mirror of
https://github.com/wassname/arXiv_abstract_bot.git
synced 2026-06-27 15:14:19 +08:00
only posts 1h old and >10 points
This commit is contained in:
@@ -2,6 +2,7 @@
|
||||
.arxiv_bot.*
|
||||
.vscode/*
|
||||
vars_copy.sh
|
||||
vars_*.sh
|
||||
|
||||
# Byte-compiled / optimized / DLL files
|
||||
__pycache__/
|
||||
|
||||
+62
-55
@@ -17,7 +17,7 @@ logger = get_logger()
|
||||
# from https://github.com/arxiv-vanity/arxiv-vanity/blob/master/arxiv_vanity/scraper/arxiv_ids.py
|
||||
ARXIV_ID_PATTERN = r'([a-z\-]+(?:\.[A-Z]{2})?/\d{7}|\d+\.\d+)(v\d+)?'
|
||||
ARXIV_URL_RE = re.compile(r'arxiv.org/[^\/]+/({})(\.pdf)?'.format(ARXIV_ID_PATTERN), re.I)
|
||||
# OPENREVIEW_URL_RE = re.compile(r'openreview.net/./', re.I)
|
||||
OPENREVIEW_URL_RE = re.compile(r'openreview.net/', re.I)
|
||||
# OPENREVIEW_URL_RE = re.compile(r'distill.pub/./', re.I)
|
||||
|
||||
r = get_bot()
|
||||
@@ -25,14 +25,16 @@ r = get_bot()
|
||||
# source subreddits
|
||||
subreddits = [
|
||||
r.subreddit('machinelearning'),
|
||||
# r.subreddit('reinforcementlearning')
|
||||
# r.subreddit('LanguageTechnology')
|
||||
r.subreddit('reinforcementlearning')
|
||||
r.subreddit('LanguageTechnology')
|
||||
]
|
||||
# target_subreddit = r.subreddit('mlresearch')
|
||||
# target_subreddit = r.subreddit('testingground4bots')
|
||||
|
||||
SLEEP = 600
|
||||
LIMIT_CHECK=20
|
||||
LIMIT_CHECK = 20
|
||||
MIN_SECONDS = 60 * 60
|
||||
MIN_SCORE = 10
|
||||
|
||||
|
||||
if r.read_only == False:
|
||||
@@ -45,68 +47,73 @@ def comment():
|
||||
try:
|
||||
all_posts = subreddit.new(limit=LIMIT_CHECK)
|
||||
for post in all_posts:
|
||||
match = ARXIV_URL_RE.search(post.url)
|
||||
if match:
|
||||
arxiv_id = match.group(1)
|
||||
match = ARXIV_URL_RE.search(post.url) or OPENREVIEW_URL_RE.search(post.url)
|
||||
|
||||
ts = time.time() - post.created_utc
|
||||
if match and (post.score > MIN_SCORE) and (ts > MIN_SECONDS):
|
||||
# arxiv_id = match.group(1)
|
||||
|
||||
# crosspost
|
||||
print('found', arxiv_id)
|
||||
|
||||
# print('found', arxiv_id)
|
||||
|
||||
if cache.get(post.id) and cache.get(post.id) is 'T':
|
||||
print ("Parsed this post already: %s"%(post.permalink))
|
||||
print("Parsed this post already: %s. %s" % (post.permalink, post.id))
|
||||
continue
|
||||
else:
|
||||
xpost(['r/researchml'], post)
|
||||
print("posting", post, post.id, post.score, ts)
|
||||
post.crosspost('researchml')
|
||||
# xpost(['r/researchml'], post)
|
||||
cache[post.id]='T'
|
||||
time.sleep(10)
|
||||
time.sleep(60)
|
||||
except Exception as error:
|
||||
logger.error("Failed to scrape")
|
||||
print(error)
|
||||
|
||||
def xpost(subs, originalpost):
|
||||
# originalpost = where.submission
|
||||
newtitle = "(X-Post r/" + str(originalpost.subreddit.display_name) + ") " + originalpost.title
|
||||
print("New post: " + str(newtitle))
|
||||
link = "https://www.reddit.com" + str(originalpost.permalink)
|
||||
workedsubs = []
|
||||
failedsubs = []
|
||||
wasError = False
|
||||
for workingsub in subs:
|
||||
exists = True
|
||||
try:
|
||||
r.subreddits.search_by_name(workingsub[2:], exact=True)
|
||||
except NotFound:
|
||||
logging.error("Failed to post")
|
||||
exists = False
|
||||
if exists == True:
|
||||
subreddit = r.subreddit(workingsub[2:])
|
||||
try:
|
||||
subreddit.submit(newtitle, url=link, resubmit=True, send_replies=False)
|
||||
workedsubs.append(str(workingsub))
|
||||
print("Posting: " + str(newtitle) + " to " + str(workingsub))
|
||||
except praw.exceptions.APIException:
|
||||
logging.error("Failed to post")
|
||||
wasError = True
|
||||
break
|
||||
else:
|
||||
failedsubs.append(str(workingsub))
|
||||
if not wasError:
|
||||
print(workedsubs,failedsubs)
|
||||
# reply(workedsubs,failedsubs,where)
|
||||
pass
|
||||
else:
|
||||
response = ""
|
||||
if workedsubs:
|
||||
response = "I was able to crosspost in "
|
||||
for i in workedsubs:
|
||||
response = response + str(i) + " and "
|
||||
response = response[:-5] + ", but I was rate-limited on the others."
|
||||
print(response)
|
||||
else:
|
||||
response = "Sorry, I was rate-limited, and I couldn't post."
|
||||
print(response)
|
||||
# where.reply(str(response) + " Make sure to give me karma to prevent that in the future.")
|
||||
# def xpost(subs, originalpost):
|
||||
# # TODO native xport
|
||||
# # originalpost = where.submission
|
||||
# newtitle = "(X-Post r/" + str(originalpost.subreddit.display_name) + ") " + originalpost.title
|
||||
# print("New post: " + str(newtitle))
|
||||
# link = "https://www.reddit.com" + str(originalpost.permalink)
|
||||
# workedsubs = []
|
||||
# failedsubs = []
|
||||
# wasError = False
|
||||
# for workingsub in subs:
|
||||
# exists = True
|
||||
# try:
|
||||
# r.subreddits.search_by_name(workingsub[2:], exact=True)
|
||||
# except NotFound:
|
||||
# logging.error("Failed to post")
|
||||
# exists = False
|
||||
# if exists == True:
|
||||
# subreddit = r.subreddit(workingsub[2:])
|
||||
# try:
|
||||
# submission.crosspost(subreddit)
|
||||
# subreddit.submit(newtitle, url=link, resubmit=True, send_replies=False)
|
||||
# workedsubs.append(str(workingsub))
|
||||
# print("Posting: " + str(newtitle) + " to " + str(workingsub))
|
||||
# except praw.exceptions.APIException:
|
||||
# logging.error("Failed to post")
|
||||
# wasError = True
|
||||
# break
|
||||
# else:
|
||||
# failedsubs.append(str(workingsub))
|
||||
# if not wasError:
|
||||
# print(workedsubs,failedsubs)
|
||||
# # reply(workedsubs,failedsubs,where)
|
||||
# pass
|
||||
# else:
|
||||
# response = ""
|
||||
# if workedsubs:
|
||||
# response = "I was able to crosspost in "
|
||||
# for i in workedsubs:
|
||||
# response = response + str(i) + " and "
|
||||
# response = response[:-5] + ", but I was rate-limited on the others."
|
||||
# print(response)
|
||||
# else:
|
||||
# response = "Sorry, I was rate-limited, and I couldn't post."
|
||||
# print(response)
|
||||
# # where.reply(str(response) + " Make sure to give me karma to prevent that in the future.")
|
||||
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user