mirror of
https://github.com/simon987/od-database.git
synced 2025-04-19 10:26:44 +00:00
Minor adjustments
This commit is contained in:
parent
5fdf35ab56
commit
6cdc4b87d0
@ -56,11 +56,11 @@ for comment in subreddit.comments(limit=50):
|
|||||||
|
|
||||||
if website and not scanned:
|
if website and not scanned:
|
||||||
# in progress
|
# in progress
|
||||||
|
print(url)
|
||||||
print("In progress")
|
print("In progress")
|
||||||
continue
|
continue
|
||||||
|
|
||||||
if website and db.website_has_been_scanned(url):
|
if website and db.website_has_been_scanned(url):
|
||||||
bot.log_crawl(comment.id)
|
|
||||||
handle_exact_repost(website.id, comment)
|
handle_exact_repost(website.id, comment)
|
||||||
continue
|
continue
|
||||||
|
|
||||||
@ -70,13 +70,11 @@ for comment in subreddit.comments(limit=50):
|
|||||||
print("Parent in progress")
|
print("Parent in progress")
|
||||||
continue
|
continue
|
||||||
if website_id and db.website_has_been_scanned(url):
|
if website_id and db.website_has_been_scanned(url):
|
||||||
bot.log_crawl(comment.id)
|
|
||||||
handle_subdir_repost(website_id, comment)
|
handle_subdir_repost(website_id, comment)
|
||||||
continue
|
continue
|
||||||
|
|
||||||
if not od_util.is_valid_url(url):
|
if not od_util.is_valid_url(url):
|
||||||
print("Skipping reddit comment: Invalid url")
|
print("Skipping reddit comment: Invalid url")
|
||||||
bot.log_crawl(comment.id)
|
|
||||||
bot.reply(comment, "Hello, " + str(comment.author) + ". Unfortunately it seems that the link you "
|
bot.reply(comment, "Hello, " + str(comment.author) + ". Unfortunately it seems that the link you "
|
||||||
"provided: `" + url + "` is not valid. Make sure that you include the"
|
"provided: `" + url + "` is not valid. Make sure that you include the"
|
||||||
"'`http(s)://` prefix. \n")
|
"'`http(s)://` prefix. \n")
|
||||||
@ -84,24 +82,21 @@ for comment in subreddit.comments(limit=50):
|
|||||||
|
|
||||||
if od_util.is_blacklisted(url):
|
if od_util.is_blacklisted(url):
|
||||||
print("Skipping reddit comment: blacklisted")
|
print("Skipping reddit comment: blacklisted")
|
||||||
bot.log_crawl(comment.id)
|
|
||||||
bot.reply(comment, "Hello, " + str(comment.author) + ". Unfortunately my programmer has "
|
bot.reply(comment, "Hello, " + str(comment.author) + ". Unfortunately my programmer has "
|
||||||
"blacklisted this website. If you think that this is an error, please "
|
"blacklisted this website. If you think that this is an error, please "
|
||||||
"[contact him](https://www.reddit.com/message/compose?to=Hexahedr_n)")
|
"[contact him](https://old.reddit.com/message/compose?to=Hexahedr_n)")
|
||||||
continue
|
continue
|
||||||
|
|
||||||
if not od_util.is_od(url):
|
if not od_util.is_od(url):
|
||||||
print("Skipping reddit comment: Not an OD")
|
print("Skipping reddit comment: Not an OD")
|
||||||
print(url)
|
print(url)
|
||||||
bot.log_crawl(comment.id)
|
|
||||||
bot.reply(comment, "Hello, " + str(comment.author) + ". Unfortunately it seems that the link you "
|
bot.reply(comment, "Hello, " + str(comment.author) + ". Unfortunately it seems that the link you "
|
||||||
"provided: `" + url + "` does not point to an open directory. This could also"
|
"provided: `" + url + "` does not point to an open directory. This could also"
|
||||||
" mean that the website is not responding (in which case, feel free to retry in "
|
" mean that the website is not responding (in which case, feel free to retry in "
|
||||||
"a few minutes). If you think that this is an error, please "
|
"a few minutes). If you think that this is an error, please "
|
||||||
"[contact my programmer](https://www.reddit.com/message/compose?to=Hexahedr_n)")
|
"[contact my programmer](https://old.reddit.com/message/compose?to=Hexahedr_n)")
|
||||||
continue
|
continue
|
||||||
|
|
||||||
bot.log_crawl(comment.id)
|
|
||||||
web_id = db.insert_website(Website(url, "localhost", "reddit_bot"))
|
web_id = db.insert_website(Website(url, "localhost", "reddit_bot"))
|
||||||
db.enqueue(web_id, reddit_comment_id=comment.id, priority=2) # Medium priority for reddit comments
|
db.enqueue(web_id, reddit_comment_id=comment.id, priority=2) # Medium priority for reddit comments
|
||||||
print("Queued comment post: " + str(web_id))
|
print("Queued comment post: " + str(web_id))
|
||||||
@ -122,7 +117,6 @@ for s in submissions:
|
|||||||
website = db.get_website_by_url(url)
|
website = db.get_website_by_url(url)
|
||||||
|
|
||||||
if website:
|
if website:
|
||||||
bot.log_crawl(s.id)
|
|
||||||
handle_exact_repost(website.id, s)
|
handle_exact_repost(website.id, s)
|
||||||
|
|
||||||
website_id = db.website_exists(url)
|
website_id = db.website_exists(url)
|
||||||
@ -146,7 +140,6 @@ for s in submissions:
|
|||||||
bot.log_crawl(s.id)
|
bot.log_crawl(s.id)
|
||||||
continue
|
continue
|
||||||
|
|
||||||
bot.log_crawl(s.id)
|
|
||||||
web_id = db.insert_website(Website(url, "localhost", "reddit_bot"))
|
web_id = db.insert_website(Website(url, "localhost", "reddit_bot"))
|
||||||
db.enqueue(web_id, reddit_post_id=s.id, priority=3) # Higher priority for reddit posts
|
db.enqueue(web_id, reddit_post_id=s.id, priority=3) # Higher priority for reddit posts
|
||||||
print("Queued reddit post: " + str(web_id))
|
print("Queued reddit post: " + str(web_id))
|
||||||
|
@ -43,9 +43,9 @@ class RedditBot:
|
|||||||
try:
|
try:
|
||||||
# Double check has_crawled
|
# Double check has_crawled
|
||||||
if not self.has_crawled(reddit_obj.id):
|
if not self.has_crawled(reddit_obj.id):
|
||||||
# reddit_obj.reply(comment)
|
reddit_obj.reply(comment)
|
||||||
print("Skipping comment " + comment)
|
|
||||||
self.log_crawl(reddit_obj.id)
|
self.log_crawl(reddit_obj.id)
|
||||||
|
print("Reply to " + reddit_obj.id)
|
||||||
break
|
break
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
print("Waiting 5 minutes: " + str(e))
|
print("Waiting 5 minutes: " + str(e))
|
||||||
|
Loading…
x
Reference in New Issue
Block a user