Added manual mode and HTTPS support

This commit is contained in:
simon
2018-02-07 19:51:06 -05:00
parent 8e1f4543fd
commit a2f671f0f5
13 changed files with 217 additions and 143 deletions

View File

@@ -39,56 +39,42 @@ class TaskQueueTest(TestCase):
if os.path.isfile("task_queue_test.txt"):
os.remove("task_queue_test.txt")
def test_push_pop_test(self):
if os.path.isfile("task_queue_test.txt"):
os.remove("task_queue_test.txt")
tq = TaskQueue("task_queue_test.txt")
tq.push(CrawTask("http://awebsite.com/", "postid", "a title"))
task1 = tq.pop()
self.assertEqual(tq.pop(), None)
self.assertEqual(task1.url, "http://awebsite.com/")
self.assertEqual(task1.post_id, "postid")
def test_persistence(self):
if os.path.isfile("task_queue_test.txt"):
os.remove("task_queue_test.txt")
tq = TaskQueue("task_queue_test.txt")
tq.push(CrawTask("http://awebsite.com/", "postid", "a title"))
tq2 = TaskQueue("task_queue_test.txt")
task = tq2.pop()
self.assertEqual(task.url, "http://awebsite.com/")
self.assertEqual(task.post_id, "postid")
def test_multiple_tasks(self):
if os.path.isfile("task_queue_test.txt"):
os.remove("task_queue_test.txt")
tq = TaskQueue("task_queue_test.txt")
tq.push(CrawTask("http://awebsite.com/", "postid", "a title"))
tq.push(CrawTask("http://awebsite.com/", "postid", "a title"))
tq.push(CrawTask("http://awebsite.com/", "postid", "a title"))
self.assertIsNotNone(tq.pop())
self.assertIsNotNone(tq.pop())
self.assertIsNotNone(tq.pop())
self.assertIsNone(tq.pop())
def test_is_queued(self):
if os.path.isfile("task_queue_test.txt"):
os.remove("task_queue_test.txt")
tq = TaskQueue("task_queue_test.txt")
tq.push(CrawTask("http://awebsite.com/", "postid", "a title"))
self.assertTrue(tq.is_queued("postid"))
self.assertFalse(tq.is_queued("123456"))
# def test_push_pop_test(self):
#
# if os.path.isfile("task_queue_test.txt"):
# os.remove("task_queue_test.txt")
#
# tq = TaskQueue("task_queue_test.txt")
# tq.push(CrawTask(dict()))
#
# task1 = tq.pop()
#
# self.assertEqual(tq.pop(), None)
# self.assertEqual(task1.submission.url, "http://awebsite.com/")
# self.assertEqual(task1.submission.post_id, "postid")
#
# def test_multiple_tasks(self):
# if os.path.isfile("task_queue_test.txt"):
# os.remove("task_queue_test.txt")
#
# tq = TaskQueue("task_queue_test.txt")
#
# tq.push(CrawTask(dict()))
# tq.push(CrawTask(dict()))
# tq.push(CrawTask(dict()))
#
# self.assertIsNotNone(tq.pop())
# self.assertIsNotNone(tq.pop())
# self.assertIsNotNone(tq.pop())
# self.assertIsNone(tq.pop())
#
# def test_is_queued(self):
# if os.path.isfile("task_queue_test.txt"):
# os.remove("task_queue_test.txt")
#
# tq = TaskQueue("task_queue_test.txt")
#
# tq.push(CrawTask({id: "postid"}))
#
# self.assertTrue(tq.is_queued("postid"))
# self.assertFalse(tq.is_queued("123456"))