Crawl tasks are now fetched by the crawlers instead of pushed by the server

2025-12-15 23:59:05 +00:00 · 2018-07-14 17:31:18 -04:00
parent d9e9f53f92
commit fe1d29aaea
20 changed files with 376 additions and 749 deletions
--- a/README.md
+++ b/README.md
@@ -22,9 +22,6 @@ FLASK_SECRET = ""
 RESULTS_PER_PAGE = (25, 50, 100, 250, 500, 1000)
 # Headers for http crawler
 HEADERS = {}
-# Token for the crawl server, used by the server to communicate to the crawl server
-CRAWL_SERVER_TOKEN = ""
-CRAWL_SERVER_PORT = 5001
 # Number of crawler instances (one per task)
 CRAWL_SERVER_PROCESSES = 3
 # Number of threads per crawler instance
@@ -33,6 +30,9 @@ CRAWL_SERVER_THREADS = 20
 SUBMIT_FTP = False
 # Allow http(s) websites in /submit
 SUBMIT_HTTP = True
+
+SERVER_URL = "http://localhost/api"
+API_TOKEN = "5817926d-f2f9-4422-a411-a98f1bfe4b6c"
 ```

 ## Running the crawl server