Update the URL queue earlier

This commit is contained in:
Daoud Clarke 2022-12-31 23:37:59 +00:00
parent 0d33b4f68f
commit 7c14cd99f8
2 changed files with 5 additions and 1 deletions

View file

@ -24,6 +24,10 @@ def run(data_path: str, url_queue: Queue):
url_db.create_tables()
initialize_url_queue(url_queue)
try:
update_url_queue(url_queue)
except Exception:
logger.exception("Error updating URL queue")
historical.run()
index_path = Path(data_path) / INDEX_NAME
batch_cache = BatchCache(Path(data_path) / BATCH_DIR_NAME)

View file

@ -4,7 +4,7 @@ from mwmbl.crawler.app import get_batches_for_date
from mwmbl.database import Database
from mwmbl.indexer.indexdb import BatchInfo, BatchStatus, IndexDatabase
DAYS = 66
DAYS = 20
def run():