Update the URL queue earlier
This commit is contained in:
parent
0d33b4f68f
commit
7c14cd99f8
2 changed files with 5 additions and 1 deletions
|
@ -24,6 +24,10 @@ def run(data_path: str, url_queue: Queue):
|
|||
url_db.create_tables()
|
||||
|
||||
initialize_url_queue(url_queue)
|
||||
try:
|
||||
update_url_queue(url_queue)
|
||||
except Exception:
|
||||
logger.exception("Error updating URL queue")
|
||||
historical.run()
|
||||
index_path = Path(data_path) / INDEX_NAME
|
||||
batch_cache = BatchCache(Path(data_path) / BATCH_DIR_NAME)
|
||||
|
|
|
@ -4,7 +4,7 @@ from mwmbl.crawler.app import get_batches_for_date
|
|||
from mwmbl.database import Database
|
||||
from mwmbl.indexer.indexdb import BatchInfo, BatchStatus, IndexDatabase
|
||||
|
||||
DAYS = 66
|
||||
DAYS = 20
|
||||
|
||||
|
||||
def run():
|
||||
|
|
Loading…
Reference in a new issue