From 4883632e373370d282c9ce1a0dfb713ea4fb4a64 Mon Sep 17 00:00:00 2001 From: ImBenji Date: Sat, 18 Apr 2026 14:05:29 +0100 Subject: [PATCH] add Google News integration and enhance crawler capabilities --- config.json | 3 +-- src/scheduler.js | 3 ++- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/config.json b/config.json index 7eee522..e9b36a1 100644 --- a/config.json +++ b/config.json @@ -42,8 +42,7 @@ "googleNews": "0 * * * *" }, "contentBackfill": { - "cron": "0 * * * *", - "batchSize": -1 + "concurrency": 10 }, "googleNews": { "queries": [ diff --git a/src/scheduler.js b/src/scheduler.js index 32c3c5c..8ad2eba 100644 --- a/src/scheduler.js +++ b/src/scheduler.js @@ -97,7 +97,8 @@ function startScheduler() { } try { - await backfillMissingContent(); + const concurrency = Number(config.contentBackfill?.concurrency) || 5; + await backfillMissingContent(-1, concurrency); } catch (error) { console.error('content backfill failed:', error); }