Reduce parallelism to avoid overwhelming server with 404s

2025-12-27 17:26:44 +00:00 · 2025-12-27 17:26:44 +00:00 · 069205946a
commit 069205946a
parent 73529bec16
1 changed files with 1 additions and 1 deletions
--- a/emblem5/ai/fetch-scans.py
+++ b/emblem5/ai/fetch-scans.py
@ -65,7 +65,7 @@ class ScanDataFetcher(object):
        if sample_rate:
            fetch_backlog = random.sample(fetch_backlog, int(len(fetch_backlog) * sample_rate))
        logger.info(f'fetch_backlog: {len(fetch_backlog)}')
-        pool = mp.Pool(mp.cpu_count() * 4)
+        pool = mp.Pool(min(8, mp.cpu_count()))
        counts = defaultdict(int)
        for r in tqdm(pool.imap_unordered(self.fetch_one_scan, fetch_backlog), total=len(fetch_backlog)):
            counts[r] += 1