From fd5a7eac87a6067c0362971160b9844e57c61303 Mon Sep 17 00:00:00 2001 From: Viktor Lofgren Date: Mon, 30 Oct 2023 11:34:16 +0100 Subject: [PATCH] (crawler) Exit crawler retriever on thread interrupted --- .../java/nu/marginalia/crawl/retreival/CrawlerRetreiver.java | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/code/processes/crawling-process/src/main/java/nu/marginalia/crawl/retreival/CrawlerRetreiver.java b/code/processes/crawling-process/src/main/java/nu/marginalia/crawl/retreival/CrawlerRetreiver.java index 42f5960e..e569d1cf 100644 --- a/code/processes/crawling-process/src/main/java/nu/marginalia/crawl/retreival/CrawlerRetreiver.java +++ b/code/processes/crawling-process/src/main/java/nu/marginalia/crawl/retreival/CrawlerRetreiver.java @@ -149,7 +149,8 @@ public class CrawlerRetreiver { while (!crawlFrontier.isEmpty() && !crawlFrontier.isCrawlDepthReached() - && errorCount < MAX_ERRORS) + && errorCount < MAX_ERRORS + && !Thread.interrupted()) { var top = crawlFrontier.takeNextUrl();