From 17db23c2c1ef4460ec90750cde1d9f411f2ef15a Mon Sep 17 00:00:00 2001 From: Viktor Lofgren Date: Fri, 7 Jul 2023 19:44:57 +0200 Subject: [PATCH] Minor: Better error handling in crawled domain reader --- .../java/nu/marginalia/crawling/io/CrawledDomainReader.java | 2 +- .../main/java/nu/marginalia/crawl/CrawlJobExtractorMain.java | 2 -- 2 files changed, 1 insertion(+), 3 deletions(-) diff --git a/code/process-models/crawling-model/src/main/java/nu/marginalia/crawling/io/CrawledDomainReader.java b/code/process-models/crawling-model/src/main/java/nu/marginalia/crawling/io/CrawledDomainReader.java index 47dec05f..9c293af7 100644 --- a/code/process-models/crawling-model/src/main/java/nu/marginalia/crawling/io/CrawledDomainReader.java +++ b/code/process-models/crawling-model/src/main/java/nu/marginalia/crawling/io/CrawledDomainReader.java @@ -64,7 +64,7 @@ public class CrawledDomainReader { return Optional.of(read(path)); } catch (Exception ex) { - logger.warn("Failed to read domain", ex); + logger.warn("Failed to read domain " + path, ex); return Optional.empty(); } } diff --git a/code/tools/crawl-job-extractor/src/main/java/nu/marginalia/crawl/CrawlJobExtractorMain.java b/code/tools/crawl-job-extractor/src/main/java/nu/marginalia/crawl/CrawlJobExtractorMain.java index e8de4de6..e898293b 100644 --- a/code/tools/crawl-job-extractor/src/main/java/nu/marginalia/crawl/CrawlJobExtractorMain.java +++ b/code/tools/crawl-job-extractor/src/main/java/nu/marginalia/crawl/CrawlJobExtractorMain.java @@ -1,6 +1,5 @@ package nu.marginalia.crawl; -import com.zaxxer.hikari.HikariDataSource; import nu.marginalia.crawling.model.spec.CrawlingSpecification; import nu.marginalia.model.EdgeDomain; import nu.marginalia.db.DomainBlacklistImpl; @@ -10,7 +9,6 @@ import nu.marginalia.service.module.DatabaseModule; import java.io.IOException; import java.nio.file.Files; import java.nio.file.Path; -import java.sql.SQLException; import java.util.*; import java.util.stream.Stream;