diff --git a/marginalia_nu/src/main/java/nu/marginalia/wmsa/edge/converting/ConverterMain.java b/marginalia_nu/src/main/java/nu/marginalia/wmsa/edge/converting/ConverterMain.java index 61ff0b00..973554d2 100644 --- a/marginalia_nu/src/main/java/nu/marginalia/wmsa/edge/converting/ConverterMain.java +++ b/marginalia_nu/src/main/java/nu/marginalia/wmsa/edge/converting/ConverterMain.java @@ -1,18 +1,19 @@ package nu.marginalia.wmsa.edge.converting; -import com.google.gson.*; +import com.google.common.base.Strings; +import com.google.gson.Gson; import com.google.inject.Guice; import com.google.inject.Inject; import com.google.inject.Injector; +import nu.marginalia.util.ParallelPipe; import nu.marginalia.wmsa.edge.converting.interpreter.Instruction; import nu.marginalia.wmsa.edge.converting.processor.DomainProcessor; import nu.marginalia.wmsa.edge.converting.processor.InstructionsCompiler; import nu.marginalia.wmsa.edge.crawling.CrawlPlanLoader; import nu.marginalia.wmsa.edge.crawling.CrawledDomainReader; -import nu.marginalia.wmsa.edge.crawling.WorkLog; import nu.marginalia.wmsa.edge.crawling.CrawlerSpecificationLoader; +import nu.marginalia.wmsa.edge.crawling.WorkLog; import nu.marginalia.wmsa.edge.crawling.model.CrawledDomain; -import nu.marginalia.util.ParallelPipe; import nu.marginalia.wmsa.edge.model.EdgeCrawlPlan; import org.slf4j.Logger; import org.slf4j.LoggerFactory; @@ -96,6 +97,10 @@ public class ConverterMain { domainToId.forEach((domain, id) -> { String fileName = idToFileName.get(id); + + if (Strings.isNullOrEmpty(fileName)) + return; + Path dest = plan.getCrawledFilePath(fileName); logger.info("{} - {} - {}", domain, id, dest);