From f140e7d7c7b3c621722376a9ee753c8386f2efc9 Mon Sep 17 00:00:00 2001 From: Viktor Lofgren Date: Wed, 21 Jun 2023 17:30:14 +0200 Subject: [PATCH] Use a default tag for unset or invalid generators. --- .../processor/logic/DocumentGeneratorExtractor.java | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/code/processes/converting-process/src/main/java/nu/marginalia/converting/processor/logic/DocumentGeneratorExtractor.java b/code/processes/converting-process/src/main/java/nu/marginalia/converting/processor/logic/DocumentGeneratorExtractor.java index 2f8d5159..f4506100 100644 --- a/code/processes/converting-process/src/main/java/nu/marginalia/converting/processor/logic/DocumentGeneratorExtractor.java +++ b/code/processes/converting-process/src/main/java/nu/marginalia/converting/processor/logic/DocumentGeneratorExtractor.java @@ -9,6 +9,8 @@ import java.util.List; /** Extract keywords for the document meta generator tag */ public class DocumentGeneratorExtractor { + private final String defaultValue = "unset"; + public List generatorCleaned(Document doc) { String generator = doc @@ -19,11 +21,11 @@ public class DocumentGeneratorExtractor { generator = trim(generator); if (generator.isBlank()) - return Collections.emptyList(); + return List.of(defaultValue); String[] parts = StringUtils.split(generator, " ,:!"); if (parts.length == 0) - return Collections.emptyList(); + return List.of(defaultValue); int slashIdx = parts[0].indexOf('/'); if (slashIdx >= 0) { @@ -32,7 +34,7 @@ public class DocumentGeneratorExtractor { } if (parts.length > 3) { - return Collections.emptyList(); // if it's still very long after trim(), it's probably a custom hand written message + return List.of(defaultValue); // if it's still very long after trim(), it's probably a custom hand written message } switch (parts[0]) {