From 78a958e2b058f75a9ae8d6582ab567704d792e53 Mon Sep 17 00:00:00 2001 From: Viktor Lofgren Date: Mon, 20 Jan 2025 18:52:14 +0100 Subject: [PATCH] (crawler) Fix broken test that started failing after the search engine moved to a new domain --- .../CrawlingThenConvertingIntegrationTest.java | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/code/processes/converting-process/test/nu/marginalia/converting/CrawlingThenConvertingIntegrationTest.java b/code/processes/converting-process/test/nu/marginalia/converting/CrawlingThenConvertingIntegrationTest.java index ce1dc66b..d7992ed3 100644 --- a/code/processes/converting-process/test/nu/marginalia/converting/CrawlingThenConvertingIntegrationTest.java +++ b/code/processes/converting-process/test/nu/marginalia/converting/CrawlingThenConvertingIntegrationTest.java @@ -201,23 +201,23 @@ public class CrawlingThenConvertingIntegrationTest { @Test public void crawlRobotsTxt() throws Exception { - var specs = new CrawlerMain.CrawlSpecRecord("search.marginalia.nu", 5, - List.of("https://search.marginalia.nu/search?q=hello+world") + var specs = new CrawlerMain.CrawlSpecRecord("marginalia-search.com", 5, + List.of("https://marginalia-search.com/search?q=hello+world") ); CrawledDomain domain = crawl(specs); assertFalse(domain.doc.isEmpty()); assertEquals("OK", domain.crawlerStatus); - assertEquals("search.marginalia.nu", domain.domain); + assertEquals("marginalia-search.com", domain.domain); Set allUrls = domain.doc.stream().map(doc -> doc.url).collect(Collectors.toSet()); - assertTrue(allUrls.contains("https://search.marginalia.nu/search"), "We expect a record for entities that are forbidden"); + assertTrue(allUrls.contains("https://marginalia-search.com/search"), "We expect a record for entities that are forbidden"); var output = process(); assertNotNull(output); assertFalse(output.documents.isEmpty()); - assertEquals(new EdgeDomain("search.marginalia.nu"), output.domain); + assertEquals(new EdgeDomain("marginalia-search.com"), output.domain); assertEquals(DomainIndexingState.ACTIVE, output.state); for (var doc : output.documents) {