Remove sitemap related log spam

This commit is contained in:
Viktor Lofgren 2023-06-27 13:59:47 +02:00
parent 7d741ff499
commit d167ad2017
2 changed files with 4 additions and 2 deletions

View File

@ -225,8 +225,6 @@ public class CrawlerRetreiver {
checkedSitemaps.add(url.path);
crawlFrontier.addAllToQueue(sitemap);
sitemap.forEach(u -> System.out.println("u" + u));
}
logger.info("Queue is now {}", crawlFrontier.queueSize());

View File

@ -6,6 +6,7 @@ import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import javax.inject.Singleton;
import java.io.FileNotFoundException;
import java.util.*;
@Singleton
@ -20,6 +21,9 @@ public class SitemapRetriever {
try {
return sitemapToUrls(parser.parseSiteMap(sitemapUrl.asURL()));
}
catch (FileNotFoundException ex) {
return Collections.emptyList();
}
catch (UnknownFormatException ex) {
logger.debug("Unknown sitemap format: {}", sitemapUrl);
return Collections.emptyList();