mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-24 05:18:58 +00:00
Remove sitemap related log spam
This commit is contained in:
parent
7d741ff499
commit
d167ad2017
@ -225,8 +225,6 @@ public class CrawlerRetreiver {
|
|||||||
checkedSitemaps.add(url.path);
|
checkedSitemaps.add(url.path);
|
||||||
|
|
||||||
crawlFrontier.addAllToQueue(sitemap);
|
crawlFrontier.addAllToQueue(sitemap);
|
||||||
|
|
||||||
sitemap.forEach(u -> System.out.println("u" + u));
|
|
||||||
}
|
}
|
||||||
|
|
||||||
logger.info("Queue is now {}", crawlFrontier.queueSize());
|
logger.info("Queue is now {}", crawlFrontier.queueSize());
|
||||||
|
@ -6,6 +6,7 @@ import org.slf4j.Logger;
|
|||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
import javax.inject.Singleton;
|
import javax.inject.Singleton;
|
||||||
|
import java.io.FileNotFoundException;
|
||||||
import java.util.*;
|
import java.util.*;
|
||||||
|
|
||||||
@Singleton
|
@Singleton
|
||||||
@ -20,6 +21,9 @@ public class SitemapRetriever {
|
|||||||
try {
|
try {
|
||||||
return sitemapToUrls(parser.parseSiteMap(sitemapUrl.asURL()));
|
return sitemapToUrls(parser.parseSiteMap(sitemapUrl.asURL()));
|
||||||
}
|
}
|
||||||
|
catch (FileNotFoundException ex) {
|
||||||
|
return Collections.emptyList();
|
||||||
|
}
|
||||||
catch (UnknownFormatException ex) {
|
catch (UnknownFormatException ex) {
|
||||||
logger.debug("Unknown sitemap format: {}", sitemapUrl);
|
logger.debug("Unknown sitemap format: {}", sitemapUrl);
|
||||||
return Collections.emptyList();
|
return Collections.emptyList();
|
||||||
|
Loading…
Reference in New Issue
Block a user