Better SiteWords extraction

This commit is contained in:
Viktor Lofgren 2023-01-30 09:42:46 +01:00
parent 5558af148e
commit 65b0ff26fc

View File

@ -33,8 +33,7 @@ public class SiteWords {
Set<String> commonSiteWords = new HashSet<>(10);
commonSiteWords.addAll(commonKeywordExtractor.getCommonSiteWords(processedDomain,
EdgePageWordFlags.Subjects,
EdgePageWordFlags.TfIdfHigh));
EdgePageWordFlags.Subjects));
commonSiteWords.addAll(commonKeywordExtractor.getCommonSiteWords(processedDomain,
EdgePageWordFlags.Title));