mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-24 05:18:58 +00:00
Better SiteWords extraction
This commit is contained in:
parent
5558af148e
commit
65b0ff26fc
@ -33,8 +33,7 @@ public class SiteWords {
|
||||
Set<String> commonSiteWords = new HashSet<>(10);
|
||||
|
||||
commonSiteWords.addAll(commonKeywordExtractor.getCommonSiteWords(processedDomain,
|
||||
EdgePageWordFlags.Subjects,
|
||||
EdgePageWordFlags.TfIdfHigh));
|
||||
EdgePageWordFlags.Subjects));
|
||||
|
||||
commonSiteWords.addAll(commonKeywordExtractor.getCommonSiteWords(processedDomain,
|
||||
EdgePageWordFlags.Title));
|
||||
|
Loading…
Reference in New Issue
Block a user