mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-23 21:18:58 +00:00
Tidy up
This commit is contained in:
parent
495e6a1639
commit
65aee9419d
@ -17,44 +17,21 @@ import java.util.stream.IntStream;
|
|||||||
import it.unimi.dsi.fastutil.ints.IntArrays;
|
import it.unimi.dsi.fastutil.ints.IntArrays;
|
||||||
|
|
||||||
public abstract class RankingAlgorithm {
|
public abstract class RankingAlgorithm {
|
||||||
final TIntObjectHashMap<RankingDomainData> domainsById = new TIntObjectHashMap<>();
|
protected final TIntObjectHashMap<RankingDomainData> domainsById = new TIntObjectHashMap<>();
|
||||||
final TIntIntHashMap domainIndexToId = new TIntIntHashMap();
|
protected final TIntIntHashMap domainIndexToId = new TIntIntHashMap();
|
||||||
final TIntIntHashMap domainIdToIndex = new TIntIntHashMap();
|
protected final TIntIntHashMap domainIdToIndex = new TIntIntHashMap();
|
||||||
|
|
||||||
TIntArrayList[] linkDataSrc2Dest;
|
protected TIntArrayList[] linkDataSrc2Dest;
|
||||||
TIntArrayList[] linkDataDest2Src;
|
protected TIntArrayList[] linkDataDest2Src;
|
||||||
|
|
||||||
public final Set<String> originDomains = new HashSet<>();
|
public final Set<String> originDomains = new HashSet<>();
|
||||||
public final Set<Integer> originDomainIds = new HashSet<>();
|
public final Set<Integer> originDomainIds = new HashSet<>();
|
||||||
|
|
||||||
private int maxKnownUrls = Integer.MAX_VALUE;
|
private int maxKnownUrls = Integer.MAX_VALUE;
|
||||||
|
|
||||||
private static final boolean getNames = true;
|
|
||||||
|
|
||||||
private final Logger logger = LoggerFactory.getLogger(getClass());
|
private final Logger logger = LoggerFactory.getLogger(getClass());
|
||||||
private RankingDomainFetcher domains;
|
|
||||||
|
|
||||||
public static void main(String... args) throws IOException {
|
private final RankingDomainFetcher domains;
|
||||||
var ds = new DatabaseModule().provideConnection();
|
|
||||||
var domains = new RankingDomainFetcher(ds, new EdgeDomainBlacklistImpl(ds));
|
|
||||||
|
|
||||||
var rpr = new BuggyReversePageRank(domains, "wiki.xxiivv.com");
|
|
||||||
var spr = new BuggyStandardPageRank(domains, "memex.marginalia.nu");
|
|
||||||
|
|
||||||
var rankVector = spr.pageRankVector();
|
|
||||||
var norm = rankVector.norm();
|
|
||||||
rpr.pageRank(i -> rankVector.get(i) / norm, 25).forEach(i -> {
|
|
||||||
System.out.println(spr.domainNameFromId(i));
|
|
||||||
return true;
|
|
||||||
});
|
|
||||||
}
|
|
||||||
|
|
||||||
public String domainNameFromId(int id) {
|
|
||||||
return domainsById.get(id).name;
|
|
||||||
}
|
|
||||||
public boolean isPeripheral(int id) {
|
|
||||||
return domainsById.get(id).peripheral;
|
|
||||||
}
|
|
||||||
|
|
||||||
public RankingAlgorithm(RankingDomainFetcher domains, String... origins) {
|
public RankingAlgorithm(RankingDomainFetcher domains, String... origins) {
|
||||||
this.domains = domains;
|
this.domains = domains;
|
||||||
|
Loading…
Reference in New Issue
Block a user