mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-24 05:18:58 +00:00
(crawler) Set more lenient parameters for recrawl
This commit is contained in:
parent
fd5a7eac87
commit
8f74dbdbb4
@ -227,9 +227,9 @@ public class CrawlerRetreiver {
|
|||||||
continue;
|
continue;
|
||||||
|
|
||||||
|
|
||||||
if (recrawled > 10
|
if (recrawled > 5
|
||||||
&& retained > 0.9 * recrawled
|
&& retained > 0.9 * recrawled
|
||||||
&& Math.random() < 0.75)
|
&& Math.random() < 0.9)
|
||||||
{
|
{
|
||||||
// Since it looks like most of these documents haven't changed,
|
// Since it looks like most of these documents haven't changed,
|
||||||
// we'll load the documents directly; but we do this in a random
|
// we'll load the documents directly; but we do this in a random
|
||||||
|
Loading…
Reference in New Issue
Block a user