mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-23 13:09:00 +00:00
(crawler) Set more lenient parameters for recrawl
This commit is contained in:
parent
fd5a7eac87
commit
8f74dbdbb4
@ -227,9 +227,9 @@ public class CrawlerRetreiver {
|
||||
continue;
|
||||
|
||||
|
||||
if (recrawled > 10
|
||||
if (recrawled > 5
|
||||
&& retained > 0.9 * recrawled
|
||||
&& Math.random() < 0.75)
|
||||
&& Math.random() < 0.9)
|
||||
{
|
||||
// Since it looks like most of these documents haven't changed,
|
||||
// we'll load the documents directly; but we do this in a random
|
||||
|
Loading…
Reference in New Issue
Block a user