mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-24 05:18:58 +00:00

This update eliminates all occurrences of the OpenNLP token model from the setup script, configuration, and test files, as this model file is no longer used.
38 lines
1.3 KiB
Java
38 lines
1.3 KiB
Java
package nu.marginalia.util;
|
|
|
|
import nu.marginalia.LanguageModels;
|
|
import nu.marginalia.WmsaHome;
|
|
|
|
import java.nio.file.Files;
|
|
import java.nio.file.Path;
|
|
import java.util.Optional;
|
|
|
|
public class TestLanguageModels {
|
|
private static final Path LANGUAGE_MODELS_DEFAULT = WmsaHome.getHomePath().resolve("model");
|
|
|
|
public static Path getLanguageModelsPath() {
|
|
final Path languageModelsHome = Optional.ofNullable(System.getenv("LANGUAGE_MODELS_HOME"))
|
|
.map(Path::of)
|
|
.orElse(LANGUAGE_MODELS_DEFAULT);
|
|
|
|
if (!Files.isDirectory(languageModelsHome)) {
|
|
throw new IllegalStateException("Could not find $LANGUAGE_MODELS_HOME, see doc/language-models.md");
|
|
}
|
|
return languageModelsHome;
|
|
}
|
|
|
|
public static LanguageModels getLanguageModels() {
|
|
|
|
var languageModelsHome = getLanguageModelsPath();
|
|
|
|
return new LanguageModels(
|
|
languageModelsHome.resolve("tfreq-new-algo3.bin"),
|
|
languageModelsHome.resolve("opennlp-sentence.bin"),
|
|
languageModelsHome.resolve("English.RDR"),
|
|
languageModelsHome.resolve("English.DICT"),
|
|
languageModelsHome.resolve("lid.176.ftz"),
|
|
languageModelsHome.resolve("segments.bin")
|
|
);
|
|
}
|
|
}
|