mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-02-24 05:18:58 +00:00

Refactoring keyword extraction to extract spans information. Modifying the intermediate storage of converted data to use the new slop library, which is allows for easier storage of ad-hoc binary data like spans and positions. This is a bit of a katamari damacy commit that ended up dragging along a bunch of other fairly tangentially related changes that are hard to break out into separate commits after the fact. Will push as-is to get back to being able to do more isolated work.
64 lines
1.9 KiB
Groovy
64 lines
1.9 KiB
Groovy
plugins {
|
|
id 'java'
|
|
|
|
id 'application'
|
|
|
|
id 'jvm-test-suite'
|
|
}
|
|
|
|
java {
|
|
toolchain {
|
|
languageVersion.set(JavaLanguageVersion.of(rootProject.ext.jvmVersion))
|
|
}
|
|
}
|
|
|
|
application {
|
|
mainClass = 'nu.marginalia.tools.ExperimentRunnerMain'
|
|
applicationName = 'experiment-runner'
|
|
}
|
|
|
|
tasks.distZip.enabled = false
|
|
|
|
apply from: "$rootProject.projectDir/srcsets.gradle"
|
|
|
|
dependencies {
|
|
implementation project(':third-party:rdrpostagger')
|
|
implementation project(':third-party:porterstemmer')
|
|
implementation project(':code:common:db')
|
|
implementation project(':code:common:model')
|
|
implementation project(':code:common:config')
|
|
implementation project(':code:common:process')
|
|
implementation project(':code:common:service')
|
|
implementation project(':code:libraries:language-processing')
|
|
implementation project(':code:libraries:term-frequency-dict')
|
|
implementation project(':code:processes:converting-process')
|
|
implementation project(':code:processes:crawling-process:model')
|
|
|
|
implementation project(':third-party:commons-codec')
|
|
implementation project(':code:features-crawl:link-parser')
|
|
implementation project(':code:features-convert:adblock')
|
|
implementation project(':code:features-convert:anchor-keywords')
|
|
implementation project(':code:features-convert:topic-detection')
|
|
implementation project(':code:features-convert:keyword-extraction')
|
|
|
|
implementation libs.bundles.slf4j
|
|
implementation libs.notnull
|
|
|
|
implementation libs.guava
|
|
implementation dependencies.create(libs.guice.get()) {
|
|
exclude group: 'com.google.guava'
|
|
}
|
|
implementation libs.jsoup
|
|
implementation libs.trove
|
|
implementation libs.fastutil
|
|
|
|
implementation libs.bundles.nlp
|
|
implementation libs.commons.lang3
|
|
implementation libs.bundles.mariadb
|
|
|
|
testImplementation libs.bundles.slf4j.test
|
|
testImplementation libs.bundles.junit
|
|
testImplementation libs.mockito
|
|
}
|
|
|