2023-03-04 12:19:01 +00:00
|
|
|
plugins {
|
|
|
|
id 'java'
|
2023-09-23 09:01:43 +00:00
|
|
|
|
2023-03-04 12:19:01 +00:00
|
|
|
id 'application'
|
|
|
|
id 'jvm-test-suite'
|
|
|
|
}
|
|
|
|
|
|
|
|
java {
|
|
|
|
toolchain {
|
2024-04-24 11:54:04 +00:00
|
|
|
languageVersion.set(JavaLanguageVersion.of(rootProject.ext.jvmVersion))
|
2023-03-04 12:19:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
application {
|
|
|
|
mainClass = 'nu.marginalia.crawl.CrawlerMain'
|
|
|
|
applicationName = 'crawler-process'
|
|
|
|
}
|
|
|
|
|
2023-03-11 10:34:51 +00:00
|
|
|
tasks.distZip.enabled = false
|
|
|
|
|
2024-02-23 15:13:40 +00:00
|
|
|
apply from: "$rootProject.projectDir/srcsets.gradle"
|
|
|
|
|
2023-03-04 12:19:01 +00:00
|
|
|
dependencies {
|
2023-03-16 20:35:54 +00:00
|
|
|
|
2023-07-11 12:46:21 +00:00
|
|
|
implementation project(':code:common:db')
|
2023-03-07 16:14:32 +00:00
|
|
|
implementation project(':code:common:model')
|
|
|
|
implementation project(':code:common:config')
|
|
|
|
implementation project(':code:common:service')
|
2023-09-20 08:11:49 +00:00
|
|
|
implementation project(':code:libraries:blocking-thread-pool')
|
2024-02-22 17:01:35 +00:00
|
|
|
implementation project(':code:index:api')
|
2024-07-27 09:44:13 +00:00
|
|
|
implementation project(':code:processes:process-mq-api')
|
2023-08-15 08:53:23 +00:00
|
|
|
implementation project(':code:libraries:message-queue')
|
2023-03-07 16:14:32 +00:00
|
|
|
implementation project(':code:libraries:language-processing')
|
2023-07-20 19:05:16 +00:00
|
|
|
implementation project(':code:libraries:easy-lsh')
|
2024-07-27 09:44:13 +00:00
|
|
|
implementation project(':code:processes:crawling-process:model')
|
|
|
|
implementation project(':code:processes:crawling-process:model')
|
2023-03-04 12:19:01 +00:00
|
|
|
|
2023-11-06 15:14:58 +00:00
|
|
|
|
2024-07-30 08:04:59 +00:00
|
|
|
implementation project(':code:processes:converting-process:ft-anchor-keywords')
|
|
|
|
implementation project(':code:processes:crawling-process:ft-crawl-blocklist')
|
|
|
|
implementation project(':code:processes:crawling-process:ft-link-parser')
|
|
|
|
implementation project(':code:processes:crawling-process:ft-content-type')
|
2023-12-27 12:29:00 +00:00
|
|
|
implementation project(':third-party:commons-codec')
|
2023-03-12 10:42:07 +00:00
|
|
|
|
2023-03-04 12:19:01 +00:00
|
|
|
implementation libs.bundles.slf4j
|
|
|
|
|
|
|
|
implementation libs.notnull
|
2024-05-23 12:20:01 +00:00
|
|
|
implementation libs.guava
|
2024-12-26 14:05:52 +00:00
|
|
|
implementation libs.sqlite
|
|
|
|
|
2024-05-23 12:20:01 +00:00
|
|
|
implementation dependencies.create(libs.guice.get()) {
|
|
|
|
exclude group: 'com.google.guava'
|
|
|
|
}
|
2023-03-04 12:19:01 +00:00
|
|
|
implementation libs.gson
|
|
|
|
implementation libs.zstd
|
2023-12-08 12:49:16 +00:00
|
|
|
implementation libs.jwarc
|
2023-03-04 12:19:01 +00:00
|
|
|
implementation libs.crawlercommons
|
|
|
|
implementation libs.jsoup
|
|
|
|
implementation libs.opencsv
|
2023-07-29 17:16:31 +00:00
|
|
|
implementation libs.fastutil
|
|
|
|
|
2023-03-04 12:19:01 +00:00
|
|
|
implementation libs.bundles.mariadb
|
|
|
|
|
|
|
|
testImplementation libs.bundles.slf4j.test
|
|
|
|
testImplementation libs.bundles.junit
|
|
|
|
testImplementation libs.mockito
|
2023-06-26 12:14:39 +00:00
|
|
|
|
|
|
|
testImplementation project(':code:processes:test-data')
|
2023-03-04 12:19:01 +00:00
|
|
|
}
|
|
|
|
|