2023-03-04 13:19:01 +01:00
|
|
|
rootProject.name = 'marginalia.nu'
|
2022-05-19 17:45:26 +02:00
|
|
|
|
2023-03-07 17:14:32 +01:00
|
|
|
include 'code:services-core:index-service'
|
|
|
|
include 'code:services-core:assistant-service'
|
2023-08-01 15:49:50 +02:00
|
|
|
include 'code:services-core:control-service'
|
2023-10-08 17:31:50 +02:00
|
|
|
include 'code:services-core:query-service'
|
2023-10-14 12:07:40 +02:00
|
|
|
include 'code:services-core:executor-service'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-10-09 13:45:45 +02:00
|
|
|
include 'code:services-application:search-service'
|
|
|
|
include 'code:services-application:api-service'
|
|
|
|
include 'code:services-application:dating-service'
|
|
|
|
include 'code:services-application:explorer-service'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-03-07 17:14:32 +01:00
|
|
|
include 'code:libraries:array'
|
2023-12-10 17:30:43 +01:00
|
|
|
include 'code:libraries:geo-ip'
|
2023-03-07 17:14:32 +01:00
|
|
|
include 'code:libraries:btree'
|
|
|
|
include 'code:libraries:easy-lsh'
|
|
|
|
include 'code:libraries:guarded-regex'
|
|
|
|
include 'code:libraries:big-string'
|
|
|
|
include 'code:libraries:random-write-funnel'
|
2023-03-11 13:48:40 +01:00
|
|
|
include 'code:libraries:next-prime'
|
2023-09-20 10:11:49 +02:00
|
|
|
include 'code:libraries:blocking-thread-pool'
|
2023-03-11 13:48:40 +01:00
|
|
|
include 'code:libraries:braille-block-punch-cards'
|
2023-03-07 17:14:32 +01:00
|
|
|
include 'code:libraries:language-processing'
|
2023-03-13 23:40:26 +01:00
|
|
|
include 'code:libraries:term-frequency-dict'
|
2024-01-12 15:55:50 +01:00
|
|
|
include 'code:libraries:test-helpers'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-08-15 10:53:23 +02:00
|
|
|
include 'code:libraries:message-queue'
|
|
|
|
|
2023-03-12 10:50:31 +01:00
|
|
|
include 'code:features-search:screenshots'
|
|
|
|
include 'code:features-search:random-websites'
|
2023-12-26 16:21:40 +01:00
|
|
|
include 'code:features-search:feedlot-client'
|
2023-10-09 15:12:30 +02:00
|
|
|
include 'code:features-qs:query-parser'
|
|
|
|
include 'code:features-index:result-ranking'
|
2023-03-12 10:50:31 +01:00
|
|
|
|
2023-03-13 17:39:53 +01:00
|
|
|
include 'code:features-convert:adblock'
|
2023-11-04 14:24:17 +01:00
|
|
|
include 'code:features-convert:anchor-keywords'
|
2024-01-15 14:54:26 +01:00
|
|
|
include 'code:features-convert:data-extractors'
|
2023-09-20 14:17:33 +02:00
|
|
|
include 'code:features-convert:stackexchange-xml'
|
2023-03-13 17:39:53 +01:00
|
|
|
include 'code:features-convert:pubdate'
|
2023-03-16 21:35:54 +01:00
|
|
|
include 'code:features-convert:summary-extraction'
|
2023-03-13 17:39:53 +01:00
|
|
|
include 'code:features-convert:keyword-extraction'
|
|
|
|
include 'code:features-convert:topic-detection'
|
|
|
|
|
2023-03-12 11:42:07 +01:00
|
|
|
include 'code:features-crawl:crawl-blocklist'
|
|
|
|
include 'code:features-crawl:link-parser'
|
2023-12-07 15:16:37 +01:00
|
|
|
include 'code:features-crawl:content-type'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-03-12 10:50:31 +01:00
|
|
|
include 'code:features-index:index-journal'
|
|
|
|
include 'code:features-index:index-query'
|
|
|
|
include 'code:features-index:index-forward'
|
|
|
|
include 'code:features-index:index-reverse'
|
|
|
|
include 'code:features-index:domain-ranking'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-10-24 11:09:12 +02:00
|
|
|
include 'code:api:actor-api'
|
2023-10-08 22:22:26 +02:00
|
|
|
include 'code:api:query-api'
|
2023-03-12 11:42:07 +01:00
|
|
|
include 'code:api:index-api'
|
|
|
|
include 'code:api:assistant-api'
|
2023-07-17 13:57:32 +02:00
|
|
|
include 'code:api:process-mqapi'
|
2023-10-14 12:07:40 +02:00
|
|
|
include 'code:api:executor-api'
|
2023-03-12 11:42:07 +01:00
|
|
|
|
2023-03-07 17:14:32 +01:00
|
|
|
include 'code:common:service-discovery'
|
|
|
|
include 'code:common:service-client'
|
2023-03-25 15:26:17 +01:00
|
|
|
include 'code:common:db'
|
2023-08-24 09:04:39 +02:00
|
|
|
include 'code:common:linkdb'
|
2023-03-07 17:14:32 +01:00
|
|
|
include 'code:common:service'
|
|
|
|
include 'code:common:config'
|
|
|
|
include 'code:common:model'
|
|
|
|
include 'code:common:renderer'
|
2023-03-16 21:35:54 +01:00
|
|
|
include 'code:common:process'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-03-13 17:39:53 +01:00
|
|
|
include 'code:processes:converting-process'
|
|
|
|
include 'code:processes:crawling-process'
|
|
|
|
include 'code:processes:loading-process'
|
2023-08-25 12:52:54 +02:00
|
|
|
include 'code:processes:index-constructor-process'
|
2023-06-26 14:14:39 +02:00
|
|
|
include 'code:processes:test-data'
|
2023-10-19 17:47:38 +02:00
|
|
|
include 'code:processes:website-adjacencies-calculator'
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-03-13 17:39:53 +01:00
|
|
|
include 'code:process-models:crawling-model'
|
2023-09-11 14:07:52 +02:00
|
|
|
include 'code:process-models:work-log'
|
2023-09-16 18:14:47 +02:00
|
|
|
include 'code:process-models:crawl-spec'
|
2023-09-11 14:08:40 +02:00
|
|
|
include 'code:process-models:processed-data'
|
2023-03-12 10:50:31 +01:00
|
|
|
|
2023-03-17 16:03:11 +01:00
|
|
|
include 'code:tools:term-frequency-extractor'
|
2023-03-28 16:58:46 +02:00
|
|
|
include 'code:tools:experiment-runner'
|
2023-04-11 16:20:27 +02:00
|
|
|
include 'code:tools:screenshot-capture-tool'
|
2023-04-02 09:43:43 +02:00
|
|
|
include 'code:tools:load-test'
|
2023-10-19 13:20:32 +02:00
|
|
|
include 'code:tools:crawl-data-unfcker'
|
2023-03-17 16:03:11 +01:00
|
|
|
|
2023-03-12 10:04:48 +01:00
|
|
|
include 'third-party:porterstemmer'
|
|
|
|
include 'third-party:symspell'
|
|
|
|
include 'third-party:rdrpostagger'
|
|
|
|
include 'third-party:openzim'
|
2023-03-16 21:35:54 +01:00
|
|
|
include 'third-party:count-min-sketch'
|
2023-03-12 10:04:48 +01:00
|
|
|
include 'third-party:monkey-patch-opennlp'
|
2023-06-12 17:42:30 +02:00
|
|
|
include 'third-party:monkey-patch-gson'
|
2023-08-01 14:57:40 +02:00
|
|
|
include 'third-party:commons-codec'
|
2023-09-05 10:38:51 +02:00
|
|
|
include 'third-party:parquet-floor'
|
2024-01-19 13:59:03 +01:00
|
|
|
include 'third-party:encyclopedia-marginalia-nu'
|
2023-03-12 10:04:48 +01:00
|
|
|
|
2023-03-04 13:19:01 +01:00
|
|
|
|
|
|
|
dependencyResolutionManagement {
|
|
|
|
|
|
|
|
repositories {
|
|
|
|
mavenLocal()
|
|
|
|
maven { url "https://artifactory.cronapp.io/public-release/" }
|
|
|
|
maven { url "https://repo1.maven.org/maven2/" }
|
|
|
|
maven { url "https://www2.ph.ed.ac.uk/maven2/" }
|
|
|
|
maven { url "https://jitpack.io/" }
|
|
|
|
exclusiveContent {
|
|
|
|
forRepository {
|
|
|
|
maven {
|
|
|
|
url = uri("https://jitpack.io")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
filter {
|
|
|
|
// Only use JitPack for the `gson-record-type-adapter-factory` library
|
|
|
|
includeModule("com.github.Marcono1234", "gson-record-type-adapter-factory")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
versionCatalogs {
|
|
|
|
libs {
|
2023-09-23 11:01:43 +02:00
|
|
|
library('lombok', 'org.projectlombok', 'lombok').version('1.18.30')
|
2023-03-04 13:19:01 +01:00
|
|
|
library('mariadb-client', 'org.mariadb.jdbc', 'mariadb-java-client').version('3.0.6')
|
|
|
|
library('hikaricp', 'com.zaxxer:HikariCP:5.0.1')
|
|
|
|
|
2023-06-20 12:03:12 +02:00
|
|
|
library('spark', 'com.sparkjava', 'spark-core').version('2.9.4')
|
2023-08-28 12:58:18 +02:00
|
|
|
library('guice', 'com.google.inject', 'guice').version('7.0.0')
|
2023-06-20 12:03:12 +02:00
|
|
|
library('guava', 'com.google.guava', 'guava').version('32.0.1-jre')
|
2023-10-31 16:09:58 +01:00
|
|
|
library('protobuf', 'com.google.protobuf', 'protobuf-java').version('3.16.3')
|
2023-10-24 11:09:12 +02:00
|
|
|
library('grpc-protobuf', 'io.grpc', 'grpc-protobuf').version('1.49.2')
|
|
|
|
library('grpc-stub', 'io.grpc', 'grpc-stub').version('1.49.2')
|
|
|
|
library('grpc-netty', 'io.grpc', 'grpc-netty-shaded').version('1.49.2')
|
2023-06-20 12:03:12 +02:00
|
|
|
library('rxjava', 'io.reactivex.rxjava3', 'rxjava').version('3.1.6')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
|
|
|
library('prometheus', 'io.prometheus', 'simpleclient').version('0.16.0')
|
|
|
|
library('prometheus-servlet', 'io.prometheus', 'simpleclient_servlet').version('0.16.0')
|
|
|
|
library('prometheus-server', 'io.prometheus', 'simpleclient_httpserver').version('0.16.0')
|
|
|
|
library('prometheus-hotspot', 'io.prometheus', 'simpleclient_hotspot').version('0.16.0')
|
|
|
|
|
|
|
|
library('slf4j.api', 'org.slf4j', 'slf4j-api').version('1.7.36')
|
|
|
|
library('slf4j.jdk14', 'org.slf4j', 'slf4j-jdk14').version('2.0.3')
|
|
|
|
|
|
|
|
library('log4j.api', 'org.apache.logging.log4j', 'log4j-api').version('2.17.2')
|
|
|
|
library('log4j.core', 'org.apache.logging.log4j', 'log4j-core').version('2.17.2')
|
|
|
|
library('log4j.slf4j', 'org.apache.logging.log4j', 'log4j-slf4j-impl').version('2.17.2')
|
|
|
|
|
|
|
|
library('notnull','org.jetbrains','annotations').version('24.0.0')
|
|
|
|
|
|
|
|
library('trove', 'net.sf.trove4j', 'trove4j').version('3.0.3')
|
|
|
|
library('fastutil', 'it.unimi.dsi', 'fastutil').version('8.5.8')
|
|
|
|
|
2023-03-16 21:35:54 +01:00
|
|
|
library('hll', 'net.agkn', 'hll').version('1.6.0')
|
2023-11-04 14:24:17 +01:00
|
|
|
library('duckdb', 'org.duckdb', 'duckdb_jdbc').version('0.9.1')
|
2023-06-20 12:03:12 +02:00
|
|
|
library('okhttp3','com.squareup.okhttp3','okhttp').version('4.11.0')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-12-13 15:33:42 +01:00
|
|
|
library('jwarc', 'org.netpreserve', 'jwarc').version('0.28.5')
|
2023-12-06 18:43:55 +01:00
|
|
|
|
2023-03-04 13:19:01 +01:00
|
|
|
library('httpcomponents.core','org.apache.httpcomponents','httpcore').version('4.4.15')
|
|
|
|
library('httpcomponents.client','org.apache.httpcomponents','httpclient').version('4.5.13')
|
|
|
|
library('commons.net', 'commons-net','commons-net').version('3.9.0')
|
|
|
|
library('commons.lang3', 'org.apache.commons','commons-lang3').version('3.12.0')
|
2024-01-22 13:01:09 +01:00
|
|
|
library('commons.compress','org.apache.commons','commons-compress').version('1.25.0')
|
2023-03-04 13:19:01 +01:00
|
|
|
library('commons.io','commons-io','commons-io').version('2.11.0')
|
2023-08-01 14:57:40 +02:00
|
|
|
library('commons.codec', 'commons-codec', 'commons-codec').version('1.16.0')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
|
|
|
library('ffi','com.github.jnr','jnr-ffi').version('2.2.12')
|
2023-10-31 16:09:58 +01:00
|
|
|
library('databind','com.fasterxml.jackson.core','jackson-databind').version('2.13.5')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2023-06-29 14:14:18 +02:00
|
|
|
library('crawlercommons', 'com.github.crawler-commons', 'crawler-commons').version('1.3')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
|
|
|
library('stanford.corenlp','edu.stanford.nlp','stanford-corenlp').version('4.4.0')
|
|
|
|
library('opennlp','org.apache.opennlp','opennlp-tools').version('1.9.4')
|
2023-08-16 15:48:12 +02:00
|
|
|
library('fasttext','com.github.vinhkhuc','jfasttext').version('0.5')
|
2023-03-04 13:19:01 +01:00
|
|
|
library('roaringbitmap','org.roaringbitmap','RoaringBitmap').version('0.9.32')
|
|
|
|
library('opencsv','com.opencsv','opencsv').version('5.6')
|
|
|
|
library('bucket4j','com.github.vladimir-bukhtoyarov','bucket4j-core').version('7.5.0')
|
|
|
|
|
2023-06-20 12:03:12 +02:00
|
|
|
library('gson','com.google.code.gson','gson').version('2.10.1')
|
2023-03-04 13:19:01 +01:00
|
|
|
library('gson-type-adapter','com.github.Marcono1234','gson-record-type-adapter-factory').version('0.2.0')
|
|
|
|
|
|
|
|
library('zstd','com.github.luben','zstd-jni').version('1.5.2-2')
|
|
|
|
library('lz4','org.lz4','lz4-java').version('1.8.0')
|
2024-01-22 13:01:09 +01:00
|
|
|
library('xz','org.tukaani','xz').version('1.9')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
2024-01-11 12:40:03 +01:00
|
|
|
library('flyway.core','org.flywaydb','flyway-core').version('10.4.1')
|
|
|
|
library('flyway.mysql','org.flywaydb','flyway-mysql').version('10.4.1')
|
|
|
|
|
2023-03-04 13:19:01 +01:00
|
|
|
library('jsoup','org.jsoup','jsoup').version('1.15.3')
|
2023-10-31 16:09:58 +01:00
|
|
|
library('snakeyaml','org.yaml','snakeyaml').version('1.33') // Known CVE, but this library only parses internal config files so it's fine
|
2023-03-04 13:19:01 +01:00
|
|
|
|
|
|
|
library('junit.jupiter','org.junit.jupiter','junit-jupiter-api').version('5.8.2')
|
|
|
|
library('junit.jupiter.engine','org.junit.jupiter','junit-jupiter-engine').version('')
|
|
|
|
library('mockito','org.mockito','mockito-junit-jupiter').version('4.5.1')
|
|
|
|
|
2023-04-16 08:55:32 +02:00
|
|
|
library('selenium.chrome','org.seleniumhq.selenium','selenium-chrome-driver').version('4.8.3')
|
|
|
|
library('selenium.java','org.seleniumhq.selenium','selenium-java').version('4.8.3')
|
2023-03-04 13:19:01 +01:00
|
|
|
|
|
|
|
library('handlebars','com.github.jknack','handlebars').version('4.3.1')
|
|
|
|
library('handlebars.markdown','com.github.jknack','handlebars-markdown').version('4.2.1')
|
|
|
|
|
2023-10-31 16:09:58 +01:00
|
|
|
library('sqlite','org.xerial','sqlite-jdbc').version('3.41.2.2')
|
2023-10-24 11:09:12 +02:00
|
|
|
library('javax.annotation','javax.annotation','javax.annotation-api').version('1.3.2')
|
2023-09-11 09:02:58 +02:00
|
|
|
library('parquet-column', 'org.apache.parquet','parquet-column').version('1.13.1')
|
|
|
|
library('parquet-hadoop', 'org.apache.parquet','parquet-hadoop').version('1.13.1')
|
|
|
|
|
2023-03-04 13:19:01 +01:00
|
|
|
bundle('slf4j', ['slf4j.api', 'log4j.api', 'log4j.core', 'log4j.slf4j'])
|
|
|
|
bundle('slf4j.test', ['slf4j.jdk14'])
|
|
|
|
bundle('prometheus', ['prometheus', 'prometheus-servlet', 'prometheus-server', 'prometheus-hotspot'])
|
|
|
|
bundle('mariadb', ['mariadb-client', 'hikaricp'])
|
2023-08-16 15:48:12 +02:00
|
|
|
bundle('nlp', ['stanford.corenlp', 'opennlp', 'fasttext'])
|
2023-03-04 13:19:01 +01:00
|
|
|
bundle('selenium', ['selenium.chrome', 'selenium.java'])
|
|
|
|
bundle('handlebars', ['handlebars', 'handlebars.markdown'])
|
2023-10-24 11:09:12 +02:00
|
|
|
bundle('grpc', ['protobuf', 'grpc-stub', 'grpc-protobuf', 'grpc-netty'])
|
2023-03-04 13:19:01 +01:00
|
|
|
bundle('gson', ['gson', 'gson-type-adapter'])
|
|
|
|
bundle('httpcomponents', ['httpcomponents.core', 'httpcomponents.client'])
|
2023-09-11 09:02:58 +02:00
|
|
|
bundle('parquet', ['parquet-column', 'parquet-hadoop'])
|
2023-03-04 13:19:01 +01:00
|
|
|
bundle('junit', ['junit.jupiter', 'junit.jupiter.engine'])
|
2024-01-11 12:40:03 +01:00
|
|
|
bundle('flyway', ['flyway.core', 'flyway.mysql'])
|
2023-03-04 13:19:01 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
}
|
2023-09-23 11:01:43 +02:00
|
|
|
|
2023-08-23 15:37:49 +02:00
|
|
|
}
|