Ecosyste.ms: Repos
An open API service providing repository metadata for many open source software ecosystems.
GitHub / chatnoir-eu / chatnoir-copycat
CopyCat is a resource for deduplication in TREC-style experimental setups.
JSON API: https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/chatnoir-eu%2Fchatnoir-copycat
Stars: 7
Forks: 0
Open Issues: 1
License: mit
Language: Arc
Repo Size: 69.8 MB
Dependencies:
201
Created: about 3 years ago
Updated: over 1 year ago
Last pushed: over 2 years ago
Last synced: about 1 year ago
Files
Loading...
Readme
Loading...
Dependencies
- org.apache.hadoop:hadoop-client 2.7.3 provided
- org.apache.spark:spark-core_2.11 2.4.3 provided
- org.projectlombok:lombok 1.18.8 provided
- commons-collections:commons-collections 3.2.2
- de.webis.chatnoir2:chatnoir2-mapfile-generator 1.0-SNAPSHOT
- de.webis.corpora:webis-uuid 1.0
- de.webis:trec-ndd 1.0-SNAPSHOT
- net.sourceforge.argparse4j:argparse4j 0.8.1
- org.apache.logging.log4j:log4j-slf4j-impl 2.13.3
- org.elasticsearch.client:elasticsearch-rest-high-level-client 6.7.1
- org.netpreserve.commons:webarchive-commons 1.1.9
- com.approvaltests:approvaltests 3.2.0 test
- com.google.code.gson:gson 2.8.5 test
- com.holdenkarau:spark-testing-base_2.11 2.4.5_0.14.0 test
- junit:junit 4.11 test
- org.mockito:mockito-all 1.10.19 test
- org.powermock:powermock-api-mockito 1.7.4 test
- org.powermock:powermock-core 1.7.4 test
- org.apache.hadoop:hadoop-client 2.7.3 provided
- org.apache.spark:spark-core_2.11 2.4.3 provided
- org.projectlombok:lombok 1.18.8 provided
- client.netspeak:netspeak-client 1.3.5
- de.webis.aitools:aitools3-aq-algebra 1.0
- de.webis.aitools:aitools3-aq-check 1.0
- de.webis.aitools:aitools3-ir-fingerprinting 1.0
- de.webis.aitools:wstud-aitools3-ir-fingerprinting-simhash 1.0
- de.webis.chatnoir2:chatnoir2-indexer 1.0-SNAPSHOT
- de.webis.chatnoir2:chatnoir2-mapfile-generator 1.0-SNAPSHOT
- de.webis.chatnoir2:chatnoir2-webclient 2.0.0-SNAPSHOT-MAIK
- de.webis.corpora:webis-uuid 1.0
- de.webis:trec-ndd 1.0-SNAPSHOT
- info.debatty:java-lsh 0.12
- net.sf.trove4j:trove4j 3.0.3
- net.sourceforge.argparse4j:argparse4j 0.8.1
- org.elasticsearch.client:transport 6.4.1
- com.approvaltests:approvaltests 3.2.0 test
- com.google.code.gson:gson 2.8.5 test
- com.holdenkarau:spark-testing-base_2.11 2.4.5_0.14.0 test
- junit:junit 4.11 test
- org.mockito:mockito-all 1.10.19 test
- org.powermock:powermock-api-mockito 1.7.4 test
- org.powermock:powermock-core 1.7.4 test
copycat-cli/pom.xml
maven
- org.projectlombok:lombok 1.18.8 provided
- de.webis.chatnoir2:chatnoir2-webclient 2.0.0-SNAPSHOT-MAIK
- de.webis:copycat-anserini-integration 1.0-SNAPSHOT
- de.webis:copycat-spark 1.0-SNAPSHOT
- org.apache.hadoop:hadoop-client 2.7.3
- org.jgrapht:jgrapht-core 1.4.0
- com.approvaltests:approvaltests 3.2.0 test
- com.google.code.gson:gson 2.8.5 test
- junit:junit 4.11 test
- org.projectlombok:lombok 1.18.8 provided
- commons-io:commons-io 2.8.0
- de.webis:copycat-interfaces 1.0-SNAPSHOT
- org.apache.lucene:lucene-core 8.3.0
- com.approvaltests:approvaltests 3.2.0 test
- com.google.code.gson:gson 2.8.5 test
- junit:junit 4.11 test
- org.projectlombok:lombok 1.18.8 provided
- com.google.guava:guava 14.0
- de.l3s.boilerpipe:boilerpipe 1.1.0
- de.webis:copycat-interfaces 1.0-SNAPSHOT
- io.anserini:anserini 0.5.1
- net.htmlparser.jericho:jericho-html 3.4
- net.jodah:failsafe 2.4.0
- net.sourceforge.argparse4j:argparse4j 0.8.1
- org.apache.lucene:lucene-analyzers-common 7.4.0
- org.apache.lucene:lucene-benchmark 7.4.0
- org.apache.lucene:lucene-core 7.4.0
- org.buildobjects:jproc 2.3.0
- com.approvaltests:approvaltests 3.2.0 test
- com.google.code.gson:gson 2.8.5 test
- junit:junit 4.11 test
- de.webis:trec-ndd 1.0-SNAPSHOT provided
- org.apache.commons:commons-lang3 3.5 provided
- org.projectlombok:lombok 1.18.8 provided
- de.l3s.boilerpipe:boilerpipe 1.1.0
- net.htmlparser.jericho:jericho-html 3.4
copycat-spark/pom.xml
maven
- org.apache.hadoop:hadoop-client 2.7.3 provided
- org.apache.spark:spark-core_2.11 2.4.3 provided
- org.projectlombok:lombok 1.18.8 provided
- client.netspeak:netspeak-client 1.3.5
- de.webis.aitools:aitools3-aq-algebra 1.0
- de.webis.aitools:aitools3-aq-check 1.0
- de.webis.aitools:aitools3-ir-fingerprinting 1.0
- de.webis.aitools:wstud-aitools3-ir-fingerprinting-simhash 1.0
- de.webis.chatnoir2:chatnoir2-indexer 1.0-SNAPSHOT
- de.webis.chatnoir2:chatnoir2-mapfile-generator 1.0-SNAPSHOT
- de.webis.chatnoir2:chatnoir2-webclient 2.0.0-SNAPSHOT-MAIK
- de.webis.corpora:webis-uuid 1.0
- de.webis:copycat-document-preprocessing 1.0-SNAPSHOT
- de.webis:copycat-interfaces 1.0-SNAPSHOT
- de.webis:trec-ndd 1.0-SNAPSHOT
- info.debatty:java-lsh 0.12
- net.sf.trove4j:trove4j 3.0.3
- net.sourceforge.argparse4j:argparse4j 0.8.1
- org.elasticsearch.client:transport 6.4.1
- com.approvaltests:approvaltests 3.2.0 test
- com.google.code.gson:gson 2.8.5 test
- com.holdenkarau:spark-testing-base_2.11 2.4.5_0.14.0 test
- junit:junit 4.11 test
- org.mockito:mockito-all 1.10.19 test
- org.powermock:powermock-api-mockito 1.7.4 test
- org.powermock:powermock-core 1.7.4 test
- approvaltests * develop
- certifi 2020.6.20 develop
- elasticsearch 7.9.1 develop
- nose * develop
- numpy 1.19.2 develop
- pandas 1.1.3 develop
- pipfile-requirements * develop
- python-dateutil 2.8.1 develop
- pytz 2020.1 develop
- six 1.15.0 develop
- urllib3 1.25.10 develop
- certifi 2020.6.20
- elasticsearch 7.9.1
- numpy 1.19.2
- pandas 1.1.3
- python-dateutil 2.8.1
- pytz 2020.1
- six 1.15.0
- urllib3 1.25.10
- approvaltests * develop
- nose * develop
- pandas 1.0.2 develop
- pipfile-requirements * develop
- pandas 1.0.2
- tqdm *
- trectools <0.0.38
- approvaltests ==0.2.7 develop
- attrs ==20.2.0 develop
- importlib-metadata ==2.0.0 develop
- iniconfig ==1.0.1 develop
- nose ==1.3.7 develop
- numpy ==1.19.2 develop
- packaging ==20.4 develop
- pandas ==1.1.2 develop
- pipfile-requirements ==0.3.0 develop
- pluggy ==0.13.1 develop
- py ==1.9.0 develop
- pyparsing ==2.4.7 develop
- pyperclip ==1.5.27 develop
- pytest ==6.1.1 develop
- python-dateutil ==2.8.1 develop
- pytz ==2020.1 develop
- six ==1.15.0 develop
- toml ==0.10.1 develop
- zipp ==3.3.0 develop
- beautifulsoup4 ==4.9.3
- bs4 ==0.0.1
- certifi ==2020.6.20
- cycler ==0.10.0
- joblib ==0.17.0
- kiwisolver ==1.2.0
- lxml ==4.5.2
- matplotlib ==3.3.2
- numpy ==1.19.2
- pandas ==1.1.2
- pillow ==7.2.0
- pyparsing ==2.4.7
- python-dateutil ==2.8.1
- pytz ==2020.1
- sarge ==0.1.6
- scikit-learn ==0.23.2
- scipy ==1.5.2
- six ==1.15.0
- soupsieve ==2.0.1
- threadpoolctl ==2.1.0
- tqdm ==4.50.0
- trectools ==0.0.37
- approvaltests ==0.2.7 develop
- attrs ==20.2.0 develop
- certifi ==2020.6.20 develop
- elasticsearch ==7.9.1 develop
- importlib-metadata ==2.0.0 develop
- iniconfig ==1.0.1 develop
- nose ==1.3.7 develop
- numpy ==1.19.2 develop
- packaging ==20.4 develop
- pandas ==1.1.3 develop
- pipfile-requirements ==0.3.0 develop
- pluggy ==0.13.1 develop
- py ==1.9.0 develop
- pyparsing ==2.4.7 develop
- pyperclip ==1.5.27 develop
- pytest ==6.1.1 develop
- python-dateutil ==2.8.1 develop
- pytz ==2020.1 develop
- six ==1.15.0 develop
- toml ==0.10.1 develop
- urllib3 ==1.25.10 develop
- zipp ==3.3.0 develop
- certifi ==2020.6.20
- elasticsearch ==7.9.1
- numpy ==1.19.2
- pandas ==1.1.3
- python-dateutil ==2.8.1
- pytz ==2020.1
- six ==1.15.0
- urllib3 ==1.25.10