.devcontainer.json
.gitignore
Dockerfile
LICENSE
Makefile
README.md
pyproject.toml
.github/dependabot.yml
.github/release.yml
.github/workflows/ci.yml
assets/banner.png
data/.gitignore
data/README.md
data/publish-all-runs-of-team.py
data/update-leaderboard.py
data/rank-distillm/README.md
data/rank-distillm/config.json
data/rank-distillm/dataset-metadata.json
data/rank-distillm/dataset-metadata.yml
data/rank-distillm/rank_distillm.py
data/rank-distillm/subsample.json
data/trec-18-web/README.md
data/trec-18-web/config.json
data/trec-18-web/dataset-metadata.json
data/trec-18-web/dataset-metadata.yml
data/trec-18-web/subsample.json
data/trec-19-web/README.md
data/trec-19-web/config.json
data/trec-19-web/dataset-metadata.json
data/trec-19-web/dataset-metadata.yml
data/trec-19-web/subsample.json
data/trec-20-web/README.md
data/trec-20-web/config.json
data/trec-20-web/dataset-metadata.json
data/trec-20-web/dataset-metadata.yml
data/trec-20-web/subsample.json
data/trec-21-web/README.md
data/trec-21-web/config.json
data/trec-21-web/dataset-metadata.json
data/trec-21-web/dataset-metadata.yml
data/trec-21-web/subsample.json
data/trec-22-web/README.md
data/trec-22-web/config.json
data/trec-22-web/dataset-metadata.json
data/trec-22-web/dataset-metadata.yml
data/trec-22-web/subsample.json
data/trec-23-web/README.md
data/trec-23-web/config.json
data/trec-23-web/dataset-metadata.json
data/trec-23-web/dataset-metadata.yml
data/trec-23-web/subsample.json
data/trec-28-deep-learning-docs/config.json
data/trec-28-deep-learning-docs/subsample.json
data/trec-28-deep-learning-passages/README.md
data/trec-28-deep-learning-passages/config.json
data/trec-28-deep-learning-passages/dataset-metadata.json
data/trec-28-deep-learning-passages/dataset-metadata.yml
data/trec-28-deep-learning-passages/subsample.json
data/trec-28-misinfo/README.md
data/trec-28-misinfo/config.json
data/trec-28-misinfo/dataset-metadata.json
data/trec-28-misinfo/dataset-metadata.yml
data/trec-28-misinfo/subsample.json
data/trec-29-deep-learning-docs/config.json
data/trec-29-deep-learning-docs/subsample.json
data/trec-29-deep-learning-passages/README.md
data/trec-29-deep-learning-passages/config.json
data/trec-29-deep-learning-passages/dataset-metadata.json
data/trec-29-deep-learning-passages/dataset-metadata.yml
data/trec-29-deep-learning-passages/subsample.json
data/trec-33-rag/README.md
data/trec-33-rag/config.json
data/trec-33-rag/dataset-metadata.json
data/trec-33-rag/dataset-metadata.yml
data/trec-33-rag/subsample.json
data/trec-robust-2004-fold-1/README.md
data/trec-robust-2004-fold-1/config.json
data/trec-robust-2004-fold-1/dataset-metadata.json
data/trec-robust-2004-fold-1/dataset-metadata.yml
data/trec-robust-2004-fold-1/subsample.json
data/trec-robust-2004-fold-2/README.md
data/trec-robust-2004-fold-2/config.json
data/trec-robust-2004-fold-2/dataset-metadata.json
data/trec-robust-2004-fold-2/dataset-metadata.yml
data/trec-robust-2004-fold-2/subsample.json
data/trec-robust-2004-fold-3/README.md
data/trec-robust-2004-fold-3/config.json
data/trec-robust-2004-fold-3/dataset-metadata.json
data/trec-robust-2004-fold-3/dataset-metadata.yml
data/trec-robust-2004-fold-3/subsample.json
data/trec-robust-2004-fold-4/README.md
data/trec-robust-2004-fold-4/config.json
data/trec-robust-2004-fold-4/dataset-metadata.json
data/trec-robust-2004-fold-4/dataset-metadata.yml
data/trec-robust-2004-fold-4/subsample.json
data/trec-robust-2004-fold-5/README.md
data/trec-robust-2004-fold-5/config.json
data/trec-robust-2004-fold-5/dataset-metadata.json
data/trec-robust-2004-fold-5/dataset-metadata.yml
data/trec-robust-2004-fold-5/subsample.json
lsr_benchmark/__init__.py
lsr_benchmark/chatnoir.py
lsr_benchmark/click.py
lsr_benchmark/irds.py
lsr_benchmark.egg-info/PKG-INFO
lsr_benchmark.egg-info/SOURCES.txt
lsr_benchmark.egg-info/dependency_links.txt
lsr_benchmark.egg-info/entry_points.txt
lsr_benchmark.egg-info/requires.txt
lsr_benchmark.egg-info/top_level.txt
lsr_benchmark/_commands/__init__.py
lsr_benchmark/_commands/_download.py
lsr_benchmark/_commands/_evaluate.py
lsr_benchmark/_commands/_retrieval.py
lsr_benchmark/corpus/__init__.py
lsr_benchmark/corpus/corpus_subsampling.py
lsr_benchmark/corpus/segmentation.py
lsr_benchmark/datasets/__init__.py
lsr_benchmark/datasets/overview.json
step-02-embedding-approaches/README.md
step-02-embedding-approaches/bge-m3/.devcontainer.json
step-02-embedding-approaches/bge-m3/Dockerfile
step-02-embedding-approaches/bge-m3/README.md
step-02-embedding-approaches/bge-m3/access-bge-ir-embeddings.py
step-02-embedding-approaches/bge-m3/bgem3.py
step-02-embedding-approaches/bge-m3/requirements.txt
step-02-embedding-approaches/lexical/.devcontainer.json
step-02-embedding-approaches/lexical/Dockerfile
step-02-embedding-approaches/lexical/README.md
step-02-embedding-approaches/lexical/requirements.txt
step-02-embedding-approaches/lexical/run-pyterrier.py
step-02-embedding-approaches/lightning-ir/.devcontainer.json
step-02-embedding-approaches/lightning-ir/Dockerfile
step-02-embedding-approaches/lightning-ir/README.md
step-02-embedding-approaches/lightning-ir/access-lightning-ir-embeddings.py
step-02-embedding-approaches/lightning-ir/lightning-ir.py
step-02-embedding-approaches/lightning-ir/requirements.txt
step-03-retrieval-approaches/README.md
step-03-retrieval-approaches/duckdb/.devcontainer.json
step-03-retrieval-approaches/duckdb/Dockerfile
step-03-retrieval-approaches/duckdb/README.md
step-03-retrieval-approaches/duckdb/requirements.txt
step-03-retrieval-approaches/duckdb/run-duckdb.py
step-03-retrieval-approaches/kannolo/.devcontainer.json
step-03-retrieval-approaches/kannolo/Dockerfile
step-03-retrieval-approaches/kannolo/README.md
step-03-retrieval-approaches/kannolo/build-and-search-kannolo-index.py
step-03-retrieval-approaches/kannolo/requirements.txt
step-03-retrieval-approaches/lexical/pyterrier-naive/.devcontainer.json
step-03-retrieval-approaches/lexical/pyterrier-naive/Dockerfile
step-03-retrieval-approaches/lexical/pyterrier-naive/README.md
step-03-retrieval-approaches/lexical/pyterrier-naive/requirements.txt
step-03-retrieval-approaches/lexical/pyterrier-naive/run-pyterrier.py
step-03-retrieval-approaches/lexical/pyterrier-pisa/.devcontainer.json
step-03-retrieval-approaches/lexical/pyterrier-pisa/Dockerfile
step-03-retrieval-approaches/lexical/pyterrier-pisa/README.md
step-03-retrieval-approaches/lexical/pyterrier-pisa/requirements.txt
step-03-retrieval-approaches/lexical/pyterrier-pisa/run-pyterrier-pisa.py
step-03-retrieval-approaches/naive-search/Dockerfile
step-03-retrieval-approaches/naive-search/README.md
step-03-retrieval-approaches/naive-search/build-and-search-naive-index.py
step-03-retrieval-approaches/naive-search/requirements.txt
step-03-retrieval-approaches/pyserini-lsr/.devcontainer.json
step-03-retrieval-approaches/pyserini-lsr/Dockerfile
step-03-retrieval-approaches/pyserini-lsr/README.md
step-03-retrieval-approaches/pyserini-lsr/requirements.txt
step-03-retrieval-approaches/pyserini-lsr/run-pyserini-lsr.py
step-03-retrieval-approaches/pyterrier-splade/.devcontainer.json
step-03-retrieval-approaches/pyterrier-splade/Dockerfile
step-03-retrieval-approaches/pyterrier-splade/README.md
step-03-retrieval-approaches/pyterrier-splade/requirements.txt
step-03-retrieval-approaches/pyterrier-splade/run-pyterrier-splade.py
step-03-retrieval-approaches/pyterrier-splade-pisa/.devcontainer.json
step-03-retrieval-approaches/pyterrier-splade-pisa/Dockerfile
step-03-retrieval-approaches/pyterrier-splade-pisa/README.md
step-03-retrieval-approaches/pyterrier-splade-pisa/requirements.txt
step-03-retrieval-approaches/pyterrier-splade-pisa/run-pyterrier-splade.py
step-03-retrieval-approaches/pytorch-naive/.devcontainer.json
step-03-retrieval-approaches/pytorch-naive/Dockerfile
step-03-retrieval-approaches/pytorch-naive/README.md
step-03-retrieval-approaches/pytorch-naive/requirements.txt
step-03-retrieval-approaches/pytorch-naive/search-pytorch-index.py
step-03-retrieval-approaches/seismic/.devcontainer.json
step-03-retrieval-approaches/seismic/Dockerfile
step-03-retrieval-approaches/seismic/README.md
step-03-retrieval-approaches/seismic/build-and-search-seismic-index.py
step-03-retrieval-approaches/seismic/requirements.txt
step-04-evaluation/README.md
step-04-evaluation/analysis-in-progress.ipynb
step-04-evaluation/analyze-embeddings.ipynb
step-04-evaluation/analyze-lsr-vs-lexical-efficiency.ipynb
step-04-evaluation/evaluation-in-progress.jsonl.gz
step-04-evaluation/lsr-vs-lexical-evaluation.jsonl.gz
step-04-evaluation/lsr-vs-lexical.jsonl.gz
step-04-evaluation/results-in-progress.jsonl.gz
test/TestPassageChunking.test_chunking.approved.json
test/test_access_to_private_datasets.py
test/test_irds_integration.py
test/test_irds_integration_to_pyterrier.py
test/test_load_embeddings.py
test/test_passage_chunking.py
test/test_run_pool_corpus_sampler.py
test/resources/example-dl-01.json
test/resources/example-dl-02.json
test/resources/load_resources.sh
test/resources/example-dataset/corpus.jsonl.gz
test/resources/example-dataset/qrels.txt
test/resources/example-dataset/queries.jsonl
tutorials/README.md
tutorials/tutorial-access-raw-data.ipynb
tutorials/tutorial-embedding-models.ipynb
tutorials/tutorial-pre-computed-resources.ipynb
tutorials/tutorial-retrieval-engines.ipynb