├── README.md ├── __init__.py ├── densify ├── __init__.py ├── densify_corpus.py ├── densify_query.py └── output_vector.py ├── docs ├── aggretriever │ ├── beir-eval.md │ └── msmarco-passage-train-eval.md └── dhr │ ├── beir-eval.md │ ├── densify_exp.md │ └── msmarco-passage-train-eval.md ├── fig ├── aggretriever.png ├── aggretriever_teaser.png ├── densification.png └── single_model_fusion.png ├── retrieval ├── __init__.py ├── evaluation │ ├── __init__.py │ └── custom_metrics.py ├── gip_retrieval.py ├── index.py ├── merge.result.py ├── quantize_index.py ├── rcap_eval.py └── util.py └── tevatron ├── Aggretriever ├── __init__.py ├── modeling.py └── utils.py ├── ColBERT └── modeling.py ├── DHR ├── __init__.py ├── modeling.py └── utils.py ├── Dense ├── __init__.py └── modeling.py ├── __init__.py ├── arguments.py ├── data.py ├── datasets ├── __init__.py ├── beir │ ├── __init__.py │ ├── encode_and_retrieval.py │ ├── preprocess.py │ └── sentence_bert.py ├── dataset.py └── preprocessor.py ├── driver ├── __init__.py ├── encode.py ├── eval.py ├── jax_encode.py ├── jax_train.py └── train.py ├── faiss_retriever ├── __init__.py ├── __main__.py ├── reducer.py └── retriever.py ├── loss.py ├── preprocessor ├── __init__.py └── preprocessor_tsv.py ├── tevax ├── __init__.py ├── loss.py └── training.py ├── trainer.py └── utils ├── __init__.py ├── convert_from_dpr.py ├── data_reader.py ├── format ├── __init__.py └── convert_result_to_trec.py ├── metrics.py ├── tokenize_corpus.py └── tokenize_query.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/README.md -------------------------------------------------------------------------------- /__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /densify/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /densify/densify_corpus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/densify/densify_corpus.py -------------------------------------------------------------------------------- /densify/densify_query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/densify/densify_query.py -------------------------------------------------------------------------------- /densify/output_vector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/densify/output_vector.py -------------------------------------------------------------------------------- /docs/aggretriever/beir-eval.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/docs/aggretriever/beir-eval.md -------------------------------------------------------------------------------- /docs/aggretriever/msmarco-passage-train-eval.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/docs/aggretriever/msmarco-passage-train-eval.md -------------------------------------------------------------------------------- /docs/dhr/beir-eval.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/docs/dhr/beir-eval.md -------------------------------------------------------------------------------- /docs/dhr/densify_exp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/docs/dhr/densify_exp.md -------------------------------------------------------------------------------- /docs/dhr/msmarco-passage-train-eval.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/docs/dhr/msmarco-passage-train-eval.md -------------------------------------------------------------------------------- /fig/aggretriever.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/fig/aggretriever.png -------------------------------------------------------------------------------- /fig/aggretriever_teaser.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/fig/aggretriever_teaser.png -------------------------------------------------------------------------------- /fig/densification.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/fig/densification.png -------------------------------------------------------------------------------- /fig/single_model_fusion.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/fig/single_model_fusion.png -------------------------------------------------------------------------------- /retrieval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /retrieval/evaluation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /retrieval/evaluation/custom_metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/evaluation/custom_metrics.py -------------------------------------------------------------------------------- /retrieval/gip_retrieval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/gip_retrieval.py -------------------------------------------------------------------------------- /retrieval/index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/index.py -------------------------------------------------------------------------------- /retrieval/merge.result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/merge.result.py -------------------------------------------------------------------------------- /retrieval/quantize_index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/quantize_index.py -------------------------------------------------------------------------------- /retrieval/rcap_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/rcap_eval.py -------------------------------------------------------------------------------- /retrieval/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/retrieval/util.py -------------------------------------------------------------------------------- /tevatron/Aggretriever/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/Aggretriever/modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/Aggretriever/modeling.py -------------------------------------------------------------------------------- /tevatron/Aggretriever/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/Aggretriever/utils.py -------------------------------------------------------------------------------- /tevatron/ColBERT/modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/ColBERT/modeling.py -------------------------------------------------------------------------------- /tevatron/DHR/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/DHR/modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/DHR/modeling.py -------------------------------------------------------------------------------- /tevatron/DHR/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/DHR/utils.py -------------------------------------------------------------------------------- /tevatron/Dense/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/Dense/modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/Dense/modeling.py -------------------------------------------------------------------------------- /tevatron/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/arguments.py -------------------------------------------------------------------------------- /tevatron/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/data.py -------------------------------------------------------------------------------- /tevatron/datasets/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/datasets/__init__.py -------------------------------------------------------------------------------- /tevatron/datasets/beir/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/datasets/beir/encode_and_retrieval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/datasets/beir/encode_and_retrieval.py -------------------------------------------------------------------------------- /tevatron/datasets/beir/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/datasets/beir/preprocess.py -------------------------------------------------------------------------------- /tevatron/datasets/beir/sentence_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/datasets/beir/sentence_bert.py -------------------------------------------------------------------------------- /tevatron/datasets/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/datasets/dataset.py -------------------------------------------------------------------------------- /tevatron/datasets/preprocessor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/datasets/preprocessor.py -------------------------------------------------------------------------------- /tevatron/driver/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/driver/encode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/driver/encode.py -------------------------------------------------------------------------------- /tevatron/driver/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/driver/eval.py -------------------------------------------------------------------------------- /tevatron/driver/jax_encode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/driver/jax_encode.py -------------------------------------------------------------------------------- /tevatron/driver/jax_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/driver/jax_train.py -------------------------------------------------------------------------------- /tevatron/driver/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/driver/train.py -------------------------------------------------------------------------------- /tevatron/faiss_retriever/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/faiss_retriever/__init__.py -------------------------------------------------------------------------------- /tevatron/faiss_retriever/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/faiss_retriever/__main__.py -------------------------------------------------------------------------------- /tevatron/faiss_retriever/reducer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/faiss_retriever/reducer.py -------------------------------------------------------------------------------- /tevatron/faiss_retriever/retriever.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/faiss_retriever/retriever.py -------------------------------------------------------------------------------- /tevatron/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/loss.py -------------------------------------------------------------------------------- /tevatron/preprocessor/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/preprocessor/__init__.py -------------------------------------------------------------------------------- /tevatron/preprocessor/preprocessor_tsv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/preprocessor/preprocessor_tsv.py -------------------------------------------------------------------------------- /tevatron/tevax/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/tevax/__init__.py -------------------------------------------------------------------------------- /tevatron/tevax/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/tevax/loss.py -------------------------------------------------------------------------------- /tevatron/tevax/training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/tevax/training.py -------------------------------------------------------------------------------- /tevatron/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/trainer.py -------------------------------------------------------------------------------- /tevatron/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/utils/convert_from_dpr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/utils/convert_from_dpr.py -------------------------------------------------------------------------------- /tevatron/utils/data_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/utils/data_reader.py -------------------------------------------------------------------------------- /tevatron/utils/format/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tevatron/utils/format/convert_result_to_trec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/utils/format/convert_result_to_trec.py -------------------------------------------------------------------------------- /tevatron/utils/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/utils/metrics.py -------------------------------------------------------------------------------- /tevatron/utils/tokenize_corpus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/utils/tokenize_corpus.py -------------------------------------------------------------------------------- /tevatron/utils/tokenize_query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/dhr/HEAD/tevatron/utils/tokenize_query.py --------------------------------------------------------------------------------