├── .gitignore ├── LICENSE ├── README.md ├── docs └── arguments.md ├── examples ├── configs │ └── xsum.json ├── notebooks │ └── indexing_tutorial.ipynb └── scripts │ ├── gradio-demo.py │ ├── index-push-pull.py │ └── xsum-demo.py ├── pyproject.toml ├── src └── spacerini │ ├── __init__.py │ ├── cli.py │ ├── data │ ├── __init__.py │ ├── __main__.py │ ├── load.py │ └── utils.py │ ├── frontend │ ├── __init__.py │ ├── __main__.py │ ├── local.py │ └── space.py │ ├── index │ ├── __init__.py │ ├── encode.py │ ├── index.py │ └── utils.py │ ├── prebuilt.py │ ├── preprocess │ ├── __init__.py │ ├── __main__.py │ ├── tokenize.py │ └── utils.py │ ├── search │ ├── __init__.py │ └── utils.py │ └── spacerini_utils │ ├── __init__.py │ ├── index.py │ └── search.py ├── templates ├── gradio │ ├── cookiecutter.json │ └── {{ cookiecutter.local_app }} │ │ ├── .gitattributes │ │ ├── README.md │ │ ├── app.py │ │ ├── data │ │ └── .gitkeep │ │ ├── index │ │ └── .gitkeep │ │ ├── packages.txt │ │ └── requirements.txt ├── gradio_roots_temp │ ├── cookiecutter.json │ └── {{ cookiecutter.local_app }} │ │ ├── .gitattributes │ │ ├── README.md │ │ ├── app.py │ │ ├── index │ │ └── .gitkeep │ │ ├── packages.txt │ │ └── requirements.txt └── streamlit │ ├── cookiecutter.json │ └── {{ cookiecutter.module_slug }} │ ├── .gitattributes │ ├── README.md │ ├── app.py │ ├── index │ └── .gitkeep │ ├── packages.txt │ └── requirements.txt └── tests ├── __init__.py ├── data └── sample_documents.jsonl ├── test_data.py ├── test_index.py └── tests └── test_frontend.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/README.md -------------------------------------------------------------------------------- /docs/arguments.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/docs/arguments.md -------------------------------------------------------------------------------- /examples/configs/xsum.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/examples/configs/xsum.json -------------------------------------------------------------------------------- /examples/notebooks/indexing_tutorial.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/examples/notebooks/indexing_tutorial.ipynb -------------------------------------------------------------------------------- /examples/scripts/gradio-demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/examples/scripts/gradio-demo.py -------------------------------------------------------------------------------- /examples/scripts/index-push-pull.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/examples/scripts/index-push-pull.py -------------------------------------------------------------------------------- /examples/scripts/xsum-demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/examples/scripts/xsum-demo.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/pyproject.toml -------------------------------------------------------------------------------- /src/spacerini/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/__init__.py -------------------------------------------------------------------------------- /src/spacerini/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/cli.py -------------------------------------------------------------------------------- /src/spacerini/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/data/__init__.py -------------------------------------------------------------------------------- /src/spacerini/data/__main__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/spacerini/data/load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/data/load.py -------------------------------------------------------------------------------- /src/spacerini/data/utils.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/spacerini/frontend/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/frontend/__init__.py -------------------------------------------------------------------------------- /src/spacerini/frontend/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/frontend/__main__.py -------------------------------------------------------------------------------- /src/spacerini/frontend/local.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/frontend/local.py -------------------------------------------------------------------------------- /src/spacerini/frontend/space.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/frontend/space.py -------------------------------------------------------------------------------- /src/spacerini/index/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/index/__init__.py -------------------------------------------------------------------------------- /src/spacerini/index/encode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/index/encode.py -------------------------------------------------------------------------------- /src/spacerini/index/index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/index/index.py -------------------------------------------------------------------------------- /src/spacerini/index/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/index/utils.py -------------------------------------------------------------------------------- /src/spacerini/prebuilt.py: -------------------------------------------------------------------------------- 1 | EXAMPLES = { 2 | 'xsum', 3 | } -------------------------------------------------------------------------------- /src/spacerini/preprocess/__init__.py: -------------------------------------------------------------------------------- 1 | from . import tokenize, utils -------------------------------------------------------------------------------- /src/spacerini/preprocess/__main__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/spacerini/preprocess/tokenize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/preprocess/tokenize.py -------------------------------------------------------------------------------- /src/spacerini/preprocess/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/preprocess/utils.py -------------------------------------------------------------------------------- /src/spacerini/search/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/search/__init__.py -------------------------------------------------------------------------------- /src/spacerini/search/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/search/utils.py -------------------------------------------------------------------------------- /src/spacerini/spacerini_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/spacerini/spacerini_utils/index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/spacerini_utils/index.py -------------------------------------------------------------------------------- /src/spacerini/spacerini_utils/search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/src/spacerini/spacerini_utils/search.py -------------------------------------------------------------------------------- /templates/gradio/cookiecutter.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio/cookiecutter.json -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio/{{ cookiecutter.local_app }}/.gitattributes -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio/{{ cookiecutter.local_app }}/README.md -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio/{{ cookiecutter.local_app }}/app.py -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/data/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/index/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/packages.txt: -------------------------------------------------------------------------------- 1 | default-jdk 2 | -------------------------------------------------------------------------------- /templates/gradio/{{ cookiecutter.local_app }}/requirements.txt: -------------------------------------------------------------------------------- 1 | pyserini 2 | datasets 3 | faiss-cpu 4 | torch -------------------------------------------------------------------------------- /templates/gradio_roots_temp/cookiecutter.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio_roots_temp/cookiecutter.json -------------------------------------------------------------------------------- /templates/gradio_roots_temp/{{ cookiecutter.local_app }}/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio_roots_temp/{{ cookiecutter.local_app }}/.gitattributes -------------------------------------------------------------------------------- /templates/gradio_roots_temp/{{ cookiecutter.local_app }}/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio_roots_temp/{{ cookiecutter.local_app }}/README.md -------------------------------------------------------------------------------- /templates/gradio_roots_temp/{{ cookiecutter.local_app }}/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/gradio_roots_temp/{{ cookiecutter.local_app }}/app.py -------------------------------------------------------------------------------- /templates/gradio_roots_temp/{{ cookiecutter.local_app }}/index/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /templates/gradio_roots_temp/{{ cookiecutter.local_app }}/packages.txt: -------------------------------------------------------------------------------- 1 | default-jdk 2 | -------------------------------------------------------------------------------- /templates/gradio_roots_temp/{{ cookiecutter.local_app }}/requirements.txt: -------------------------------------------------------------------------------- 1 | pyserini 2 | datasets 3 | faiss-cpu 4 | torch -------------------------------------------------------------------------------- /templates/streamlit/cookiecutter.json: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /templates/streamlit/{{ cookiecutter.module_slug }}/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/streamlit/{{ cookiecutter.module_slug }}/.gitattributes -------------------------------------------------------------------------------- /templates/streamlit/{{ cookiecutter.module_slug }}/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/streamlit/{{ cookiecutter.module_slug }}/README.md -------------------------------------------------------------------------------- /templates/streamlit/{{ cookiecutter.module_slug }}/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/templates/streamlit/{{ cookiecutter.module_slug }}/app.py -------------------------------------------------------------------------------- /templates/streamlit/{{ cookiecutter.module_slug }}/index/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /templates/streamlit/{{ cookiecutter.module_slug }}/packages.txt: -------------------------------------------------------------------------------- 1 | default-jdk 2 | -------------------------------------------------------------------------------- /templates/streamlit/{{ cookiecutter.module_slug }}/requirements.txt: -------------------------------------------------------------------------------- 1 | pyserini 2 | faiss-cpu 3 | torch -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/data/sample_documents.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/tests/data/sample_documents.jsonl -------------------------------------------------------------------------------- /tests/test_data.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/test_index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/castorini/hf-spacerini/HEAD/tests/test_index.py -------------------------------------------------------------------------------- /tests/tests/test_frontend.py: -------------------------------------------------------------------------------- 1 | --------------------------------------------------------------------------------