├── .gitignore ├── LICENSE ├── README.md ├── add_meta_from_domain.py ├── backup ├── ollama-gen │ ├── Modelfile │ ├── create.sh │ └── out ├── train10.json ├── train11.json ├── train12.json ├── train13.json ├── train15.json ├── train16.json ├── train17.json ├── train18.json ├── train19.json ├── train2.json ├── train21.json ├── train22.json ├── train23.json ├── train24.json ├── train25.json ├── train26.json ├── train27.json ├── train28.json ├── train29.json ├── train30.json ├── train31.json ├── train4.json ├── train5.json ├── train6.json ├── train7.json ├── train8.json └── train9.json ├── data_tool.py ├── example.md ├── example.md.json ├── example.txt ├── extract_json.py ├── extract_json_mapping.py ├── generate_prompt.py ├── generate_synthetic_data.py ├── gpt4-data ├── train10.json ├── train11.json ├── train12.json ├── train13.json ├── train15.json ├── train16.json ├── train17.json ├── train18.json ├── train19.json ├── train2.json ├── train21.json ├── train22.json ├── train23.json ├── train24.json ├── train25.json ├── train26.json ├── train27.json ├── train28.json ├── train29.json ├── train30.json ├── train31.json ├── train4.json ├── train5.json ├── train6.json ├── train7.json ├── train8.json └── train9.json ├── json_sampler.py ├── merge_data.py ├── ollama-gen ├── Modelfile ├── create.sh └── sample.txt ├── out.txt ├── stat_data.py ├── template.txt ├── test.json ├── test2.json ├── test_extract_mappings.py └── validate_data.py /.gitignore: -------------------------------------------------------------------------------- 1 | __* 2 | venv 3 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/README.md -------------------------------------------------------------------------------- /add_meta_from_domain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/add_meta_from_domain.py -------------------------------------------------------------------------------- /backup/ollama-gen/Modelfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/ollama-gen/Modelfile -------------------------------------------------------------------------------- /backup/ollama-gen/create.sh: -------------------------------------------------------------------------------- 1 | ollama create es-synth -f ./Modelfile 2 | 3 | -------------------------------------------------------------------------------- /backup/ollama-gen/out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/ollama-gen/out -------------------------------------------------------------------------------- /backup/train10.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train10.json -------------------------------------------------------------------------------- /backup/train11.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train11.json -------------------------------------------------------------------------------- /backup/train12.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train12.json -------------------------------------------------------------------------------- /backup/train13.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train13.json -------------------------------------------------------------------------------- /backup/train15.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train15.json -------------------------------------------------------------------------------- /backup/train16.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train16.json -------------------------------------------------------------------------------- /backup/train17.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train17.json -------------------------------------------------------------------------------- /backup/train18.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train18.json -------------------------------------------------------------------------------- /backup/train19.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train19.json -------------------------------------------------------------------------------- /backup/train2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train2.json -------------------------------------------------------------------------------- /backup/train21.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train21.json -------------------------------------------------------------------------------- /backup/train22.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train22.json -------------------------------------------------------------------------------- /backup/train23.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train23.json -------------------------------------------------------------------------------- /backup/train24.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train24.json -------------------------------------------------------------------------------- /backup/train25.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train25.json -------------------------------------------------------------------------------- /backup/train26.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train26.json -------------------------------------------------------------------------------- /backup/train27.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train27.json -------------------------------------------------------------------------------- /backup/train28.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train28.json -------------------------------------------------------------------------------- /backup/train29.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train29.json -------------------------------------------------------------------------------- /backup/train30.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train30.json -------------------------------------------------------------------------------- /backup/train31.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train31.json -------------------------------------------------------------------------------- /backup/train4.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train4.json -------------------------------------------------------------------------------- /backup/train5.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train5.json -------------------------------------------------------------------------------- /backup/train6.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train6.json -------------------------------------------------------------------------------- /backup/train7.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train7.json -------------------------------------------------------------------------------- /backup/train8.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train8.json -------------------------------------------------------------------------------- /backup/train9.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/backup/train9.json -------------------------------------------------------------------------------- /data_tool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/data_tool.py -------------------------------------------------------------------------------- /example.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/example.md -------------------------------------------------------------------------------- /example.md.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/example.md.json -------------------------------------------------------------------------------- /example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/example.txt -------------------------------------------------------------------------------- /extract_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/extract_json.py -------------------------------------------------------------------------------- /extract_json_mapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/extract_json_mapping.py -------------------------------------------------------------------------------- /generate_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/generate_prompt.py -------------------------------------------------------------------------------- /generate_synthetic_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/generate_synthetic_data.py -------------------------------------------------------------------------------- /gpt4-data/train10.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train10.json -------------------------------------------------------------------------------- /gpt4-data/train11.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train11.json -------------------------------------------------------------------------------- /gpt4-data/train12.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train12.json -------------------------------------------------------------------------------- /gpt4-data/train13.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train13.json -------------------------------------------------------------------------------- /gpt4-data/train15.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train15.json -------------------------------------------------------------------------------- /gpt4-data/train16.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train16.json -------------------------------------------------------------------------------- /gpt4-data/train17.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train17.json -------------------------------------------------------------------------------- /gpt4-data/train18.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train18.json -------------------------------------------------------------------------------- /gpt4-data/train19.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train19.json -------------------------------------------------------------------------------- /gpt4-data/train2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train2.json -------------------------------------------------------------------------------- /gpt4-data/train21.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train21.json -------------------------------------------------------------------------------- /gpt4-data/train22.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train22.json -------------------------------------------------------------------------------- /gpt4-data/train23.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train23.json -------------------------------------------------------------------------------- /gpt4-data/train24.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train24.json -------------------------------------------------------------------------------- /gpt4-data/train25.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train25.json -------------------------------------------------------------------------------- /gpt4-data/train26.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train26.json -------------------------------------------------------------------------------- /gpt4-data/train27.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train27.json -------------------------------------------------------------------------------- /gpt4-data/train28.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train28.json -------------------------------------------------------------------------------- /gpt4-data/train29.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train29.json -------------------------------------------------------------------------------- /gpt4-data/train30.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train30.json -------------------------------------------------------------------------------- /gpt4-data/train31.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train31.json -------------------------------------------------------------------------------- /gpt4-data/train4.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train4.json -------------------------------------------------------------------------------- /gpt4-data/train5.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train5.json -------------------------------------------------------------------------------- /gpt4-data/train6.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train6.json -------------------------------------------------------------------------------- /gpt4-data/train7.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train7.json -------------------------------------------------------------------------------- /gpt4-data/train8.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train8.json -------------------------------------------------------------------------------- /gpt4-data/train9.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/gpt4-data/train9.json -------------------------------------------------------------------------------- /json_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/json_sampler.py -------------------------------------------------------------------------------- /merge_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/merge_data.py -------------------------------------------------------------------------------- /ollama-gen/Modelfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/ollama-gen/Modelfile -------------------------------------------------------------------------------- /ollama-gen/create.sh: -------------------------------------------------------------------------------- 1 | ollama create es-synth -f ./Modelfile 2 | 3 | -------------------------------------------------------------------------------- /ollama-gen/sample.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/ollama-gen/sample.txt -------------------------------------------------------------------------------- /out.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/out.txt -------------------------------------------------------------------------------- /stat_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/stat_data.py -------------------------------------------------------------------------------- /template.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/template.txt -------------------------------------------------------------------------------- /test.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/test.json -------------------------------------------------------------------------------- /test2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/test2.json -------------------------------------------------------------------------------- /test_extract_mappings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/test_extract_mappings.py -------------------------------------------------------------------------------- /validate_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/queelius/elasticsearch-lm/HEAD/validate_data.py --------------------------------------------------------------------------------