├── data ├── Readme.md ├── SuperBEIR │ └── SuperBEIR-categories-with-rationales.json ├── WikiQuestions-2.0.json ├── WikiQuestions-builder.py ├── WikiQuestions.json ├── duplicate-answer.py ├── wiki-abstract-titles.json └── wiki-answerable-questions.json ├── docs ├── 1_run_test.md ├── 2_result_visualization.md └── task-zoo.md ├── notebooks ├── OPRO-Compiled-JSON-Mode.ipynb └── StructuredRAG_Experimental_Visualization.ipynb ├── poetry.lock ├── pyproject.toml ├── readme.md ├── related-works.md ├── setup.py ├── structured_rag ├── mock_gfl │ ├── __init__.py │ ├── dspy_program.py │ ├── dspy_signatures.py │ ├── fstring_program.py │ ├── fstring_prompts.py │ └── modal_vllm_outlines │ │ ├── download_llama.py │ │ ├── modal_web_server.py │ │ ├── quick_setup_test.py │ │ ├── readme.md │ │ ├── setup.sh │ │ └── vllm_outlines_setup.py ├── models.py ├── readme.md └── run_test │ ├── __init__.py │ ├── readme.md │ ├── result_visualization │ ├── aggregate_result_jsons.py │ ├── boxplot_success_rates_per_model.png │ ├── boxplot_success_rates_per_task.png │ ├── compute_averages.py │ ├── dspy_error_analysis.py │ ├── new_aggregate_result_jsons.py │ ├── success_rate_heatmap.png │ ├── success_rates.png │ ├── success_rates_per_test.png │ ├── visualize.py │ └── visualize_single_result.py │ ├── results │ ├── 10-6-24 │ │ ├── AssessAnswerability-gpt-4o-2024-08-06-dspy.json │ │ ├── AssessAnswerability-gpt-4o-2024-08-06-dspy_NO_OPRO_JSON.json │ │ ├── AssessAnswerability-gpt-4o-2024-08-06-dspy_WITH_OPRO_JSON.json │ │ ├── AssessAnswerability-gpt-4o-2024-08-06-fstring.json │ │ ├── AssessAnswerability-gpt-4o-2024-08-06-fstring_with_structured_outputs.json │ │ └── AssessAnswerability-gpt-4o-2024-08-06-fstring_without_structured_outputs.json │ ├── 9-26-24 │ │ ├── AssessAnswerability-llama3.2:3b-instruct-fp16-dspy.json │ │ └── AssessAnswerability-llama3.2:3b-instruct-fp16-fstring.json │ ├── Gemini-1.5-Pro-9-11-24 │ │ ├── AssessAnswerability-gemini-1.5-pro-dspy.json │ │ ├── AssessAnswerability-gemini-1.5-pro-fstring.json │ │ ├── GenerateAnswer-gemini-1.5-pro-dspy.json │ │ ├── GenerateAnswer-gemini-1.5-pro-fstring.json │ │ ├── GenerateAnswerWithConfidence-gemini-1.5-pro-dspy.json │ │ ├── GenerateAnswerWithConfidence-gemini-1.5-pro-fstring.json │ │ ├── GenerateAnswersWithConfidence-gemini-1.5-pro-dspy.json │ │ ├── GenerateAnswersWithConfidence-gemini-1.5-pro-fstring.json │ │ ├── ParaphraseQuestions-gemini-1.5-pro-dspy.json │ │ ├── ParaphraseQuestions-gemini-1.5-pro-fstring.json │ │ ├── RAGAS-gemini-1.5-pro-dspy.json │ │ ├── RAGAS-gemini-1.5-pro-fstring.json │ │ ├── RateContext-gemini-1.5-pro-dspy.json │ │ └── RateContext-gemini-1.5-pro-fstring.json │ ├── batch-9-13-24 │ │ ├── AssessAnswerability-BATCH-llama3-8b-instruct-Modal.json │ │ ├── GenerateAnswer-BATCH-llama3-8b-instruct-Modal.json │ │ ├── GenerateAnswerWithConfidence-BATCH-llama3-8b-instruct-Modal.json │ │ ├── GenerateAnswersWithConfidence-BATCH-llama3-8b-instruct-Modal.json │ │ ├── ParaphraseQuestions-BATCH-llama3-8b-instruct-Modal.json │ │ ├── RAGAS-BATCH-llama3-8b-instruct-Modal.json │ │ └── RateContext-BATCH-llama3-8b-instruct-Modal.json │ ├── experimental-results-8-26-24 │ │ ├── aggregated_results-8-26-24.json │ │ ├── model_comparison.png │ │ ├── model_comparison_results-trial-1.png │ │ ├── model_comparison_results-trial-2.png │ │ ├── trial-1 │ │ │ ├── AssessAnswerability-gemini-1.5-pro.json │ │ │ ├── AssessAnswerability-llama3:instruct.json │ │ │ ├── GenerateAnswer-gemini-1.5-pro.json │ │ │ ├── GenerateAnswer-llama3:instruct.json │ │ │ ├── GenerateAnswerWithConfidence-gemini-1.5-pro.json │ │ │ ├── GenerateAnswerWithConfidence-llama3:instruct.json │ │ │ ├── GenerateAnswersWithConfidence-gemini-1.5-pro.json │ │ │ ├── GenerateAnswersWithConfidence-llama3:instruct.json │ │ │ ├── ParaphraseQuestions-gemini-1.5-pro.json │ │ │ ├── ParaphraseQuestions-llama3:instruct.json │ │ │ ├── RateContext-gemini-1.5-pro.json │ │ │ └── RateContext-llama3:instruct.json │ │ └── trial-2 │ │ │ ├── AssessAnswerability-gemini-1.5-pro.json │ │ │ ├── AssessAnswerability-llama3:instruct.json │ │ │ ├── GenerateAnswer-gemini-1.5-pro.json │ │ │ ├── GenerateAnswer-llama3:instruct.json │ │ │ ├── GenerateAnswerWithConfidence-gemini-1.5-pro.json │ │ │ ├── GenerateAnswerWithConfidence-llama3:instruct.json │ │ │ ├── GenerateAnswersWithConfidence-gemini-1.5-pro.json │ │ │ ├── GenerateAnswersWithConfidence-llama3:instruct.json │ │ │ ├── ParaphraseQuestions-gemini-1.5-pro.json │ │ │ ├── ParaphraseQuestions-llama3:instruct.json │ │ │ ├── RateContext-gemini-1.5-pro.json │ │ │ └── RateContext-llama3:instruct.json │ ├── experimental-results-9-11-24 │ │ ├── AssessAnswerability-claude-3-5-sonnet-20240620-dspy.json │ │ ├── AssessAnswerability-claude-3-5-sonnet-20240620-fstring.json │ │ ├── AssessAnswerability-gemini-1.5-pro-dspy.json │ │ ├── AssessAnswerability-gemini-1.5-pro-fstring.json │ │ ├── AssessAnswerability-gpt-4o-dspy.json │ │ ├── AssessAnswerability-gpt-4o-fstring.json │ │ ├── AssessAnswerability-llama3:instruct-dspy.json │ │ ├── AssessAnswerability-llama3:instruct-fstring.json │ │ ├── GenerateAnswer-claude-3-5-sonnet-20240620-dspy.json │ │ ├── GenerateAnswer-claude-3-5-sonnet-20240620-fstring.json │ │ ├── GenerateAnswer-gemini-1.5-pro-dspy.json │ │ ├── GenerateAnswer-gemini-1.5-pro-fstring.json │ │ ├── GenerateAnswer-gpt-4o-dspy.json │ │ ├── GenerateAnswer-gpt-4o-fstring.json │ │ ├── GenerateAnswer-llama3:instruct-dspy.json │ │ ├── GenerateAnswer-llama3:instruct-fstring.json │ │ ├── GenerateAnswerWithConfidence-claude-3-5-sonnet-20240620-dspy.json │ │ ├── GenerateAnswerWithConfidence-claude-3-5-sonnet-20240620-fstring.json │ │ ├── GenerateAnswerWithConfidence-gemini-1.5-pro-dspy.json │ │ ├── GenerateAnswerWithConfidence-gemini-1.5-pro-fstring.json │ │ ├── GenerateAnswerWithConfidence-gpt-4o-dspy.json │ │ ├── GenerateAnswerWithConfidence-gpt-4o-fstring.json │ │ ├── GenerateAnswerWithConfidence-llama3:instruct-dspy.json │ │ ├── GenerateAnswerWithConfidence-llama3:instruct-fstring.json │ │ ├── GenerateAnswersWithConfidence-claude-3-5-sonnet-20240620-dspy.json │ │ ├── GenerateAnswersWithConfidence-claude-3-5-sonnet-20240620-fstring.json │ │ ├── GenerateAnswersWithConfidence-gemini-1.5-pro-dspy.json │ │ ├── GenerateAnswersWithConfidence-gemini-1.5-pro-fstring.json │ │ ├── GenerateAnswersWithConfidence-gpt-4o-dspy.json │ │ ├── GenerateAnswersWithConfidence-gpt-4o-fstring.json │ │ ├── GenerateAnswersWithConfidence-llama3:instruct-dspy.json │ │ ├── GenerateAnswersWithConfidence-llama3:instruct-fstring.json │ │ ├── ParaphraseQuestions-claude-3-5-sonnet-20240620-dspy.json │ │ ├── ParaphraseQuestions-claude-3-5-sonnet-20240620-fstring.json │ │ ├── ParaphraseQuestions-gemini-1.5-pro-dspy.json │ │ ├── ParaphraseQuestions-gemini-1.5-pro-fstring.json │ │ ├── ParaphraseQuestions-gpt-4o-dspy.json │ │ ├── ParaphraseQuestions-gpt-4o-fstring.json │ │ ├── ParaphraseQuestions-llama3:instruct-dspy.json │ │ ├── ParaphraseQuestions-llama3:instruct-fstring.json │ │ ├── RAGAS-claude-3-5-sonnet-20240620-dspy.json │ │ ├── RAGAS-claude-3-5-sonnet-20240620-fstring.json │ │ ├── RAGAS-gemini-1.5-pro-dspy.json │ │ ├── RAGAS-gemini-1.5-pro-fstring.json │ │ ├── RAGAS-gpt-4o-dspy.json │ │ ├── RAGAS-gpt-4o-fstring.json │ │ ├── RAGAS-llama3:instruct-dspy.json │ │ ├── RAGAS-llama3:instruct-fstring.json │ │ ├── RateContext-claude-3-5-sonnet-20240620-dspy.json │ │ ├── RateContext-claude-3-5-sonnet-20240620-fstring.json │ │ ├── RateContext-gemini-1.5-pro-dspy.json │ │ ├── RateContext-gemini-1.5-pro-fstring.json │ │ ├── RateContext-gpt-4o-dspy.json │ │ ├── RateContext-gpt-4o-fstring.json │ │ ├── RateContext-llama3:instruct-dspy.json │ │ └── RateContext-llama3:instruct-fstring.json │ └── results │ │ ├── AssessAnswerability-gpt-4o-dspy_NO_OPRO_JSON-2024-11-29.json │ │ ├── AssessAnswerability-gpt-4o-dspy_WITH_OPRO_JSON-2024-11-29.json │ │ ├── AssessAnswerability-gpt-4o-fstring_with_structured_outputs-2024-11-29.json │ │ └── AssessAnswerability-gpt-4o-fstring_without_structured_outputs-2024-11-29.json │ ├── run_scripts │ ├── experiment-log.md │ ├── results │ │ ├── 9-25-24 │ │ │ ├── AssessAnswerability-llama3:instruct-dspy.json │ │ │ └── AssessAnswerability-llama3:instruct-fstring.json │ │ ├── AssessAnswerability-BATCH-llama3-8b-instruct-Modal.json │ │ ├── ClassifyDocumentWithRationale-Modal-vLLM.json │ │ └── GenerateAnswer-BATCH-llama3.2-1b-instruct-Modal.json │ ├── run_batch_test.py │ └── run_test.py │ └── utils_and_metrics │ ├── __pycache__ │ ├── helpers.cpython-310.pyc │ └── metrics.cpython-310.pyc │ ├── count-tokens.py │ ├── helpers.py │ └── metrics.py └── test-cost.md /data/Readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/Readme.md -------------------------------------------------------------------------------- /data/SuperBEIR/SuperBEIR-categories-with-rationales.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/SuperBEIR/SuperBEIR-categories-with-rationales.json -------------------------------------------------------------------------------- /data/WikiQuestions-2.0.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/WikiQuestions-2.0.json -------------------------------------------------------------------------------- /data/WikiQuestions-builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/WikiQuestions-builder.py -------------------------------------------------------------------------------- /data/WikiQuestions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/WikiQuestions.json -------------------------------------------------------------------------------- /data/duplicate-answer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/duplicate-answer.py -------------------------------------------------------------------------------- /data/wiki-abstract-titles.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/wiki-abstract-titles.json -------------------------------------------------------------------------------- /data/wiki-answerable-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/data/wiki-answerable-questions.json -------------------------------------------------------------------------------- /docs/1_run_test.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/docs/1_run_test.md -------------------------------------------------------------------------------- /docs/2_result_visualization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/docs/2_result_visualization.md -------------------------------------------------------------------------------- /docs/task-zoo.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/docs/task-zoo.md -------------------------------------------------------------------------------- /notebooks/OPRO-Compiled-JSON-Mode.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/notebooks/OPRO-Compiled-JSON-Mode.ipynb -------------------------------------------------------------------------------- /notebooks/StructuredRAG_Experimental_Visualization.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/notebooks/StructuredRAG_Experimental_Visualization.ipynb -------------------------------------------------------------------------------- /poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/poetry.lock -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/pyproject.toml -------------------------------------------------------------------------------- /readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/readme.md -------------------------------------------------------------------------------- /related-works.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/related-works.md -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/setup.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/__init__.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/dspy_program.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/dspy_program.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/dspy_signatures.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/dspy_signatures.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/fstring_program.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/fstring_program.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/fstring_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/fstring_prompts.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/modal_vllm_outlines/download_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/modal_vllm_outlines/download_llama.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/modal_vllm_outlines/modal_web_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/modal_vllm_outlines/modal_web_server.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/modal_vllm_outlines/quick_setup_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/modal_vllm_outlines/quick_setup_test.py -------------------------------------------------------------------------------- /structured_rag/mock_gfl/modal_vllm_outlines/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/modal_vllm_outlines/readme.md -------------------------------------------------------------------------------- /structured_rag/mock_gfl/modal_vllm_outlines/setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/modal_vllm_outlines/setup.sh -------------------------------------------------------------------------------- /structured_rag/mock_gfl/modal_vllm_outlines/vllm_outlines_setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/mock_gfl/modal_vllm_outlines/vllm_outlines_setup.py -------------------------------------------------------------------------------- /structured_rag/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/models.py -------------------------------------------------------------------------------- /structured_rag/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/readme.md -------------------------------------------------------------------------------- /structured_rag/run_test/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /structured_rag/run_test/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/readme.md -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/aggregate_result_jsons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/aggregate_result_jsons.py -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/boxplot_success_rates_per_model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/boxplot_success_rates_per_model.png -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/boxplot_success_rates_per_task.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/boxplot_success_rates_per_task.png -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/compute_averages.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/compute_averages.py -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/dspy_error_analysis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/dspy_error_analysis.py -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/new_aggregate_result_jsons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/new_aggregate_result_jsons.py -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/success_rate_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/success_rate_heatmap.png -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/success_rates.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/success_rates.png -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/success_rates_per_test.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/success_rates_per_test.png -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/visualize.py -------------------------------------------------------------------------------- /structured_rag/run_test/result_visualization/visualize_single_result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/result_visualization/visualize_single_result.py -------------------------------------------------------------------------------- /structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-dspy_NO_OPRO_JSON.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-dspy_NO_OPRO_JSON.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-dspy_WITH_OPRO_JSON.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-dspy_WITH_OPRO_JSON.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-fstring_with_structured_outputs.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-fstring_with_structured_outputs.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-fstring_without_structured_outputs.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/10-6-24/AssessAnswerability-gpt-4o-2024-08-06-fstring_without_structured_outputs.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/9-26-24/AssessAnswerability-llama3.2:3b-instruct-fp16-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/9-26-24/AssessAnswerability-llama3.2:3b-instruct-fp16-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/9-26-24/AssessAnswerability-llama3.2:3b-instruct-fp16-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/9-26-24/AssessAnswerability-llama3.2:3b-instruct-fp16-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/AssessAnswerability-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/AssessAnswerability-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/AssessAnswerability-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/AssessAnswerability-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswer-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswer-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswer-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswer-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/ParaphraseQuestions-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/ParaphraseQuestions-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/ParaphraseQuestions-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/ParaphraseQuestions-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RAGAS-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RAGAS-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RAGAS-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RAGAS-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RateContext-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RateContext-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RateContext-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/Gemini-1.5-Pro-9-11-24/RateContext-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/AssessAnswerability-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/AssessAnswerability-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/GenerateAnswer-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/GenerateAnswer-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/GenerateAnswerWithConfidence-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/GenerateAnswerWithConfidence-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/GenerateAnswersWithConfidence-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/GenerateAnswersWithConfidence-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/ParaphraseQuestions-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/ParaphraseQuestions-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/RAGAS-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/RAGAS-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/batch-9-13-24/RateContext-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/batch-9-13-24/RateContext-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/aggregated_results-8-26-24.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/aggregated_results-8-26-24.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/model_comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/model_comparison.png -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/model_comparison_results-trial-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/model_comparison_results-trial-1.png -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/model_comparison_results-trial-2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/model_comparison_results-trial-2.png -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/AssessAnswerability-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/AssessAnswerability-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/AssessAnswerability-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/AssessAnswerability-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswer-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswer-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswer-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswer-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswerWithConfidence-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswerWithConfidence-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswerWithConfidence-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswerWithConfidence-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswersWithConfidence-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswersWithConfidence-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswersWithConfidence-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/GenerateAnswersWithConfidence-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/ParaphraseQuestions-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/ParaphraseQuestions-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/ParaphraseQuestions-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/ParaphraseQuestions-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/RateContext-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/RateContext-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-1/RateContext-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-1/RateContext-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/AssessAnswerability-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/AssessAnswerability-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/AssessAnswerability-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/AssessAnswerability-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswer-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswer-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswer-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswer-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswerWithConfidence-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswerWithConfidence-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswerWithConfidence-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswerWithConfidence-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswersWithConfidence-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswersWithConfidence-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswersWithConfidence-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/GenerateAnswersWithConfidence-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/ParaphraseQuestions-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/ParaphraseQuestions-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/ParaphraseQuestions-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/ParaphraseQuestions-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/RateContext-gemini-1.5-pro.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/RateContext-gemini-1.5-pro.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-8-26-24/trial-2/RateContext-llama3:instruct.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-8-26-24/trial-2/RateContext-llama3:instruct.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/AssessAnswerability-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswer-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswerWithConfidence-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/GenerateAnswersWithConfidence-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/ParaphraseQuestions-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RAGAS-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-claude-3-5-sonnet-20240620-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-claude-3-5-sonnet-20240620-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-claude-3-5-sonnet-20240620-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-claude-3-5-sonnet-20240620-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gemini-1.5-pro-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gemini-1.5-pro-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gemini-1.5-pro-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gemini-1.5-pro-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gpt-4o-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gpt-4o-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gpt-4o-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-gpt-4o-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/experimental-results-9-11-24/RateContext-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/experimental-results-9-11-24/RateContext-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-dspy_NO_OPRO_JSON-2024-11-29.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-dspy_NO_OPRO_JSON-2024-11-29.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-dspy_WITH_OPRO_JSON-2024-11-29.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-dspy_WITH_OPRO_JSON-2024-11-29.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-fstring_with_structured_outputs-2024-11-29.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-fstring_with_structured_outputs-2024-11-29.json -------------------------------------------------------------------------------- /structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-fstring_without_structured_outputs-2024-11-29.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/results/results/AssessAnswerability-gpt-4o-fstring_without_structured_outputs-2024-11-29.json -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/experiment-log.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/experiment-log.md -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/results/9-25-24/AssessAnswerability-llama3:instruct-dspy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/results/9-25-24/AssessAnswerability-llama3:instruct-dspy.json -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/results/9-25-24/AssessAnswerability-llama3:instruct-fstring.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/results/9-25-24/AssessAnswerability-llama3:instruct-fstring.json -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/results/AssessAnswerability-BATCH-llama3-8b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/results/AssessAnswerability-BATCH-llama3-8b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/results/ClassifyDocumentWithRationale-Modal-vLLM.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/results/ClassifyDocumentWithRationale-Modal-vLLM.json -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/results/GenerateAnswer-BATCH-llama3.2-1b-instruct-Modal.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/results/GenerateAnswer-BATCH-llama3.2-1b-instruct-Modal.json -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/run_batch_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/run_batch_test.py -------------------------------------------------------------------------------- /structured_rag/run_test/run_scripts/run_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/run_scripts/run_test.py -------------------------------------------------------------------------------- /structured_rag/run_test/utils_and_metrics/__pycache__/helpers.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/utils_and_metrics/__pycache__/helpers.cpython-310.pyc -------------------------------------------------------------------------------- /structured_rag/run_test/utils_and_metrics/__pycache__/metrics.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/utils_and_metrics/__pycache__/metrics.cpython-310.pyc -------------------------------------------------------------------------------- /structured_rag/run_test/utils_and_metrics/count-tokens.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/utils_and_metrics/count-tokens.py -------------------------------------------------------------------------------- /structured_rag/run_test/utils_and_metrics/helpers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/utils_and_metrics/helpers.py -------------------------------------------------------------------------------- /structured_rag/run_test/utils_and_metrics/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/structured_rag/run_test/utils_and_metrics/metrics.py -------------------------------------------------------------------------------- /test-cost.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/weaviate/structured-rag/HEAD/test-cost.md --------------------------------------------------------------------------------