├── .gitignore ├── .gitmodules ├── Cerebras-Dragon-DocChat ├── README.md ├── convert_embedding_checkpoint.py ├── create_train_dataset.py ├── dragon_converter.py ├── embedding_eval │ ├── README.md │ ├── arguments.py │ ├── dataset.py │ └── evaluate.py ├── example_usage │ ├── main.py │ ├── sample_document_1.md │ └── sample_document_2.md ├── train.sh └── train_configs │ └── params_train.yaml ├── Cerebras-Llama3-DocChat ├── README.md ├── cerebras_datasets │ ├── download.sh │ └── numina_math_cot.yaml ├── chatrag_eval │ ├── README.md │ ├── arguments.py │ ├── dataset.py │ ├── eval_all.sh │ ├── evaluation_utils.py │ ├── get_scores.py │ ├── metrics.py │ └── run_generation_vllm.py ├── convert_llm_checkpoint.py ├── create_train_dataset.py ├── example_usage │ ├── main.py │ └── sample_document.md ├── train.sh └── train_configs │ ├── stage_1.yaml │ └── stage_2.yaml ├── README.md ├── SkgInstruct └── download.sh └── setup.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/.gitmodules -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/README.md -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/convert_embedding_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/convert_embedding_checkpoint.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/create_train_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/create_train_dataset.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/dragon_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/dragon_converter.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/embedding_eval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/embedding_eval/README.md -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/embedding_eval/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/embedding_eval/arguments.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/embedding_eval/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/embedding_eval/dataset.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/embedding_eval/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/embedding_eval/evaluate.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/example_usage/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/example_usage/main.py -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/example_usage/sample_document_1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/example_usage/sample_document_1.md -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/example_usage/sample_document_2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/example_usage/sample_document_2.md -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/train.sh -------------------------------------------------------------------------------- /Cerebras-Dragon-DocChat/train_configs/params_train.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Dragon-DocChat/train_configs/params_train.yaml -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/README.md -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/cerebras_datasets/download.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/cerebras_datasets/download.sh -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/cerebras_datasets/numina_math_cot.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/cerebras_datasets/numina_math_cot.yaml -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/README.md -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/arguments.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/dataset.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/eval_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/eval_all.sh -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/evaluation_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/evaluation_utils.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/get_scores.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/get_scores.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/metrics.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/chatrag_eval/run_generation_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/chatrag_eval/run_generation_vllm.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/convert_llm_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/convert_llm_checkpoint.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/create_train_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/create_train_dataset.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/example_usage/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/example_usage/main.py -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/example_usage/sample_document.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/example_usage/sample_document.md -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/train.sh -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/train_configs/stage_1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/train_configs/stage_1.yaml -------------------------------------------------------------------------------- /Cerebras-Llama3-DocChat/train_configs/stage_2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/Cerebras-Llama3-DocChat/train_configs/stage_2.yaml -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/README.md -------------------------------------------------------------------------------- /SkgInstruct/download.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/SkgInstruct/download.sh -------------------------------------------------------------------------------- /setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Cerebras/DocChat/HEAD/setup.sh --------------------------------------------------------------------------------