├── .gitattributes ├── .gitignore ├── LICENSE ├── README.md ├── all_results.md ├── data ├── 42dot │ └── 42dot_LLM-SFT-1.3B │ │ ├── alpaca-eval-ko.json │ │ ├── alpaca-eval-ko_helpful.json │ │ ├── gpt4evol.json │ │ ├── gpt4evol.json_helpful.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ ├── ko-ethical-questions.json_safety.json │ │ ├── ko-ethical-questions_helpful.json │ │ ├── pku-saferlhf-ko.json │ │ ├── pku-saferlhf-ko.json_safety.json │ │ └── pku-saferlhf-ko_helpful.json ├── GT │ ├── alpaca-eval-ko_helpful.json │ ├── gpt4evol_helpful.json │ └── ko-ethical-questions_safety.json ├── KT-AI │ └── midm-bitext-S-7B-inst-v1 │ │ ├── alpaca-eval-ko.json │ │ ├── alpaca-eval-ko_helpful.json │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ ├── ko-ethical-questions_helpful.json │ │ └── ko-ethical-questions_safety.json ├── beomi │ ├── KoAlpaca-Polyglot-12.8B │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ ├── ko-ethical-questions_helpful.json │ │ └── ko-ethical-questions_safety.json │ └── KoAlpaca-Polyglot-5.8B │ │ ├── alpaca-eval-ko.json │ │ └── alpaca-eval-ko_helpful.json ├── gemma-2b-it │ ├── alpaca-eval-ko.json │ ├── alpaca-eval-ko_helpful.json │ ├── ko-ethical-questions.json │ └── ko-ethical-questions_safety.json ├── gemma-7b-it │ ├── alpaca-eval-ko.json │ ├── alpaca-eval-ko_helpful.json │ ├── ko-ethical-questions.json │ └── ko-ethical-questions_safety.json ├── heegyu │ ├── 42dot-SFT-DPO-v0.1-steps-126664 │ │ ├── gpt4evol.json │ │ ├── gpt4evol.json_helpful.json │ │ ├── ko-ethical-questions.json │ │ ├── ko-ethical-questions.json_safety.json │ │ ├── pku-saferlhf-ko.json │ │ └── pku-saferlhf-ko.json_safety.json │ ├── 42dot-SFT-DPO-v0.1-steps-189996 │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ └── ko-ethical-questions_safety.json │ ├── 42dot-SFT-DPO-v0.1-steps-253328 │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ └── ko-ethical-questions_safety.json │ ├── 42dot-SFT-DPO-v0.1-steps-63332 │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ └── ko-ethical-questions_safety.json │ └── Yi-ko-6B-OKI-v20231124-2e-5-epoch-1 │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ └── ko-ethical-questions_safety.json ├── hyeogi │ └── Yi-6b-dpo-v0.2 │ │ ├── gpt4evol.json │ │ └── ko-ethical-questions.json ├── kfkas │ └── Llama-2-ko-7b-Chat │ │ ├── alpaca-eval-ko.json │ │ └── alpaca-eval-ko_helpful.json ├── logicker │ └── SkkuDataScience-10.7B-v5 │ │ └── gpt4evol.json ├── maywell │ └── Synatra-Yi-Ko-6B │ │ ├── alpaca-eval-ko.json │ │ ├── alpaca-eval-ko_helpful.json │ │ ├── gpt4evol.json │ │ ├── gpt4evol_helpful.json │ │ ├── ko-ethical-questions.json │ │ └── ko-ethical-questions_safety.json └── nlpai-lab │ ├── kullm-polyglot-12.8b-v3 │ ├── alpaca-eval-ko.json │ ├── alpaca-eval-ko_helpful.json │ ├── gpt4evol.json │ ├── gpt4evol_helpful.json │ ├── ko-ethical-questions.json │ └── ko-ethical-questions_safety.json │ └── kullm-polyglot-5.8b-v2 │ ├── alpaca-eval-ko.json │ ├── alpaca-eval-ko_helpful.json │ ├── gpt4evol.json │ ├── gpt4evol_helpful.json │ ├── ko-ethical-questions.json │ ├── ko-ethical-questions_helpful.json │ └── ko-ethical-questions_safety.json ├── eval.py ├── eval_batch.py ├── eval_gt.py ├── generate.py ├── heegyu └── Yi-ko-6B-OKI-v20231124-2e-5-epoch-1 │ ├── gpt4evol.json │ ├── gpt4evol_helpful.json │ ├── ko-ethical-questions.json │ └── ko-ethical-questions_safety.json ├── img ├── llama_evaluator.jpeg └── llama_judge.jpeg ├── make_md.py ├── prompt_templates.py ├── question_datasets.py ├── requirements.txt └── script ├── 42dot-dpo.sh ├── 42dot.sh ├── README.md ├── alpacaeval.sh ├── eval_batch.sh ├── eval_gt.sh ├── gemma.sh ├── heegyu-yi-ko.sh ├── hyeogi-Yi-6b-dpo-v0.2.sh ├── koalpaca.sh ├── kullm.sh ├── midm.sh ├── skkuds.sh └── synatra.sh /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/.gitattributes -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/README.md -------------------------------------------------------------------------------- /all_results.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/all_results.md -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/gpt4evol.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/gpt4evol.json_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/gpt4evol.json_helpful.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/ko-ethical-questions.json_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/ko-ethical-questions.json_safety.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/ko-ethical-questions_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/ko-ethical-questions_helpful.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/pku-saferlhf-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/pku-saferlhf-ko.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/pku-saferlhf-ko.json_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/pku-saferlhf-ko.json_safety.json -------------------------------------------------------------------------------- /data/42dot/42dot_LLM-SFT-1.3B/pku-saferlhf-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/42dot/42dot_LLM-SFT-1.3B/pku-saferlhf-ko_helpful.json -------------------------------------------------------------------------------- /data/GT/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/GT/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/GT/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/GT/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/GT/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/GT/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/gpt4evol.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/ko-ethical-questions_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/ko-ethical-questions_helpful.json -------------------------------------------------------------------------------- /data/KT-AI/midm-bitext-S-7B-inst-v1/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/KT-AI/midm-bitext-S-7B-inst-v1/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-12.8B/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-12.8B/gpt4evol.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-12.8B/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-12.8B/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-12.8B/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-12.8B/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-12.8B/ko-ethical-questions_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-12.8B/ko-ethical-questions_helpful.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-12.8B/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-12.8B/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-5.8B/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-5.8B/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/beomi/KoAlpaca-Polyglot-5.8B/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/beomi/KoAlpaca-Polyglot-5.8B/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/gemma-2b-it/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-2b-it/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/gemma-2b-it/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-2b-it/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/gemma-2b-it/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-2b-it/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/gemma-2b-it/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-2b-it/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/gemma-7b-it/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-7b-it/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/gemma-7b-it/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-7b-it/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/gemma-7b-it/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-7b-it/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/gemma-7b-it/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/gemma-7b-it/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/gpt4evol.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/gpt4evol.json_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/gpt4evol.json_helpful.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/ko-ethical-questions.json_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/ko-ethical-questions.json_safety.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/pku-saferlhf-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/pku-saferlhf-ko.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/pku-saferlhf-ko.json_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-126664/pku-saferlhf-ko.json_safety.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/gpt4evol.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-189996/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/gpt4evol.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-253328/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/gpt4evol.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/42dot-SFT-DPO-v0.1-steps-63332/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol.json -------------------------------------------------------------------------------- /data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/hyeogi/Yi-6b-dpo-v0.2/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/hyeogi/Yi-6b-dpo-v0.2/gpt4evol.json -------------------------------------------------------------------------------- /data/hyeogi/Yi-6b-dpo-v0.2/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/hyeogi/Yi-6b-dpo-v0.2/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/kfkas/Llama-2-ko-7b-Chat/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/kfkas/Llama-2-ko-7b-Chat/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/kfkas/Llama-2-ko-7b-Chat/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/kfkas/Llama-2-ko-7b-Chat/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/logicker/SkkuDataScience-10.7B-v5/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/logicker/SkkuDataScience-10.7B-v5/gpt4evol.json -------------------------------------------------------------------------------- /data/maywell/Synatra-Yi-Ko-6B/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/maywell/Synatra-Yi-Ko-6B/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/maywell/Synatra-Yi-Ko-6B/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/maywell/Synatra-Yi-Ko-6B/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/maywell/Synatra-Yi-Ko-6B/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/maywell/Synatra-Yi-Ko-6B/gpt4evol.json -------------------------------------------------------------------------------- /data/maywell/Synatra-Yi-Ko-6B/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/maywell/Synatra-Yi-Ko-6B/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/maywell/Synatra-Yi-Ko-6B/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/maywell/Synatra-Yi-Ko-6B/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/maywell/Synatra-Yi-Ko-6B/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/maywell/Synatra-Yi-Ko-6B/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-12.8b-v3/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-12.8b-v3/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-12.8b-v3/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-12.8b-v3/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-12.8b-v3/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-12.8b-v3/gpt4evol.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-12.8b-v3/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-12.8b-v3/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-12.8b-v3/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-12.8b-v3/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-12.8b-v3/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-12.8b-v3/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/alpaca-eval-ko.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/alpaca-eval-ko.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/alpaca-eval-ko_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/alpaca-eval-ko_helpful.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/gpt4evol.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/gpt4evol_helpful.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/ko-ethical-questions.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/ko-ethical-questions_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/ko-ethical-questions_helpful.json -------------------------------------------------------------------------------- /data/nlpai-lab/kullm-polyglot-5.8b-v2/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/data/nlpai-lab/kullm-polyglot-5.8b-v2/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/eval.py -------------------------------------------------------------------------------- /eval_batch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/eval_batch.py -------------------------------------------------------------------------------- /eval_gt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/eval_gt.py -------------------------------------------------------------------------------- /generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/generate.py -------------------------------------------------------------------------------- /heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol.json -------------------------------------------------------------------------------- /heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol_helpful.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/gpt4evol_helpful.json -------------------------------------------------------------------------------- /heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions.json -------------------------------------------------------------------------------- /heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions_safety.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/heegyu/Yi-ko-6B-OKI-v20231124-2e-5-epoch-1/ko-ethical-questions_safety.json -------------------------------------------------------------------------------- /img/llama_evaluator.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/img/llama_evaluator.jpeg -------------------------------------------------------------------------------- /img/llama_judge.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/img/llama_judge.jpeg -------------------------------------------------------------------------------- /make_md.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/make_md.py -------------------------------------------------------------------------------- /prompt_templates.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/prompt_templates.py -------------------------------------------------------------------------------- /question_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/question_datasets.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | fire 2 | transformers 3 | datasets 4 | jsonlines -------------------------------------------------------------------------------- /script/42dot-dpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/42dot-dpo.sh -------------------------------------------------------------------------------- /script/42dot.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/42dot.sh -------------------------------------------------------------------------------- /script/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/README.md -------------------------------------------------------------------------------- /script/alpacaeval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/alpacaeval.sh -------------------------------------------------------------------------------- /script/eval_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/eval_batch.sh -------------------------------------------------------------------------------- /script/eval_gt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/eval_gt.sh -------------------------------------------------------------------------------- /script/gemma.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/gemma.sh -------------------------------------------------------------------------------- /script/heegyu-yi-ko.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/heegyu-yi-ko.sh -------------------------------------------------------------------------------- /script/hyeogi-Yi-6b-dpo-v0.2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/hyeogi-Yi-6b-dpo-v0.2.sh -------------------------------------------------------------------------------- /script/koalpaca.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/koalpaca.sh -------------------------------------------------------------------------------- /script/kullm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/kullm.sh -------------------------------------------------------------------------------- /script/midm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/midm.sh -------------------------------------------------------------------------------- /script/skkuds.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/skkuds.sh -------------------------------------------------------------------------------- /script/synatra.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/HeegyuKim/ko-rm-judge/HEAD/script/synatra.sh --------------------------------------------------------------------------------