├── .DS_Store ├── .gitignore ├── LICENSE ├── README.md ├── data └── sample │ ├── round_1.json │ ├── round_2.json │ ├── round_3.json │ └── round_4.json ├── index.html ├── media ├── banner.png ├── baseline_comparison.png ├── combined_em_score_plots.png ├── dice_band.png ├── dice_score.png ├── multi_round.png ├── pipeline.png ├── results.png ├── single_round_four_parties.png └── tool_graph.png ├── outputs ├── all_rounds │ ├── round_1.json │ └── round_2.json ├── inf_vllm │ └── llama_3_2_3b_instruct │ │ ├── llama_3_2_3b_instruct_round_1.json │ │ ├── llama_3_2_3b_instruct_round_2.json │ │ ├── llama_3_2_3b_instruct_round_3.json │ │ └── llama_3_2_3b_instruct_round_4.json └── selected_round │ └── round_4.json ├── pyproject.toml ├── scripts ├── gen_all_round.sh ├── gen_selected_round.sh └── inf_vllm.sh ├── src ├── __init__.py ├── agent │ └── base.py ├── colorlog.py ├── config.py ├── get_dice_score.py ├── graph │ ├── sample_subgraph.py │ ├── tool_docs.json │ ├── tool_graph.json │ ├── utils.py │ └── visualize_graph.py ├── inference │ ├── __init__.py │ ├── inference_vllm.py │ └── utils.py ├── main.py ├── prompt │ ├── base.py │ ├── domain_prompt.py │ └── inference_prompt.py ├── utils │ ├── few_shot_params.py │ └── utils.py └── validation │ ├── main.py │ ├── prompt │ ├── Coherence.txt │ ├── Dialogue_Consistency.txt │ ├── Eristic.txt │ ├── Fluency.txt │ ├── Humanness.txt │ ├── Inquiry_and_Information_Seeking.txt │ ├── Persona_Consistency.txt │ ├── Persuassion_Deliberation_and_Negotiation.txt │ └── Relevance.txt │ ├── rule_based_val.ipynb │ └── utils.py ├── static ├── css │ ├── bulma-carousel.min.css │ ├── bulma-slider.min.css │ ├── bulma.css.map.txt │ ├── bulma.min.css │ ├── fontawesome.all.min.css │ └── index.css ├── images │ ├── LinkedIn_icon.svg │ ├── favicon.ico │ ├── github-mark.svg │ ├── huggingface_logo-noborder.svg │ └── x_logo.png └── js │ ├── bulma-carousel.js │ ├── bulma-carousel.min.js │ ├── bulma-slider.js │ ├── bulma-slider.min.js │ ├── fontawesome.all.min.js │ └── index.js └── uv.lock /.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/.DS_Store -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/README.md -------------------------------------------------------------------------------- /data/sample/round_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/data/sample/round_1.json -------------------------------------------------------------------------------- /data/sample/round_2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/data/sample/round_2.json -------------------------------------------------------------------------------- /data/sample/round_3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/data/sample/round_3.json -------------------------------------------------------------------------------- /data/sample/round_4.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/data/sample/round_4.json -------------------------------------------------------------------------------- /index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/index.html -------------------------------------------------------------------------------- /media/banner.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/banner.png -------------------------------------------------------------------------------- /media/baseline_comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/baseline_comparison.png -------------------------------------------------------------------------------- /media/combined_em_score_plots.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/combined_em_score_plots.png -------------------------------------------------------------------------------- /media/dice_band.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/dice_band.png -------------------------------------------------------------------------------- /media/dice_score.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/dice_score.png -------------------------------------------------------------------------------- /media/multi_round.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/multi_round.png -------------------------------------------------------------------------------- /media/pipeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/pipeline.png -------------------------------------------------------------------------------- /media/results.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/results.png -------------------------------------------------------------------------------- /media/single_round_four_parties.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/single_round_four_parties.png -------------------------------------------------------------------------------- /media/tool_graph.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/media/tool_graph.png -------------------------------------------------------------------------------- /outputs/all_rounds/round_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/all_rounds/round_1.json -------------------------------------------------------------------------------- /outputs/all_rounds/round_2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/all_rounds/round_2.json -------------------------------------------------------------------------------- /outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_1.json -------------------------------------------------------------------------------- /outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_2.json -------------------------------------------------------------------------------- /outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_3.json -------------------------------------------------------------------------------- /outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_4.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/inf_vllm/llama_3_2_3b_instruct/llama_3_2_3b_instruct_round_4.json -------------------------------------------------------------------------------- /outputs/selected_round/round_4.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/outputs/selected_round/round_4.json -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/pyproject.toml -------------------------------------------------------------------------------- /scripts/gen_all_round.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/scripts/gen_all_round.sh -------------------------------------------------------------------------------- /scripts/gen_selected_round.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/scripts/gen_selected_round.sh -------------------------------------------------------------------------------- /scripts/inf_vllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/scripts/inf_vllm.sh -------------------------------------------------------------------------------- /src/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/agent/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/agent/base.py -------------------------------------------------------------------------------- /src/colorlog.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/colorlog.py -------------------------------------------------------------------------------- /src/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/config.py -------------------------------------------------------------------------------- /src/get_dice_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/get_dice_score.py -------------------------------------------------------------------------------- /src/graph/sample_subgraph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/graph/sample_subgraph.py -------------------------------------------------------------------------------- /src/graph/tool_docs.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/graph/tool_docs.json -------------------------------------------------------------------------------- /src/graph/tool_graph.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/graph/tool_graph.json -------------------------------------------------------------------------------- /src/graph/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/graph/utils.py -------------------------------------------------------------------------------- /src/graph/visualize_graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/graph/visualize_graph.py -------------------------------------------------------------------------------- /src/inference/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/inference/inference_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/inference/inference_vllm.py -------------------------------------------------------------------------------- /src/inference/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/inference/utils.py -------------------------------------------------------------------------------- /src/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/main.py -------------------------------------------------------------------------------- /src/prompt/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/prompt/base.py -------------------------------------------------------------------------------- /src/prompt/domain_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/prompt/domain_prompt.py -------------------------------------------------------------------------------- /src/prompt/inference_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/prompt/inference_prompt.py -------------------------------------------------------------------------------- /src/utils/few_shot_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/utils/few_shot_params.py -------------------------------------------------------------------------------- /src/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/utils/utils.py -------------------------------------------------------------------------------- /src/validation/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/main.py -------------------------------------------------------------------------------- /src/validation/prompt/Coherence.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Coherence.txt -------------------------------------------------------------------------------- /src/validation/prompt/Dialogue_Consistency.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Dialogue_Consistency.txt -------------------------------------------------------------------------------- /src/validation/prompt/Eristic.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Eristic.txt -------------------------------------------------------------------------------- /src/validation/prompt/Fluency.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Fluency.txt -------------------------------------------------------------------------------- /src/validation/prompt/Humanness.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Humanness.txt -------------------------------------------------------------------------------- /src/validation/prompt/Inquiry_and_Information_Seeking.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Inquiry_and_Information_Seeking.txt -------------------------------------------------------------------------------- /src/validation/prompt/Persona_Consistency.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Persona_Consistency.txt -------------------------------------------------------------------------------- /src/validation/prompt/Persuassion_Deliberation_and_Negotiation.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Persuassion_Deliberation_and_Negotiation.txt -------------------------------------------------------------------------------- /src/validation/prompt/Relevance.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/prompt/Relevance.txt -------------------------------------------------------------------------------- /src/validation/rule_based_val.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/rule_based_val.ipynb -------------------------------------------------------------------------------- /src/validation/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/src/validation/utils.py -------------------------------------------------------------------------------- /static/css/bulma-carousel.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/css/bulma-carousel.min.css -------------------------------------------------------------------------------- /static/css/bulma-slider.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/css/bulma-slider.min.css -------------------------------------------------------------------------------- /static/css/bulma.css.map.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/css/bulma.css.map.txt -------------------------------------------------------------------------------- /static/css/bulma.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/css/bulma.min.css -------------------------------------------------------------------------------- /static/css/fontawesome.all.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/css/fontawesome.all.min.css -------------------------------------------------------------------------------- /static/css/index.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/css/index.css -------------------------------------------------------------------------------- /static/images/LinkedIn_icon.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/images/LinkedIn_icon.svg -------------------------------------------------------------------------------- /static/images/favicon.ico: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/images/favicon.ico -------------------------------------------------------------------------------- /static/images/github-mark.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/images/github-mark.svg -------------------------------------------------------------------------------- /static/images/huggingface_logo-noborder.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/images/huggingface_logo-noborder.svg -------------------------------------------------------------------------------- /static/images/x_logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/images/x_logo.png -------------------------------------------------------------------------------- /static/js/bulma-carousel.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/js/bulma-carousel.js -------------------------------------------------------------------------------- /static/js/bulma-carousel.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/js/bulma-carousel.min.js -------------------------------------------------------------------------------- /static/js/bulma-slider.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/js/bulma-slider.js -------------------------------------------------------------------------------- /static/js/bulma-slider.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/js/bulma-slider.min.js -------------------------------------------------------------------------------- /static/js/fontawesome.all.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/js/fontawesome.all.min.js -------------------------------------------------------------------------------- /static/js/index.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/static/js/index.js -------------------------------------------------------------------------------- /uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/snuhcc/DICE-Bench/HEAD/uv.lock --------------------------------------------------------------------------------