├── .DS_Store ├── LICENSE ├── README.md ├── configs ├── .DS_Store ├── axolotl │ ├── axolotl-train-qwen2-7b-wildchat-250k-llama31-8b.sbatch │ ├── rewild-sft.yaml │ └── wildchat-250k-llama31-8b.yaml └── open-instruct │ ├── dpo-qwen2572b-athene70b-jdg-Llama3-Factuality-AllenAI-fmt-dpo-8b.yaml │ └── open-instruct-train-dpo-qal3f.sbatch ├── model_responses ├── .DS_Store ├── judged │ └── qwen-2.5-72b-resps │ │ ├── 100.html │ │ ├── 101.html │ │ ├── 102.html │ │ ├── 103.html │ │ ├── 104.html │ │ ├── 105.html │ │ ├── 106.html │ │ ├── 107.html │ │ ├── 108.html │ │ ├── 109.html │ │ ├── 110.html │ │ ├── 111.html │ │ ├── 112.html │ │ ├── 113.html │ │ ├── 114.html │ │ ├── 115.html │ │ ├── 116.html │ │ ├── 117.html │ │ ├── 118.html │ │ ├── 119.html │ │ ├── 120.html │ │ ├── 121.html │ │ ├── 122.html │ │ ├── 123.html │ │ ├── 124.html │ │ ├── 125.html │ │ ├── 126.html │ │ ├── 127.html │ │ ├── 128.html │ │ ├── 129.html │ │ ├── 130.html │ │ ├── 131.html │ │ ├── 132.html │ │ ├── 133.html │ │ ├── 134.html │ │ ├── 135.html │ │ ├── 136.html │ │ ├── 137.html │ │ ├── 138.html │ │ ├── 139.html │ │ ├── 140.html │ │ ├── 141.html │ │ ├── 142.html │ │ ├── 143.html │ │ ├── 144.html │ │ ├── 145.html │ │ ├── 146.html │ │ ├── 147.html │ │ ├── 148.html │ │ ├── 149.html │ │ ├── 150.html │ │ ├── 151.html │ │ ├── 152.html │ │ ├── 153.html │ │ ├── 154.html │ │ ├── 155.html │ │ ├── 156.html │ │ ├── 157.html │ │ ├── 158.html │ │ ├── 159.html │ │ ├── 160.html │ │ ├── 81.html │ │ ├── 82.html │ │ ├── 83.html │ │ ├── 84.html │ │ ├── 85.html │ │ ├── 86.html │ │ ├── 87.html │ │ ├── 88.html │ │ ├── 89.html │ │ ├── 90.html │ │ ├── 91.html │ │ ├── 92.html │ │ ├── 93.html │ │ ├── 94.html │ │ ├── 95.html │ │ ├── 96.html │ │ ├── 97.html │ │ ├── 98.html │ │ └── 99.html └── pairwise │ ├── .DS_Store │ └── llama3.3-qwen2.5-comparison │ ├── comparison_105698.html │ ├── comparison_105717.html │ ├── comparison_109076.html │ ├── comparison_109944.html │ ├── comparison_112014.html │ ├── comparison_11250.html │ ├── comparison_114658.html │ ├── comparison_117364.html │ ├── comparison_11960.html │ ├── comparison_122729.html │ ├── comparison_123953.html │ ├── comparison_127758.html │ ├── comparison_130789.html │ ├── comparison_130823.html │ ├── comparison_132088.html │ ├── comparison_133033.html │ ├── comparison_133040.html │ ├── comparison_134263.html │ ├── comparison_138860.html │ ├── comparison_139963.html │ ├── comparison_1411.html │ ├── comparison_141145.html │ ├── comparison_14605.html │ ├── comparison_14607.html │ ├── comparison_148423.html │ ├── comparison_150942.html │ ├── comparison_152118.html │ ├── comparison_152965.html │ ├── comparison_15602.html │ ├── comparison_156220.html │ ├── comparison_156524.html │ ├── comparison_156967.html │ ├── comparison_156988.html │ ├── comparison_158549.html │ ├── comparison_158764.html │ ├── comparison_159381.html │ ├── comparison_159668.html │ ├── comparison_160096.html │ ├── comparison_163591.html │ ├── comparison_16853.html │ ├── comparison_172794.html │ ├── comparison_17477.html │ ├── comparison_175185.html │ ├── comparison_177760.html │ ├── comparison_178692.html │ ├── comparison_181887.html │ ├── comparison_184524.html │ ├── comparison_184769.html │ ├── comparison_186268.html │ ├── comparison_186967.html │ ├── comparison_190331.html │ ├── comparison_202475.html │ ├── comparison_205171.html │ ├── comparison_23832.html │ ├── comparison_2436.html │ ├── comparison_27671.html │ ├── comparison_28726.html │ ├── comparison_29099.html │ ├── comparison_3057.html │ ├── comparison_30610.html │ ├── comparison_30752.html │ ├── comparison_32095.html │ ├── comparison_36269.html │ ├── comparison_36657.html │ ├── comparison_37247.html │ ├── comparison_38813.html │ ├── comparison_39763.html │ ├── comparison_40069.html │ ├── comparison_40705.html │ ├── comparison_41374.html │ ├── comparison_41527.html │ ├── comparison_42090.html │ ├── comparison_45141.html │ ├── comparison_45316.html │ ├── comparison_45364.html │ ├── comparison_46759.html │ ├── comparison_47345.html │ ├── comparison_48282.html │ ├── comparison_49569.html │ ├── comparison_51335.html │ ├── comparison_51456.html │ ├── comparison_53200.html │ ├── comparison_53729.html │ ├── comparison_59128.html │ ├── comparison_61163.html │ ├── comparison_65833.html │ ├── comparison_71631.html │ ├── comparison_77141.html │ ├── comparison_82196.html │ ├── comparison_83618.html │ ├── comparison_84755.html │ ├── comparison_86413.html │ ├── comparison_90081.html │ ├── comparison_91098.html │ ├── comparison_91519.html │ ├── comparison_93768.html │ ├── comparison_95683.html │ ├── comparison_95922.html │ ├── comparison_96705.html │ └── comparison_98868.html ├── notebooks ├── conversation_processing.ipynb ├── mt_bench_jsonl_to_html.ipynb ├── plotting.ipynb └── textual_similarity.ipynb ├── src ├── .DS_Store ├── core │ ├── generate_model_responses.py │ ├── judgment.py │ └── utils.py ├── requirements.txt └── util │ ├── length_control.py │ ├── random_sample_viewer.py │ └── remove_cols_from_hf_dataset.py └── tables ├── combined_preferences.csv ├── english_only_conv_hash.csv └── wc50m_results.xlsx /.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/.DS_Store -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/README.md -------------------------------------------------------------------------------- /configs/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/configs/.DS_Store -------------------------------------------------------------------------------- /configs/axolotl/axolotl-train-qwen2-7b-wildchat-250k-llama31-8b.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/configs/axolotl/axolotl-train-qwen2-7b-wildchat-250k-llama31-8b.sbatch -------------------------------------------------------------------------------- /configs/axolotl/rewild-sft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/configs/axolotl/rewild-sft.yaml -------------------------------------------------------------------------------- /configs/axolotl/wildchat-250k-llama31-8b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/configs/axolotl/wildchat-250k-llama31-8b.yaml -------------------------------------------------------------------------------- /configs/open-instruct/dpo-qwen2572b-athene70b-jdg-Llama3-Factuality-AllenAI-fmt-dpo-8b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/configs/open-instruct/dpo-qwen2572b-athene70b-jdg-Llama3-Factuality-AllenAI-fmt-dpo-8b.yaml -------------------------------------------------------------------------------- /configs/open-instruct/open-instruct-train-dpo-qal3f.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/configs/open-instruct/open-instruct-train-dpo-qal3f.sbatch -------------------------------------------------------------------------------- /model_responses/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/.DS_Store -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/100.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/100.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/101.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/101.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/102.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/102.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/103.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/103.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/104.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/104.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/105.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/105.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/106.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/106.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/107.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/107.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/108.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/108.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/109.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/109.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/110.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/110.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/111.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/111.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/112.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/112.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/113.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/113.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/114.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/114.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/115.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/115.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/116.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/116.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/117.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/117.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/118.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/118.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/119.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/119.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/120.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/120.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/121.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/121.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/122.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/122.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/123.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/123.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/124.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/124.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/125.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/125.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/126.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/126.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/127.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/127.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/128.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/128.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/129.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/129.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/130.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/130.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/131.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/131.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/132.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/132.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/133.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/133.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/134.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/134.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/135.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/135.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/136.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/136.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/137.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/137.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/138.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/138.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/139.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/139.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/140.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/140.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/141.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/141.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/142.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/142.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/143.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/143.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/144.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/144.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/145.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/145.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/146.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/146.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/147.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/147.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/148.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/148.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/149.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/149.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/150.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/150.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/151.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/151.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/152.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/152.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/153.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/153.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/154.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/154.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/155.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/155.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/156.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/156.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/157.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/157.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/158.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/158.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/159.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/159.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/160.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/160.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/81.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/81.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/82.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/82.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/83.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/83.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/84.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/84.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/85.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/85.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/86.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/86.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/87.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/87.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/88.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/88.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/89.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/89.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/90.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/90.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/91.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/91.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/92.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/92.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/93.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/93.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/94.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/94.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/95.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/95.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/96.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/96.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/97.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/97.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/98.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/98.html -------------------------------------------------------------------------------- /model_responses/judged/qwen-2.5-72b-resps/99.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/judged/qwen-2.5-72b-resps/99.html -------------------------------------------------------------------------------- /model_responses/pairwise/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/.DS_Store -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_105698.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_105698.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_105717.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_105717.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_109076.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_109076.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_109944.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_109944.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_112014.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_112014.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_11250.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_11250.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_114658.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_114658.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_117364.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_117364.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_11960.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_11960.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_122729.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_122729.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_123953.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_123953.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_127758.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_127758.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_130789.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_130789.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_130823.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_130823.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_132088.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_132088.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_133033.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_133033.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_133040.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_133040.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_134263.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_134263.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_138860.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_138860.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_139963.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_139963.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_1411.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_1411.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_141145.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_141145.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_14605.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_14605.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_14607.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_14607.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_148423.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_148423.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_150942.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_150942.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_152118.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_152118.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_152965.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_152965.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_15602.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_15602.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156220.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156220.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156524.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156524.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156967.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156967.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156988.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_156988.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_158549.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_158549.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_158764.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_158764.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_159381.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_159381.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_159668.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_159668.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_160096.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_160096.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_163591.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_163591.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_16853.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_16853.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_172794.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_172794.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_17477.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_17477.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_175185.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_175185.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_177760.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_177760.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_178692.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_178692.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_181887.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_181887.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_184524.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_184524.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_184769.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_184769.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_186268.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_186268.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_186967.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_186967.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_190331.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_190331.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_202475.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_202475.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_205171.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_205171.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_23832.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_23832.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_2436.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_2436.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_27671.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_27671.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_28726.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_28726.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_29099.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_29099.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_3057.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_3057.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_30610.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_30610.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_30752.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_30752.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_32095.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_32095.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_36269.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_36269.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_36657.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_36657.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_37247.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_37247.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_38813.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_38813.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_39763.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_39763.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_40069.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_40069.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_40705.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_40705.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_41374.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_41374.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_41527.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_41527.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_42090.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_42090.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_45141.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_45141.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_45316.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_45316.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_45364.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_45364.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_46759.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_46759.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_47345.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_47345.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_48282.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_48282.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_49569.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_49569.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_51335.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_51335.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_51456.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_51456.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_53200.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_53200.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_53729.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_53729.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_59128.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_59128.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_61163.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_61163.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_65833.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_65833.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_71631.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_71631.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_77141.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_77141.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_82196.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_82196.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_83618.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_83618.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_84755.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_84755.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_86413.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_86413.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_90081.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_90081.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_91098.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_91098.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_91519.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_91519.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_93768.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_93768.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_95683.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_95683.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_95922.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_95922.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_96705.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_96705.html -------------------------------------------------------------------------------- /model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_98868.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/model_responses/pairwise/llama3.3-qwen2.5-comparison/comparison_98868.html -------------------------------------------------------------------------------- /notebooks/conversation_processing.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/notebooks/conversation_processing.ipynb -------------------------------------------------------------------------------- /notebooks/mt_bench_jsonl_to_html.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/notebooks/mt_bench_jsonl_to_html.ipynb -------------------------------------------------------------------------------- /notebooks/plotting.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/notebooks/plotting.ipynb -------------------------------------------------------------------------------- /notebooks/textual_similarity.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/notebooks/textual_similarity.ipynb -------------------------------------------------------------------------------- /src/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/.DS_Store -------------------------------------------------------------------------------- /src/core/generate_model_responses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/core/generate_model_responses.py -------------------------------------------------------------------------------- /src/core/judgment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/core/judgment.py -------------------------------------------------------------------------------- /src/core/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/core/utils.py -------------------------------------------------------------------------------- /src/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/requirements.txt -------------------------------------------------------------------------------- /src/util/length_control.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/util/length_control.py -------------------------------------------------------------------------------- /src/util/random_sample_viewer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/util/random_sample_viewer.py -------------------------------------------------------------------------------- /src/util/remove_cols_from_hf_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/src/util/remove_cols_from_hf_dataset.py -------------------------------------------------------------------------------- /tables/combined_preferences.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/tables/combined_preferences.csv -------------------------------------------------------------------------------- /tables/english_only_conv_hash.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/tables/english_only_conv_hash.csv -------------------------------------------------------------------------------- /tables/wc50m_results.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/penfever/wildchat-50m/HEAD/tables/wc50m_results.xlsx --------------------------------------------------------------------------------