├── .gitignore ├── Dockerfile ├── LICENSE ├── README.md ├── assets ├── dataset-on-hf-lg.svg ├── dataset-on-hf-md.svg ├── explainer_figure.png ├── model-on-hf-lg.svg └── model-on-hf-md.svg ├── experiments ├── ambiguous_generate.py ├── calibration_tune.py ├── classifier_tune.py ├── cluster.py ├── embedding_tune.py ├── evaluate.py ├── evaluate_logits.py ├── fine_tune.py ├── generate.py ├── play.py ├── publish.py ├── temperature_scale.py └── train_embedding_only.py ├── llm ├── __init__.py ├── datasets │ ├── __init__.py │ ├── hf │ │ ├── __init__.py │ │ ├── anli.py │ │ ├── arc.py │ │ ├── boolq.py │ │ ├── cb.py │ │ ├── commonsense_qa.py │ │ ├── copa.py │ │ ├── cosmos_qa.py │ │ ├── gsm8k.py │ │ ├── hellaswag.py │ │ ├── math_qa.py │ │ ├── mmlu.py │ │ ├── mmlu_pro.py │ │ ├── multirc.py │ │ ├── obqa.py │ │ ├── piqa.py │ │ ├── sciq.py │ │ ├── siqa.py │ │ ├── snli.py │ │ ├── story_cloze.py │ │ ├── trec.py │ │ ├── truthful_qa.py │ │ ├── winogrande.py │ │ └── wsc.py │ ├── llm_data_utils.py │ ├── llm_utils_oe.py │ ├── offline │ │ ├── __init__.py │ │ ├── combined.py │ │ ├── mmlu_offline.py │ │ ├── mmlu_pro_offline.py │ │ ├── modiste.py │ │ ├── offline.py │ │ └── offline_logits.py │ ├── registry.py │ └── utils.py ├── distributed │ ├── __init__.py │ └── accelerate.py ├── eval │ ├── __init__.py │ ├── classifier.py │ ├── common.py │ ├── oe.py │ ├── query.py │ ├── third_party │ │ ├── __init__.py │ │ └── calibration.py │ └── utils.py ├── logging.py ├── models │ ├── __init__.py │ ├── llama2.py │ ├── llama3.py │ ├── llm_model_utils.py │ ├── mistral.py │ ├── mlp.py │ ├── mpnet.py │ ├── openai.py │ ├── peft │ │ ├── __init__.py │ │ ├── classifier_head.py │ │ ├── lora.py │ │ ├── prompt_tuning.py │ │ ├── temperature_scaling.py │ │ └── utils.py │ ├── qwen.py │ └── registry.py ├── random.py ├── trainer │ ├── __init__.py │ ├── calibration_tune.py │ ├── classification_tune.py │ ├── embedding_tune.py │ ├── fine_tune.py │ └── utils.py └── utils │ ├── __init__.py │ └── generate_utils.py ├── notebooks ├── .gitignore ├── all_plots.ipynb ├── cleanup_offline.ipynb ├── eval_mmlu_ct_oe.ipynb ├── eval_mmlu_oe.ipynb ├── eval_mmlu_oe_verb1s.ipynb ├── eval_mmlu_oe_verb1s2g.ipynb ├── mmlu_pro.ipynb ├── results │ ├── .gitignore │ ├── classifier_results.csv │ ├── classifier_ts_results.csv │ ├── eval-mmlu_choice-base-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-base │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct-oe_transfer │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct_embed-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct_embed │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct_probe-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-ct_probe │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-logits_ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-lora_probe-oe_transfer │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-lora_probe-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_choice-lora_probe │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-base-cross │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-base-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-base │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct-choice_transfer │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct-cross_train │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-ct-human │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-ct-ts-cross │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-ct-ts-scale │ │ ├── md │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ │ ├── sm │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ │ ├── xs │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ │ └── xxs │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_embed-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_embed │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_embed_oai-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_embed_oai │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_nokl-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_probe-cross_train │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-ct_probe-human │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-ct_probe-ts-cross │ │ ├── llama2-7b.csv │ │ └── mistral-7b.csv │ ├── eval-mmlu_oe-ct_probe-ts-scale │ │ ├── md │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ │ ├── sm │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ │ ├── xs │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ │ └── xxs │ │ │ ├── llama2-13b.csv │ │ │ ├── llama2-13b_chat.csv │ │ │ ├── llama2-7b.csv │ │ │ ├── llama2-7b_chat.csv │ │ │ ├── mistral-7b.csv │ │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_probe-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-ct_probe │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-lora_probe-choice_transfer │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-lora_probe-ts │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval-mmlu_oe-lora_probe │ │ ├── llama2-13b.csv │ │ ├── llama2-13b_chat.csv │ │ ├── llama2-7b.csv │ │ ├── llama2-7b_chat.csv │ │ ├── mistral-7b.csv │ │ └── mistral-7b_instruct.csv │ ├── eval_7b-all_200k-mmlu.csv │ ├── eval_all_20k_uniform-13b_chat.csv │ ├── eval_mmlu-13b_chat-ct.csv │ ├── eval_mmlu-13b_chat-mcq2oe.csv │ ├── eval_mmlu-13b_chat-verb1s1g.csv │ ├── eval_mmlu-13b_chat-verb1s2g.csv │ ├── eval_mmlu-13b_chat-verb1s4g.csv │ ├── eval_mmlu-13b_chat-verb2s1CoT.csv │ ├── eval_mmlu-13b_chat-verb2s1g.csv │ ├── eval_mmlu-13b_chat-verb2s2g.csv │ ├── eval_mmlu-13b_chat-verb2s4g.csv │ ├── eval_mmlu-7b-cc.csv │ ├── eval_mmlu-7b-it-cs.csv │ ├── eval_mmlu-7b-it-temp.csv │ ├── eval_mmlu-7b-sub_200k-ut.csv │ ├── eval_mmlu-7b.csv │ ├── eval_mmlu-7b_instruct-ct.csv │ ├── oe_sampling.csv │ ├── sampling_results.csv │ └── ve_results.csv ├── user-study.ipynb ├── viz_conf_distribution.ipynb ├── viz_features.ipynb ├── viz_imp_oe.ipynb └── viz_mmlu.ipynb ├── pyproject.toml ├── requirements-base.txt ├── requirements-dev.txt └── requirements.txt /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/.gitignore -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/Dockerfile -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/README.md -------------------------------------------------------------------------------- /assets/dataset-on-hf-lg.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/assets/dataset-on-hf-lg.svg -------------------------------------------------------------------------------- /assets/dataset-on-hf-md.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/assets/dataset-on-hf-md.svg -------------------------------------------------------------------------------- /assets/explainer_figure.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/assets/explainer_figure.png -------------------------------------------------------------------------------- /assets/model-on-hf-lg.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/assets/model-on-hf-lg.svg -------------------------------------------------------------------------------- /assets/model-on-hf-md.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/assets/model-on-hf-md.svg -------------------------------------------------------------------------------- /experiments/ambiguous_generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/ambiguous_generate.py -------------------------------------------------------------------------------- /experiments/calibration_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/calibration_tune.py -------------------------------------------------------------------------------- /experiments/classifier_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/classifier_tune.py -------------------------------------------------------------------------------- /experiments/cluster.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/cluster.py -------------------------------------------------------------------------------- /experiments/embedding_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/embedding_tune.py -------------------------------------------------------------------------------- /experiments/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/evaluate.py -------------------------------------------------------------------------------- /experiments/evaluate_logits.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/evaluate_logits.py -------------------------------------------------------------------------------- /experiments/fine_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/fine_tune.py -------------------------------------------------------------------------------- /experiments/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/generate.py -------------------------------------------------------------------------------- /experiments/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/play.py -------------------------------------------------------------------------------- /experiments/publish.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/publish.py -------------------------------------------------------------------------------- /experiments/temperature_scale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/temperature_scale.py -------------------------------------------------------------------------------- /experiments/train_embedding_only.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/experiments/train_embedding_only.py -------------------------------------------------------------------------------- /llm/__init__.py: -------------------------------------------------------------------------------- 1 | __version__ = "0.1.0" 2 | -------------------------------------------------------------------------------- /llm/datasets/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/__init__.py -------------------------------------------------------------------------------- /llm/datasets/hf/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/__init__.py -------------------------------------------------------------------------------- /llm/datasets/hf/anli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/anli.py -------------------------------------------------------------------------------- /llm/datasets/hf/arc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/arc.py -------------------------------------------------------------------------------- /llm/datasets/hf/boolq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/boolq.py -------------------------------------------------------------------------------- /llm/datasets/hf/cb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/cb.py -------------------------------------------------------------------------------- /llm/datasets/hf/commonsense_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/commonsense_qa.py -------------------------------------------------------------------------------- /llm/datasets/hf/copa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/copa.py -------------------------------------------------------------------------------- /llm/datasets/hf/cosmos_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/cosmos_qa.py -------------------------------------------------------------------------------- /llm/datasets/hf/gsm8k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/gsm8k.py -------------------------------------------------------------------------------- /llm/datasets/hf/hellaswag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/hellaswag.py -------------------------------------------------------------------------------- /llm/datasets/hf/math_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/math_qa.py -------------------------------------------------------------------------------- /llm/datasets/hf/mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/mmlu.py -------------------------------------------------------------------------------- /llm/datasets/hf/mmlu_pro.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/mmlu_pro.py -------------------------------------------------------------------------------- /llm/datasets/hf/multirc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/multirc.py -------------------------------------------------------------------------------- /llm/datasets/hf/obqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/obqa.py -------------------------------------------------------------------------------- /llm/datasets/hf/piqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/piqa.py -------------------------------------------------------------------------------- /llm/datasets/hf/sciq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/sciq.py -------------------------------------------------------------------------------- /llm/datasets/hf/siqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/siqa.py -------------------------------------------------------------------------------- /llm/datasets/hf/snli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/snli.py -------------------------------------------------------------------------------- /llm/datasets/hf/story_cloze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/story_cloze.py -------------------------------------------------------------------------------- /llm/datasets/hf/trec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/trec.py -------------------------------------------------------------------------------- /llm/datasets/hf/truthful_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/truthful_qa.py -------------------------------------------------------------------------------- /llm/datasets/hf/winogrande.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/winogrande.py -------------------------------------------------------------------------------- /llm/datasets/hf/wsc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/hf/wsc.py -------------------------------------------------------------------------------- /llm/datasets/llm_data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/llm_data_utils.py -------------------------------------------------------------------------------- /llm/datasets/llm_utils_oe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/llm_utils_oe.py -------------------------------------------------------------------------------- /llm/datasets/offline/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/__init__.py -------------------------------------------------------------------------------- /llm/datasets/offline/combined.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/combined.py -------------------------------------------------------------------------------- /llm/datasets/offline/mmlu_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/mmlu_offline.py -------------------------------------------------------------------------------- /llm/datasets/offline/mmlu_pro_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/mmlu_pro_offline.py -------------------------------------------------------------------------------- /llm/datasets/offline/modiste.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/modiste.py -------------------------------------------------------------------------------- /llm/datasets/offline/offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/offline.py -------------------------------------------------------------------------------- /llm/datasets/offline/offline_logits.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/offline/offline_logits.py -------------------------------------------------------------------------------- /llm/datasets/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/registry.py -------------------------------------------------------------------------------- /llm/datasets/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/datasets/utils.py -------------------------------------------------------------------------------- /llm/distributed/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/distributed/__init__.py -------------------------------------------------------------------------------- /llm/distributed/accelerate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/distributed/accelerate.py -------------------------------------------------------------------------------- /llm/eval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/__init__.py -------------------------------------------------------------------------------- /llm/eval/classifier.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/classifier.py -------------------------------------------------------------------------------- /llm/eval/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/common.py -------------------------------------------------------------------------------- /llm/eval/oe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/oe.py -------------------------------------------------------------------------------- /llm/eval/query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/query.py -------------------------------------------------------------------------------- /llm/eval/third_party/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /llm/eval/third_party/calibration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/third_party/calibration.py -------------------------------------------------------------------------------- /llm/eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/eval/utils.py -------------------------------------------------------------------------------- /llm/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/logging.py -------------------------------------------------------------------------------- /llm/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/__init__.py -------------------------------------------------------------------------------- /llm/models/llama2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/llama2.py -------------------------------------------------------------------------------- /llm/models/llama3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/llama3.py -------------------------------------------------------------------------------- /llm/models/llm_model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/llm_model_utils.py -------------------------------------------------------------------------------- /llm/models/mistral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/mistral.py -------------------------------------------------------------------------------- /llm/models/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/mlp.py -------------------------------------------------------------------------------- /llm/models/mpnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/mpnet.py -------------------------------------------------------------------------------- /llm/models/openai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/openai.py -------------------------------------------------------------------------------- /llm/models/peft/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/peft/__init__.py -------------------------------------------------------------------------------- /llm/models/peft/classifier_head.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/peft/classifier_head.py -------------------------------------------------------------------------------- /llm/models/peft/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/peft/lora.py -------------------------------------------------------------------------------- /llm/models/peft/prompt_tuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/peft/prompt_tuning.py -------------------------------------------------------------------------------- /llm/models/peft/temperature_scaling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/peft/temperature_scaling.py -------------------------------------------------------------------------------- /llm/models/peft/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/peft/utils.py -------------------------------------------------------------------------------- /llm/models/qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/qwen.py -------------------------------------------------------------------------------- /llm/models/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/models/registry.py -------------------------------------------------------------------------------- /llm/random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/random.py -------------------------------------------------------------------------------- /llm/trainer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/trainer/__init__.py -------------------------------------------------------------------------------- /llm/trainer/calibration_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/trainer/calibration_tune.py -------------------------------------------------------------------------------- /llm/trainer/classification_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/trainer/classification_tune.py -------------------------------------------------------------------------------- /llm/trainer/embedding_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/trainer/embedding_tune.py -------------------------------------------------------------------------------- /llm/trainer/fine_tune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/trainer/fine_tune.py -------------------------------------------------------------------------------- /llm/trainer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/trainer/utils.py -------------------------------------------------------------------------------- /llm/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /llm/utils/generate_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/llm/utils/generate_utils.py -------------------------------------------------------------------------------- /notebooks/.gitignore: -------------------------------------------------------------------------------- 1 | *_tmp*.ipynb -------------------------------------------------------------------------------- /notebooks/all_plots.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/all_plots.ipynb -------------------------------------------------------------------------------- /notebooks/cleanup_offline.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/cleanup_offline.ipynb -------------------------------------------------------------------------------- /notebooks/eval_mmlu_ct_oe.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/eval_mmlu_ct_oe.ipynb -------------------------------------------------------------------------------- /notebooks/eval_mmlu_oe.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/eval_mmlu_oe.ipynb -------------------------------------------------------------------------------- /notebooks/eval_mmlu_oe_verb1s.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/eval_mmlu_oe_verb1s.ipynb -------------------------------------------------------------------------------- /notebooks/eval_mmlu_oe_verb1s2g.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/eval_mmlu_oe_verb1s2g.ipynb -------------------------------------------------------------------------------- /notebooks/mmlu_pro.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/mmlu_pro.ipynb -------------------------------------------------------------------------------- /notebooks/results/.gitignore: -------------------------------------------------------------------------------- 1 | *raw.csv -------------------------------------------------------------------------------- /notebooks/results/classifier_results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/classifier_results.csv -------------------------------------------------------------------------------- /notebooks/results/classifier_ts_results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/classifier_ts_results.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-base/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-base/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-oe_transfer/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-oe_transfer/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-oe_transfer/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-oe_transfer/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-oe_transfer/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_embed/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_embed/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-ct_probe/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-ct_probe/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-logits_ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-logits_ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-logits_ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-logits_ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-logits_ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-logits_ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-logits_ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-logits_ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-logits_ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-logits_ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-logits_ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-logits_ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-oe_transfer/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_choice-lora_probe/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_choice-lora_probe/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-cross/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-cross/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-cross/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-cross/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-base/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-base/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-choice_transfer/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-choice_transfer/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-choice_transfer/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-choice_transfer/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-choice_transfer/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-cross_train/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-cross_train/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-cross_train/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-cross_train/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-human/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-human/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-human/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-human/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-cross/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-cross/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-cross/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-cross/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/md/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/md/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/md/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/md/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/md/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/sm/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xs/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts-scale/xxs/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_embed_oai/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_embed_oai/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_nokl-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_nokl-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_nokl-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_nokl-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_nokl-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-cross_train/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-cross_train/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-cross_train/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-cross_train/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-human/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-human/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-human/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-human/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-cross/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-cross/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-cross/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-cross/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/md/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/sm/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xs/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts-scale/xxs/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-ct_probe/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-ct_probe/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-choice_transfer/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-ts/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-ts/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-ts/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe-ts/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe-ts/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe/llama2-13b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe/llama2-13b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe/llama2-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe/llama2-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe/llama2-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe/llama2-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe/llama2-7b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe/llama2-7b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe/mistral-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe/mistral-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval-mmlu_oe-lora_probe/mistral-7b_instruct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval-mmlu_oe-lora_probe/mistral-7b_instruct.csv -------------------------------------------------------------------------------- /notebooks/results/eval_7b-all_200k-mmlu.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_7b-all_200k-mmlu.csv -------------------------------------------------------------------------------- /notebooks/results/eval_all_20k_uniform-13b_chat.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_all_20k_uniform-13b_chat.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-ct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-ct.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-mcq2oe.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-mcq2oe.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb1s1g.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb1s1g.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb1s2g.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb1s2g.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb1s4g.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb1s4g.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb2s1CoT.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb2s1CoT.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb2s1g.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb2s1g.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb2s2g.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb2s2g.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-13b_chat-verb2s4g.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-13b_chat-verb2s4g.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-7b-cc.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-7b-cc.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-7b-it-cs.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-7b-it-cs.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-7b-it-temp.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-7b-it-temp.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-7b-sub_200k-ut.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-7b-sub_200k-ut.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-7b.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-7b.csv -------------------------------------------------------------------------------- /notebooks/results/eval_mmlu-7b_instruct-ct.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/eval_mmlu-7b_instruct-ct.csv -------------------------------------------------------------------------------- /notebooks/results/oe_sampling.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/oe_sampling.csv -------------------------------------------------------------------------------- /notebooks/results/sampling_results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/sampling_results.csv -------------------------------------------------------------------------------- /notebooks/results/ve_results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/results/ve_results.csv -------------------------------------------------------------------------------- /notebooks/user-study.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/user-study.ipynb -------------------------------------------------------------------------------- /notebooks/viz_conf_distribution.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/viz_conf_distribution.ipynb -------------------------------------------------------------------------------- /notebooks/viz_features.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/viz_features.ipynb -------------------------------------------------------------------------------- /notebooks/viz_imp_oe.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/viz_imp_oe.ipynb -------------------------------------------------------------------------------- /notebooks/viz_mmlu.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/notebooks/viz_mmlu.ipynb -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements-base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/requirements-base.txt -------------------------------------------------------------------------------- /requirements-dev.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/requirements-dev.txt -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/activatedgeek/calibration-tuning/HEAD/requirements.txt --------------------------------------------------------------------------------