├── .DS_Store ├── .gitignore ├── LICENSE ├── README.md ├── assets ├── inference_pipeline.png ├── listwise_model_input.png └── pointwise_model_input.png ├── code ├── awq_quantization.py ├── eval_ranker_listwise.py ├── eval_ranker_pointwise.py ├── generate_llm_reasoner.py ├── llm_embedding │ ├── eedi_dataset.py │ ├── eedi_loader.py │ ├── eedi_model.py │ └── eedi_optimizer.py ├── llm_reasoner │ ├── eedi_dataset.py │ ├── eedi_loader.py │ └── eedi_optimizer.py ├── merge_adapter.py ├── ranker_listwise │ ├── ranker_dataset.py │ ├── ranker_loader.py │ ├── ranker_model.py │ └── ranker_optimizer.py ├── ranker_pointwise │ ├── ranker_dataset.py │ ├── ranker_loader.py │ ├── ranker_model.py │ └── ranker_optimizer.py ├── train_llm_embedding.py ├── train_llm_reasoner.py ├── train_ranker_listwise.py ├── train_ranker_pointwise.py └── utils │ ├── metric_utils.py │ ├── ranker_data_prep.py │ ├── ranker_oof_prep.py │ ├── retriever_utils.py │ └── train_utils.py ├── conf ├── conf_ranker_prep.yaml ├── llm_embedding │ ├── conf_bge.yaml │ ├── conf_intfloat.yaml │ ├── conf_qwen14b_finetune.yaml │ └── conf_qwen14b_pretrain.yaml ├── llm_reasoner │ ├── conf_reasoner_14b.yaml │ ├── conf_reasoner_32b.yaml │ └── conf_reasoner_7b.yaml ├── ranker_listwise │ ├── conf_listwise_72b.yaml │ └── conf_listwise_infer.yaml ├── ranker_pointwise │ ├── conf_pointwise_14b.yaml │ ├── conf_pointwise_32b.yaml │ ├── conf_pointwise_72b.yaml │ ├── conf_pointwise_infer_14b.yaml │ ├── conf_pointwise_infer_32b.yaml │ └── conf_pointwise_infer_72b.yaml └── synthetic │ ├── conf_cot_claude.yaml │ ├── conf_eval_oai.yaml │ └── conf_gen_claude.yaml ├── download_datasets.py ├── requirements.txt ├── ruff.toml └── synthetic ├── cot_claude.py ├── generate_claude.py └── judge_oai.py /.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/.DS_Store -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/README.md -------------------------------------------------------------------------------- /assets/inference_pipeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/assets/inference_pipeline.png -------------------------------------------------------------------------------- /assets/listwise_model_input.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/assets/listwise_model_input.png -------------------------------------------------------------------------------- /assets/pointwise_model_input.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/assets/pointwise_model_input.png -------------------------------------------------------------------------------- /code/awq_quantization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/awq_quantization.py -------------------------------------------------------------------------------- /code/eval_ranker_listwise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/eval_ranker_listwise.py -------------------------------------------------------------------------------- /code/eval_ranker_pointwise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/eval_ranker_pointwise.py -------------------------------------------------------------------------------- /code/generate_llm_reasoner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/generate_llm_reasoner.py -------------------------------------------------------------------------------- /code/llm_embedding/eedi_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_embedding/eedi_dataset.py -------------------------------------------------------------------------------- /code/llm_embedding/eedi_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_embedding/eedi_loader.py -------------------------------------------------------------------------------- /code/llm_embedding/eedi_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_embedding/eedi_model.py -------------------------------------------------------------------------------- /code/llm_embedding/eedi_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_embedding/eedi_optimizer.py -------------------------------------------------------------------------------- /code/llm_reasoner/eedi_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_reasoner/eedi_dataset.py -------------------------------------------------------------------------------- /code/llm_reasoner/eedi_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_reasoner/eedi_loader.py -------------------------------------------------------------------------------- /code/llm_reasoner/eedi_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/llm_reasoner/eedi_optimizer.py -------------------------------------------------------------------------------- /code/merge_adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/merge_adapter.py -------------------------------------------------------------------------------- /code/ranker_listwise/ranker_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_listwise/ranker_dataset.py -------------------------------------------------------------------------------- /code/ranker_listwise/ranker_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_listwise/ranker_loader.py -------------------------------------------------------------------------------- /code/ranker_listwise/ranker_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_listwise/ranker_model.py -------------------------------------------------------------------------------- /code/ranker_listwise/ranker_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_listwise/ranker_optimizer.py -------------------------------------------------------------------------------- /code/ranker_pointwise/ranker_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_pointwise/ranker_dataset.py -------------------------------------------------------------------------------- /code/ranker_pointwise/ranker_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_pointwise/ranker_loader.py -------------------------------------------------------------------------------- /code/ranker_pointwise/ranker_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_pointwise/ranker_model.py -------------------------------------------------------------------------------- /code/ranker_pointwise/ranker_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/ranker_pointwise/ranker_optimizer.py -------------------------------------------------------------------------------- /code/train_llm_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/train_llm_embedding.py -------------------------------------------------------------------------------- /code/train_llm_reasoner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/train_llm_reasoner.py -------------------------------------------------------------------------------- /code/train_ranker_listwise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/train_ranker_listwise.py -------------------------------------------------------------------------------- /code/train_ranker_pointwise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/train_ranker_pointwise.py -------------------------------------------------------------------------------- /code/utils/metric_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/utils/metric_utils.py -------------------------------------------------------------------------------- /code/utils/ranker_data_prep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/utils/ranker_data_prep.py -------------------------------------------------------------------------------- /code/utils/ranker_oof_prep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/utils/ranker_oof_prep.py -------------------------------------------------------------------------------- /code/utils/retriever_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/utils/retriever_utils.py -------------------------------------------------------------------------------- /code/utils/train_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/code/utils/train_utils.py -------------------------------------------------------------------------------- /conf/conf_ranker_prep.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/conf_ranker_prep.yaml -------------------------------------------------------------------------------- /conf/llm_embedding/conf_bge.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_embedding/conf_bge.yaml -------------------------------------------------------------------------------- /conf/llm_embedding/conf_intfloat.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_embedding/conf_intfloat.yaml -------------------------------------------------------------------------------- /conf/llm_embedding/conf_qwen14b_finetune.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_embedding/conf_qwen14b_finetune.yaml -------------------------------------------------------------------------------- /conf/llm_embedding/conf_qwen14b_pretrain.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_embedding/conf_qwen14b_pretrain.yaml -------------------------------------------------------------------------------- /conf/llm_reasoner/conf_reasoner_14b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_reasoner/conf_reasoner_14b.yaml -------------------------------------------------------------------------------- /conf/llm_reasoner/conf_reasoner_32b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_reasoner/conf_reasoner_32b.yaml -------------------------------------------------------------------------------- /conf/llm_reasoner/conf_reasoner_7b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/llm_reasoner/conf_reasoner_7b.yaml -------------------------------------------------------------------------------- /conf/ranker_listwise/conf_listwise_72b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_listwise/conf_listwise_72b.yaml -------------------------------------------------------------------------------- /conf/ranker_listwise/conf_listwise_infer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_listwise/conf_listwise_infer.yaml -------------------------------------------------------------------------------- /conf/ranker_pointwise/conf_pointwise_14b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_pointwise/conf_pointwise_14b.yaml -------------------------------------------------------------------------------- /conf/ranker_pointwise/conf_pointwise_32b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_pointwise/conf_pointwise_32b.yaml -------------------------------------------------------------------------------- /conf/ranker_pointwise/conf_pointwise_72b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_pointwise/conf_pointwise_72b.yaml -------------------------------------------------------------------------------- /conf/ranker_pointwise/conf_pointwise_infer_14b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_pointwise/conf_pointwise_infer_14b.yaml -------------------------------------------------------------------------------- /conf/ranker_pointwise/conf_pointwise_infer_32b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_pointwise/conf_pointwise_infer_32b.yaml -------------------------------------------------------------------------------- /conf/ranker_pointwise/conf_pointwise_infer_72b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/ranker_pointwise/conf_pointwise_infer_72b.yaml -------------------------------------------------------------------------------- /conf/synthetic/conf_cot_claude.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/synthetic/conf_cot_claude.yaml -------------------------------------------------------------------------------- /conf/synthetic/conf_eval_oai.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/synthetic/conf_eval_oai.yaml -------------------------------------------------------------------------------- /conf/synthetic/conf_gen_claude.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/conf/synthetic/conf_gen_claude.yaml -------------------------------------------------------------------------------- /download_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/download_datasets.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/requirements.txt -------------------------------------------------------------------------------- /ruff.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/ruff.toml -------------------------------------------------------------------------------- /synthetic/cot_claude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/synthetic/cot_claude.py -------------------------------------------------------------------------------- /synthetic/generate_claude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/synthetic/generate_claude.py -------------------------------------------------------------------------------- /synthetic/judge_oai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rbiswasfc/eedi-mining-misconceptions/HEAD/synthetic/judge_oai.py --------------------------------------------------------------------------------