├── ReadMe.md ├── assets ├── Ass05-grpo-alg.png ├── ass01-test.png ├── ass02.JPG ├── ass05-SFT_alg.png ├── ass05-expert-iteartion-for-math-alg.png ├── ass05-grpo-test.png ├── ass05-sft-test.png └── note-website.png ├── assignment1-basics ├── .gitignore ├── CHANGELOG.md ├── LICENSE ├── README.md ├── cs336_basics │ ├── __init__.py │ ├── data.py │ ├── loss.py │ ├── model │ │ ├── modules.py │ │ ├── rope.py │ │ └── transformer.py │ ├── optimizer.py │ ├── tokenizer │ │ ├── pretokenization_regular_pattern.py │ │ ├── tokenizer.py │ │ └── utils.py │ └── utils.py ├── cs336_spring2025_assignment1_basics.pdf ├── make_submission.sh ├── profile.html ├── profile.json ├── pyproject.toml ├── simple_bpe.ipynb ├── tests │ ├── __init__.py │ ├── _snapshots │ │ ├── test_4d_scaled_dot_product_attention.npz │ │ ├── test_adamw.npz │ │ ├── test_embedding.npz │ │ ├── test_linear.npz │ │ ├── test_multihead_self_attention.npz │ │ ├── test_multihead_self_attention_with_rope.npz │ │ ├── test_positionwise_feedforward.npz │ │ ├── test_rmsnorm.npz │ │ ├── test_rope.npz │ │ ├── test_scaled_dot_product_attention.npz │ │ ├── test_swiglu.npz │ │ ├── test_train_bpe_special_tokens.pkl │ │ ├── test_transformer_block.npz │ │ ├── test_transformer_lm.npz │ │ └── test_transformer_lm_truncated_input.npz │ ├── adapters.py │ ├── common.py │ ├── conftest.py │ ├── fixtures │ │ ├── address.txt │ │ ├── corpus.en │ │ ├── german.txt │ │ ├── gpt2_merges.txt │ │ ├── gpt2_vocab.json │ │ ├── special_token_double_newlines_non_whitespace.txt │ │ ├── special_token_trailing_newlines.txt │ │ ├── tinystories_sample.txt │ │ ├── tinystories_sample_5M.txt │ │ ├── train-bpe-reference-merges.txt │ │ ├── train-bpe-reference-vocab.json │ │ └── ts_tests │ │ │ ├── model.pt │ │ │ └── model_config.json │ ├── test_data.py │ ├── test_model.py │ ├── test_nn_utils.py │ ├── test_optimizer.py │ ├── test_serialization.py │ ├── test_tokenizer.py │ └── test_train_bpe.py └── uv.lock ├── assignment2-systems ├── CHANGELOG.md ├── LICENSE ├── README.md ├── cs336-basics │ ├── README.md │ ├── cs336_basics │ │ ├── __init__.py │ │ ├── data.py │ │ ├── model.py │ │ ├── nn_utils.py │ │ └── optimizer.py │ └── pyproject.toml ├── cs336_spring2025_assignment2_systems.pdf ├── cs336_systems │ ├── __init__.py │ ├── benchmark │ │ └── benchmark.py │ ├── flash_attn │ │ ├── flash_attn_pytorch.py │ │ └── flash_attn_triton.py │ └── parallel │ │ ├── ddp.py │ │ └── optimizer.py ├── pyproject.toml ├── test_and_make_submission.sh ├── tests │ ├── __init__.py │ ├── adapters.py │ ├── common.py │ ├── conftest.py │ ├── fixtures │ │ ├── ddp_test_data.pt │ │ └── ddp_test_labels.pt │ ├── test_attention.py │ ├── test_ddp.py │ ├── test_ddp_individual_parameters.py │ └── test_sharded_optimizer.py └── uv.lock ├── assignment4-data ├── CHANGELOG.md ├── LICENSE ├── README.md ├── cs336-basics │ ├── README.md │ ├── configs │ │ ├── config.yaml │ │ └── experiment │ │ │ └── your_data.yaml │ ├── cs336_basics │ │ ├── __init__.py │ │ ├── data.py │ │ ├── ddp_utils.py │ │ ├── model.py │ │ ├── optimizer.py │ │ └── train_config.py │ ├── pyproject.toml │ ├── scripts │ │ ├── generate_with_gpt2_tok.py │ │ └── train.py │ └── uv.lock ├── cs336_data │ └── __init__.py ├── cs336_spring2025_assignment4_data.pdf ├── get_assets.sh ├── pyproject.toml ├── test_and_make_submission.sh ├── tests │ ├── __init__.py │ ├── adapters.py │ ├── common.py │ ├── fixtures │ │ ├── documents_line_deduplicated │ │ │ ├── doc1.txt │ │ │ ├── doc2.txt │ │ │ ├── doc3.txt │ │ │ ├── doc4.txt │ │ │ └── doc5.txt │ │ ├── documents_with_fuzzy_duplicates │ │ │ ├── pytorch_license.txt │ │ │ ├── rails_mit_license.txt │ │ │ └── react_mit_license.txt │ │ ├── documents_with_line_duplicates │ │ │ ├── doc1.txt │ │ │ ├── doc2.txt │ │ │ ├── doc3.txt │ │ │ ├── doc4.txt │ │ │ └── doc5.txt │ │ ├── high_quality_wiki_reference.txt │ │ ├── low_quality_cc.txt │ │ ├── moby.html │ │ └── moby_extracted.txt │ ├── test_deduplication.py │ ├── test_extract.py │ ├── test_langid.py │ ├── test_pii.py │ ├── test_quality.py │ └── test_toxicity.py └── uv.lock └── assignment5-alignment ├── CHANGELOG.md ├── README.md ├── cs336_alignment ├── __init__.py ├── data_utils.py ├── drgrpo_grader.py ├── evaluate.py ├── grpo.py ├── prompts │ ├── alpaca_sft.prompt │ ├── question_only.prompt │ ├── r1_zero.prompt │ └── zero_shot_system_prompt.prompt ├── sft_utils.py ├── utils.py └── vllm_utils.py ├── cs336_spring2025_assignment5_alignment.pdf ├── cs336_spring2025_assignment5_supplement_safety_rlhf.pdf ├── data ├── alpaca_eval │ └── alpaca_eval.jsonl ├── gsm8k │ ├── test.jsonl │ └── train.jsonl ├── mmlu │ ├── README.txt │ ├── dev │ │ ├── abstract_algebra_dev.csv │ │ ├── anatomy_dev.csv │ │ ├── astronomy_dev.csv │ │ ├── business_ethics_dev.csv │ │ ├── clinical_knowledge_dev.csv │ │ ├── college_biology_dev.csv │ │ ├── college_chemistry_dev.csv │ │ ├── college_computer_science_dev.csv │ │ ├── college_mathematics_dev.csv │ │ ├── college_medicine_dev.csv │ │ ├── college_physics_dev.csv │ │ ├── computer_security_dev.csv │ │ ├── conceptual_physics_dev.csv │ │ ├── econometrics_dev.csv │ │ ├── electrical_engineering_dev.csv │ │ ├── elementary_mathematics_dev.csv │ │ ├── formal_logic_dev.csv │ │ ├── global_facts_dev.csv │ │ ├── high_school_biology_dev.csv │ │ ├── high_school_chemistry_dev.csv │ │ ├── high_school_computer_science_dev.csv │ │ ├── high_school_european_history_dev.csv │ │ ├── high_school_geography_dev.csv │ │ ├── high_school_government_and_politics_dev.csv │ │ ├── high_school_macroeconomics_dev.csv │ │ ├── high_school_mathematics_dev.csv │ │ ├── high_school_microeconomics_dev.csv │ │ ├── high_school_physics_dev.csv │ │ ├── high_school_psychology_dev.csv │ │ ├── high_school_statistics_dev.csv │ │ ├── high_school_us_history_dev.csv │ │ ├── high_school_world_history_dev.csv │ │ ├── human_aging_dev.csv │ │ ├── human_sexuality_dev.csv │ │ ├── international_law_dev.csv │ │ ├── jurisprudence_dev.csv │ │ ├── logical_fallacies_dev.csv │ │ ├── machine_learning_dev.csv │ │ ├── management_dev.csv │ │ ├── marketing_dev.csv │ │ ├── medical_genetics_dev.csv │ │ ├── miscellaneous_dev.csv │ │ ├── moral_disputes_dev.csv │ │ ├── moral_scenarios_dev.csv │ │ ├── nutrition_dev.csv │ │ ├── philosophy_dev.csv │ │ ├── prehistory_dev.csv │ │ ├── professional_accounting_dev.csv │ │ ├── professional_law_dev.csv │ │ ├── professional_medicine_dev.csv │ │ ├── professional_psychology_dev.csv │ │ ├── public_relations_dev.csv │ │ ├── security_studies_dev.csv │ │ ├── sociology_dev.csv │ │ ├── us_foreign_policy_dev.csv │ │ ├── virology_dev.csv │ │ └── world_religions_dev.csv │ ├── possibly_contaminated_urls.txt │ ├── test │ │ ├── abstract_algebra_test.csv │ │ ├── anatomy_test.csv │ │ ├── astronomy_test.csv │ │ ├── business_ethics_test.csv │ │ ├── clinical_knowledge_test.csv │ │ ├── college_biology_test.csv │ │ ├── college_chemistry_test.csv │ │ ├── college_computer_science_test.csv │ │ ├── college_mathematics_test.csv │ │ ├── college_medicine_test.csv │ │ ├── college_physics_test.csv │ │ ├── computer_security_test.csv │ │ ├── conceptual_physics_test.csv │ │ ├── econometrics_test.csv │ │ ├── electrical_engineering_test.csv │ │ ├── elementary_mathematics_test.csv │ │ ├── formal_logic_test.csv │ │ ├── global_facts_test.csv │ │ ├── high_school_biology_test.csv │ │ ├── high_school_chemistry_test.csv │ │ ├── high_school_computer_science_test.csv │ │ ├── high_school_european_history_test.csv │ │ ├── high_school_geography_test.csv │ │ ├── high_school_government_and_politics_test.csv │ │ ├── high_school_macroeconomics_test.csv │ │ ├── high_school_mathematics_test.csv │ │ ├── high_school_microeconomics_test.csv │ │ ├── high_school_physics_test.csv │ │ ├── high_school_psychology_test.csv │ │ ├── high_school_statistics_test.csv │ │ ├── high_school_us_history_test.csv │ │ ├── high_school_world_history_test.csv │ │ ├── human_aging_test.csv │ │ ├── human_sexuality_test.csv │ │ ├── international_law_test.csv │ │ ├── jurisprudence_test.csv │ │ ├── logical_fallacies_test.csv │ │ ├── machine_learning_test.csv │ │ ├── management_test.csv │ │ ├── marketing_test.csv │ │ ├── medical_genetics_test.csv │ │ ├── miscellaneous_test.csv │ │ ├── moral_disputes_test.csv │ │ ├── moral_scenarios_test.csv │ │ ├── nutrition_test.csv │ │ ├── philosophy_test.csv │ │ ├── prehistory_test.csv │ │ ├── professional_accounting_test.csv │ │ ├── professional_law_test.csv │ │ ├── professional_medicine_test.csv │ │ ├── professional_psychology_test.csv │ │ ├── public_relations_test.csv │ │ ├── security_studies_test.csv │ │ ├── sociology_test.csv │ │ ├── us_foreign_policy_test.csv │ │ ├── virology_test.csv │ │ └── world_religions_test.csv │ └── val │ │ ├── abstract_algebra_val.csv │ │ ├── anatomy_val.csv │ │ ├── astronomy_val.csv │ │ ├── business_ethics_val.csv │ │ ├── clinical_knowledge_val.csv │ │ ├── college_biology_val.csv │ │ ├── college_chemistry_val.csv │ │ ├── college_computer_science_val.csv │ │ ├── college_mathematics_val.csv │ │ ├── college_medicine_val.csv │ │ ├── college_physics_val.csv │ │ ├── computer_security_val.csv │ │ ├── conceptual_physics_val.csv │ │ ├── econometrics_val.csv │ │ ├── electrical_engineering_val.csv │ │ ├── elementary_mathematics_val.csv │ │ ├── formal_logic_val.csv │ │ ├── global_facts_val.csv │ │ ├── high_school_biology_val.csv │ │ ├── high_school_chemistry_val.csv │ │ ├── high_school_computer_science_val.csv │ │ ├── high_school_european_history_val.csv │ │ ├── high_school_geography_val.csv │ │ ├── high_school_government_and_politics_val.csv │ │ ├── high_school_macroeconomics_val.csv │ │ ├── high_school_mathematics_val.csv │ │ ├── high_school_microeconomics_val.csv │ │ ├── high_school_physics_val.csv │ │ ├── high_school_psychology_val.csv │ │ ├── high_school_statistics_val.csv │ │ ├── high_school_us_history_val.csv │ │ ├── high_school_world_history_val.csv │ │ ├── human_aging_val.csv │ │ ├── human_sexuality_val.csv │ │ ├── international_law_val.csv │ │ ├── jurisprudence_val.csv │ │ ├── logical_fallacies_val.csv │ │ ├── machine_learning_val.csv │ │ ├── management_val.csv │ │ ├── marketing_val.csv │ │ ├── medical_genetics_val.csv │ │ ├── miscellaneous_val.csv │ │ ├── moral_disputes_val.csv │ │ ├── moral_scenarios_val.csv │ │ ├── nutrition_val.csv │ │ ├── philosophy_val.csv │ │ ├── prehistory_val.csv │ │ ├── professional_accounting_val.csv │ │ ├── professional_law_val.csv │ │ ├── professional_medicine_val.csv │ │ ├── professional_psychology_val.csv │ │ ├── public_relations_val.csv │ │ ├── security_studies_val.csv │ │ ├── sociology_val.csv │ │ ├── us_foreign_policy_val.csv │ │ ├── virology_val.csv │ │ └── world_religions_val.csv └── simple_safety_tests │ └── simple_safety_tests.csv ├── download_model.py ├── pyproject.toml ├── scripts ├── alpaca_eval_vllm_llama3_3_70b_fn │ ├── alpaca_eval_fn.txt │ └── configs.yaml ├── eval.sh └── evaluate_safety.py ├── test_and_make_submission.sh ├── tests ├── __init__.py ├── _snapshots │ ├── test_compute_entropy.npz │ ├── test_compute_group_normalized_rewards_no_normalize_by_std.npz │ ├── test_compute_group_normalized_rewards_normalize_by_std.npz │ ├── test_compute_grpo_clip_loss_large_cliprange.npz │ ├── test_compute_grpo_clip_loss_small_cliprange.npz │ ├── test_compute_naive_policy_gradient_loss.npz │ ├── test_compute_policy_gradient_loss_grpo_clip.npz │ ├── test_compute_policy_gradient_loss_no_baseline.npz │ ├── test_compute_policy_gradient_loss_reinforce_with_baseline.npz │ ├── test_get_response_log_probs.npz │ ├── test_grpo_microbatch_train_step_grpo_clip.npz │ ├── test_grpo_microbatch_train_step_grpo_clip_10_steps.npz │ ├── test_masked_mean_dim0.npz │ ├── test_masked_mean_dim1.npz │ ├── test_masked_mean_dimNone.npz │ ├── test_masked_mean_dimlast.npz │ ├── test_masked_normalize_dim0.npz │ ├── test_masked_normalize_dim1.npz │ ├── test_masked_normalize_dimNone.npz │ ├── test_masked_normalize_dimlast.npz │ ├── test_sft_microbatch_train_step.npz │ ├── test_sft_microbatch_train_step_10_steps.npz │ ├── test_sft_microbatch_train_step_normalize.npz │ └── test_tokenize_prompt_and_output.npz ├── adapters.py ├── common.py ├── conftest.py ├── fixtures │ ├── .gitkeep │ ├── Meta-Llama-3-8B │ │ ├── special_tokens_map.json │ │ ├── tokenizer.json │ │ └── tokenizer_config.json │ ├── sft_sample.jsonl │ ├── tiny-gpt2-ref │ │ ├── config.json │ │ ├── generation_config.json │ │ └── model.safetensors │ ├── tiny-gpt2 │ │ ├── config.json │ │ ├── generation_config.json │ │ └── model.safetensors │ └── tokenized_sft_sample.json ├── test_data.py ├── test_dpo.py ├── test_grpo.py ├── test_metrics.py └── test_sft.py ├── train_ei.py ├── train_grpo.py ├── train_sft.py └── uv.lock /ReadMe.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/ReadMe.md -------------------------------------------------------------------------------- /assets/Ass05-grpo-alg.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/Ass05-grpo-alg.png -------------------------------------------------------------------------------- /assets/ass01-test.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/ass01-test.png -------------------------------------------------------------------------------- /assets/ass02.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/ass02.JPG -------------------------------------------------------------------------------- /assets/ass05-SFT_alg.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/ass05-SFT_alg.png -------------------------------------------------------------------------------- /assets/ass05-expert-iteartion-for-math-alg.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/ass05-expert-iteartion-for-math-alg.png -------------------------------------------------------------------------------- /assets/ass05-grpo-test.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/ass05-grpo-test.png -------------------------------------------------------------------------------- /assets/ass05-sft-test.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/ass05-sft-test.png -------------------------------------------------------------------------------- /assets/note-website.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assets/note-website.png -------------------------------------------------------------------------------- /assignment1-basics/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/.gitignore -------------------------------------------------------------------------------- /assignment1-basics/CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/CHANGELOG.md -------------------------------------------------------------------------------- /assignment1-basics/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/LICENSE -------------------------------------------------------------------------------- /assignment1-basics/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/README.md -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/__init__.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/data.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/loss.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/model/modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/model/modules.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/model/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/model/rope.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/model/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/model/transformer.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/optimizer.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/tokenizer/pretokenization_regular_pattern.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/tokenizer/pretokenization_regular_pattern.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/tokenizer/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/tokenizer/tokenizer.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/tokenizer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/tokenizer/utils.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_basics/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_basics/utils.py -------------------------------------------------------------------------------- /assignment1-basics/cs336_spring2025_assignment1_basics.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/cs336_spring2025_assignment1_basics.pdf -------------------------------------------------------------------------------- /assignment1-basics/make_submission.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/make_submission.sh -------------------------------------------------------------------------------- /assignment1-basics/profile.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/profile.html -------------------------------------------------------------------------------- /assignment1-basics/profile.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/profile.json -------------------------------------------------------------------------------- /assignment1-basics/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/pyproject.toml -------------------------------------------------------------------------------- /assignment1-basics/simple_bpe.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/simple_bpe.ipynb -------------------------------------------------------------------------------- /assignment1-basics/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_4d_scaled_dot_product_attention.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_4d_scaled_dot_product_attention.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_adamw.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_adamw.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_embedding.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_embedding.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_linear.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_linear.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_multihead_self_attention.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_multihead_self_attention.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_multihead_self_attention_with_rope.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_multihead_self_attention_with_rope.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_positionwise_feedforward.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_positionwise_feedforward.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_rmsnorm.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_rmsnorm.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_rope.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_rope.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_scaled_dot_product_attention.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_scaled_dot_product_attention.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_swiglu.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_swiglu.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_train_bpe_special_tokens.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_train_bpe_special_tokens.pkl -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_transformer_block.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_transformer_block.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_transformer_lm.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_transformer_lm.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/_snapshots/test_transformer_lm_truncated_input.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/_snapshots/test_transformer_lm_truncated_input.npz -------------------------------------------------------------------------------- /assignment1-basics/tests/adapters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/adapters.py -------------------------------------------------------------------------------- /assignment1-basics/tests/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/common.py -------------------------------------------------------------------------------- /assignment1-basics/tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/conftest.py -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/address.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/address.txt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/corpus.en: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/corpus.en -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/german.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/german.txt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/gpt2_merges.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/gpt2_merges.txt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/gpt2_vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/gpt2_vocab.json -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/special_token_double_newlines_non_whitespace.txt: -------------------------------------------------------------------------------- 1 | <|endoftext|> 2 | 3 | testing! -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/special_token_trailing_newlines.txt: -------------------------------------------------------------------------------- 1 | <|endoftext|> 2 | 3 | -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/tinystories_sample.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/tinystories_sample.txt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/tinystories_sample_5M.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/tinystories_sample_5M.txt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/train-bpe-reference-merges.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/train-bpe-reference-merges.txt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/train-bpe-reference-vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/train-bpe-reference-vocab.json -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/ts_tests/model.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/ts_tests/model.pt -------------------------------------------------------------------------------- /assignment1-basics/tests/fixtures/ts_tests/model_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/fixtures/ts_tests/model_config.json -------------------------------------------------------------------------------- /assignment1-basics/tests/test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_data.py -------------------------------------------------------------------------------- /assignment1-basics/tests/test_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_model.py -------------------------------------------------------------------------------- /assignment1-basics/tests/test_nn_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_nn_utils.py -------------------------------------------------------------------------------- /assignment1-basics/tests/test_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_optimizer.py -------------------------------------------------------------------------------- /assignment1-basics/tests/test_serialization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_serialization.py -------------------------------------------------------------------------------- /assignment1-basics/tests/test_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_tokenizer.py -------------------------------------------------------------------------------- /assignment1-basics/tests/test_train_bpe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/tests/test_train_bpe.py -------------------------------------------------------------------------------- /assignment1-basics/uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment1-basics/uv.lock -------------------------------------------------------------------------------- /assignment2-systems/CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/CHANGELOG.md -------------------------------------------------------------------------------- /assignment2-systems/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/LICENSE -------------------------------------------------------------------------------- /assignment2-systems/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/README.md -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336-basics/README.md -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/cs336_basics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/cs336_basics/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336-basics/cs336_basics/data.py -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/cs336_basics/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336-basics/cs336_basics/model.py -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/cs336_basics/nn_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336-basics/cs336_basics/nn_utils.py -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/cs336_basics/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336-basics/cs336_basics/optimizer.py -------------------------------------------------------------------------------- /assignment2-systems/cs336-basics/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336-basics/pyproject.toml -------------------------------------------------------------------------------- /assignment2-systems/cs336_spring2025_assignment2_systems.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_spring2025_assignment2_systems.pdf -------------------------------------------------------------------------------- /assignment2-systems/cs336_systems/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_systems/__init__.py -------------------------------------------------------------------------------- /assignment2-systems/cs336_systems/benchmark/benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_systems/benchmark/benchmark.py -------------------------------------------------------------------------------- /assignment2-systems/cs336_systems/flash_attn/flash_attn_pytorch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_systems/flash_attn/flash_attn_pytorch.py -------------------------------------------------------------------------------- /assignment2-systems/cs336_systems/flash_attn/flash_attn_triton.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_systems/flash_attn/flash_attn_triton.py -------------------------------------------------------------------------------- /assignment2-systems/cs336_systems/parallel/ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_systems/parallel/ddp.py -------------------------------------------------------------------------------- /assignment2-systems/cs336_systems/parallel/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/cs336_systems/parallel/optimizer.py -------------------------------------------------------------------------------- /assignment2-systems/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/pyproject.toml -------------------------------------------------------------------------------- /assignment2-systems/test_and_make_submission.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/test_and_make_submission.sh -------------------------------------------------------------------------------- /assignment2-systems/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment2-systems/tests/adapters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/adapters.py -------------------------------------------------------------------------------- /assignment2-systems/tests/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/common.py -------------------------------------------------------------------------------- /assignment2-systems/tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/conftest.py -------------------------------------------------------------------------------- /assignment2-systems/tests/fixtures/ddp_test_data.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/fixtures/ddp_test_data.pt -------------------------------------------------------------------------------- /assignment2-systems/tests/fixtures/ddp_test_labels.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/fixtures/ddp_test_labels.pt -------------------------------------------------------------------------------- /assignment2-systems/tests/test_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/test_attention.py -------------------------------------------------------------------------------- /assignment2-systems/tests/test_ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/test_ddp.py -------------------------------------------------------------------------------- /assignment2-systems/tests/test_ddp_individual_parameters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/test_ddp_individual_parameters.py -------------------------------------------------------------------------------- /assignment2-systems/tests/test_sharded_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/tests/test_sharded_optimizer.py -------------------------------------------------------------------------------- /assignment2-systems/uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment2-systems/uv.lock -------------------------------------------------------------------------------- /assignment4-data/CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/CHANGELOG.md -------------------------------------------------------------------------------- /assignment4-data/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/LICENSE -------------------------------------------------------------------------------- /assignment4-data/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/README.md -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/README.md -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/configs/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/configs/config.yaml -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/configs/experiment/your_data.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/configs/experiment/your_data.yaml -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/cs336_basics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/cs336_basics/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/cs336_basics/data.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/cs336_basics/ddp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/cs336_basics/ddp_utils.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/cs336_basics/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/cs336_basics/model.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/cs336_basics/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/cs336_basics/optimizer.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/cs336_basics/train_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/cs336_basics/train_config.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/pyproject.toml -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/scripts/generate_with_gpt2_tok.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/scripts/generate_with_gpt2_tok.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/scripts/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/scripts/train.py -------------------------------------------------------------------------------- /assignment4-data/cs336-basics/uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336-basics/uv.lock -------------------------------------------------------------------------------- /assignment4-data/cs336_data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336_data/__init__.py -------------------------------------------------------------------------------- /assignment4-data/cs336_spring2025_assignment4_data.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/cs336_spring2025_assignment4_data.pdf -------------------------------------------------------------------------------- /assignment4-data/get_assets.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/get_assets.sh -------------------------------------------------------------------------------- /assignment4-data/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/pyproject.toml -------------------------------------------------------------------------------- /assignment4-data/test_and_make_submission.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/test_and_make_submission.sh -------------------------------------------------------------------------------- /assignment4-data/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment4-data/tests/adapters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/adapters.py -------------------------------------------------------------------------------- /assignment4-data/tests/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/common.py -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_line_deduplicated/doc1.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_line_deduplicated/doc2.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_line_deduplicated/doc3.txt: -------------------------------------------------------------------------------- 1 | - back 2 | 3 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_line_deduplicated/doc4.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_line_deduplicated/doc5.txt: -------------------------------------------------------------------------------- 1 | Document 5 doesn't have any line-level duplicates. 2 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_fuzzy_duplicates/pytorch_license.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/documents_with_fuzzy_duplicates/pytorch_license.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_fuzzy_duplicates/rails_mit_license.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/documents_with_fuzzy_duplicates/rails_mit_license.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_fuzzy_duplicates/react_mit_license.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/documents_with_fuzzy_duplicates/react_mit_license.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_line_duplicates/doc1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/documents_with_line_duplicates/doc1.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_line_duplicates/doc2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/documents_with_line_duplicates/doc2.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_line_duplicates/doc3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/documents_with_line_duplicates/doc3.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_line_duplicates/doc4.txt: -------------------------------------------------------------------------------- 1 | - home 2 | - menu 3 | 4 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/documents_with_line_duplicates/doc5.txt: -------------------------------------------------------------------------------- 1 | Document 5 doesn't have any line-level duplicates. 2 | -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/high_quality_wiki_reference.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/high_quality_wiki_reference.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/low_quality_cc.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/low_quality_cc.txt -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/moby.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/moby.html -------------------------------------------------------------------------------- /assignment4-data/tests/fixtures/moby_extracted.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/fixtures/moby_extracted.txt -------------------------------------------------------------------------------- /assignment4-data/tests/test_deduplication.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/test_deduplication.py -------------------------------------------------------------------------------- /assignment4-data/tests/test_extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/test_extract.py -------------------------------------------------------------------------------- /assignment4-data/tests/test_langid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/test_langid.py -------------------------------------------------------------------------------- /assignment4-data/tests/test_pii.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/test_pii.py -------------------------------------------------------------------------------- /assignment4-data/tests/test_quality.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/test_quality.py -------------------------------------------------------------------------------- /assignment4-data/tests/test_toxicity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/tests/test_toxicity.py -------------------------------------------------------------------------------- /assignment4-data/uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment4-data/uv.lock -------------------------------------------------------------------------------- /assignment5-alignment/CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/CHANGELOG.md -------------------------------------------------------------------------------- /assignment5-alignment/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/README.md -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/data_utils.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/drgrpo_grader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/drgrpo_grader.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/evaluate.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/grpo.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/prompts/alpaca_sft.prompt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/prompts/alpaca_sft.prompt -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/prompts/question_only.prompt: -------------------------------------------------------------------------------- 1 | {question} -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/prompts/r1_zero.prompt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/prompts/r1_zero.prompt -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/prompts/zero_shot_system_prompt.prompt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/prompts/zero_shot_system_prompt.prompt -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/sft_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/sft_utils.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/utils.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_alignment/vllm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_alignment/vllm_utils.py -------------------------------------------------------------------------------- /assignment5-alignment/cs336_spring2025_assignment5_alignment.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_spring2025_assignment5_alignment.pdf -------------------------------------------------------------------------------- /assignment5-alignment/cs336_spring2025_assignment5_supplement_safety_rlhf.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/cs336_spring2025_assignment5_supplement_safety_rlhf.pdf -------------------------------------------------------------------------------- /assignment5-alignment/data/alpaca_eval/alpaca_eval.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/alpaca_eval/alpaca_eval.jsonl -------------------------------------------------------------------------------- /assignment5-alignment/data/gsm8k/test.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/gsm8k/test.jsonl -------------------------------------------------------------------------------- /assignment5-alignment/data/gsm8k/train.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/gsm8k/train.jsonl -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/README.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/README.txt -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/abstract_algebra_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/abstract_algebra_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/anatomy_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/anatomy_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/astronomy_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/astronomy_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/business_ethics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/business_ethics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/clinical_knowledge_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/clinical_knowledge_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/college_biology_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/college_biology_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/college_chemistry_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/college_chemistry_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/college_computer_science_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/college_computer_science_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/college_mathematics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/college_mathematics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/college_medicine_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/college_medicine_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/college_physics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/college_physics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/computer_security_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/computer_security_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/conceptual_physics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/conceptual_physics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/econometrics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/econometrics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/electrical_engineering_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/electrical_engineering_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/elementary_mathematics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/elementary_mathematics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/formal_logic_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/formal_logic_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/global_facts_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/global_facts_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_biology_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_biology_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_chemistry_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_chemistry_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_computer_science_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_computer_science_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_european_history_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_european_history_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_geography_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_geography_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_government_and_politics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_government_and_politics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_macroeconomics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_macroeconomics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_mathematics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_mathematics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_microeconomics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_microeconomics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_physics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_physics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_psychology_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_psychology_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_statistics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_statistics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_us_history_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_us_history_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/high_school_world_history_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/high_school_world_history_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/human_aging_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/human_aging_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/human_sexuality_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/human_sexuality_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/international_law_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/international_law_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/jurisprudence_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/jurisprudence_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/logical_fallacies_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/logical_fallacies_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/machine_learning_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/machine_learning_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/management_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/management_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/marketing_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/marketing_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/medical_genetics_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/medical_genetics_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/miscellaneous_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/miscellaneous_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/moral_disputes_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/moral_disputes_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/moral_scenarios_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/moral_scenarios_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/nutrition_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/nutrition_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/philosophy_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/philosophy_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/prehistory_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/prehistory_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/professional_accounting_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/professional_accounting_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/professional_law_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/professional_law_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/professional_medicine_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/professional_medicine_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/professional_psychology_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/professional_psychology_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/public_relations_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/public_relations_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/security_studies_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/security_studies_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/sociology_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/sociology_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/us_foreign_policy_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/us_foreign_policy_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/virology_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/virology_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/dev/world_religions_dev.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/dev/world_religions_dev.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/possibly_contaminated_urls.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/possibly_contaminated_urls.txt -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/abstract_algebra_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/abstract_algebra_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/anatomy_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/anatomy_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/astronomy_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/astronomy_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/business_ethics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/business_ethics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/clinical_knowledge_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/clinical_knowledge_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/college_biology_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/college_biology_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/college_chemistry_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/college_chemistry_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/college_computer_science_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/college_computer_science_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/college_mathematics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/college_mathematics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/college_medicine_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/college_medicine_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/college_physics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/college_physics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/computer_security_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/computer_security_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/conceptual_physics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/conceptual_physics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/econometrics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/econometrics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/electrical_engineering_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/electrical_engineering_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/elementary_mathematics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/elementary_mathematics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/formal_logic_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/formal_logic_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/global_facts_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/global_facts_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_biology_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_biology_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_chemistry_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_chemistry_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_computer_science_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_computer_science_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_european_history_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_european_history_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_geography_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_geography_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_government_and_politics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_government_and_politics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_macroeconomics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_macroeconomics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_mathematics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_mathematics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_microeconomics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_microeconomics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_physics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_physics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_psychology_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_psychology_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_statistics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_statistics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_us_history_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_us_history_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/high_school_world_history_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/high_school_world_history_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/human_aging_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/human_aging_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/human_sexuality_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/human_sexuality_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/international_law_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/international_law_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/jurisprudence_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/jurisprudence_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/logical_fallacies_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/logical_fallacies_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/machine_learning_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/machine_learning_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/management_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/management_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/marketing_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/marketing_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/medical_genetics_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/medical_genetics_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/miscellaneous_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/miscellaneous_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/moral_disputes_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/moral_disputes_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/moral_scenarios_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/moral_scenarios_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/nutrition_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/nutrition_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/philosophy_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/philosophy_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/prehistory_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/prehistory_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/professional_accounting_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/professional_accounting_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/professional_law_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/professional_law_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/professional_medicine_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/professional_medicine_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/professional_psychology_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/professional_psychology_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/public_relations_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/public_relations_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/security_studies_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/security_studies_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/sociology_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/sociology_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/us_foreign_policy_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/us_foreign_policy_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/virology_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/virology_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/test/world_religions_test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/test/world_religions_test.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/abstract_algebra_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/abstract_algebra_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/anatomy_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/anatomy_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/astronomy_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/astronomy_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/business_ethics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/business_ethics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/clinical_knowledge_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/clinical_knowledge_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/college_biology_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/college_biology_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/college_chemistry_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/college_chemistry_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/college_computer_science_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/college_computer_science_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/college_mathematics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/college_mathematics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/college_medicine_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/college_medicine_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/college_physics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/college_physics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/computer_security_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/computer_security_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/conceptual_physics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/conceptual_physics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/econometrics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/econometrics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/electrical_engineering_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/electrical_engineering_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/elementary_mathematics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/elementary_mathematics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/formal_logic_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/formal_logic_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/global_facts_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/global_facts_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_biology_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_biology_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_chemistry_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_chemistry_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_computer_science_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_computer_science_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_european_history_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_european_history_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_geography_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_geography_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_government_and_politics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_government_and_politics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_macroeconomics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_macroeconomics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_mathematics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_mathematics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_microeconomics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_microeconomics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_physics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_physics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_psychology_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_psychology_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_statistics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_statistics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_us_history_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_us_history_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/high_school_world_history_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/high_school_world_history_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/human_aging_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/human_aging_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/human_sexuality_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/human_sexuality_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/international_law_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/international_law_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/jurisprudence_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/jurisprudence_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/logical_fallacies_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/logical_fallacies_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/machine_learning_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/machine_learning_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/management_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/management_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/marketing_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/marketing_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/medical_genetics_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/medical_genetics_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/miscellaneous_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/miscellaneous_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/moral_disputes_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/moral_disputes_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/moral_scenarios_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/moral_scenarios_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/nutrition_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/nutrition_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/philosophy_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/philosophy_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/prehistory_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/prehistory_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/professional_accounting_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/professional_accounting_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/professional_law_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/professional_law_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/professional_medicine_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/professional_medicine_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/professional_psychology_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/professional_psychology_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/public_relations_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/public_relations_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/security_studies_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/security_studies_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/sociology_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/sociology_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/us_foreign_policy_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/us_foreign_policy_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/virology_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/virology_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/mmlu/val/world_religions_val.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/mmlu/val/world_religions_val.csv -------------------------------------------------------------------------------- /assignment5-alignment/data/simple_safety_tests/simple_safety_tests.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/data/simple_safety_tests/simple_safety_tests.csv -------------------------------------------------------------------------------- /assignment5-alignment/download_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/download_model.py -------------------------------------------------------------------------------- /assignment5-alignment/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/pyproject.toml -------------------------------------------------------------------------------- /assignment5-alignment/scripts/alpaca_eval_vllm_llama3_3_70b_fn/alpaca_eval_fn.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/scripts/alpaca_eval_vllm_llama3_3_70b_fn/alpaca_eval_fn.txt -------------------------------------------------------------------------------- /assignment5-alignment/scripts/alpaca_eval_vllm_llama3_3_70b_fn/configs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/scripts/alpaca_eval_vllm_llama3_3_70b_fn/configs.yaml -------------------------------------------------------------------------------- /assignment5-alignment/scripts/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/scripts/eval.sh -------------------------------------------------------------------------------- /assignment5-alignment/scripts/evaluate_safety.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/scripts/evaluate_safety.py -------------------------------------------------------------------------------- /assignment5-alignment/test_and_make_submission.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/test_and_make_submission.sh -------------------------------------------------------------------------------- /assignment5-alignment/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_entropy.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_entropy.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_group_normalized_rewards_no_normalize_by_std.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_group_normalized_rewards_no_normalize_by_std.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_group_normalized_rewards_normalize_by_std.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_group_normalized_rewards_normalize_by_std.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_grpo_clip_loss_large_cliprange.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_grpo_clip_loss_large_cliprange.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_grpo_clip_loss_small_cliprange.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_grpo_clip_loss_small_cliprange.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_naive_policy_gradient_loss.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_naive_policy_gradient_loss.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_policy_gradient_loss_grpo_clip.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_policy_gradient_loss_grpo_clip.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_policy_gradient_loss_no_baseline.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_policy_gradient_loss_no_baseline.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_compute_policy_gradient_loss_reinforce_with_baseline.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_compute_policy_gradient_loss_reinforce_with_baseline.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_get_response_log_probs.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_get_response_log_probs.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_grpo_microbatch_train_step_grpo_clip.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_grpo_microbatch_train_step_grpo_clip.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_grpo_microbatch_train_step_grpo_clip_10_steps.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_grpo_microbatch_train_step_grpo_clip_10_steps.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_mean_dim0.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_mean_dim0.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_mean_dim1.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_mean_dim1.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_mean_dimNone.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_mean_dimNone.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_mean_dimlast.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_mean_dimlast.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_normalize_dim0.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_normalize_dim0.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_normalize_dim1.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_normalize_dim1.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_normalize_dimNone.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_normalize_dimNone.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_masked_normalize_dimlast.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_masked_normalize_dimlast.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_sft_microbatch_train_step.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_sft_microbatch_train_step.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_sft_microbatch_train_step_10_steps.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_sft_microbatch_train_step_10_steps.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_sft_microbatch_train_step_normalize.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_sft_microbatch_train_step_normalize.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/_snapshots/test_tokenize_prompt_and_output.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/_snapshots/test_tokenize_prompt_and_output.npz -------------------------------------------------------------------------------- /assignment5-alignment/tests/adapters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/adapters.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/common.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/conftest.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/Meta-Llama-3-8B/special_tokens_map.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/Meta-Llama-3-8B/special_tokens_map.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/Meta-Llama-3-8B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/Meta-Llama-3-8B/tokenizer.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/Meta-Llama-3-8B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/Meta-Llama-3-8B/tokenizer_config.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/sft_sample.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/sft_sample.jsonl -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tiny-gpt2-ref/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tiny-gpt2-ref/config.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tiny-gpt2-ref/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tiny-gpt2-ref/generation_config.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tiny-gpt2-ref/model.safetensors: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tiny-gpt2-ref/model.safetensors -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tiny-gpt2/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tiny-gpt2/config.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tiny-gpt2/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tiny-gpt2/generation_config.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tiny-gpt2/model.safetensors: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tiny-gpt2/model.safetensors -------------------------------------------------------------------------------- /assignment5-alignment/tests/fixtures/tokenized_sft_sample.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/fixtures/tokenized_sft_sample.json -------------------------------------------------------------------------------- /assignment5-alignment/tests/test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/test_data.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/test_dpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/test_dpo.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/test_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/test_grpo.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/test_metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/test_metrics.py -------------------------------------------------------------------------------- /assignment5-alignment/tests/test_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/tests/test_sft.py -------------------------------------------------------------------------------- /assignment5-alignment/train_ei.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/train_ei.py -------------------------------------------------------------------------------- /assignment5-alignment/train_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/train_grpo.py -------------------------------------------------------------------------------- /assignment5-alignment/train_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/train_sft.py -------------------------------------------------------------------------------- /assignment5-alignment/uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YYZhang2025/Stanford-CS336/HEAD/assignment5-alignment/uv.lock --------------------------------------------------------------------------------