├── .github └── workflows │ ├── headers.yml │ └── style.yml ├── .gitignore ├── .gitmodules ├── .licenserc.yaml ├── .pre-commit-config.yaml ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── LICENSE ├── README.md ├── gh-pages ├── README.md ├── _config.yaml └── workshop │ └── COLM_2025 │ ├── README.md │ └── ram2.jpeg ├── projects ├── README.md ├── co-improvement.pdf ├── cocomix │ ├── README.md │ ├── cocomix.png │ ├── conf │ │ ├── config.yaml │ │ ├── config_eval.yaml │ │ ├── ddp.yaml │ │ ├── fsdp_bf16.yaml │ │ └── setup │ │ │ ├── gpt2_1b_cocomix.yaml │ │ │ ├── gpt2_1b_ntp.yaml │ │ │ ├── gpt2_386m_cocomix.yaml │ │ │ ├── gpt2_386m_ntp.yaml │ │ │ ├── gpt2_69m_cocomix.yaml │ │ │ └── gpt2_69m_ntp.yaml │ ├── data │ │ ├── __init__.py │ │ ├── data.py │ │ └── openwebtext_preprocess │ │ │ ├── prepare.py │ │ │ └── readme.md │ ├── main.py │ ├── models │ │ ├── __init__.py │ │ ├── concept_extractor.py │ │ ├── modeling_gpt2_cocomix.py │ │ └── sparse_autoencoder │ │ │ ├── __init__.py │ │ │ ├── kernels.py │ │ │ ├── loss.py │ │ │ ├── model.py │ │ │ └── paths.py │ ├── requirements.txt │ ├── slurm_bash │ │ └── slurm_multi.sh │ ├── test.py │ ├── train │ │ ├── __init__.py │ │ ├── train_func │ │ │ ├── __init__.py │ │ │ ├── cocomix.py │ │ │ └── ntp.py │ │ └── trainer.py │ └── utils.py ├── cope │ ├── README.md │ ├── eval.py │ ├── figures │ │ ├── CoPE.png │ │ └── counting_task.png │ ├── requirements.txt │ ├── run.sh │ ├── scripts │ │ └── count_data_gen.py │ ├── src │ │ ├── cope │ │ │ └── context_position.py │ │ ├── data │ │ │ ├── __init__.py │ │ │ ├── constants.py │ │ │ ├── data_collator.py │ │ │ ├── simple.py │ │ │ └── tokenizer.py │ │ ├── main.py │ │ ├── models │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── relative_position.py │ │ │ ├── simple_transformer.py │ │ │ └── transformer.py │ │ ├── trainer.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── checkpoint.py │ │ │ ├── distributed.py │ │ │ ├── logger.py │ │ │ └── world.py │ └── train.py ├── length_instruct │ ├── README.md │ └── fig.png ├── mta │ ├── README.md │ ├── __init__.py │ ├── configs │ │ ├── 1B_baseline.yaml │ │ ├── 1B_mta.yaml │ │ ├── 1B_talking_heads.yaml │ │ ├── 300M_baseline.yaml │ │ ├── 300M_mta.yaml │ │ ├── 300M_talking_heads.yaml │ │ ├── 550M_baseline.yaml │ │ ├── 550M_mta.yaml │ │ ├── 550M_talking_heads.yaml │ │ ├── 830M_baseline.yaml │ │ ├── 830M_mta.yaml │ │ └── 830M_talking_heads.yaml │ ├── data.py │ ├── eval.py │ ├── figures │ │ └── attn_schema.png │ ├── generate.py │ ├── mta_transformer.py │ ├── single_json.py │ ├── tokenizer.py │ ├── toy_task │ │ ├── README.md │ │ ├── configs │ │ │ ├── find_block_base.yaml │ │ │ └── find_block_mta.yaml │ │ └── generate_data.py │ ├── train.py │ └── transformer.py ├── otb │ ├── .gitignore │ ├── LICENSE │ ├── README.md │ ├── eval.py │ ├── evals │ │ ├── math_eval.py │ │ ├── overthink_eval.py │ │ ├── token_eval.py │ │ └── underthink_eval.py │ ├── figures │ │ └── otb.png │ ├── generate.py │ ├── otb_creation │ │ ├── __init__.py │ │ ├── create_overthink.py │ │ ├── create_underthink.py │ │ ├── data │ │ │ ├── overthink_bench.jsonl │ │ │ └── underthink_bench.pkl │ │ ├── filter_overthink.py │ │ └── prompts.py │ ├── otbench │ │ ├── __init__.py │ │ └── cli.py │ ├── prepare.py │ ├── requirements.txt │ ├── setup.py │ └── utils.py ├── sd-ra-it │ ├── README.md │ ├── configs │ │ ├── dpo_70b.yaml │ │ ├── dpo_8b.yaml │ │ ├── sft_70b.yaml │ │ └── sft_8b.yaml │ └── scripts │ │ ├── create_self_demo_train_set.sh │ │ ├── data │ │ └── io_to_qas_format.py │ │ ├── eval.py │ │ ├── generate.py │ │ ├── get_demos.py │ │ ├── prompt_optimization.py │ │ ├── relevance.py │ │ └── reward_model_gemma.py ├── self_notes │ ├── README.md │ ├── fig_method.png │ ├── fig_rel.png │ └── toy_story │ │ ├── constants.py │ │ ├── graph.py │ │ ├── main.py │ │ ├── relation.py │ │ ├── rules.py │ │ └── world.py └── self_taught_evaluator │ ├── README.md │ ├── data │ ├── prompts │ │ ├── eval_plan.prompt │ │ └── worse_response.prompt │ └── training_data.yaml │ ├── figures │ └── self_taught_dpo.png │ ├── run_inference_wvllm.sh │ ├── run_rewardbench.sh │ ├── src │ ├── __init__.py │ ├── load_dpo_data_from_hf.py │ ├── prepare_dpo_data.py │ ├── prepare_sft_data.py │ ├── requirements.txt │ ├── run_model.py │ └── utils.py │ └── training_configs │ ├── dpo_training.yaml │ └── sft_training.yaml ├── ram ├── __init__.py ├── data.py └── data_utils.py └── setup.py /.github/workflows/headers.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/.github/workflows/headers.yml -------------------------------------------------------------------------------- /.github/workflows/style.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/.github/workflows/style.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/.gitmodules -------------------------------------------------------------------------------- /.licenserc.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/.licenserc.yaml -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/README.md -------------------------------------------------------------------------------- /gh-pages/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/gh-pages/README.md -------------------------------------------------------------------------------- /gh-pages/_config.yaml: -------------------------------------------------------------------------------- 1 | name: RAM @ Meta AI 2 | title: null 3 | -------------------------------------------------------------------------------- /gh-pages/workshop/COLM_2025/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/gh-pages/workshop/COLM_2025/README.md -------------------------------------------------------------------------------- /gh-pages/workshop/COLM_2025/ram2.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/gh-pages/workshop/COLM_2025/ram2.jpeg -------------------------------------------------------------------------------- /projects/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/README.md -------------------------------------------------------------------------------- /projects/co-improvement.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/co-improvement.pdf -------------------------------------------------------------------------------- /projects/cocomix/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/README.md -------------------------------------------------------------------------------- /projects/cocomix/cocomix.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/cocomix.png -------------------------------------------------------------------------------- /projects/cocomix/conf/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/config.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/config_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/config_eval.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/ddp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/ddp.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/fsdp_bf16.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/fsdp_bf16.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/setup/gpt2_1b_cocomix.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/setup/gpt2_1b_cocomix.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/setup/gpt2_1b_ntp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/setup/gpt2_1b_ntp.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/setup/gpt2_386m_cocomix.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/setup/gpt2_386m_cocomix.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/setup/gpt2_386m_ntp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/setup/gpt2_386m_ntp.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/setup/gpt2_69m_cocomix.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/setup/gpt2_69m_cocomix.yaml -------------------------------------------------------------------------------- /projects/cocomix/conf/setup/gpt2_69m_ntp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/conf/setup/gpt2_69m_ntp.yaml -------------------------------------------------------------------------------- /projects/cocomix/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/data/__init__.py -------------------------------------------------------------------------------- /projects/cocomix/data/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/data/data.py -------------------------------------------------------------------------------- /projects/cocomix/data/openwebtext_preprocess/prepare.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/data/openwebtext_preprocess/prepare.py -------------------------------------------------------------------------------- /projects/cocomix/data/openwebtext_preprocess/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/data/openwebtext_preprocess/readme.md -------------------------------------------------------------------------------- /projects/cocomix/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/main.py -------------------------------------------------------------------------------- /projects/cocomix/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/__init__.py -------------------------------------------------------------------------------- /projects/cocomix/models/concept_extractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/concept_extractor.py -------------------------------------------------------------------------------- /projects/cocomix/models/modeling_gpt2_cocomix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/modeling_gpt2_cocomix.py -------------------------------------------------------------------------------- /projects/cocomix/models/sparse_autoencoder/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/sparse_autoencoder/__init__.py -------------------------------------------------------------------------------- /projects/cocomix/models/sparse_autoencoder/kernels.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/sparse_autoencoder/kernels.py -------------------------------------------------------------------------------- /projects/cocomix/models/sparse_autoencoder/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/sparse_autoencoder/loss.py -------------------------------------------------------------------------------- /projects/cocomix/models/sparse_autoencoder/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/sparse_autoencoder/model.py -------------------------------------------------------------------------------- /projects/cocomix/models/sparse_autoencoder/paths.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/models/sparse_autoencoder/paths.py -------------------------------------------------------------------------------- /projects/cocomix/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/requirements.txt -------------------------------------------------------------------------------- /projects/cocomix/slurm_bash/slurm_multi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/slurm_bash/slurm_multi.sh -------------------------------------------------------------------------------- /projects/cocomix/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/test.py -------------------------------------------------------------------------------- /projects/cocomix/train/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/train/__init__.py -------------------------------------------------------------------------------- /projects/cocomix/train/train_func/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/train/train_func/__init__.py -------------------------------------------------------------------------------- /projects/cocomix/train/train_func/cocomix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/train/train_func/cocomix.py -------------------------------------------------------------------------------- /projects/cocomix/train/train_func/ntp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/train/train_func/ntp.py -------------------------------------------------------------------------------- /projects/cocomix/train/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/train/trainer.py -------------------------------------------------------------------------------- /projects/cocomix/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cocomix/utils.py -------------------------------------------------------------------------------- /projects/cope/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/README.md -------------------------------------------------------------------------------- /projects/cope/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/eval.py -------------------------------------------------------------------------------- /projects/cope/figures/CoPE.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/figures/CoPE.png -------------------------------------------------------------------------------- /projects/cope/figures/counting_task.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/figures/counting_task.png -------------------------------------------------------------------------------- /projects/cope/requirements.txt: -------------------------------------------------------------------------------- 1 | submitit==1.5.1 2 | transformers 3 | wandb==0.17.4 4 | -------------------------------------------------------------------------------- /projects/cope/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/run.sh -------------------------------------------------------------------------------- /projects/cope/scripts/count_data_gen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/scripts/count_data_gen.py -------------------------------------------------------------------------------- /projects/cope/src/cope/context_position.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/cope/context_position.py -------------------------------------------------------------------------------- /projects/cope/src/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/data/__init__.py -------------------------------------------------------------------------------- /projects/cope/src/data/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/data/constants.py -------------------------------------------------------------------------------- /projects/cope/src/data/data_collator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/data/data_collator.py -------------------------------------------------------------------------------- /projects/cope/src/data/simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/data/simple.py -------------------------------------------------------------------------------- /projects/cope/src/data/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/data/tokenizer.py -------------------------------------------------------------------------------- /projects/cope/src/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/main.py -------------------------------------------------------------------------------- /projects/cope/src/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/models/__init__.py -------------------------------------------------------------------------------- /projects/cope/src/models/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/models/base.py -------------------------------------------------------------------------------- /projects/cope/src/models/relative_position.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/models/relative_position.py -------------------------------------------------------------------------------- /projects/cope/src/models/simple_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/models/simple_transformer.py -------------------------------------------------------------------------------- /projects/cope/src/models/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/models/transformer.py -------------------------------------------------------------------------------- /projects/cope/src/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/trainer.py -------------------------------------------------------------------------------- /projects/cope/src/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/utils/__init__.py -------------------------------------------------------------------------------- /projects/cope/src/utils/checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/utils/checkpoint.py -------------------------------------------------------------------------------- /projects/cope/src/utils/distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/utils/distributed.py -------------------------------------------------------------------------------- /projects/cope/src/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/utils/logger.py -------------------------------------------------------------------------------- /projects/cope/src/utils/world.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/src/utils/world.py -------------------------------------------------------------------------------- /projects/cope/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/cope/train.py -------------------------------------------------------------------------------- /projects/length_instruct/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/length_instruct/README.md -------------------------------------------------------------------------------- /projects/length_instruct/fig.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/length_instruct/fig.png -------------------------------------------------------------------------------- /projects/mta/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/README.md -------------------------------------------------------------------------------- /projects/mta/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/__init__.py -------------------------------------------------------------------------------- /projects/mta/configs/1B_baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/1B_baseline.yaml -------------------------------------------------------------------------------- /projects/mta/configs/1B_mta.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/1B_mta.yaml -------------------------------------------------------------------------------- /projects/mta/configs/1B_talking_heads.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/1B_talking_heads.yaml -------------------------------------------------------------------------------- /projects/mta/configs/300M_baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/300M_baseline.yaml -------------------------------------------------------------------------------- /projects/mta/configs/300M_mta.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/300M_mta.yaml -------------------------------------------------------------------------------- /projects/mta/configs/300M_talking_heads.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/300M_talking_heads.yaml -------------------------------------------------------------------------------- /projects/mta/configs/550M_baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/550M_baseline.yaml -------------------------------------------------------------------------------- /projects/mta/configs/550M_mta.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/550M_mta.yaml -------------------------------------------------------------------------------- /projects/mta/configs/550M_talking_heads.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/550M_talking_heads.yaml -------------------------------------------------------------------------------- /projects/mta/configs/830M_baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/830M_baseline.yaml -------------------------------------------------------------------------------- /projects/mta/configs/830M_mta.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/830M_mta.yaml -------------------------------------------------------------------------------- /projects/mta/configs/830M_talking_heads.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/configs/830M_talking_heads.yaml -------------------------------------------------------------------------------- /projects/mta/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/data.py -------------------------------------------------------------------------------- /projects/mta/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/eval.py -------------------------------------------------------------------------------- /projects/mta/figures/attn_schema.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/figures/attn_schema.png -------------------------------------------------------------------------------- /projects/mta/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/generate.py -------------------------------------------------------------------------------- /projects/mta/mta_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/mta_transformer.py -------------------------------------------------------------------------------- /projects/mta/single_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/single_json.py -------------------------------------------------------------------------------- /projects/mta/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/tokenizer.py -------------------------------------------------------------------------------- /projects/mta/toy_task/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/toy_task/README.md -------------------------------------------------------------------------------- /projects/mta/toy_task/configs/find_block_base.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/toy_task/configs/find_block_base.yaml -------------------------------------------------------------------------------- /projects/mta/toy_task/configs/find_block_mta.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/toy_task/configs/find_block_mta.yaml -------------------------------------------------------------------------------- /projects/mta/toy_task/generate_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/toy_task/generate_data.py -------------------------------------------------------------------------------- /projects/mta/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/train.py -------------------------------------------------------------------------------- /projects/mta/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/mta/transformer.py -------------------------------------------------------------------------------- /projects/otb/.gitignore: -------------------------------------------------------------------------------- 1 | data* 2 | *.egg-info 3 | nohup.out 4 | final_outputs 5 | __pycache__ -------------------------------------------------------------------------------- /projects/otb/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/LICENSE -------------------------------------------------------------------------------- /projects/otb/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/README.md -------------------------------------------------------------------------------- /projects/otb/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/eval.py -------------------------------------------------------------------------------- /projects/otb/evals/math_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/evals/math_eval.py -------------------------------------------------------------------------------- /projects/otb/evals/overthink_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/evals/overthink_eval.py -------------------------------------------------------------------------------- /projects/otb/evals/token_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/evals/token_eval.py -------------------------------------------------------------------------------- /projects/otb/evals/underthink_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/evals/underthink_eval.py -------------------------------------------------------------------------------- /projects/otb/figures/otb.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/figures/otb.png -------------------------------------------------------------------------------- /projects/otb/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/generate.py -------------------------------------------------------------------------------- /projects/otb/otb_creation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/__init__.py -------------------------------------------------------------------------------- /projects/otb/otb_creation/create_overthink.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/create_overthink.py -------------------------------------------------------------------------------- /projects/otb/otb_creation/create_underthink.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/create_underthink.py -------------------------------------------------------------------------------- /projects/otb/otb_creation/data/overthink_bench.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/data/overthink_bench.jsonl -------------------------------------------------------------------------------- /projects/otb/otb_creation/data/underthink_bench.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/data/underthink_bench.pkl -------------------------------------------------------------------------------- /projects/otb/otb_creation/filter_overthink.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/filter_overthink.py -------------------------------------------------------------------------------- /projects/otb/otb_creation/prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otb_creation/prompts.py -------------------------------------------------------------------------------- /projects/otb/otbench/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otbench/__init__.py -------------------------------------------------------------------------------- /projects/otb/otbench/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/otbench/cli.py -------------------------------------------------------------------------------- /projects/otb/prepare.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/prepare.py -------------------------------------------------------------------------------- /projects/otb/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/requirements.txt -------------------------------------------------------------------------------- /projects/otb/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/setup.py -------------------------------------------------------------------------------- /projects/otb/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/otb/utils.py -------------------------------------------------------------------------------- /projects/sd-ra-it/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/README.md -------------------------------------------------------------------------------- /projects/sd-ra-it/configs/dpo_70b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/configs/dpo_70b.yaml -------------------------------------------------------------------------------- /projects/sd-ra-it/configs/dpo_8b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/configs/dpo_8b.yaml -------------------------------------------------------------------------------- /projects/sd-ra-it/configs/sft_70b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/configs/sft_70b.yaml -------------------------------------------------------------------------------- /projects/sd-ra-it/configs/sft_8b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/configs/sft_8b.yaml -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/create_self_demo_train_set.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/create_self_demo_train_set.sh -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/data/io_to_qas_format.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/data/io_to_qas_format.py -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/eval.py -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/generate.py -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/get_demos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/get_demos.py -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/prompt_optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/prompt_optimization.py -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/relevance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/relevance.py -------------------------------------------------------------------------------- /projects/sd-ra-it/scripts/reward_model_gemma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/sd-ra-it/scripts/reward_model_gemma.py -------------------------------------------------------------------------------- /projects/self_notes/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/README.md -------------------------------------------------------------------------------- /projects/self_notes/fig_method.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/fig_method.png -------------------------------------------------------------------------------- /projects/self_notes/fig_rel.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/fig_rel.png -------------------------------------------------------------------------------- /projects/self_notes/toy_story/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/toy_story/constants.py -------------------------------------------------------------------------------- /projects/self_notes/toy_story/graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/toy_story/graph.py -------------------------------------------------------------------------------- /projects/self_notes/toy_story/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/toy_story/main.py -------------------------------------------------------------------------------- /projects/self_notes/toy_story/relation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/toy_story/relation.py -------------------------------------------------------------------------------- /projects/self_notes/toy_story/rules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/toy_story/rules.py -------------------------------------------------------------------------------- /projects/self_notes/toy_story/world.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_notes/toy_story/world.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/README.md -------------------------------------------------------------------------------- /projects/self_taught_evaluator/data/prompts/eval_plan.prompt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/data/prompts/eval_plan.prompt -------------------------------------------------------------------------------- /projects/self_taught_evaluator/data/prompts/worse_response.prompt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/data/prompts/worse_response.prompt -------------------------------------------------------------------------------- /projects/self_taught_evaluator/data/training_data.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/data/training_data.yaml -------------------------------------------------------------------------------- /projects/self_taught_evaluator/figures/self_taught_dpo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/figures/self_taught_dpo.png -------------------------------------------------------------------------------- /projects/self_taught_evaluator/run_inference_wvllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/run_inference_wvllm.sh -------------------------------------------------------------------------------- /projects/self_taught_evaluator/run_rewardbench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/run_rewardbench.sh -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/src/__init__.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/load_dpo_data_from_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/src/load_dpo_data_from_hf.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/prepare_dpo_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/src/prepare_dpo_data.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/prepare_sft_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/src/prepare_sft_data.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/requirements.txt: -------------------------------------------------------------------------------- 1 | vllm 2 | fastchat 3 | fire 4 | rewardbench 5 | accelerate 6 | -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/run_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/src/run_model.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/src/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/src/utils.py -------------------------------------------------------------------------------- /projects/self_taught_evaluator/training_configs/dpo_training.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/training_configs/dpo_training.yaml -------------------------------------------------------------------------------- /projects/self_taught_evaluator/training_configs/sft_training.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/projects/self_taught_evaluator/training_configs/sft_training.yaml -------------------------------------------------------------------------------- /ram/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/ram/__init__.py -------------------------------------------------------------------------------- /ram/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/ram/data.py -------------------------------------------------------------------------------- /ram/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/ram/data_utils.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/RAM/HEAD/setup.py --------------------------------------------------------------------------------