├── CHANGELOG.md ├── LICENSE ├── Makefile ├── README.md ├── apex_setup.py ├── assets ├── bytedance.jpeg ├── memv2.jpeg ├── result.jpeg └── tdqkr.jpeg ├── checkpoints └── official │ ├── OLMo-1B.csv │ ├── OLMo-7B-0424.csv │ ├── OLMo-7B-0724.csv │ ├── OLMo-7B-Twin-2T.csv │ └── OLMo-7B.csv ├── configs ├── amberish1-weka.yaml ├── amberish13-weka.yaml ├── amberish7-weka.yaml ├── amberish70-weka.yaml ├── c4-extra-tiny-debug.yaml ├── c4-large.yaml ├── c4-medium.yaml ├── c4-small.yaml ├── c4-tiny.yaml ├── exps │ └── OLMoE-1B-7B-0906_reproduce.yml ├── llama7-s3.yaml ├── llama7.yaml ├── llamaish1-s3.yaml ├── llamaish7-s3.yaml ├── mcli │ ├── .gitignore │ ├── ananya-1b-ib.yaml │ ├── ananya-1b.yaml │ ├── harvest_hostnames.yaml │ ├── mitchish-final.yaml │ ├── mitchish-instruct.yml │ ├── mitchish.yaml │ ├── mitchish1.yaml │ ├── mitchish7.yaml │ ├── mitchish70-from160510.yaml │ ├── mitchish70.yaml │ ├── mosaic-ananya-1b.yaml │ ├── olmo7-ablation-baseline.yaml │ ├── olmo7-ablation-dedupedocs.yaml │ ├── olmo7-ablation-dolma17.yaml │ ├── v1-mix-medium-mitch-ish.yaml │ ├── v1-mix-medium.yaml │ ├── v1_5-mix-medium-mitch-ish.yaml │ └── v1_5-mix-medium.yaml ├── mitchish-instruct.yaml ├── mitchish1-s3.yaml ├── mitchish35.yaml ├── mitchish50.yaml ├── mitchish65-s3.yaml ├── mitchish65.yaml ├── mitchish7-llamainit-s3.yaml ├── mitchish7-s3.yaml ├── mitchish70-s3.yaml ├── mitchish70.yaml ├── official │ ├── OLMo-1B.yaml │ ├── OLMo-7B-0424.yaml │ ├── OLMo-7B-0724.yaml │ ├── OLMo-7B.yaml │ └── OLMoE-7B-A1B.yaml ├── olmo-small-ablation.yaml ├── olmo7-ablation-baseline.yaml ├── olmo7-ablation-dedupedocs.yaml ├── olmo7-ablation-dedupeparas.yaml ├── olmo7-ablation-dolma17.yaml ├── olmo7-ablation-final2.yaml ├── olmo7-ablation-refheavy.yaml ├── peteish1-weka.yaml ├── peteish7-weka.yaml ├── pile-llamaish7-s3.yaml ├── pile-llamaish7.yaml ├── tiny-llamaish-s3.yaml ├── tiny │ ├── OLMo-150M.yaml │ ├── OLMo-20M.yaml │ ├── OLMo-300M.yaml │ ├── OLMo-60M.yaml │ └── OLMo-700M.yaml ├── v1-mix-medium-mitch-ish-s3.yaml ├── v1-mix-medium-mitch-ish.yaml ├── v1-mix-medium-s3.yaml ├── v1-mix-medium.yaml ├── v1-mix-small-s3.yaml ├── v1-mix-small.yaml ├── v1_5-mix-medium-mitch-ish-s3.yaml ├── v1_5-mix-medium-mitch-ish.yaml └── v1_5-mix-medium-s3.yaml ├── conftest.py ├── docker ├── Dockerfile.base ├── Dockerfile.gantry ├── Dockerfile.lumi └── Dockerfile.test ├── docs ├── Checkpoints.md ├── Kempner.md ├── LUMI.md ├── NOTES.md ├── RELEASE_PROCESS.md ├── Safetensors.md └── TRAINLOG.md ├── evaluation ├── README.md ├── __init__.py ├── empty_workspace.py ├── experiments │ ├── evaluation_2023_07_26.jsonnet │ ├── task_sets │ │ ├── eval_suite_ppl_val_v2_small.libsonnet │ │ ├── eval_suite_ppl_val_v3.libsonnet │ │ ├── eval_suite_ppl_val_v3_small.libsonnet │ │ ├── gen_tasks.libsonnet │ │ ├── rc20_tasks.libsonnet │ │ ├── summary_tasks.libsonnet │ │ ├── task_utils.libsonnet │ │ └── test_sets │ │ │ ├── test_eval_suite_ppl_val_v2_small.libsonnet │ │ │ ├── test_gen_tasks.libsonnet │ │ │ └── test_rc20_tasks.libsonnet │ ├── test_config.jsonnet │ └── utils.libsonnet ├── requirements.txt ├── see_available_tasks.py ├── steps │ ├── __init__.py │ ├── get_model.py │ ├── run_catwalk.py │ └── wandb_metrics.py └── tango-in-beaker.yml ├── fuse_ops ├── __init__.py ├── fused_glu.cpp ├── fused_glu.cu ├── fused_index.py ├── fused_lookup.cpp ├── fused_lookup.cu ├── fused_topk.cpp ├── fused_topk.cu ├── scatter_add.py ├── test_fused_lookup.py ├── test_glu.py ├── test_scatter_add.py ├── unsorted_segment_sum.cpp └── unsorted_segment_sum.cu ├── hf_olmo ├── __init__.py ├── configuration_olmo.py ├── convert_olmo_to_hf.py ├── modeling_olmo.py ├── pyproject.toml ├── requirements.txt └── tokenization_olmo_fast.py ├── inference ├── NOTES.md ├── README.md ├── __init__.py ├── compression │ ├── dependencies │ │ └── AutoGPTQ │ │ │ ├── .gitignore │ │ │ ├── LICENSE │ │ │ ├── README.md │ │ │ ├── README_zh.md │ │ │ ├── auto_gptq │ │ │ ├── __init__.py │ │ │ ├── eval_tasks │ │ │ │ ├── __init__.py │ │ │ │ ├── _base.py │ │ │ │ ├── _utils │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── classification_utils.py │ │ │ │ │ └── generation_utils.py │ │ │ │ ├── language_modeling_task.py │ │ │ │ ├── sequence_classification_task.py │ │ │ │ └── text_summarization_task.py │ │ │ ├── modeling │ │ │ │ ├── __init__.py │ │ │ │ ├── _base.py │ │ │ │ ├── _const.py │ │ │ │ ├── _utils.py │ │ │ │ ├── auto.py │ │ │ │ ├── baichuan.py │ │ │ │ ├── bloom.py │ │ │ │ ├── codegen.py │ │ │ │ ├── gpt2.py │ │ │ │ ├── gpt_bigcode.py │ │ │ │ ├── gpt_neox.py │ │ │ │ ├── gptj.py │ │ │ │ ├── internlm.py │ │ │ │ ├── llama.py │ │ │ │ ├── moss.py │ │ │ │ ├── olmo.py │ │ │ │ ├── opt.py │ │ │ │ ├── qwen.py │ │ │ │ └── rw.py │ │ │ ├── nn_modules │ │ │ │ ├── __init__.py │ │ │ │ ├── _fused_base.py │ │ │ │ ├── fused_gptj_attn.py │ │ │ │ ├── fused_llama_attn.py │ │ │ │ ├── fused_llama_mlp.py │ │ │ │ ├── qlinear │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── qlinear_cuda.py │ │ │ │ │ ├── qlinear_cuda_old.py │ │ │ │ │ ├── qlinear_exllama.py │ │ │ │ │ └── qlinear_triton.py │ │ │ │ └── triton_utils │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── custom_autotune.py │ │ │ │ │ ├── kernels.py │ │ │ │ │ └── mixin.py │ │ │ ├── quantization │ │ │ │ ├── __init__.py │ │ │ │ ├── gptq.py │ │ │ │ └── quantizer.py │ │ │ └── utils │ │ │ │ ├── __init__.py │ │ │ │ ├── data_utils.py │ │ │ │ ├── import_utils.py │ │ │ │ ├── peft_utils.py │ │ │ │ └── perplexity_utils.py │ │ │ ├── autogptq_extension │ │ │ ├── cuda_256 │ │ │ │ ├── autogptq_cuda_256.cpp │ │ │ │ └── autogptq_cuda_kernel_256.cu │ │ │ ├── cuda_64 │ │ │ │ ├── autogptq_cuda_64.cpp │ │ │ │ └── autogptq_cuda_kernel_64.cu │ │ │ ├── exllama │ │ │ │ ├── cu_compat.cuh │ │ │ │ ├── cuda_buffers.cu │ │ │ │ ├── cuda_buffers.cuh │ │ │ │ ├── cuda_func │ │ │ │ │ ├── column_remap.cu │ │ │ │ │ ├── column_remap.cuh │ │ │ │ │ ├── q4_matmul.cu │ │ │ │ │ ├── q4_matmul.cuh │ │ │ │ │ ├── q4_matrix.cu │ │ │ │ │ └── q4_matrix.cuh │ │ │ │ ├── exllama_ext.cpp │ │ │ │ ├── hip_compat.cuh │ │ │ │ ├── matrix.cuh │ │ │ │ ├── tuning.h │ │ │ │ └── util.cuh │ │ │ └── qigen │ │ │ │ ├── generate.py │ │ │ │ ├── intrin.py │ │ │ │ ├── mmm.cpp │ │ │ │ └── template.py │ │ │ ├── docs │ │ │ ├── NEWS_OR_UPDATE.md │ │ │ └── tutorial │ │ │ │ ├── 01-Quick-Start.md │ │ │ │ └── 02-Advanced-Model-Loading-and-Best-Practice.md │ │ │ ├── examples │ │ │ ├── README.md │ │ │ ├── benchmark │ │ │ │ ├── generation_speed.py │ │ │ │ └── perplexity.py │ │ │ ├── evaluation │ │ │ │ ├── run_language_modeling_task.py │ │ │ │ ├── run_sequence_classification_task.py │ │ │ │ └── run_text_summarization_task.py │ │ │ ├── peft │ │ │ │ ├── peft_adalora_clm_instruction_tuning.py │ │ │ │ ├── peft_adaption_prompt_clm_instruction_tuning.py │ │ │ │ └── peft_lora_clm_instruction_tuning.py │ │ │ └── quantization │ │ │ │ ├── basic_usage.py │ │ │ │ ├── basic_usage_gpt_xl.py │ │ │ │ ├── basic_usage_wikitext2.py │ │ │ │ ├── dataset │ │ │ │ └── alpaca_data_cleaned.json │ │ │ │ └── quant_with_alpaca.py │ │ │ ├── setup.py │ │ │ └── tests │ │ │ └── test_q4.py │ ├── olmo_gptq_class.py │ ├── run_olmo_quantization.sh │ └── run_quantization.py ├── efficiency │ ├── dependencies │ │ ├── efficiency-pentathlon │ │ │ ├── .dockerignore │ │ │ ├── Dockerfile │ │ │ ├── LICENSE │ │ │ ├── README.md │ │ │ ├── eb_gantry │ │ │ │ ├── __init__.py │ │ │ │ ├── __main__.py │ │ │ │ ├── aliases.py │ │ │ │ ├── constants.py │ │ │ │ ├── entrypoint.sh │ │ │ │ ├── exceptions.py │ │ │ │ ├── py.typed │ │ │ │ ├── util.py │ │ │ │ └── version.py │ │ │ ├── efficiency_benchmark │ │ │ │ ├── __init__.py │ │ │ │ ├── __main__.py │ │ │ │ ├── dependencies │ │ │ │ │ ├── __init__.py │ │ │ │ │ └── lm_eval │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ ├── base.py │ │ │ │ │ │ ├── datasets │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ ├── arithmetic │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── arithmetic.py │ │ │ │ │ │ ├── asdiv │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── asdiv.py │ │ │ │ │ │ ├── coqa │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── coqa.py │ │ │ │ │ │ ├── drop │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── drop.py │ │ │ │ │ │ ├── headqa │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── headqa.py │ │ │ │ │ │ ├── hendrycks_ethics │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── hendrycks_ethics.py │ │ │ │ │ │ ├── hendrycks_math │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── hendrycks_math.py │ │ │ │ │ │ ├── lambada_openai │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── lambada_openai.py │ │ │ │ │ │ ├── logiqa │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── logiqa.py │ │ │ │ │ │ ├── mutual │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── mutual.py │ │ │ │ │ │ ├── pile │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── pile.py │ │ │ │ │ │ ├── quac │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── quac.py │ │ │ │ │ │ ├── sat_analogies │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── sat_analogies.py │ │ │ │ │ │ ├── triviaqa │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── triviaqa.py │ │ │ │ │ │ ├── unscramble │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── unscramble.py │ │ │ │ │ │ └── wikitext │ │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ │ └── wikitext.py │ │ │ │ │ │ ├── decontamination │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ ├── archiver.py │ │ │ │ │ │ ├── decontaminate.py │ │ │ │ │ │ └── janitor.py │ │ │ │ │ │ ├── evaluator.py │ │ │ │ │ │ ├── metrics.py │ │ │ │ │ │ ├── models │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ ├── dummy.py │ │ │ │ │ │ ├── gpt2.py │ │ │ │ │ │ ├── gpt3.py │ │ │ │ │ │ └── textsynth.py │ │ │ │ │ │ ├── tasks │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ ├── anli.py │ │ │ │ │ │ ├── arc.py │ │ │ │ │ │ ├── arithmetic.py │ │ │ │ │ │ ├── asdiv.py │ │ │ │ │ │ ├── blimp.py │ │ │ │ │ │ ├── cbt.py │ │ │ │ │ │ ├── coqa.py │ │ │ │ │ │ ├── drop.py │ │ │ │ │ │ ├── glue.py │ │ │ │ │ │ ├── gsm8k.py │ │ │ │ │ │ ├── headqa.py │ │ │ │ │ │ ├── hellaswag.py │ │ │ │ │ │ ├── hendrycks_ethics.py │ │ │ │ │ │ ├── hendrycks_math.py │ │ │ │ │ │ ├── hendrycks_test.py │ │ │ │ │ │ ├── lambada.py │ │ │ │ │ │ ├── lambada_cloze.py │ │ │ │ │ │ ├── lambada_multilingual.py │ │ │ │ │ │ ├── logiqa.py │ │ │ │ │ │ ├── mathqa.py │ │ │ │ │ │ ├── mc_taco.py │ │ │ │ │ │ ├── mutual.py │ │ │ │ │ │ ├── naturalqs.py │ │ │ │ │ │ ├── openbookqa.py │ │ │ │ │ │ ├── pile.py │ │ │ │ │ │ ├── piqa.py │ │ │ │ │ │ ├── prost.py │ │ │ │ │ │ ├── pubmedqa.py │ │ │ │ │ │ ├── qa4mre.py │ │ │ │ │ │ ├── qasper.py │ │ │ │ │ │ ├── quac.py │ │ │ │ │ │ ├── race.py │ │ │ │ │ │ ├── sat.py │ │ │ │ │ │ ├── sciq.py │ │ │ │ │ │ ├── squad.py │ │ │ │ │ │ ├── storycloze.py │ │ │ │ │ │ ├── superglue.py │ │ │ │ │ │ ├── swag.py │ │ │ │ │ │ ├── translation.py │ │ │ │ │ │ ├── triviaqa.py │ │ │ │ │ │ ├── truthfulqa.py │ │ │ │ │ │ ├── unscramble.py │ │ │ │ │ │ ├── webqs.py │ │ │ │ │ │ ├── wikitext.py │ │ │ │ │ │ ├── winogrande.py │ │ │ │ │ │ └── wsc273.py │ │ │ │ │ │ └── utils.py │ │ │ │ ├── efficiency │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── power_monitor.py │ │ │ │ │ └── profiler.py │ │ │ │ ├── metrics │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── accuracy.py │ │ │ │ │ ├── bleu.py │ │ │ │ │ ├── entropy.py │ │ │ │ │ └── perplexity.py │ │ │ │ ├── stdio_wrapper.py │ │ │ │ ├── steps.py │ │ │ │ ├── tango_utils │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── det_hash.py │ │ │ │ │ └── sequences.py │ │ │ │ ├── task.py │ │ │ │ ├── tasks │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── efficiency_benchmark.py │ │ │ │ │ ├── eleuther.py │ │ │ │ │ ├── huggingface.py │ │ │ │ │ ├── metaicl.py │ │ │ │ │ ├── mrqa.py │ │ │ │ │ ├── p3.py │ │ │ │ │ ├── raft.py │ │ │ │ │ └── t5.py │ │ │ │ └── utils.py │ │ │ ├── profile.d │ │ │ │ ├── aliases.sh │ │ │ │ ├── conda.sh │ │ │ │ ├── env.sh │ │ │ │ ├── path.sh │ │ │ │ └── prompt.sh │ │ │ ├── requirements.txt │ │ │ ├── scripts │ │ │ │ ├── process_data.py │ │ │ │ ├── process_raft.sh │ │ │ │ └── process_wmt.sh │ │ │ └── setup.py │ │ └── previous_version │ │ │ ├── efficiency_benchmark │ │ │ ├── __init__.py │ │ │ ├── __main__.py │ │ │ ├── dependencies │ │ │ │ ├── __init__.py │ │ │ │ └── lm_eval │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── base.py │ │ │ │ │ ├── datasets │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── arithmetic │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── arithmetic.py │ │ │ │ │ ├── asdiv │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── asdiv.py │ │ │ │ │ ├── coqa │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── coqa.py │ │ │ │ │ ├── drop │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── drop.py │ │ │ │ │ ├── headqa │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── headqa.py │ │ │ │ │ ├── hendrycks_ethics │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── hendrycks_ethics.py │ │ │ │ │ ├── hendrycks_math │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── hendrycks_math.py │ │ │ │ │ ├── lambada_openai │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── lambada_openai.py │ │ │ │ │ ├── logiqa │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── logiqa.py │ │ │ │ │ ├── mutual │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── mutual.py │ │ │ │ │ ├── pile │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── pile.py │ │ │ │ │ ├── quac │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── quac.py │ │ │ │ │ ├── sat_analogies │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── sat_analogies.py │ │ │ │ │ ├── triviaqa │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── triviaqa.py │ │ │ │ │ ├── unscramble │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── unscramble.py │ │ │ │ │ └── wikitext │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ └── wikitext.py │ │ │ │ │ ├── decontamination │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── archiver.py │ │ │ │ │ ├── decontaminate.py │ │ │ │ │ └── janitor.py │ │ │ │ │ ├── evaluator.py │ │ │ │ │ ├── metrics.py │ │ │ │ │ ├── models │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── dummy.py │ │ │ │ │ ├── gpt2.py │ │ │ │ │ ├── gpt3.py │ │ │ │ │ └── textsynth.py │ │ │ │ │ ├── tasks │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── anli.py │ │ │ │ │ ├── arc.py │ │ │ │ │ ├── arithmetic.py │ │ │ │ │ ├── asdiv.py │ │ │ │ │ ├── blimp.py │ │ │ │ │ ├── cbt.py │ │ │ │ │ ├── coqa.py │ │ │ │ │ ├── drop.py │ │ │ │ │ ├── glue.py │ │ │ │ │ ├── gsm8k.py │ │ │ │ │ ├── headqa.py │ │ │ │ │ ├── hellaswag.py │ │ │ │ │ ├── hendrycks_ethics.py │ │ │ │ │ ├── hendrycks_math.py │ │ │ │ │ ├── hendrycks_test.py │ │ │ │ │ ├── lambada.py │ │ │ │ │ ├── lambada_cloze.py │ │ │ │ │ ├── lambada_multilingual.py │ │ │ │ │ ├── logiqa.py │ │ │ │ │ ├── mathqa.py │ │ │ │ │ ├── mc_taco.py │ │ │ │ │ ├── mutual.py │ │ │ │ │ ├── naturalqs.py │ │ │ │ │ ├── openbookqa.py │ │ │ │ │ ├── pile.py │ │ │ │ │ ├── piqa.py │ │ │ │ │ ├── prost.py │ │ │ │ │ ├── pubmedqa.py │ │ │ │ │ ├── qa4mre.py │ │ │ │ │ ├── qasper.py │ │ │ │ │ ├── quac.py │ │ │ │ │ ├── race.py │ │ │ │ │ ├── sat.py │ │ │ │ │ ├── sciq.py │ │ │ │ │ ├── squad.py │ │ │ │ │ ├── storycloze.py │ │ │ │ │ ├── superglue.py │ │ │ │ │ ├── swag.py │ │ │ │ │ ├── translation.py │ │ │ │ │ ├── triviaqa.py │ │ │ │ │ ├── truthfulqa.py │ │ │ │ │ ├── unscramble.py │ │ │ │ │ ├── webqs.py │ │ │ │ │ ├── wikitext.py │ │ │ │ │ ├── winogrande.py │ │ │ │ │ └── wsc273.py │ │ │ │ │ └── utils.py │ │ │ ├── efficiency │ │ │ │ ├── __init__.py │ │ │ │ ├── power_monitor.py │ │ │ │ └── profiler.py │ │ │ ├── metrics │ │ │ │ ├── __init__.py │ │ │ │ ├── accuracy.py │ │ │ │ ├── bleu.py │ │ │ │ ├── entropy.py │ │ │ │ └── perplexity.py │ │ │ ├── stdio_wrapper.py │ │ │ ├── steps.py │ │ │ ├── tango_utils │ │ │ │ ├── __init__.py │ │ │ │ ├── det_hash.py │ │ │ │ └── sequences.py │ │ │ ├── task.py │ │ │ ├── tasks │ │ │ │ ├── __init__.py │ │ │ │ ├── efficiency_benchmark.py │ │ │ │ ├── eleuther.py │ │ │ │ ├── huggingface.py │ │ │ │ ├── metaicl.py │ │ │ │ ├── mrqa.py │ │ │ │ ├── p3.py │ │ │ │ ├── raft.py │ │ │ │ └── t5.py │ │ │ └── utils.py │ │ │ ├── efficiency_requirements.txt │ │ │ ├── olmo_efficiency.py │ │ │ └── olmo_efficiency.sh │ ├── run_efficiency_benchmark.py │ └── run_efficiency_benchmark.sh ├── eval │ ├── __init__.py │ ├── dispatch_openai_requests.py │ ├── mmlu │ │ ├── __init__.py │ │ ├── categories.py │ │ ├── eval_on_mmlu.sh │ │ └── run_eval.py │ ├── requirements.txt │ └── utils.py └── requirements.txt ├── launch.sh ├── olmo ├── __init__.py ├── aliases.py ├── beam_search.py ├── checkpoint.py ├── config.py ├── data │ ├── __init__.py │ ├── collator.py │ ├── iterable_dataset.py │ ├── memmap_dataset.py │ ├── named_data_mixes.py │ └── util.py ├── eval │ ├── __init__.py │ ├── downstream.py │ └── evaluator.py ├── exceptions.py ├── initialization.py ├── memory_parallel.py ├── memory_plus_layer.py ├── model.py ├── optim.py ├── product_key │ ├── colwise_embedding_bag.py │ ├── memory.py │ └── xformer_embeddingbag.py ├── py.typed ├── safetensors_util.py ├── tokenizer.py ├── torch_util.py ├── train.py ├── ultramem_layer.py ├── ultramem_layer_v2.py ├── util.py └── version.py ├── olmo_data ├── __init__.py ├── data.py ├── hf_datasets │ ├── ai2_arc │ │ ├── ARC-Challenge │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ └── ARC-Easy │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── allenai │ │ └── basic_arithmetic │ │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── boolq │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── glue │ │ ├── mrpc │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ ├── rte │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ └── sst2 │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── hails │ │ └── mmlu_no_train │ │ │ ├── abstract_algebra │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── anatomy │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── astronomy │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── business_ethics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── clinical_knowledge │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── college_biology │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── college_chemistry │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── college_computer_science │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── college_mathematics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── college_medicine │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── college_physics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── computer_security │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── conceptual_physics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── econometrics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── electrical_engineering │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── elementary_mathematics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── formal_logic │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── global_facts │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_biology │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_chemistry │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_computer_science │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_european_history │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_geography │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_government_and_politics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_macroeconomics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_mathematics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_microeconomics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_physics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_psychology │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_statistics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_us_history │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── high_school_world_history │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── human_aging │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── human_sexuality │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── international_law │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── jurisprudence │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── logical_fallacies │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── machine_learning │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── management │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── marketing │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── medical_genetics │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── miscellaneous │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── moral_disputes │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── moral_scenarios │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── nutrition │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── philosophy │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── prehistory │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── professional_accounting │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── professional_law │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── professional_medicine │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── professional_psychology │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── public_relations │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── security_studies │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── sociology │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── us_foreign_policy │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── virology │ │ │ ├── dev │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ ├── test │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ │ └── world_religions │ │ │ ├── dev │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ │ │ ├── test │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── hellaswag │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── nq_open │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── openbookqa │ │ └── main │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── piqa │ │ └── plain_text │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── sciq │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── social_i_qa │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── super_glue │ │ ├── cb │ │ │ └── validation │ │ │ │ ├── data-00000-of-00001.arrow │ │ │ │ ├── dataset_info.json │ │ │ │ └── state.json │ │ └── copa │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── tau │ │ └── commonsense_qa │ │ │ └── none │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ ├── trivia_qa │ │ └── rc.wikipedia.nocontext │ │ │ └── validation │ │ │ ├── data-00000-of-00001.arrow │ │ │ ├── dataset_info.json │ │ │ └── state.json │ └── winogrande │ │ └── winogrande_xl │ │ └── validation │ │ ├── data-00000-of-00001.arrow │ │ ├── dataset_info.json │ │ └── state.json ├── oe_eval_tasks │ ├── arc_challenge │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── arc_easy │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── boolq │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── copa │ │ └── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── copycolors │ │ ├── 10way │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── xl_10way │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── csqa │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── hellaswag │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── openbookqa │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── piqa │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── sciq │ │ └── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ ├── socialiqa │ │ ├── mc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ │ ├── config.json │ │ │ └── requests.jsonl.gz │ └── winogrande │ │ ├── mc_5shot │ │ ├── config.json │ │ └── requests.jsonl.gz │ │ ├── rc_0shot │ │ ├── config.json │ │ └── requests.jsonl.gz │ │ └── rc_5shot │ │ ├── config.json │ │ └── requests.jsonl.gz └── tokenizers │ ├── allenai_eleuther-ai-gpt-neox-20b-pii-special.json │ └── allenai_gpt-neox-olmo-dolma-v1_5.json ├── pyproject.toml ├── run.sh ├── run_memory_plus.sh ├── run_moe.sh ├── run_ultramem_v1.sh ├── run_ultramem_v2.sh ├── scripts ├── add_code_eval.py ├── beaker │ ├── amberish │ │ ├── amberish1-8k-cham-launch.sh │ │ ├── amberish1-8k-cham.sh │ │ ├── amberish1-8k-doc-mask-cham-launch.sh │ │ ├── amberish1-8k-doc-mask-cham-rtheta-launch.sh │ │ ├── amberish1-8k-doc-mask-cham-rtheta.sh │ │ ├── amberish1-8k-doc-mask-cham.sh │ │ ├── amberish1-chameleon-launch.sh │ │ ├── amberish1-chameleon.sh │ │ ├── amberish1-emb-init-1-launch.sh │ │ ├── amberish1-emb-init-1.sh │ │ ├── amberish1-launch.sh │ │ ├── amberish1-selective-updates-launch.sh │ │ ├── amberish1-selective-updates.sh │ │ ├── amberish1-wd-all-launch.sh │ │ ├── amberish1-wd-all.sh │ │ ├── amberish1-z-loss-launch.sh │ │ ├── amberish1-z-loss.sh │ │ ├── amberish1.sh │ │ ├── amberish7-launch.sh │ │ ├── amberish7.sh │ │ ├── amberish70-launch.sh │ │ └── amberish70.sh │ ├── beaker_interactive.sh │ ├── chameleon │ │ ├── llamaish1-launch.sh │ │ ├── llamaish1-normal-launch.sh │ │ ├── llamaish1-normal-qk-norm-reorder-zloss-launch.sh │ │ ├── llamaish1-normal-qk-norm-reorder-zloss.sh │ │ ├── llamaish1-normal.sh │ │ ├── llamaish1-qk-norm-reorder-launch.sh │ │ ├── llamaish1-qk-norm-reorder-zloss-launch.sh │ │ ├── llamaish1-qk-norm-reorder-zloss.sh │ │ ├── llamaish1-qk-norm-reorder.sh │ │ ├── llamaish1.sh │ │ ├── llamaish7-normal-qk-norm-reorder-zloss-launch.sh │ │ ├── llamaish7-normal-qk-norm-reorder-zloss.sh │ │ ├── llamaish7-qk-norm-launch.sh │ │ ├── llamaish7-qk-norm-reorder-launch.sh │ │ ├── llamaish7-qk-norm-reorder-zloss-launch.sh │ │ ├── llamaish7-qk-norm-reorder-zloss.sh │ │ ├── llamaish7-qk-norm-reorder.sh │ │ └── llamaish7-qk-norm.sh │ ├── ib-ananya-1b.sh │ ├── ladder-launch.sh │ ├── ladder.sh │ ├── llamaish7-launch.sh │ ├── llamaish7-normal-launch.sh │ ├── llamaish7-normal.sh │ ├── llamaish7.sh │ ├── mitch-ish-7b.sh │ ├── mitchish65.sh │ ├── mitchish7-launch.sh │ ├── mitchish7-llamainit-launch.sh │ ├── mitchish7-llamainit.sh │ ├── mitchish7.sh │ ├── mitchish70-from160510-launch.sh │ ├── mitchish70-from160510.sh │ ├── mitchish70-launch.sh │ ├── mitchish70-loadtest-launch.sh │ ├── mitchish70-loadtest.sh │ ├── mitchish70.sh │ ├── olmo-small-ablation-on-gantry.sh │ ├── olmo7-ablation-baseline.sh │ ├── olmo7-ablation-dedupeparas.sh │ ├── olmo7-ablation-final2.sh │ ├── olmo7-ablation-refheavy.sh │ ├── peteish │ │ ├── peteish1-launch.sh │ │ ├── peteish1.sh │ │ ├── peteish7-launch.sh │ │ └── peteish7.sh │ ├── pile-llamaish7-launch.sh │ ├── pile-llamaish7.sh │ ├── tiny-llamaish-launch.sh │ ├── tiny-llamaish.sh │ ├── tiny │ │ ├── gantry-script.sh │ │ └── torchrun-script.sh │ ├── unshard-launch.sh │ ├── unshard.sh │ └── warm_hf_cache.sh ├── compare_model_state.py ├── compare_module_outputs.py ├── compare_wandb_configs.py ├── convert_olmo_to_hf_new.py ├── convert_pt_to_safetensors.py ├── init_config.py ├── inspect_train_data.py ├── kempner │ ├── llama7.sh │ ├── log_into_node.sh │ ├── mitch-ish-7b.sh │ └── v1-mix-small.sh ├── ladder.ipynb ├── ladder.py ├── list_evals_from_oe_eval.py ├── lumi │ ├── c4-large-on-lumi.sh │ ├── c4-medium-on-lumi.sh │ ├── c4-small-on-lumi.sh │ ├── llama7.sh │ ├── log_into_node.sh │ ├── lumi-interactive.sh │ ├── mitch-ish-7b.sh │ ├── mitchish65-randomseed.sh │ ├── mitchish65.sh │ ├── mitchish70.sh │ ├── olmo-small-ablation-on-lumi.sh │ ├── olmo7-ablations.sh │ ├── pile-llamaish7.sh │ ├── v1-mix-medium-on-lumi.sh │ └── v1-mix-small-on-lumi.sh ├── mcli │ ├── manage_run.py │ └── unshard_mitchish70.sh ├── prepare_changelog.py ├── prepare_memmap_dataset.py ├── prepare_tulu_data.py ├── pyspy_all_nodes.sh ├── pyspy_all_processes.sh ├── release.sh ├── release_notes.py ├── run_dataloader.py ├── run_with_environment.sh ├── s3_unshard_to_hf.py ├── show_model_size.py ├── split_gz.py ├── storage_cleaner.py ├── test_entrypoint.sh ├── train.py ├── unshard.py └── wandb_change_group.py ├── test_fixtures ├── c4-sample.01.json.gz ├── c4-sample.02.json.gz ├── c4-sample.03.json.gz ├── evaluation │ └── ppl-test-data │ │ ├── 4chan │ │ └── val │ │ │ └── 4chan_00000000.jsonl.gz │ │ └── c4_100_domains │ │ └── val │ │ └── c4_100_domains_5_www.theguardian.com_00000000.jsonl.gz ├── test-olmo-model │ ├── config.json │ ├── config.yaml │ ├── model.pt │ ├── pytorch_model.bin │ ├── special_tokens_map.json │ ├── tokenizer.json │ └── tokenizer_config.json ├── train_tiny.yaml └── train_tiny_with_evaluator.yaml └── tests ├── __init__.py ├── beam_search_test.py ├── checkpoint_test.py ├── config_test.py ├── data ├── __init__.py ├── collator_test.py ├── iterable_dataset_test.py ├── memmap_dataset_test.py └── util_test.py ├── ddp_checkpoint_test.py ├── eval └── downstream_test.py ├── grad_norm_test.py ├── hf_olmo ├── __init__.py ├── configuration_olmo_test.py ├── hf_olmo_test.py ├── hf_pipeline_test.py ├── modeling_olmo_test.py └── tokenization_olmo_fast_test.py ├── initialization_test.py ├── model_test.py ├── optim_test.py ├── tokenizer_test.py ├── torch_util_test.py ├── train_test.py └── util_test.py /CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/CHANGELOG.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/README.md -------------------------------------------------------------------------------- /apex_setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/apex_setup.py -------------------------------------------------------------------------------- /assets/bytedance.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/assets/bytedance.jpeg -------------------------------------------------------------------------------- /assets/memv2.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/assets/memv2.jpeg -------------------------------------------------------------------------------- /assets/result.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/assets/result.jpeg -------------------------------------------------------------------------------- /assets/tdqkr.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/assets/tdqkr.jpeg -------------------------------------------------------------------------------- /checkpoints/official/OLMo-1B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/checkpoints/official/OLMo-1B.csv -------------------------------------------------------------------------------- /checkpoints/official/OLMo-7B-0424.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/checkpoints/official/OLMo-7B-0424.csv -------------------------------------------------------------------------------- /checkpoints/official/OLMo-7B-0724.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/checkpoints/official/OLMo-7B-0724.csv -------------------------------------------------------------------------------- /checkpoints/official/OLMo-7B-Twin-2T.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/checkpoints/official/OLMo-7B-Twin-2T.csv -------------------------------------------------------------------------------- /checkpoints/official/OLMo-7B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/checkpoints/official/OLMo-7B.csv -------------------------------------------------------------------------------- /configs/amberish1-weka.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/amberish1-weka.yaml -------------------------------------------------------------------------------- /configs/amberish13-weka.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/amberish13-weka.yaml -------------------------------------------------------------------------------- /configs/amberish7-weka.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/amberish7-weka.yaml -------------------------------------------------------------------------------- /configs/amberish70-weka.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/amberish70-weka.yaml -------------------------------------------------------------------------------- /configs/c4-extra-tiny-debug.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/c4-extra-tiny-debug.yaml -------------------------------------------------------------------------------- /configs/c4-large.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/c4-large.yaml -------------------------------------------------------------------------------- /configs/c4-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/c4-medium.yaml -------------------------------------------------------------------------------- /configs/c4-small.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/c4-small.yaml -------------------------------------------------------------------------------- /configs/c4-tiny.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/c4-tiny.yaml -------------------------------------------------------------------------------- /configs/exps/OLMoE-1B-7B-0906_reproduce.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/exps/OLMoE-1B-7B-0906_reproduce.yml -------------------------------------------------------------------------------- /configs/llama7-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/llama7-s3.yaml -------------------------------------------------------------------------------- /configs/llama7.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/llama7.yaml -------------------------------------------------------------------------------- /configs/llamaish1-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/llamaish1-s3.yaml -------------------------------------------------------------------------------- /configs/llamaish7-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/llamaish7-s3.yaml -------------------------------------------------------------------------------- /configs/mcli/.gitignore: -------------------------------------------------------------------------------- 1 | petew-* 2 | -------------------------------------------------------------------------------- /configs/mcli/ananya-1b-ib.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/ananya-1b-ib.yaml -------------------------------------------------------------------------------- /configs/mcli/ananya-1b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/ananya-1b.yaml -------------------------------------------------------------------------------- /configs/mcli/harvest_hostnames.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/harvest_hostnames.yaml -------------------------------------------------------------------------------- /configs/mcli/mitchish-final.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish-final.yaml -------------------------------------------------------------------------------- /configs/mcli/mitchish-instruct.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish-instruct.yml -------------------------------------------------------------------------------- /configs/mcli/mitchish.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish.yaml -------------------------------------------------------------------------------- /configs/mcli/mitchish1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish1.yaml -------------------------------------------------------------------------------- /configs/mcli/mitchish7.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish7.yaml -------------------------------------------------------------------------------- /configs/mcli/mitchish70-from160510.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish70-from160510.yaml -------------------------------------------------------------------------------- /configs/mcli/mitchish70.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mitchish70.yaml -------------------------------------------------------------------------------- /configs/mcli/mosaic-ananya-1b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/mosaic-ananya-1b.yaml -------------------------------------------------------------------------------- /configs/mcli/olmo7-ablation-baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/olmo7-ablation-baseline.yaml -------------------------------------------------------------------------------- /configs/mcli/olmo7-ablation-dedupedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/olmo7-ablation-dedupedocs.yaml -------------------------------------------------------------------------------- /configs/mcli/olmo7-ablation-dolma17.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/olmo7-ablation-dolma17.yaml -------------------------------------------------------------------------------- /configs/mcli/v1-mix-medium-mitch-ish.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/v1-mix-medium-mitch-ish.yaml -------------------------------------------------------------------------------- /configs/mcli/v1-mix-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/v1-mix-medium.yaml -------------------------------------------------------------------------------- /configs/mcli/v1_5-mix-medium-mitch-ish.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/v1_5-mix-medium-mitch-ish.yaml -------------------------------------------------------------------------------- /configs/mcli/v1_5-mix-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mcli/v1_5-mix-medium.yaml -------------------------------------------------------------------------------- /configs/mitchish-instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish-instruct.yaml -------------------------------------------------------------------------------- /configs/mitchish1-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish1-s3.yaml -------------------------------------------------------------------------------- /configs/mitchish35.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish35.yaml -------------------------------------------------------------------------------- /configs/mitchish50.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish50.yaml -------------------------------------------------------------------------------- /configs/mitchish65-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish65-s3.yaml -------------------------------------------------------------------------------- /configs/mitchish65.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish65.yaml -------------------------------------------------------------------------------- /configs/mitchish7-llamainit-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish7-llamainit-s3.yaml -------------------------------------------------------------------------------- /configs/mitchish7-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish7-s3.yaml -------------------------------------------------------------------------------- /configs/mitchish70-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish70-s3.yaml -------------------------------------------------------------------------------- /configs/mitchish70.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/mitchish70.yaml -------------------------------------------------------------------------------- /configs/official/OLMo-1B.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/official/OLMo-1B.yaml -------------------------------------------------------------------------------- /configs/official/OLMo-7B-0424.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/official/OLMo-7B-0424.yaml -------------------------------------------------------------------------------- /configs/official/OLMo-7B-0724.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/official/OLMo-7B-0724.yaml -------------------------------------------------------------------------------- /configs/official/OLMo-7B.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/official/OLMo-7B.yaml -------------------------------------------------------------------------------- /configs/official/OLMoE-7B-A1B.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/official/OLMoE-7B-A1B.yaml -------------------------------------------------------------------------------- /configs/olmo-small-ablation.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo-small-ablation.yaml -------------------------------------------------------------------------------- /configs/olmo7-ablation-baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo7-ablation-baseline.yaml -------------------------------------------------------------------------------- /configs/olmo7-ablation-dedupedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo7-ablation-dedupedocs.yaml -------------------------------------------------------------------------------- /configs/olmo7-ablation-dedupeparas.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo7-ablation-dedupeparas.yaml -------------------------------------------------------------------------------- /configs/olmo7-ablation-dolma17.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo7-ablation-dolma17.yaml -------------------------------------------------------------------------------- /configs/olmo7-ablation-final2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo7-ablation-final2.yaml -------------------------------------------------------------------------------- /configs/olmo7-ablation-refheavy.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/olmo7-ablation-refheavy.yaml -------------------------------------------------------------------------------- /configs/peteish1-weka.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/peteish1-weka.yaml -------------------------------------------------------------------------------- /configs/peteish7-weka.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/peteish7-weka.yaml -------------------------------------------------------------------------------- /configs/pile-llamaish7-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/pile-llamaish7-s3.yaml -------------------------------------------------------------------------------- /configs/pile-llamaish7.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/pile-llamaish7.yaml -------------------------------------------------------------------------------- /configs/tiny-llamaish-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/tiny-llamaish-s3.yaml -------------------------------------------------------------------------------- /configs/tiny/OLMo-150M.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/tiny/OLMo-150M.yaml -------------------------------------------------------------------------------- /configs/tiny/OLMo-20M.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/tiny/OLMo-20M.yaml -------------------------------------------------------------------------------- /configs/tiny/OLMo-300M.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/tiny/OLMo-300M.yaml -------------------------------------------------------------------------------- /configs/tiny/OLMo-60M.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/tiny/OLMo-60M.yaml -------------------------------------------------------------------------------- /configs/tiny/OLMo-700M.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/tiny/OLMo-700M.yaml -------------------------------------------------------------------------------- /configs/v1-mix-medium-mitch-ish-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1-mix-medium-mitch-ish-s3.yaml -------------------------------------------------------------------------------- /configs/v1-mix-medium-mitch-ish.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1-mix-medium-mitch-ish.yaml -------------------------------------------------------------------------------- /configs/v1-mix-medium-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1-mix-medium-s3.yaml -------------------------------------------------------------------------------- /configs/v1-mix-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1-mix-medium.yaml -------------------------------------------------------------------------------- /configs/v1-mix-small-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1-mix-small-s3.yaml -------------------------------------------------------------------------------- /configs/v1-mix-small.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1-mix-small.yaml -------------------------------------------------------------------------------- /configs/v1_5-mix-medium-mitch-ish-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1_5-mix-medium-mitch-ish-s3.yaml -------------------------------------------------------------------------------- /configs/v1_5-mix-medium-mitch-ish.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1_5-mix-medium-mitch-ish.yaml -------------------------------------------------------------------------------- /configs/v1_5-mix-medium-s3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/configs/v1_5-mix-medium-s3.yaml -------------------------------------------------------------------------------- /conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/conftest.py -------------------------------------------------------------------------------- /docker/Dockerfile.base: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docker/Dockerfile.base -------------------------------------------------------------------------------- /docker/Dockerfile.gantry: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docker/Dockerfile.gantry -------------------------------------------------------------------------------- /docker/Dockerfile.lumi: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docker/Dockerfile.lumi -------------------------------------------------------------------------------- /docker/Dockerfile.test: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docker/Dockerfile.test -------------------------------------------------------------------------------- /docs/Checkpoints.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/Checkpoints.md -------------------------------------------------------------------------------- /docs/Kempner.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/Kempner.md -------------------------------------------------------------------------------- /docs/LUMI.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/LUMI.md -------------------------------------------------------------------------------- /docs/NOTES.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/NOTES.md -------------------------------------------------------------------------------- /docs/RELEASE_PROCESS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/RELEASE_PROCESS.md -------------------------------------------------------------------------------- /docs/Safetensors.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/Safetensors.md -------------------------------------------------------------------------------- /docs/TRAINLOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/docs/TRAINLOG.md -------------------------------------------------------------------------------- /evaluation/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/README.md -------------------------------------------------------------------------------- /evaluation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /evaluation/empty_workspace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/empty_workspace.py -------------------------------------------------------------------------------- /evaluation/experiments/evaluation_2023_07_26.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/evaluation_2023_07_26.jsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/eval_suite_ppl_val_v2_small.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/eval_suite_ppl_val_v2_small.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/eval_suite_ppl_val_v3.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/eval_suite_ppl_val_v3.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/eval_suite_ppl_val_v3_small.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/eval_suite_ppl_val_v3_small.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/gen_tasks.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/gen_tasks.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/rc20_tasks.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/rc20_tasks.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/summary_tasks.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/summary_tasks.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/task_utils.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/task_utils.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/test_sets/test_gen_tasks.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/test_sets/test_gen_tasks.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/task_sets/test_sets/test_rc20_tasks.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/task_sets/test_sets/test_rc20_tasks.libsonnet -------------------------------------------------------------------------------- /evaluation/experiments/test_config.jsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/test_config.jsonnet -------------------------------------------------------------------------------- /evaluation/experiments/utils.libsonnet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/experiments/utils.libsonnet -------------------------------------------------------------------------------- /evaluation/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/requirements.txt -------------------------------------------------------------------------------- /evaluation/see_available_tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/see_available_tasks.py -------------------------------------------------------------------------------- /evaluation/steps/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/steps/__init__.py -------------------------------------------------------------------------------- /evaluation/steps/get_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/steps/get_model.py -------------------------------------------------------------------------------- /evaluation/steps/run_catwalk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/steps/run_catwalk.py -------------------------------------------------------------------------------- /evaluation/steps/wandb_metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/steps/wandb_metrics.py -------------------------------------------------------------------------------- /evaluation/tango-in-beaker.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/evaluation/tango-in-beaker.yml -------------------------------------------------------------------------------- /fuse_ops/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/__init__.py -------------------------------------------------------------------------------- /fuse_ops/fused_glu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_glu.cpp -------------------------------------------------------------------------------- /fuse_ops/fused_glu.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_glu.cu -------------------------------------------------------------------------------- /fuse_ops/fused_index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_index.py -------------------------------------------------------------------------------- /fuse_ops/fused_lookup.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_lookup.cpp -------------------------------------------------------------------------------- /fuse_ops/fused_lookup.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_lookup.cu -------------------------------------------------------------------------------- /fuse_ops/fused_topk.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_topk.cpp -------------------------------------------------------------------------------- /fuse_ops/fused_topk.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/fused_topk.cu -------------------------------------------------------------------------------- /fuse_ops/scatter_add.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/scatter_add.py -------------------------------------------------------------------------------- /fuse_ops/test_fused_lookup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/test_fused_lookup.py -------------------------------------------------------------------------------- /fuse_ops/test_glu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/test_glu.py -------------------------------------------------------------------------------- /fuse_ops/test_scatter_add.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/test_scatter_add.py -------------------------------------------------------------------------------- /fuse_ops/unsorted_segment_sum.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/unsorted_segment_sum.cpp -------------------------------------------------------------------------------- /fuse_ops/unsorted_segment_sum.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/fuse_ops/unsorted_segment_sum.cu -------------------------------------------------------------------------------- /hf_olmo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/hf_olmo/__init__.py -------------------------------------------------------------------------------- /hf_olmo/configuration_olmo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/hf_olmo/configuration_olmo.py -------------------------------------------------------------------------------- /hf_olmo/convert_olmo_to_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/hf_olmo/convert_olmo_to_hf.py -------------------------------------------------------------------------------- /hf_olmo/modeling_olmo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/hf_olmo/modeling_olmo.py -------------------------------------------------------------------------------- /hf_olmo/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/hf_olmo/pyproject.toml -------------------------------------------------------------------------------- /hf_olmo/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers 2 | -------------------------------------------------------------------------------- /hf_olmo/tokenization_olmo_fast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/hf_olmo/tokenization_olmo_fast.py -------------------------------------------------------------------------------- /inference/NOTES.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/NOTES.md -------------------------------------------------------------------------------- /inference/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/README.md -------------------------------------------------------------------------------- /inference/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/.gitignore -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/LICENSE -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/README.md -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/README_zh.md -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/__init__.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/eval_tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/eval_tasks/__init__.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/eval_tasks/_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/eval_tasks/_base.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/eval_tasks/_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/__init__.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/_base.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/_const.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/_const.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/_utils.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/auto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/auto.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/baichuan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/baichuan.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/bloom.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/bloom.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/codegen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/codegen.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gpt2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gpt2.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gpt_bigcode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gpt_bigcode.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gpt_neox.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gpt_neox.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gptj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/gptj.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/internlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/internlm.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/llama.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/moss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/moss.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/olmo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/olmo.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/opt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/opt.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/qwen.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/rw.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/modeling/rw.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/nn_modules/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/nn_modules/_fused_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/nn_modules/_fused_base.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/nn_modules/triton_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/quantization/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/quantization/__init__.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/quantization/gptq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/quantization/gptq.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/quantization/quantizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/quantization/quantizer.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/__init__.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/data_utils.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/import_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/import_utils.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/peft_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/peft_utils.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/perplexity_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/auto_gptq/utils/perplexity_utils.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/autogptq_extension/exllama/tuning.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/autogptq_extension/exllama/tuning.h -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/autogptq_extension/exllama/util.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/autogptq_extension/exllama/util.cuh -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/generate.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/intrin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/intrin.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/mmm.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/mmm.cpp -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/autogptq_extension/qigen/template.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/docs/NEWS_OR_UPDATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/docs/NEWS_OR_UPDATE.md -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/docs/tutorial/01-Quick-Start.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/docs/tutorial/01-Quick-Start.md -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/examples/README.md -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/examples/benchmark/perplexity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/examples/benchmark/perplexity.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/examples/quantization/basic_usage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/examples/quantization/basic_usage.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/setup.py -------------------------------------------------------------------------------- /inference/compression/dependencies/AutoGPTQ/tests/test_q4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/dependencies/AutoGPTQ/tests/test_q4.py -------------------------------------------------------------------------------- /inference/compression/olmo_gptq_class.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/olmo_gptq_class.py -------------------------------------------------------------------------------- /inference/compression/run_olmo_quantization.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/run_olmo_quantization.sh -------------------------------------------------------------------------------- /inference/compression/run_quantization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/compression/run_quantization.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/.dockerignore: -------------------------------------------------------------------------------- 1 | verify 2 | vhome/ 3 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/Dockerfile -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/LICENSE -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/README.md -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/__init__.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/__main__.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/aliases.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/aliases.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/constants.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/entrypoint.sh -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/py.typed: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/util.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/version.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/eb_gantry/version.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/arithmetic/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/asdiv/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/coqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/drop/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/headqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/hendrycks_ethics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/hendrycks_math/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/lambada_openai/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/logiqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/mutual/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/pile/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/quac/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/sat_analogies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/triviaqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/unscramble/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/datasets/wikitext/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/efficiency_benchmark/dependencies/lm_eval/decontamination/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/profile.d/aliases.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/profile.d/aliases.sh -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/profile.d/conda.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/profile.d/conda.sh -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/profile.d/env.sh: -------------------------------------------------------------------------------- 1 | # Environment variables. 2 | export LANG=en_US.UTF-8 3 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/profile.d/path.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/profile.d/path.sh -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/profile.d/prompt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/profile.d/prompt.sh -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/requirements.txt -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/scripts/process_wmt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/scripts/process_wmt.sh -------------------------------------------------------------------------------- /inference/efficiency/dependencies/efficiency-pentathlon/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/efficiency-pentathlon/setup.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/arithmetic/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/asdiv/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/coqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/drop/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/headqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/hendrycks_ethics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/hendrycks_math/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/lambada_openai/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/logiqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/mutual/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/pile/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/quac/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/sat_analogies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/triviaqa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/unscramble/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/datasets/wikitext/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_benchmark/dependencies/lm_eval/decontamination/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/efficiency_requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/previous_version/efficiency_requirements.txt -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/olmo_efficiency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/previous_version/olmo_efficiency.py -------------------------------------------------------------------------------- /inference/efficiency/dependencies/previous_version/olmo_efficiency.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/dependencies/previous_version/olmo_efficiency.sh -------------------------------------------------------------------------------- /inference/efficiency/run_efficiency_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/run_efficiency_benchmark.py -------------------------------------------------------------------------------- /inference/efficiency/run_efficiency_benchmark.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/efficiency/run_efficiency_benchmark.sh -------------------------------------------------------------------------------- /inference/eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/eval/dispatch_openai_requests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/eval/dispatch_openai_requests.py -------------------------------------------------------------------------------- /inference/eval/mmlu/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /inference/eval/mmlu/categories.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/eval/mmlu/categories.py -------------------------------------------------------------------------------- /inference/eval/mmlu/eval_on_mmlu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/eval/mmlu/eval_on_mmlu.sh -------------------------------------------------------------------------------- /inference/eval/mmlu/run_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/eval/mmlu/run_eval.py -------------------------------------------------------------------------------- /inference/eval/requirements.txt: -------------------------------------------------------------------------------- 1 | openai 2 | -------------------------------------------------------------------------------- /inference/eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/eval/utils.py -------------------------------------------------------------------------------- /inference/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/inference/requirements.txt -------------------------------------------------------------------------------- /launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/launch.sh -------------------------------------------------------------------------------- /olmo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/__init__.py -------------------------------------------------------------------------------- /olmo/aliases.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/aliases.py -------------------------------------------------------------------------------- /olmo/beam_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/beam_search.py -------------------------------------------------------------------------------- /olmo/checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/checkpoint.py -------------------------------------------------------------------------------- /olmo/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/config.py -------------------------------------------------------------------------------- /olmo/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/data/__init__.py -------------------------------------------------------------------------------- /olmo/data/collator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/data/collator.py -------------------------------------------------------------------------------- /olmo/data/iterable_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/data/iterable_dataset.py -------------------------------------------------------------------------------- /olmo/data/memmap_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/data/memmap_dataset.py -------------------------------------------------------------------------------- /olmo/data/named_data_mixes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/data/named_data_mixes.py -------------------------------------------------------------------------------- /olmo/data/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/data/util.py -------------------------------------------------------------------------------- /olmo/eval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/eval/__init__.py -------------------------------------------------------------------------------- /olmo/eval/downstream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/eval/downstream.py -------------------------------------------------------------------------------- /olmo/eval/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/eval/evaluator.py -------------------------------------------------------------------------------- /olmo/exceptions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/exceptions.py -------------------------------------------------------------------------------- /olmo/initialization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/initialization.py -------------------------------------------------------------------------------- /olmo/memory_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/memory_parallel.py -------------------------------------------------------------------------------- /olmo/memory_plus_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/memory_plus_layer.py -------------------------------------------------------------------------------- /olmo/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/model.py -------------------------------------------------------------------------------- /olmo/optim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/optim.py -------------------------------------------------------------------------------- /olmo/product_key/colwise_embedding_bag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/product_key/colwise_embedding_bag.py -------------------------------------------------------------------------------- /olmo/product_key/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/product_key/memory.py -------------------------------------------------------------------------------- /olmo/product_key/xformer_embeddingbag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/product_key/xformer_embeddingbag.py -------------------------------------------------------------------------------- /olmo/py.typed: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /olmo/safetensors_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/safetensors_util.py -------------------------------------------------------------------------------- /olmo/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/tokenizer.py -------------------------------------------------------------------------------- /olmo/torch_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/torch_util.py -------------------------------------------------------------------------------- /olmo/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/train.py -------------------------------------------------------------------------------- /olmo/ultramem_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/ultramem_layer.py -------------------------------------------------------------------------------- /olmo/ultramem_layer_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/ultramem_layer_v2.py -------------------------------------------------------------------------------- /olmo/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/util.py -------------------------------------------------------------------------------- /olmo/version.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo/version.py -------------------------------------------------------------------------------- /olmo_data/__init__.py: -------------------------------------------------------------------------------- 1 | from .data import * 2 | -------------------------------------------------------------------------------- /olmo_data/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/data.py -------------------------------------------------------------------------------- /olmo_data/hf_datasets/ai2_arc/ARC-Challenge/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/ai2_arc/ARC-Challenge/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/ai2_arc/ARC-Challenge/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/ai2_arc/ARC-Challenge/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/ai2_arc/ARC-Easy/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/ai2_arc/ARC-Easy/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/ai2_arc/ARC-Easy/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/ai2_arc/ARC-Easy/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/ai2_arc/ARC-Easy/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/ai2_arc/ARC-Easy/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/allenai/basic_arithmetic/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/allenai/basic_arithmetic/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/boolq/none/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/boolq/none/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/boolq/none/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/boolq/none/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/boolq/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/boolq/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/mrpc/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/mrpc/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/mrpc/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/mrpc/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/mrpc/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/mrpc/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/rte/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/rte/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/rte/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/rte/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/rte/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/rte/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/sst2/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/sst2/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/sst2/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/sst2/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/glue/sst2/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/glue/sst2/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/abstract_algebra/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/abstract_algebra/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/abstract_algebra/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/abstract_algebra/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/anatomy/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/astronomy/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/business_ethics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/business_ethics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/business_ethics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/business_ethics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/clinical_knowledge/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/clinical_knowledge/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/clinical_knowledge/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/clinical_knowledge/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_biology/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_biology/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_biology/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_biology/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_chemistry/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_chemistry/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_chemistry/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_chemistry/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_mathematics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_mathematics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_mathematics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_mathematics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_medicine/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_medicine/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_medicine/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_medicine/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_physics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_physics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/college_physics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/college_physics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/computer_security/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/computer_security/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/computer_security/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/computer_security/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/conceptual_physics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/conceptual_physics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/conceptual_physics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/conceptual_physics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/econometrics/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/formal_logic/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/global_facts/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/high_school_biology/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/high_school_biology/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/high_school_biology/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/high_school_biology/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/high_school_chemistry/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/high_school_chemistry/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/high_school_geography/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/high_school_geography/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/high_school_physics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/high_school_physics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/high_school_physics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/high_school_physics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_aging/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_sexuality/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_sexuality/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/human_sexuality/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/human_sexuality/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/international_law/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/international_law/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/international_law/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/international_law/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/jurisprudence/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/logical_fallacies/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/logical_fallacies/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/logical_fallacies/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/logical_fallacies/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/machine_learning/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/machine_learning/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/machine_learning/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/machine_learning/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/management/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/management/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/management/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/management/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/management/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/management/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/management/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/management/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/management/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/management/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/marketing/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/marketing/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/marketing/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/marketing/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/marketing/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/marketing/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/marketing/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/marketing/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/marketing/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/marketing/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/medical_genetics/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/medical_genetics/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/medical_genetics/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/medical_genetics/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/miscellaneous/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/moral_disputes/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/moral_scenarios/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/moral_scenarios/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/moral_scenarios/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/moral_scenarios/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/nutrition/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/philosophy/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/prehistory/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/professional_law/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/professional_law/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/professional_law/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/professional_law/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/professional_medicine/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/professional_medicine/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/public_relations/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/public_relations/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/public_relations/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/public_relations/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/security_studies/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/security_studies/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/security_studies/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/security_studies/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/sociology/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/sociology/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/sociology/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/sociology/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/sociology/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/sociology/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/sociology/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/sociology/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/sociology/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/sociology/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/us_foreign_policy/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/us_foreign_policy/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/us_foreign_policy/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/us_foreign_policy/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/virology/dev/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/virology/dev/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/virology/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/virology/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/virology/test/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/virology/test/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/virology/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/virology/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/virology/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/virology/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/world_religions/dev/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/world_religions/dev/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hails/mmlu_no_train/world_religions/test/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hails/mmlu_no_train/world_religions/test/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hellaswag/none/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hellaswag/none/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hellaswag/none/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hellaswag/none/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/hellaswag/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/hellaswag/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/nq_open/none/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/nq_open/none/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/nq_open/none/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/nq_open/none/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/nq_open/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/nq_open/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/openbookqa/main/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/openbookqa/main/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/openbookqa/main/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/openbookqa/main/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/openbookqa/main/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/openbookqa/main/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/piqa/plain_text/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/piqa/plain_text/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/piqa/plain_text/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/piqa/plain_text/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/piqa/plain_text/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/piqa/plain_text/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/sciq/none/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/sciq/none/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/sciq/none/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/sciq/none/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/sciq/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/sciq/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/social_i_qa/none/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/social_i_qa/none/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/social_i_qa/none/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/social_i_qa/none/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/social_i_qa/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/social_i_qa/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/super_glue/cb/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/super_glue/cb/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/super_glue/cb/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/super_glue/cb/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/super_glue/cb/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/super_glue/cb/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/super_glue/copa/validation/data-00000-of-00001.arrow: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/super_glue/copa/validation/data-00000-of-00001.arrow -------------------------------------------------------------------------------- /olmo_data/hf_datasets/super_glue/copa/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/super_glue/copa/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/super_glue/copa/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/super_glue/copa/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/tau/commonsense_qa/none/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/tau/commonsense_qa/none/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/tau/commonsense_qa/none/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/tau/commonsense_qa/none/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/trivia_qa/rc.wikipedia.nocontext/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/trivia_qa/rc.wikipedia.nocontext/validation/state.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/winogrande/winogrande_xl/validation/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/winogrande/winogrande_xl/validation/dataset_info.json -------------------------------------------------------------------------------- /olmo_data/hf_datasets/winogrande/winogrande_xl/validation/state.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/hf_datasets/winogrande/winogrande_xl/validation/state.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_challenge/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_challenge/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_challenge/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_challenge/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_challenge/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_challenge/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_challenge/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_challenge/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_challenge/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_challenge/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_challenge/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_challenge/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_easy/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_easy/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_easy/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_easy/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_easy/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_easy/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_easy/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_easy/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_easy/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_easy/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/arc_easy/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/arc_easy/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/boolq/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/boolq/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/boolq/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/boolq/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/boolq/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/boolq/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/boolq/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/boolq/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/boolq/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/boolq/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/boolq/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/boolq/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/copa/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/copa/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/copa/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/copa/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/copycolors/10way/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/copycolors/10way/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/copycolors/10way/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/copycolors/10way/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/copycolors/xl_10way/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/copycolors/xl_10way/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/copycolors/xl_10way/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/copycolors/xl_10way/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/csqa/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/csqa/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/csqa/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/csqa/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/csqa/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/csqa/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/csqa/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/csqa/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/csqa/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/csqa/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/csqa/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/csqa/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/hellaswag/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/hellaswag/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/hellaswag/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/hellaswag/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/hellaswag/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/hellaswag/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/hellaswag/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/hellaswag/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/hellaswag/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/hellaswag/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/hellaswag/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/hellaswag/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/openbookqa/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/openbookqa/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/openbookqa/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/openbookqa/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/openbookqa/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/openbookqa/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/openbookqa/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/openbookqa/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/openbookqa/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/openbookqa/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/openbookqa/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/openbookqa/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/piqa/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/piqa/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/piqa/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/piqa/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/piqa/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/piqa/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/piqa/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/piqa/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/piqa/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/piqa/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/piqa/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/piqa/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/sciq/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/sciq/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/sciq/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/sciq/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/socialiqa/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/socialiqa/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/socialiqa/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/socialiqa/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/socialiqa/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/socialiqa/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/socialiqa/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/socialiqa/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/socialiqa/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/socialiqa/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/socialiqa/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/socialiqa/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/winogrande/mc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/winogrande/mc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/winogrande/mc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/winogrande/mc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/winogrande/rc_0shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/winogrande/rc_0shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/winogrande/rc_0shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/winogrande/rc_0shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/winogrande/rc_5shot/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/winogrande/rc_5shot/config.json -------------------------------------------------------------------------------- /olmo_data/oe_eval_tasks/winogrande/rc_5shot/requests.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/oe_eval_tasks/winogrande/rc_5shot/requests.jsonl.gz -------------------------------------------------------------------------------- /olmo_data/tokenizers/allenai_eleuther-ai-gpt-neox-20b-pii-special.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/tokenizers/allenai_eleuther-ai-gpt-neox-20b-pii-special.json -------------------------------------------------------------------------------- /olmo_data/tokenizers/allenai_gpt-neox-olmo-dolma-v1_5.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/olmo_data/tokenizers/allenai_gpt-neox-olmo-dolma-v1_5.json -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/pyproject.toml -------------------------------------------------------------------------------- /run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/run.sh -------------------------------------------------------------------------------- /run_memory_plus.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/run_memory_plus.sh -------------------------------------------------------------------------------- /run_moe.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/run_moe.sh -------------------------------------------------------------------------------- /run_ultramem_v1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/run_ultramem_v1.sh -------------------------------------------------------------------------------- /run_ultramem_v2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/run_ultramem_v2.sh -------------------------------------------------------------------------------- /scripts/add_code_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/add_code_eval.py -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-8k-cham-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-8k-cham-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-8k-cham.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-8k-cham.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-8k-doc-mask-cham-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-8k-doc-mask-cham-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-8k-doc-mask-cham-rtheta-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-8k-doc-mask-cham-rtheta-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-8k-doc-mask-cham-rtheta.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-8k-doc-mask-cham-rtheta.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-8k-doc-mask-cham.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-8k-doc-mask-cham.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-chameleon-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-chameleon-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-chameleon.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-chameleon.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-emb-init-1-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-emb-init-1-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-emb-init-1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-emb-init-1.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-selective-updates-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-selective-updates-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-selective-updates.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-selective-updates.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-wd-all-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-wd-all-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-wd-all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-wd-all.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-z-loss-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-z-loss-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1-z-loss.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1-z-loss.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish1.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish7-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish7-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish7.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish70-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish70-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/amberish/amberish70.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/amberish/amberish70.sh -------------------------------------------------------------------------------- /scripts/beaker/beaker_interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/beaker_interactive.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-normal-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-normal-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-normal-qk-norm-reorder-zloss-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-normal-qk-norm-reorder-zloss-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-normal-qk-norm-reorder-zloss.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-normal-qk-norm-reorder-zloss.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-normal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-normal.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-qk-norm-reorder-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-qk-norm-reorder-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-qk-norm-reorder-zloss-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-qk-norm-reorder-zloss-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-qk-norm-reorder-zloss.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-qk-norm-reorder-zloss.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1-qk-norm-reorder.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1-qk-norm-reorder.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish1.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-normal-qk-norm-reorder-zloss-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-normal-qk-norm-reorder-zloss-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-normal-qk-norm-reorder-zloss.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-normal-qk-norm-reorder-zloss.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-qk-norm-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-qk-norm-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-qk-norm-reorder-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-qk-norm-reorder-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-qk-norm-reorder-zloss-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-qk-norm-reorder-zloss-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-qk-norm-reorder-zloss.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-qk-norm-reorder-zloss.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-qk-norm-reorder.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-qk-norm-reorder.sh -------------------------------------------------------------------------------- /scripts/beaker/chameleon/llamaish7-qk-norm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/chameleon/llamaish7-qk-norm.sh -------------------------------------------------------------------------------- /scripts/beaker/ib-ananya-1b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/ib-ananya-1b.sh -------------------------------------------------------------------------------- /scripts/beaker/ladder-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/ladder-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/ladder.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/ladder.sh -------------------------------------------------------------------------------- /scripts/beaker/llamaish7-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/llamaish7-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/llamaish7-normal-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/llamaish7-normal-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/llamaish7-normal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/llamaish7-normal.sh -------------------------------------------------------------------------------- /scripts/beaker/llamaish7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/llamaish7.sh -------------------------------------------------------------------------------- /scripts/beaker/mitch-ish-7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitch-ish-7b.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish65.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish65.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish7-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish7-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish7-llamainit-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish7-llamainit-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish7-llamainit.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish7-llamainit.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish7.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish70-from160510-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish70-from160510-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish70-from160510.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish70-from160510.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish70-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish70-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish70-loadtest-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish70-loadtest-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish70-loadtest.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish70-loadtest.sh -------------------------------------------------------------------------------- /scripts/beaker/mitchish70.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/mitchish70.sh -------------------------------------------------------------------------------- /scripts/beaker/olmo-small-ablation-on-gantry.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/olmo-small-ablation-on-gantry.sh -------------------------------------------------------------------------------- /scripts/beaker/olmo7-ablation-baseline.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/olmo7-ablation-baseline.sh -------------------------------------------------------------------------------- /scripts/beaker/olmo7-ablation-dedupeparas.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/olmo7-ablation-dedupeparas.sh -------------------------------------------------------------------------------- /scripts/beaker/olmo7-ablation-final2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/olmo7-ablation-final2.sh -------------------------------------------------------------------------------- /scripts/beaker/olmo7-ablation-refheavy.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/olmo7-ablation-refheavy.sh -------------------------------------------------------------------------------- /scripts/beaker/peteish/peteish1-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/peteish/peteish1-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/peteish/peteish1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/peteish/peteish1.sh -------------------------------------------------------------------------------- /scripts/beaker/peteish/peteish7-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/peteish/peteish7-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/peteish/peteish7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/peteish/peteish7.sh -------------------------------------------------------------------------------- /scripts/beaker/pile-llamaish7-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/pile-llamaish7-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/pile-llamaish7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/pile-llamaish7.sh -------------------------------------------------------------------------------- /scripts/beaker/tiny-llamaish-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/tiny-llamaish-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/tiny-llamaish.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/tiny-llamaish.sh -------------------------------------------------------------------------------- /scripts/beaker/tiny/gantry-script.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/tiny/gantry-script.sh -------------------------------------------------------------------------------- /scripts/beaker/tiny/torchrun-script.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/tiny/torchrun-script.sh -------------------------------------------------------------------------------- /scripts/beaker/unshard-launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/unshard-launch.sh -------------------------------------------------------------------------------- /scripts/beaker/unshard.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/unshard.sh -------------------------------------------------------------------------------- /scripts/beaker/warm_hf_cache.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/beaker/warm_hf_cache.sh -------------------------------------------------------------------------------- /scripts/compare_model_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/compare_model_state.py -------------------------------------------------------------------------------- /scripts/compare_module_outputs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/compare_module_outputs.py -------------------------------------------------------------------------------- /scripts/compare_wandb_configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/compare_wandb_configs.py -------------------------------------------------------------------------------- /scripts/convert_olmo_to_hf_new.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/convert_olmo_to_hf_new.py -------------------------------------------------------------------------------- /scripts/convert_pt_to_safetensors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/convert_pt_to_safetensors.py -------------------------------------------------------------------------------- /scripts/init_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/init_config.py -------------------------------------------------------------------------------- /scripts/inspect_train_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/inspect_train_data.py -------------------------------------------------------------------------------- /scripts/kempner/llama7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/kempner/llama7.sh -------------------------------------------------------------------------------- /scripts/kempner/log_into_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/kempner/log_into_node.sh -------------------------------------------------------------------------------- /scripts/kempner/mitch-ish-7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/kempner/mitch-ish-7b.sh -------------------------------------------------------------------------------- /scripts/kempner/v1-mix-small.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/kempner/v1-mix-small.sh -------------------------------------------------------------------------------- /scripts/ladder.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/ladder.ipynb -------------------------------------------------------------------------------- /scripts/ladder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/ladder.py -------------------------------------------------------------------------------- /scripts/list_evals_from_oe_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/list_evals_from_oe_eval.py -------------------------------------------------------------------------------- /scripts/lumi/c4-large-on-lumi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/c4-large-on-lumi.sh -------------------------------------------------------------------------------- /scripts/lumi/c4-medium-on-lumi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/c4-medium-on-lumi.sh -------------------------------------------------------------------------------- /scripts/lumi/c4-small-on-lumi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/c4-small-on-lumi.sh -------------------------------------------------------------------------------- /scripts/lumi/llama7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/llama7.sh -------------------------------------------------------------------------------- /scripts/lumi/log_into_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/log_into_node.sh -------------------------------------------------------------------------------- /scripts/lumi/lumi-interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/lumi-interactive.sh -------------------------------------------------------------------------------- /scripts/lumi/mitch-ish-7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/mitch-ish-7b.sh -------------------------------------------------------------------------------- /scripts/lumi/mitchish65-randomseed.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/mitchish65-randomseed.sh -------------------------------------------------------------------------------- /scripts/lumi/mitchish65.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/mitchish65.sh -------------------------------------------------------------------------------- /scripts/lumi/mitchish70.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/mitchish70.sh -------------------------------------------------------------------------------- /scripts/lumi/olmo-small-ablation-on-lumi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/olmo-small-ablation-on-lumi.sh -------------------------------------------------------------------------------- /scripts/lumi/olmo7-ablations.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/olmo7-ablations.sh -------------------------------------------------------------------------------- /scripts/lumi/pile-llamaish7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/pile-llamaish7.sh -------------------------------------------------------------------------------- /scripts/lumi/v1-mix-medium-on-lumi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/v1-mix-medium-on-lumi.sh -------------------------------------------------------------------------------- /scripts/lumi/v1-mix-small-on-lumi.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/lumi/v1-mix-small-on-lumi.sh -------------------------------------------------------------------------------- /scripts/mcli/manage_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/mcli/manage_run.py -------------------------------------------------------------------------------- /scripts/mcli/unshard_mitchish70.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/mcli/unshard_mitchish70.sh -------------------------------------------------------------------------------- /scripts/prepare_changelog.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/prepare_changelog.py -------------------------------------------------------------------------------- /scripts/prepare_memmap_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/prepare_memmap_dataset.py -------------------------------------------------------------------------------- /scripts/prepare_tulu_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/prepare_tulu_data.py -------------------------------------------------------------------------------- /scripts/pyspy_all_nodes.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/pyspy_all_nodes.sh -------------------------------------------------------------------------------- /scripts/pyspy_all_processes.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/pyspy_all_processes.sh -------------------------------------------------------------------------------- /scripts/release.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/release.sh -------------------------------------------------------------------------------- /scripts/release_notes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/release_notes.py -------------------------------------------------------------------------------- /scripts/run_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/run_dataloader.py -------------------------------------------------------------------------------- /scripts/run_with_environment.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/run_with_environment.sh -------------------------------------------------------------------------------- /scripts/s3_unshard_to_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/s3_unshard_to_hf.py -------------------------------------------------------------------------------- /scripts/show_model_size.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/show_model_size.py -------------------------------------------------------------------------------- /scripts/split_gz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/split_gz.py -------------------------------------------------------------------------------- /scripts/storage_cleaner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/storage_cleaner.py -------------------------------------------------------------------------------- /scripts/test_entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/test_entrypoint.sh -------------------------------------------------------------------------------- /scripts/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/train.py -------------------------------------------------------------------------------- /scripts/unshard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/unshard.py -------------------------------------------------------------------------------- /scripts/wandb_change_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/scripts/wandb_change_group.py -------------------------------------------------------------------------------- /test_fixtures/c4-sample.01.json.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/c4-sample.01.json.gz -------------------------------------------------------------------------------- /test_fixtures/c4-sample.02.json.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/c4-sample.02.json.gz -------------------------------------------------------------------------------- /test_fixtures/c4-sample.03.json.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/c4-sample.03.json.gz -------------------------------------------------------------------------------- /test_fixtures/evaluation/ppl-test-data/4chan/val/4chan_00000000.jsonl.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/evaluation/ppl-test-data/4chan/val/4chan_00000000.jsonl.gz -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/config.json -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/config.yaml -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/model.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/model.pt -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/pytorch_model.bin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/pytorch_model.bin -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/special_tokens_map.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/special_tokens_map.json -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/tokenizer.json -------------------------------------------------------------------------------- /test_fixtures/test-olmo-model/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/test-olmo-model/tokenizer_config.json -------------------------------------------------------------------------------- /test_fixtures/train_tiny.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/train_tiny.yaml -------------------------------------------------------------------------------- /test_fixtures/train_tiny_with_evaluator.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/test_fixtures/train_tiny_with_evaluator.yaml -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/beam_search_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/beam_search_test.py -------------------------------------------------------------------------------- /tests/checkpoint_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/checkpoint_test.py -------------------------------------------------------------------------------- /tests/config_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/config_test.py -------------------------------------------------------------------------------- /tests/data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/data/collator_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/data/collator_test.py -------------------------------------------------------------------------------- /tests/data/iterable_dataset_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/data/iterable_dataset_test.py -------------------------------------------------------------------------------- /tests/data/memmap_dataset_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/data/memmap_dataset_test.py -------------------------------------------------------------------------------- /tests/data/util_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/data/util_test.py -------------------------------------------------------------------------------- /tests/ddp_checkpoint_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/ddp_checkpoint_test.py -------------------------------------------------------------------------------- /tests/eval/downstream_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/eval/downstream_test.py -------------------------------------------------------------------------------- /tests/grad_norm_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/grad_norm_test.py -------------------------------------------------------------------------------- /tests/hf_olmo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/hf_olmo/configuration_olmo_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/hf_olmo/configuration_olmo_test.py -------------------------------------------------------------------------------- /tests/hf_olmo/hf_olmo_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/hf_olmo/hf_olmo_test.py -------------------------------------------------------------------------------- /tests/hf_olmo/hf_pipeline_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/hf_olmo/hf_pipeline_test.py -------------------------------------------------------------------------------- /tests/hf_olmo/modeling_olmo_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/hf_olmo/modeling_olmo_test.py -------------------------------------------------------------------------------- /tests/hf_olmo/tokenization_olmo_fast_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/hf_olmo/tokenization_olmo_fast_test.py -------------------------------------------------------------------------------- /tests/initialization_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/initialization_test.py -------------------------------------------------------------------------------- /tests/model_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/model_test.py -------------------------------------------------------------------------------- /tests/optim_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/optim_test.py -------------------------------------------------------------------------------- /tests/tokenizer_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/tokenizer_test.py -------------------------------------------------------------------------------- /tests/torch_util_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/torch_util_test.py -------------------------------------------------------------------------------- /tests/train_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/train_test.py -------------------------------------------------------------------------------- /tests/util_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZihaoHuang-notabot/Ultra-Sparse-Memory-Network/HEAD/tests/util_test.py --------------------------------------------------------------------------------