├── .gitignore ├── LICENSE ├── README.md ├── assets ├── combined_blocks.pdf └── combined_blocks.png ├── exp_scripts ├── baseline_comparison.sh ├── train_long.sh └── trainable_value_proj_gains.sh ├── requirements.txt ├── run_clm.py └── simplified_transformers ├── config ├── config.yaml ├── model │ ├── default-parallel.yaml │ ├── default.yaml │ ├── op.yaml │ ├── skipless-parallel.yaml │ └── skipless.yaml └── train │ └── train.yaml ├── model_utils.py └── train_utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/README.md -------------------------------------------------------------------------------- /assets/combined_blocks.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/assets/combined_blocks.pdf -------------------------------------------------------------------------------- /assets/combined_blocks.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/assets/combined_blocks.png -------------------------------------------------------------------------------- /exp_scripts/baseline_comparison.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/exp_scripts/baseline_comparison.sh -------------------------------------------------------------------------------- /exp_scripts/train_long.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/exp_scripts/train_long.sh -------------------------------------------------------------------------------- /exp_scripts/trainable_value_proj_gains.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/exp_scripts/trainable_value_proj_gains.sh -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/requirements.txt -------------------------------------------------------------------------------- /run_clm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/run_clm.py -------------------------------------------------------------------------------- /simplified_transformers/config/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/config.yaml -------------------------------------------------------------------------------- /simplified_transformers/config/model/default-parallel.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/model/default-parallel.yaml -------------------------------------------------------------------------------- /simplified_transformers/config/model/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/model/default.yaml -------------------------------------------------------------------------------- /simplified_transformers/config/model/op.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/model/op.yaml -------------------------------------------------------------------------------- /simplified_transformers/config/model/skipless-parallel.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/model/skipless-parallel.yaml -------------------------------------------------------------------------------- /simplified_transformers/config/model/skipless.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/model/skipless.yaml -------------------------------------------------------------------------------- /simplified_transformers/config/train/train.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/config/train/train.yaml -------------------------------------------------------------------------------- /simplified_transformers/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/model_utils.py -------------------------------------------------------------------------------- /simplified_transformers/train_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/bobby-he/simplified_transformers/HEAD/simplified_transformers/train_utils.py --------------------------------------------------------------------------------