├── .gitignore ├── BAP ├── BAP.ipynb ├── README.md ├── adapters.py ├── data_loaders.py ├── main.py ├── reward_model.py └── trainer.py ├── README.md ├── ppo ├── adapters.ipynb ├── gpt2withclassfierhead.py ├── ppo.py ├── train.ipynb └── utils.py ├── preprocess_comparisons.py ├── preprocess_tldr_dataset.py ├── requirements.txt ├── straight-through ├── classifier.py ├── straight-though.ipynb └── train.py ├── tuning ├── ds_config.json ├── midtune.py └── train_reward.py └── utils ├── __init__.py └── dataset.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/.gitignore -------------------------------------------------------------------------------- /BAP/BAP.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/BAP.ipynb -------------------------------------------------------------------------------- /BAP/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/README.md -------------------------------------------------------------------------------- /BAP/adapters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/adapters.py -------------------------------------------------------------------------------- /BAP/data_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/data_loaders.py -------------------------------------------------------------------------------- /BAP/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/main.py -------------------------------------------------------------------------------- /BAP/reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/reward_model.py -------------------------------------------------------------------------------- /BAP/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/BAP/trainer.py -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/README.md -------------------------------------------------------------------------------- /ppo/adapters.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/ppo/adapters.ipynb -------------------------------------------------------------------------------- /ppo/gpt2withclassfierhead.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/ppo/gpt2withclassfierhead.py -------------------------------------------------------------------------------- /ppo/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/ppo/ppo.py -------------------------------------------------------------------------------- /ppo/train.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/ppo/train.ipynb -------------------------------------------------------------------------------- /ppo/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/ppo/utils.py -------------------------------------------------------------------------------- /preprocess_comparisons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/preprocess_comparisons.py -------------------------------------------------------------------------------- /preprocess_tldr_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/preprocess_tldr_dataset.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/requirements.txt -------------------------------------------------------------------------------- /straight-through/classifier.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/straight-through/classifier.py -------------------------------------------------------------------------------- /straight-through/straight-though.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/straight-through/straight-though.ipynb -------------------------------------------------------------------------------- /straight-through/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/straight-through/train.py -------------------------------------------------------------------------------- /tuning/ds_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/tuning/ds_config.json -------------------------------------------------------------------------------- /tuning/midtune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/tuning/midtune.py -------------------------------------------------------------------------------- /tuning/train_reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/tuning/train_reward.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/utils/__init__.py -------------------------------------------------------------------------------- /utils/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAGI/summarisation/HEAD/utils/dataset.py --------------------------------------------------------------------------------