├── .gitignore ├── Implementations ├── DistRLOrig │ ├── .idea │ │ ├── DistRLOrig.iml │ │ ├── inspectionProfiles │ │ │ └── profiles_settings.xml │ │ ├── misc.xml │ │ ├── modules.xml │ │ ├── vcs.xml │ │ └── workspace.xml │ └── algorithm1.py ├── learned_weighted_td.py └── weighted_td_learning.py ├── Model ├── .Torchbeast ├── atari_wrappers.py ├── core │ ├── __pycache__ │ │ ├── environment.cpython-37.pyc │ │ ├── file_writer.cpython-37.pyc │ │ ├── prof.cpython-37.pyc │ │ └── vtrace.cpython-37.pyc │ ├── environment.py │ ├── file_writer.py │ ├── prof.py │ └── vtrace.py ├── monobeast.py ├── monobeast_baseline.py ├── monobeast_fb.py ├── monobeast_single_proc.py ├── monobeast_test.py └── requirements.txt ├── README.md ├── StableTransformersReplication ├── dmlab_agent.py ├── implNotes.txt ├── random_agent_dmlab.py ├── training.py ├── transformer_xl.py └── vanillaTransformer.py ├── Transformer-XLCode └── Icon ├── adaptive_span2 ├── adagrad_with_grad_clip.py ├── adaptive_io.py ├── adaptive_span.py ├── config.py ├── data.py ├── get_data.sh ├── get_pretrained.sh ├── main.py ├── models.py ├── persistent_memory.py ├── trainer.py └── utils.py ├── dqn.py ├── old_monobeast_test.py ├── old_transformer_xl.py ├── replayBuffer.py ├── requirements.txt ├── tester.py ├── torchbeast ├── core │ ├── environment.py │ ├── file_writer.py │ ├── prof.py │ └── vtrace.py ├── dmlab30.py ├── dmlab_wrappers.py └── monobeast.py ├── train.py └── transformerDqn.py /.gitignore: -------------------------------------------------------------------------------- 1 | .idea/ 2 | *.xml 3 | Model/logs/ -------------------------------------------------------------------------------- /Implementations/DistRLOrig/.idea/DistRLOrig.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/.idea/DistRLOrig.iml -------------------------------------------------------------------------------- /Implementations/DistRLOrig/.idea/inspectionProfiles/profiles_settings.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/.idea/inspectionProfiles/profiles_settings.xml -------------------------------------------------------------------------------- /Implementations/DistRLOrig/.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/.idea/misc.xml -------------------------------------------------------------------------------- /Implementations/DistRLOrig/.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/.idea/modules.xml -------------------------------------------------------------------------------- /Implementations/DistRLOrig/.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/.idea/vcs.xml -------------------------------------------------------------------------------- /Implementations/DistRLOrig/.idea/workspace.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/.idea/workspace.xml -------------------------------------------------------------------------------- /Implementations/DistRLOrig/algorithm1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/DistRLOrig/algorithm1.py -------------------------------------------------------------------------------- /Implementations/learned_weighted_td.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/learned_weighted_td.py -------------------------------------------------------------------------------- /Implementations/weighted_td_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Implementations/weighted_td_learning.py -------------------------------------------------------------------------------- /Model/.Torchbeast: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Model/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/atari_wrappers.py -------------------------------------------------------------------------------- /Model/core/__pycache__/environment.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/__pycache__/environment.cpython-37.pyc -------------------------------------------------------------------------------- /Model/core/__pycache__/file_writer.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/__pycache__/file_writer.cpython-37.pyc -------------------------------------------------------------------------------- /Model/core/__pycache__/prof.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/__pycache__/prof.cpython-37.pyc -------------------------------------------------------------------------------- /Model/core/__pycache__/vtrace.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/__pycache__/vtrace.cpython-37.pyc -------------------------------------------------------------------------------- /Model/core/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/environment.py -------------------------------------------------------------------------------- /Model/core/file_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/file_writer.py -------------------------------------------------------------------------------- /Model/core/prof.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/prof.py -------------------------------------------------------------------------------- /Model/core/vtrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/core/vtrace.py -------------------------------------------------------------------------------- /Model/monobeast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/monobeast.py -------------------------------------------------------------------------------- /Model/monobeast_baseline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/monobeast_baseline.py -------------------------------------------------------------------------------- /Model/monobeast_fb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/monobeast_fb.py -------------------------------------------------------------------------------- /Model/monobeast_single_proc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/monobeast_single_proc.py -------------------------------------------------------------------------------- /Model/monobeast_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/monobeast_test.py -------------------------------------------------------------------------------- /Model/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/Model/requirements.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/README.md -------------------------------------------------------------------------------- /StableTransformersReplication/dmlab_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/StableTransformersReplication/dmlab_agent.py -------------------------------------------------------------------------------- /StableTransformersReplication/implNotes.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/StableTransformersReplication/implNotes.txt -------------------------------------------------------------------------------- /StableTransformersReplication/random_agent_dmlab.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /StableTransformersReplication/training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/StableTransformersReplication/training.py -------------------------------------------------------------------------------- /StableTransformersReplication/transformer_xl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/StableTransformersReplication/transformer_xl.py -------------------------------------------------------------------------------- /StableTransformersReplication/vanillaTransformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/StableTransformersReplication/vanillaTransformer.py -------------------------------------------------------------------------------- /Transformer-XLCode/Icon : -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /adaptive_span2/adagrad_with_grad_clip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/adagrad_with_grad_clip.py -------------------------------------------------------------------------------- /adaptive_span2/adaptive_io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/adaptive_io.py -------------------------------------------------------------------------------- /adaptive_span2/adaptive_span.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/adaptive_span.py -------------------------------------------------------------------------------- /adaptive_span2/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/config.py -------------------------------------------------------------------------------- /adaptive_span2/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/data.py -------------------------------------------------------------------------------- /adaptive_span2/get_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/get_data.sh -------------------------------------------------------------------------------- /adaptive_span2/get_pretrained.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/get_pretrained.sh -------------------------------------------------------------------------------- /adaptive_span2/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/main.py -------------------------------------------------------------------------------- /adaptive_span2/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/models.py -------------------------------------------------------------------------------- /adaptive_span2/persistent_memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/persistent_memory.py -------------------------------------------------------------------------------- /adaptive_span2/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/trainer.py -------------------------------------------------------------------------------- /adaptive_span2/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/adaptive_span2/utils.py -------------------------------------------------------------------------------- /dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/dqn.py -------------------------------------------------------------------------------- /old_monobeast_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/old_monobeast_test.py -------------------------------------------------------------------------------- /old_transformer_xl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/old_transformer_xl.py -------------------------------------------------------------------------------- /replayBuffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/replayBuffer.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/requirements.txt -------------------------------------------------------------------------------- /tester.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/tester.py -------------------------------------------------------------------------------- /torchbeast/core/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/core/environment.py -------------------------------------------------------------------------------- /torchbeast/core/file_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/core/file_writer.py -------------------------------------------------------------------------------- /torchbeast/core/prof.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/core/prof.py -------------------------------------------------------------------------------- /torchbeast/core/vtrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/core/vtrace.py -------------------------------------------------------------------------------- /torchbeast/dmlab30.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/dmlab30.py -------------------------------------------------------------------------------- /torchbeast/dmlab_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/dmlab_wrappers.py -------------------------------------------------------------------------------- /torchbeast/monobeast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/torchbeast/monobeast.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/train.py -------------------------------------------------------------------------------- /transformerDqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jerrodparker20/adaptive-transformers-in-rl/HEAD/transformerDqn.py --------------------------------------------------------------------------------