├── .gitignore ├── INSTALL.md ├── README.md ├── env ├── __init__.py ├── ale │ ├── __init__.py │ └── ale_env.py ├── arguments.py ├── torcs │ ├── INSTALL.md │ ├── __init__.py │ ├── autostart.sh │ ├── autostart2.sh │ ├── autostart3.sh │ ├── snakeoil3_gym.py │ └── torcs_env.py └── vizdoom │ ├── __init__.py │ └── vizdoom_env.py ├── network_model ├── __init__.py ├── model_neon.py ├── model_tf.py ├── model_tf_a3c.py ├── model_tf_a3c_lstm.py ├── model_tf_async.py └── model_tf_ddpg.py ├── play.py ├── replay_memory.py ├── sampling_manager.py ├── snapshot ├── breakout_a3c.gif ├── breakout_a3c.png ├── hero.gif ├── hero_priority.png ├── space_invaders_a3c.png ├── space_invaders_a3c_lstm.gif └── torcs-1.png ├── test ├── binary_heap │ ├── binary_heap.py │ ├── binary_heap_test.py │ └── prioritizedRL.py ├── replay_memory_test.py └── sampling_manager_test.py ├── train.py └── util.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/.gitignore -------------------------------------------------------------------------------- /INSTALL.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/INSTALL.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/README.md -------------------------------------------------------------------------------- /env/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /env/ale/__init__.py: -------------------------------------------------------------------------------- 1 | from ale_env import initialize_args -------------------------------------------------------------------------------- /env/ale/ale_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/ale/ale_env.py -------------------------------------------------------------------------------- /env/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/arguments.py -------------------------------------------------------------------------------- /env/torcs/INSTALL.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/torcs/INSTALL.md -------------------------------------------------------------------------------- /env/torcs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /env/torcs/autostart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/torcs/autostart.sh -------------------------------------------------------------------------------- /env/torcs/autostart2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/torcs/autostart2.sh -------------------------------------------------------------------------------- /env/torcs/autostart3.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/torcs/autostart3.sh -------------------------------------------------------------------------------- /env/torcs/snakeoil3_gym.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/torcs/snakeoil3_gym.py -------------------------------------------------------------------------------- /env/torcs/torcs_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/torcs/torcs_env.py -------------------------------------------------------------------------------- /env/vizdoom/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /env/vizdoom/vizdoom_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/env/vizdoom/vizdoom_env.py -------------------------------------------------------------------------------- /network_model/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /network_model/model_neon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/network_model/model_neon.py -------------------------------------------------------------------------------- /network_model/model_tf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/network_model/model_tf.py -------------------------------------------------------------------------------- /network_model/model_tf_a3c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/network_model/model_tf_a3c.py -------------------------------------------------------------------------------- /network_model/model_tf_a3c_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/network_model/model_tf_a3c_lstm.py -------------------------------------------------------------------------------- /network_model/model_tf_async.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/network_model/model_tf_async.py -------------------------------------------------------------------------------- /network_model/model_tf_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/network_model/model_tf_ddpg.py -------------------------------------------------------------------------------- /play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/play.py -------------------------------------------------------------------------------- /replay_memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/replay_memory.py -------------------------------------------------------------------------------- /sampling_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/sampling_manager.py -------------------------------------------------------------------------------- /snapshot/breakout_a3c.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/breakout_a3c.gif -------------------------------------------------------------------------------- /snapshot/breakout_a3c.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/breakout_a3c.png -------------------------------------------------------------------------------- /snapshot/hero.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/hero.gif -------------------------------------------------------------------------------- /snapshot/hero_priority.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/hero_priority.png -------------------------------------------------------------------------------- /snapshot/space_invaders_a3c.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/space_invaders_a3c.png -------------------------------------------------------------------------------- /snapshot/space_invaders_a3c_lstm.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/space_invaders_a3c_lstm.gif -------------------------------------------------------------------------------- /snapshot/torcs-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/snapshot/torcs-1.png -------------------------------------------------------------------------------- /test/binary_heap/binary_heap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/test/binary_heap/binary_heap.py -------------------------------------------------------------------------------- /test/binary_heap/binary_heap_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/test/binary_heap/binary_heap_test.py -------------------------------------------------------------------------------- /test/binary_heap/prioritizedRL.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/test/binary_heap/prioritizedRL.py -------------------------------------------------------------------------------- /test/replay_memory_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/test/replay_memory_test.py -------------------------------------------------------------------------------- /test/sampling_manager_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/test/sampling_manager_test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/train.py -------------------------------------------------------------------------------- /util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/futurecrew/DeepRL/HEAD/util.py --------------------------------------------------------------------------------