├── .gitignore ├── Dockerfile ├── LICENSE ├── README.md ├── deep_rl ├── __init__.py ├── agent │ ├── A2C_agent.py │ ├── BaseAgent.py │ ├── CategoricalDQN_agent.py │ ├── DDPG_agent.py │ ├── DQN_agent.py │ ├── NStepDQN_agent.py │ ├── OptionCritic_agent.py │ ├── PPO_agent.py │ ├── QuantileRegressionDQN_agent.py │ ├── TD3_agent.py │ └── __init__.py ├── component │ ├── __init__.py │ ├── envs.py │ ├── random_process.py │ └── replay.py ├── network │ ├── __init__.py │ ├── network_bodies.py │ ├── network_heads.py │ └── network_utils.py └── utils │ ├── __init__.py │ ├── config.py │ ├── logger.py │ ├── misc.py │ ├── normalizer.py │ ├── plot.py │ ├── schedule.py │ ├── sum_tree.py │ └── torch_utils.py ├── docker_batch.sh ├── docker_build.sh ├── docker_clean.sh ├── docker_python.sh ├── docker_shell.sh ├── docker_stop.sh ├── examples.py ├── images ├── Breakout.png ├── PPO.png └── mujoco_eval.png ├── requirements.txt ├── setup.py ├── template_jobs.py └── template_plot.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/.gitignore -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/Dockerfile -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/README.md -------------------------------------------------------------------------------- /deep_rl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/__init__.py -------------------------------------------------------------------------------- /deep_rl/agent/A2C_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/A2C_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/BaseAgent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/BaseAgent.py -------------------------------------------------------------------------------- /deep_rl/agent/CategoricalDQN_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/CategoricalDQN_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/DDPG_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/DDPG_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/DQN_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/DQN_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/NStepDQN_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/NStepDQN_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/OptionCritic_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/OptionCritic_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/PPO_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/PPO_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/QuantileRegressionDQN_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/QuantileRegressionDQN_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/TD3_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/TD3_agent.py -------------------------------------------------------------------------------- /deep_rl/agent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/agent/__init__.py -------------------------------------------------------------------------------- /deep_rl/component/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/component/__init__.py -------------------------------------------------------------------------------- /deep_rl/component/envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/component/envs.py -------------------------------------------------------------------------------- /deep_rl/component/random_process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/component/random_process.py -------------------------------------------------------------------------------- /deep_rl/component/replay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/component/replay.py -------------------------------------------------------------------------------- /deep_rl/network/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/network/__init__.py -------------------------------------------------------------------------------- /deep_rl/network/network_bodies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/network/network_bodies.py -------------------------------------------------------------------------------- /deep_rl/network/network_heads.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/network/network_heads.py -------------------------------------------------------------------------------- /deep_rl/network/network_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/network/network_utils.py -------------------------------------------------------------------------------- /deep_rl/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/__init__.py -------------------------------------------------------------------------------- /deep_rl/utils/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/config.py -------------------------------------------------------------------------------- /deep_rl/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/logger.py -------------------------------------------------------------------------------- /deep_rl/utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/misc.py -------------------------------------------------------------------------------- /deep_rl/utils/normalizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/normalizer.py -------------------------------------------------------------------------------- /deep_rl/utils/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/plot.py -------------------------------------------------------------------------------- /deep_rl/utils/schedule.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/schedule.py -------------------------------------------------------------------------------- /deep_rl/utils/sum_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/sum_tree.py -------------------------------------------------------------------------------- /deep_rl/utils/torch_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/deep_rl/utils/torch_utils.py -------------------------------------------------------------------------------- /docker_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/docker_batch.sh -------------------------------------------------------------------------------- /docker_build.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/docker_build.sh -------------------------------------------------------------------------------- /docker_clean.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/docker_clean.sh -------------------------------------------------------------------------------- /docker_python.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/docker_python.sh -------------------------------------------------------------------------------- /docker_shell.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/docker_shell.sh -------------------------------------------------------------------------------- /docker_stop.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/docker_stop.sh -------------------------------------------------------------------------------- /examples.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/examples.py -------------------------------------------------------------------------------- /images/Breakout.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/images/Breakout.png -------------------------------------------------------------------------------- /images/PPO.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/images/PPO.png -------------------------------------------------------------------------------- /images/mujoco_eval.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/images/mujoco_eval.png -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/requirements.txt -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/setup.py -------------------------------------------------------------------------------- /template_jobs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/template_jobs.py -------------------------------------------------------------------------------- /template_plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShangtongZhang/DeepRL/HEAD/template_plot.py --------------------------------------------------------------------------------