├── .gitignore ├── .vscode ├── .ropeproject │ └── config.py └── settings.json ├── Actor_Critic ├── a3c.py ├── actor_critic_cartpole.py └── actor_critic_pendulum.py ├── Deep_Deterministic_Policy_Gradient ├── ddpg.py ├── main.py └── memory.py ├── Deep_Q_Network ├── Bootstrapped_DQN │ ├── dqn.py │ ├── main.py │ └── memory.py ├── DQN │ ├── dqn.py │ ├── main.py │ └── memory.py ├── Double_DQN │ ├── dqn.py │ ├── main.py │ └── memory.py ├── Dueling_DQN │ ├── dqn.py │ ├── main.py │ └── memory.py └── Prioritized_DQN │ ├── dqn.py │ ├── main.py │ ├── memory.py │ └── sum_tree.py ├── Proximal_Policy_Optimization ├── main.py └── ppo.py ├── README.md └── Recurrent_Deterministic_Policy_Gradient ├── main.py ├── memory.py └── rdpg.py /.gitignore: -------------------------------------------------------------------------------- 1 | __pycache__ 2 | /Deep_Q_Network/Bootstrapped_DQN_eager -------------------------------------------------------------------------------- /.vscode/.ropeproject/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/.vscode/.ropeproject/config.py -------------------------------------------------------------------------------- /.vscode/settings.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/.vscode/settings.json -------------------------------------------------------------------------------- /Actor_Critic/a3c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Actor_Critic/a3c.py -------------------------------------------------------------------------------- /Actor_Critic/actor_critic_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Actor_Critic/actor_critic_cartpole.py -------------------------------------------------------------------------------- /Actor_Critic/actor_critic_pendulum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Actor_Critic/actor_critic_pendulum.py -------------------------------------------------------------------------------- /Deep_Deterministic_Policy_Gradient/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Deterministic_Policy_Gradient/ddpg.py -------------------------------------------------------------------------------- /Deep_Deterministic_Policy_Gradient/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Deterministic_Policy_Gradient/main.py -------------------------------------------------------------------------------- /Deep_Deterministic_Policy_Gradient/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Deterministic_Policy_Gradient/memory.py -------------------------------------------------------------------------------- /Deep_Q_Network/Bootstrapped_DQN/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Bootstrapped_DQN/dqn.py -------------------------------------------------------------------------------- /Deep_Q_Network/Bootstrapped_DQN/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Bootstrapped_DQN/main.py -------------------------------------------------------------------------------- /Deep_Q_Network/Bootstrapped_DQN/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Bootstrapped_DQN/memory.py -------------------------------------------------------------------------------- /Deep_Q_Network/DQN/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/DQN/dqn.py -------------------------------------------------------------------------------- /Deep_Q_Network/DQN/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/DQN/main.py -------------------------------------------------------------------------------- /Deep_Q_Network/DQN/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/DQN/memory.py -------------------------------------------------------------------------------- /Deep_Q_Network/Double_DQN/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Double_DQN/dqn.py -------------------------------------------------------------------------------- /Deep_Q_Network/Double_DQN/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Double_DQN/main.py -------------------------------------------------------------------------------- /Deep_Q_Network/Double_DQN/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Double_DQN/memory.py -------------------------------------------------------------------------------- /Deep_Q_Network/Dueling_DQN/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Dueling_DQN/dqn.py -------------------------------------------------------------------------------- /Deep_Q_Network/Dueling_DQN/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Dueling_DQN/main.py -------------------------------------------------------------------------------- /Deep_Q_Network/Dueling_DQN/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Dueling_DQN/memory.py -------------------------------------------------------------------------------- /Deep_Q_Network/Prioritized_DQN/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Prioritized_DQN/dqn.py -------------------------------------------------------------------------------- /Deep_Q_Network/Prioritized_DQN/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Prioritized_DQN/main.py -------------------------------------------------------------------------------- /Deep_Q_Network/Prioritized_DQN/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Prioritized_DQN/memory.py -------------------------------------------------------------------------------- /Deep_Q_Network/Prioritized_DQN/sum_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Deep_Q_Network/Prioritized_DQN/sum_tree.py -------------------------------------------------------------------------------- /Proximal_Policy_Optimization/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Proximal_Policy_Optimization/main.py -------------------------------------------------------------------------------- /Proximal_Policy_Optimization/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Proximal_Policy_Optimization/ppo.py -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/README.md -------------------------------------------------------------------------------- /Recurrent_Deterministic_Policy_Gradient/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Recurrent_Deterministic_Policy_Gradient/main.py -------------------------------------------------------------------------------- /Recurrent_Deterministic_Policy_Gradient/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Recurrent_Deterministic_Policy_Gradient/memory.py -------------------------------------------------------------------------------- /Recurrent_Deterministic_Policy_Gradient/rdpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/BlueFisher/Reinforcement-Learning/HEAD/Recurrent_Deterministic_Policy_Gradient/rdpg.py --------------------------------------------------------------------------------