├── README.md ├── p0_taxi-v2 ├── README.md ├── agent.py ├── images │ ├── all_perf.png │ ├── expected_sarsa_algo.png │ ├── expected_sarsa_perf.png │ ├── expected_sarsa_update_rule.png │ ├── sarsa_algo.png │ ├── sarsa_perf.png │ ├── sarsa_update_rule.png │ ├── sarsamax_algo.png │ ├── sarsamax_perf.png │ ├── sarsamax_update_rule.png │ ├── taxi-game.gif │ └── taxi_game_gif.gif ├── main.py └── monitor.py ├── p1_navigation ├── Navigation.ipynb ├── README.md ├── config.json ├── dqn_agent.py ├── main.py ├── model.py ├── report.pdf ├── requirements.txt ├── saved │ └── DQN_exp │ │ └── model_trained_solved.pth └── utils.py ├── p2_continuous_control ├── Continuous_Control.ipynb ├── README.md ├── config.json ├── ddpg_agent.py ├── images │ └── reacher_gif.gif ├── models.py ├── report.pdf ├── requirements.txt └── saved │ └── DDPG_exp │ ├── checkpoint_actor_solved.pth │ └── checkpoint_critic_solved.pth └── p3_collab_compet ├── DDPGAgents.py ├── OUNoise.py ├── README.md ├── ReplayBuffer.py ├── Tennis.ipynb ├── config.json ├── images └── tennis_gif.gif ├── report.pdf ├── requirements.txt ├── saved └── DDPGAgents_exp │ ├── checkpoint_actor_solved.pth │ └── checkpoint_critic_solved.pth └── utils.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/README.md -------------------------------------------------------------------------------- /p0_taxi-v2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/README.md -------------------------------------------------------------------------------- /p0_taxi-v2/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/agent.py -------------------------------------------------------------------------------- /p0_taxi-v2/images/all_perf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/all_perf.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/expected_sarsa_algo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/expected_sarsa_algo.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/expected_sarsa_perf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/expected_sarsa_perf.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/expected_sarsa_update_rule.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/expected_sarsa_update_rule.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/sarsa_algo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/sarsa_algo.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/sarsa_perf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/sarsa_perf.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/sarsa_update_rule.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/sarsa_update_rule.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/sarsamax_algo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/sarsamax_algo.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/sarsamax_perf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/sarsamax_perf.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/sarsamax_update_rule.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/sarsamax_update_rule.png -------------------------------------------------------------------------------- /p0_taxi-v2/images/taxi-game.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/taxi-game.gif -------------------------------------------------------------------------------- /p0_taxi-v2/images/taxi_game_gif.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/images/taxi_game_gif.gif -------------------------------------------------------------------------------- /p0_taxi-v2/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/main.py -------------------------------------------------------------------------------- /p0_taxi-v2/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p0_taxi-v2/monitor.py -------------------------------------------------------------------------------- /p1_navigation/Navigation.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/Navigation.ipynb -------------------------------------------------------------------------------- /p1_navigation/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/README.md -------------------------------------------------------------------------------- /p1_navigation/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/config.json -------------------------------------------------------------------------------- /p1_navigation/dqn_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/dqn_agent.py -------------------------------------------------------------------------------- /p1_navigation/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/main.py -------------------------------------------------------------------------------- /p1_navigation/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/model.py -------------------------------------------------------------------------------- /p1_navigation/report.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/report.pdf -------------------------------------------------------------------------------- /p1_navigation/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/requirements.txt -------------------------------------------------------------------------------- /p1_navigation/saved/DQN_exp/model_trained_solved.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/saved/DQN_exp/model_trained_solved.pth -------------------------------------------------------------------------------- /p1_navigation/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p1_navigation/utils.py -------------------------------------------------------------------------------- /p2_continuous_control/Continuous_Control.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/Continuous_Control.ipynb -------------------------------------------------------------------------------- /p2_continuous_control/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/README.md -------------------------------------------------------------------------------- /p2_continuous_control/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/config.json -------------------------------------------------------------------------------- /p2_continuous_control/ddpg_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/ddpg_agent.py -------------------------------------------------------------------------------- /p2_continuous_control/images/reacher_gif.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/images/reacher_gif.gif -------------------------------------------------------------------------------- /p2_continuous_control/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/models.py -------------------------------------------------------------------------------- /p2_continuous_control/report.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/report.pdf -------------------------------------------------------------------------------- /p2_continuous_control/requirements.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /p2_continuous_control/saved/DDPG_exp/checkpoint_actor_solved.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/saved/DDPG_exp/checkpoint_actor_solved.pth -------------------------------------------------------------------------------- /p2_continuous_control/saved/DDPG_exp/checkpoint_critic_solved.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p2_continuous_control/saved/DDPG_exp/checkpoint_critic_solved.pth -------------------------------------------------------------------------------- /p3_collab_compet/DDPGAgents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/DDPGAgents.py -------------------------------------------------------------------------------- /p3_collab_compet/OUNoise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/OUNoise.py -------------------------------------------------------------------------------- /p3_collab_compet/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/README.md -------------------------------------------------------------------------------- /p3_collab_compet/ReplayBuffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/ReplayBuffer.py -------------------------------------------------------------------------------- /p3_collab_compet/Tennis.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/Tennis.ipynb -------------------------------------------------------------------------------- /p3_collab_compet/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/config.json -------------------------------------------------------------------------------- /p3_collab_compet/images/tennis_gif.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/images/tennis_gif.gif -------------------------------------------------------------------------------- /p3_collab_compet/report.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/report.pdf -------------------------------------------------------------------------------- /p3_collab_compet/requirements.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /p3_collab_compet/saved/DDPGAgents_exp/checkpoint_actor_solved.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/saved/DDPGAgents_exp/checkpoint_actor_solved.pth -------------------------------------------------------------------------------- /p3_collab_compet/saved/DDPGAgents_exp/checkpoint_critic_solved.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/saved/DDPGAgents_exp/checkpoint_critic_solved.pth -------------------------------------------------------------------------------- /p3_collab_compet/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vmelan/DRLND-udacity/HEAD/p3_collab_compet/utils.py --------------------------------------------------------------------------------