├── README.md ├── announcement.txt └── codes ├── Installation Guide.pptx ├── week01 ├── .ipynb_checkpoints │ ├── basic_gym-checkpoint.ipynb │ ├── basic_python-checkpoint.ipynb │ ├── basic_tensorflow-checkpoint.ipynb │ └── behavior_cloning-checkpoint.ipynb ├── CartPole-v1_expert_demo.pkl ├── MountainCarContinuous-v0_expert_demo.pkl ├── basic_gym.ipynb ├── basic_python.ipynb ├── basic_tensorflow.ipynb └── behavior_cloning.ipynb ├── week02 ├── .ipynb_checkpoints │ ├── policy_iteration-checkpoint.ipynb │ └── value_iteration-checkpoint.ipynb ├── policy_iteration.ipynb └── value_iteration.ipynb ├── week03 ├── SARSA.ipynb ├── custum_frozen_lake_env.py ├── monte_carlo_policy_iteration.ipynb └── q_learning.ipynb ├── week04 ├── basic_tensorflow.ipynb ├── deep_q_learning.ipynb ├── figs │ ├── graph_structure1.png │ ├── graph_structure2.png │ └── summary.PNG ├── pdd_q_learning.ipynb ├── prioritized_experience_replay.ipynb └── save_model │ ├── checkpoint │ ├── dqn_model.data-00000-of-00001 │ ├── dqn_model.index │ └── dqn_model.meta ├── week05 ├── .ipynb_checkpoints │ ├── REINFORCE-checkpoint.ipynb │ ├── REINFORCE_exercise-checkpoint.ipynb │ ├── proximal_policy_optimization-checkpoint.ipynb │ ├── proximal_policy_optimization_exercise-checkpoint.ipynb │ └── trust_region_policy_optimization-checkpoint.ipynb ├── REINFORCE.ipynb ├── REINFORCE_exercise.ipynb ├── proximal_policy_optimization.ipynb ├── proximal_policy_optimization_exercise.ipynb └── trust_region_policy_optimization.ipynb ├── week06 ├── deep_deterministic_policy_gradient.ipynb ├── path_consistency_learning.ipynb └── policy_optimization_with_gae.ipynb ├── week07 ├── Deep Q learning from Demonstrations.ipynb ├── Exploration Methods.ipynb └── Thompson Sampling.ipynb └── week08 ├── MountainCarContinuous-v0_expert_demo.pkl ├── custum_frozen_lake_env.py ├── generative_adversarial_imitation_learning.ipynb └── maximum_entropy_irl.ipynb /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/README.md -------------------------------------------------------------------------------- /announcement.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /codes/Installation Guide.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/Installation Guide.pptx -------------------------------------------------------------------------------- /codes/week01/.ipynb_checkpoints/basic_gym-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/.ipynb_checkpoints/basic_gym-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week01/.ipynb_checkpoints/basic_python-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/.ipynb_checkpoints/basic_python-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week01/.ipynb_checkpoints/basic_tensorflow-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/.ipynb_checkpoints/basic_tensorflow-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week01/.ipynb_checkpoints/behavior_cloning-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/.ipynb_checkpoints/behavior_cloning-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week01/CartPole-v1_expert_demo.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/CartPole-v1_expert_demo.pkl -------------------------------------------------------------------------------- /codes/week01/MountainCarContinuous-v0_expert_demo.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/MountainCarContinuous-v0_expert_demo.pkl -------------------------------------------------------------------------------- /codes/week01/basic_gym.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/basic_gym.ipynb -------------------------------------------------------------------------------- /codes/week01/basic_python.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/basic_python.ipynb -------------------------------------------------------------------------------- /codes/week01/basic_tensorflow.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/basic_tensorflow.ipynb -------------------------------------------------------------------------------- /codes/week01/behavior_cloning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week01/behavior_cloning.ipynb -------------------------------------------------------------------------------- /codes/week02/.ipynb_checkpoints/policy_iteration-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week02/.ipynb_checkpoints/policy_iteration-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week02/.ipynb_checkpoints/value_iteration-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week02/.ipynb_checkpoints/value_iteration-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week02/policy_iteration.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week02/policy_iteration.ipynb -------------------------------------------------------------------------------- /codes/week02/value_iteration.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week02/value_iteration.ipynb -------------------------------------------------------------------------------- /codes/week03/SARSA.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week03/SARSA.ipynb -------------------------------------------------------------------------------- /codes/week03/custum_frozen_lake_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week03/custum_frozen_lake_env.py -------------------------------------------------------------------------------- /codes/week03/monte_carlo_policy_iteration.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week03/monte_carlo_policy_iteration.ipynb -------------------------------------------------------------------------------- /codes/week03/q_learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week03/q_learning.ipynb -------------------------------------------------------------------------------- /codes/week04/basic_tensorflow.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/basic_tensorflow.ipynb -------------------------------------------------------------------------------- /codes/week04/deep_q_learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/deep_q_learning.ipynb -------------------------------------------------------------------------------- /codes/week04/figs/graph_structure1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/figs/graph_structure1.png -------------------------------------------------------------------------------- /codes/week04/figs/graph_structure2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/figs/graph_structure2.png -------------------------------------------------------------------------------- /codes/week04/figs/summary.PNG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/figs/summary.PNG -------------------------------------------------------------------------------- /codes/week04/pdd_q_learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/pdd_q_learning.ipynb -------------------------------------------------------------------------------- /codes/week04/prioritized_experience_replay.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/prioritized_experience_replay.ipynb -------------------------------------------------------------------------------- /codes/week04/save_model/checkpoint: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/save_model/checkpoint -------------------------------------------------------------------------------- /codes/week04/save_model/dqn_model.data-00000-of-00001: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/save_model/dqn_model.data-00000-of-00001 -------------------------------------------------------------------------------- /codes/week04/save_model/dqn_model.index: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/save_model/dqn_model.index -------------------------------------------------------------------------------- /codes/week04/save_model/dqn_model.meta: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week04/save_model/dqn_model.meta -------------------------------------------------------------------------------- /codes/week05/.ipynb_checkpoints/REINFORCE-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/.ipynb_checkpoints/REINFORCE-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week05/.ipynb_checkpoints/REINFORCE_exercise-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/.ipynb_checkpoints/REINFORCE_exercise-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week05/.ipynb_checkpoints/proximal_policy_optimization-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/.ipynb_checkpoints/proximal_policy_optimization-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week05/.ipynb_checkpoints/proximal_policy_optimization_exercise-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/.ipynb_checkpoints/proximal_policy_optimization_exercise-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week05/.ipynb_checkpoints/trust_region_policy_optimization-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/.ipynb_checkpoints/trust_region_policy_optimization-checkpoint.ipynb -------------------------------------------------------------------------------- /codes/week05/REINFORCE.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/REINFORCE.ipynb -------------------------------------------------------------------------------- /codes/week05/REINFORCE_exercise.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/REINFORCE_exercise.ipynb -------------------------------------------------------------------------------- /codes/week05/proximal_policy_optimization.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/proximal_policy_optimization.ipynb -------------------------------------------------------------------------------- /codes/week05/proximal_policy_optimization_exercise.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/proximal_policy_optimization_exercise.ipynb -------------------------------------------------------------------------------- /codes/week05/trust_region_policy_optimization.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week05/trust_region_policy_optimization.ipynb -------------------------------------------------------------------------------- /codes/week06/deep_deterministic_policy_gradient.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week06/deep_deterministic_policy_gradient.ipynb -------------------------------------------------------------------------------- /codes/week06/path_consistency_learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week06/path_consistency_learning.ipynb -------------------------------------------------------------------------------- /codes/week06/policy_optimization_with_gae.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week06/policy_optimization_with_gae.ipynb -------------------------------------------------------------------------------- /codes/week07/Deep Q learning from Demonstrations.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week07/Deep Q learning from Demonstrations.ipynb -------------------------------------------------------------------------------- /codes/week07/Exploration Methods.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week07/Exploration Methods.ipynb -------------------------------------------------------------------------------- /codes/week07/Thompson Sampling.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week07/Thompson Sampling.ipynb -------------------------------------------------------------------------------- /codes/week08/MountainCarContinuous-v0_expert_demo.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week08/MountainCarContinuous-v0_expert_demo.pkl -------------------------------------------------------------------------------- /codes/week08/custum_frozen_lake_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week08/custum_frozen_lake_env.py -------------------------------------------------------------------------------- /codes/week08/generative_adversarial_imitation_learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week08/generative_adversarial_imitation_learning.ipynb -------------------------------------------------------------------------------- /codes/week08/maximum_entropy_irl.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rllab-snu/Deep-Reinforcement-Learning/HEAD/codes/week08/maximum_entropy_irl.ipynb --------------------------------------------------------------------------------