├── .gitignore ├── 1-grid-world ├── 1-policy-iteration │ ├── environment.py │ └── policy_iteration.py ├── 2-value-iteration │ ├── environment.py │ └── value_iteration.py ├── 3-monte-carlo │ ├── environment.py │ └── mc_agent.py ├── 4-sarsa │ ├── environment.py │ └── sarsa_agent.py ├── 5-q-learning │ ├── environment.py │ └── q_learning_agent.py └── img │ ├── circle.png │ ├── down.png │ ├── left.png │ ├── rectangle.png │ ├── right.png │ ├── triangle.png │ └── up.png ├── 2-cartpole ├── 1-dqn │ ├── memory.py │ ├── model.py │ ├── test.py │ └── train.py ├── 2-actor-critic │ ├── main.py │ ├── model.py │ ├── save_model │ │ └── ckpt_1157.pth │ ├── test.py │ └── train.py └── 3-multi-step │ ├── memory.py │ ├── model.py │ ├── test.py │ └── train.py ├── 3-atari └── 1-dqn │ ├── memory.py │ ├── model.py │ ├── test.py │ ├── train.py │ └── utils.py ├── LICENSE └── README.md /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/.gitignore -------------------------------------------------------------------------------- /1-grid-world/1-policy-iteration/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/1-policy-iteration/environment.py -------------------------------------------------------------------------------- /1-grid-world/1-policy-iteration/policy_iteration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/1-policy-iteration/policy_iteration.py -------------------------------------------------------------------------------- /1-grid-world/2-value-iteration/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/2-value-iteration/environment.py -------------------------------------------------------------------------------- /1-grid-world/2-value-iteration/value_iteration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/2-value-iteration/value_iteration.py -------------------------------------------------------------------------------- /1-grid-world/3-monte-carlo/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/3-monte-carlo/environment.py -------------------------------------------------------------------------------- /1-grid-world/3-monte-carlo/mc_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/3-monte-carlo/mc_agent.py -------------------------------------------------------------------------------- /1-grid-world/4-sarsa/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/4-sarsa/environment.py -------------------------------------------------------------------------------- /1-grid-world/4-sarsa/sarsa_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/4-sarsa/sarsa_agent.py -------------------------------------------------------------------------------- /1-grid-world/5-q-learning/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/5-q-learning/environment.py -------------------------------------------------------------------------------- /1-grid-world/5-q-learning/q_learning_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/5-q-learning/q_learning_agent.py -------------------------------------------------------------------------------- /1-grid-world/img/circle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/circle.png -------------------------------------------------------------------------------- /1-grid-world/img/down.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/down.png -------------------------------------------------------------------------------- /1-grid-world/img/left.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/left.png -------------------------------------------------------------------------------- /1-grid-world/img/rectangle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/rectangle.png -------------------------------------------------------------------------------- /1-grid-world/img/right.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/right.png -------------------------------------------------------------------------------- /1-grid-world/img/triangle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/triangle.png -------------------------------------------------------------------------------- /1-grid-world/img/up.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/1-grid-world/img/up.png -------------------------------------------------------------------------------- /2-cartpole/1-dqn/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/1-dqn/memory.py -------------------------------------------------------------------------------- /2-cartpole/1-dqn/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/1-dqn/model.py -------------------------------------------------------------------------------- /2-cartpole/1-dqn/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/1-dqn/test.py -------------------------------------------------------------------------------- /2-cartpole/1-dqn/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/1-dqn/train.py -------------------------------------------------------------------------------- /2-cartpole/2-actor-critic/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/2-actor-critic/main.py -------------------------------------------------------------------------------- /2-cartpole/2-actor-critic/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/2-actor-critic/model.py -------------------------------------------------------------------------------- /2-cartpole/2-actor-critic/save_model/ckpt_1157.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/2-actor-critic/save_model/ckpt_1157.pth -------------------------------------------------------------------------------- /2-cartpole/2-actor-critic/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/2-actor-critic/test.py -------------------------------------------------------------------------------- /2-cartpole/2-actor-critic/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/2-actor-critic/train.py -------------------------------------------------------------------------------- /2-cartpole/3-multi-step/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/3-multi-step/memory.py -------------------------------------------------------------------------------- /2-cartpole/3-multi-step/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/3-multi-step/model.py -------------------------------------------------------------------------------- /2-cartpole/3-multi-step/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/3-multi-step/test.py -------------------------------------------------------------------------------- /2-cartpole/3-multi-step/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/2-cartpole/3-multi-step/train.py -------------------------------------------------------------------------------- /3-atari/1-dqn/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/3-atari/1-dqn/memory.py -------------------------------------------------------------------------------- /3-atari/1-dqn/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/3-atari/1-dqn/model.py -------------------------------------------------------------------------------- /3-atari/1-dqn/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/3-atari/1-dqn/test.py -------------------------------------------------------------------------------- /3-atari/1-dqn/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/3-atari/1-dqn/train.py -------------------------------------------------------------------------------- /3-atari/1-dqn/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/3-atari/1-dqn/utils.py -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/reinforcement-learning-kr/reinforcement-learning-pytorch/HEAD/README.md --------------------------------------------------------------------------------