├── .gitignore ├── .idea └── vcs.xml ├── Appendix └── Appendix.ipynb ├── Chapter 1 └── Ch1_Introduction.ipynb ├── Chapter 10 └── Ch10_book.ipynb ├── Chapter 2 └── Ch2_book.ipynb ├── Chapter 3 ├── Ch3_book.ipynb ├── GridBoard.py └── Gridworld.py ├── Chapter 4 └── Ch4_book.ipynb ├── Chapter 5 └── Ch5_book.ipynb ├── Chapter 6 ├── Ch6_book.ipynb ├── MNIST Genetic Algorithm.ipynb ├── String Genetic Algorithm.ipynb ├── buffer.py ├── main.py └── simulator.py ├── Chapter 7 └── Ch7_book.ipynb ├── Chapter 8 ├── Ch8_book.ipynb └── script_8.py ├── Chapter 9 ├── Ch9_book.ipynb └── MAgent │ └── build │ └── render │ └── README.txt ├── Environments ├── GridBoard.py └── Gridworld.py ├── Errata.md ├── Errata ├── Chapter 2.ipynb ├── Chapter 3.ipynb ├── Chapter 4.ipynb ├── Chapter 5.ipynb ├── GridBoard.py └── Gridworld.py ├── LICENSE ├── README.md ├── old_but_more_detailed ├── Cartpole A3C N step.ipynb ├── Cartpole A3C.ipynb ├── Ch10_Relational DRL.ipynb ├── Ch2_N Armed Bandits.ipynb ├── Ch3_DQN.ipynb ├── Ch3_Gridworld.ipynb ├── Ch3_Gridworld_exp.ipynb ├── Ch4_PolicyGradients.ipynb ├── Ch4_PolicyGradients_.ipynb ├── Ch6_Evolutionary.ipynb ├── Ch6_book_dev.ipynb ├── Ch7_DistDQN.ipynb └── Curiosity-Driven Exploration Super Mario.ipynb └── requirements.txt /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/.gitignore -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /Appendix/Appendix.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Appendix/Appendix.ipynb -------------------------------------------------------------------------------- /Chapter 1/Ch1_Introduction.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 1/Ch1_Introduction.ipynb -------------------------------------------------------------------------------- /Chapter 10/Ch10_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 10/Ch10_book.ipynb -------------------------------------------------------------------------------- /Chapter 2/Ch2_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 2/Ch2_book.ipynb -------------------------------------------------------------------------------- /Chapter 3/Ch3_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 3/Ch3_book.ipynb -------------------------------------------------------------------------------- /Chapter 3/GridBoard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 3/GridBoard.py -------------------------------------------------------------------------------- /Chapter 3/Gridworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 3/Gridworld.py -------------------------------------------------------------------------------- /Chapter 4/Ch4_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 4/Ch4_book.ipynb -------------------------------------------------------------------------------- /Chapter 5/Ch5_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 5/Ch5_book.ipynb -------------------------------------------------------------------------------- /Chapter 6/Ch6_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 6/Ch6_book.ipynb -------------------------------------------------------------------------------- /Chapter 6/MNIST Genetic Algorithm.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 6/MNIST Genetic Algorithm.ipynb -------------------------------------------------------------------------------- /Chapter 6/String Genetic Algorithm.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 6/String Genetic Algorithm.ipynb -------------------------------------------------------------------------------- /Chapter 6/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 6/buffer.py -------------------------------------------------------------------------------- /Chapter 6/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 6/main.py -------------------------------------------------------------------------------- /Chapter 6/simulator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 6/simulator.py -------------------------------------------------------------------------------- /Chapter 7/Ch7_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 7/Ch7_book.ipynb -------------------------------------------------------------------------------- /Chapter 8/Ch8_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 8/Ch8_book.ipynb -------------------------------------------------------------------------------- /Chapter 8/script_8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 8/script_8.py -------------------------------------------------------------------------------- /Chapter 9/Ch9_book.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 9/Ch9_book.ipynb -------------------------------------------------------------------------------- /Chapter 9/MAgent/build/render/README.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Chapter 9/MAgent/build/render/README.txt -------------------------------------------------------------------------------- /Environments/GridBoard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Environments/GridBoard.py -------------------------------------------------------------------------------- /Environments/Gridworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Environments/Gridworld.py -------------------------------------------------------------------------------- /Errata.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata.md -------------------------------------------------------------------------------- /Errata/Chapter 2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata/Chapter 2.ipynb -------------------------------------------------------------------------------- /Errata/Chapter 3.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata/Chapter 3.ipynb -------------------------------------------------------------------------------- /Errata/Chapter 4.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata/Chapter 4.ipynb -------------------------------------------------------------------------------- /Errata/Chapter 5.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata/Chapter 5.ipynb -------------------------------------------------------------------------------- /Errata/GridBoard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata/GridBoard.py -------------------------------------------------------------------------------- /Errata/Gridworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/Errata/Gridworld.py -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/README.md -------------------------------------------------------------------------------- /old_but_more_detailed/Cartpole A3C N step.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Cartpole A3C N step.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Cartpole A3C.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Cartpole A3C.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch10_Relational DRL.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch10_Relational DRL.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch2_N Armed Bandits.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch2_N Armed Bandits.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch3_DQN.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch3_DQN.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch3_Gridworld.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch3_Gridworld.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch3_Gridworld_exp.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch3_Gridworld_exp.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch4_PolicyGradients.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch4_PolicyGradients.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch4_PolicyGradients_.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch4_PolicyGradients_.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch6_Evolutionary.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch6_Evolutionary.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch6_book_dev.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch6_book_dev.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Ch7_DistDQN.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Ch7_DistDQN.ipynb -------------------------------------------------------------------------------- /old_but_more_detailed/Curiosity-Driven Exploration Super Mario.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/old_but_more_detailed/Curiosity-Driven Exploration Super Mario.ipynb -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DeepReinforcementLearning/DeepReinforcementLearningInAction/HEAD/requirements.txt --------------------------------------------------------------------------------