├── .idea ├── A-introduction-to-reinforcement-learning.iml ├── misc.xml ├── modules.xml ├── vcs.xml └── workspace.xml ├── README.md ├── RLF ├── DDPG.py ├── DQN.py ├── DQN.pyc ├── Dyna_Q.py ├── MC_ON-POLICY_RACETRACK.png ├── Q-LEARNING_RACETRACK.png ├── Q_A.md ├── SARSA_RACETRACK.png ├── SARSA_lambda_RACETRACK.png ├── TEST.py ├── dp.py ├── env.py ├── env.pyc ├── main.py ├── monte_carlo.py ├── monte_carlo.pyc ├── naive_Q_lambda_RACETRACK.png ├── result_analysis.py ├── result_analysis.pyc ├── td.py ├── td.pyc ├── td_lambda.py └── td_lambda.pyc ├── chapter4 ├── Jack’s_Car_Rental.py └── The_Gambler.py ├── chapter5 ├── Q_A.md ├── Racetrack.py ├── Racetrack_result_1.png ├── Racetrack_result_2.png └── tmp_data.txt ├── chapter6 ├── Q-LEARNING_RACETRACK.png ├── SARSA_RACETRACK.png └── td.py ├── chapter7 ├── SARSA_lambda_RACETRACK.png ├── naive_Q_lambda_RACETRACK.png └── td_lambda.py ├── chapter8 └── Dyna_Q.py └── papers ├── A3C.pdf ├── DDPG.pdf ├── DPG.pdf ├── DQN.pdf ├── DRL_simulated_Auto_Vehicle.pdf ├── TRPO.pdf ├── bookdraft2017june19.pdf └── crossing.pdf /.idea/A-introduction-to-reinforcement-learning.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/.idea/A-introduction-to-reinforcement-learning.iml -------------------------------------------------------------------------------- /.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/.idea/misc.xml -------------------------------------------------------------------------------- /.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/.idea/modules.xml -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /.idea/workspace.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/.idea/workspace.xml -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/README.md -------------------------------------------------------------------------------- /RLF/DDPG.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/DDPG.py -------------------------------------------------------------------------------- /RLF/DQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/DQN.py -------------------------------------------------------------------------------- /RLF/DQN.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/DQN.pyc -------------------------------------------------------------------------------- /RLF/Dyna_Q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/Dyna_Q.py -------------------------------------------------------------------------------- /RLF/MC_ON-POLICY_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/MC_ON-POLICY_RACETRACK.png -------------------------------------------------------------------------------- /RLF/Q-LEARNING_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/Q-LEARNING_RACETRACK.png -------------------------------------------------------------------------------- /RLF/Q_A.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/Q_A.md -------------------------------------------------------------------------------- /RLF/SARSA_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/SARSA_RACETRACK.png -------------------------------------------------------------------------------- /RLF/SARSA_lambda_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/SARSA_lambda_RACETRACK.png -------------------------------------------------------------------------------- /RLF/TEST.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/TEST.py -------------------------------------------------------------------------------- /RLF/dp.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RLF/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/env.py -------------------------------------------------------------------------------- /RLF/env.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/env.pyc -------------------------------------------------------------------------------- /RLF/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/main.py -------------------------------------------------------------------------------- /RLF/monte_carlo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/monte_carlo.py -------------------------------------------------------------------------------- /RLF/monte_carlo.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/monte_carlo.pyc -------------------------------------------------------------------------------- /RLF/naive_Q_lambda_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/naive_Q_lambda_RACETRACK.png -------------------------------------------------------------------------------- /RLF/result_analysis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/result_analysis.py -------------------------------------------------------------------------------- /RLF/result_analysis.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/result_analysis.pyc -------------------------------------------------------------------------------- /RLF/td.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/td.py -------------------------------------------------------------------------------- /RLF/td.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/td.pyc -------------------------------------------------------------------------------- /RLF/td_lambda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/td_lambda.py -------------------------------------------------------------------------------- /RLF/td_lambda.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/RLF/td_lambda.pyc -------------------------------------------------------------------------------- /chapter4/Jack’s_Car_Rental.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter4/Jack’s_Car_Rental.py -------------------------------------------------------------------------------- /chapter4/The_Gambler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter4/The_Gambler.py -------------------------------------------------------------------------------- /chapter5/Q_A.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter5/Q_A.md -------------------------------------------------------------------------------- /chapter5/Racetrack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter5/Racetrack.py -------------------------------------------------------------------------------- /chapter5/Racetrack_result_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter5/Racetrack_result_1.png -------------------------------------------------------------------------------- /chapter5/Racetrack_result_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter5/Racetrack_result_2.png -------------------------------------------------------------------------------- /chapter5/tmp_data.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /chapter6/Q-LEARNING_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter6/Q-LEARNING_RACETRACK.png -------------------------------------------------------------------------------- /chapter6/SARSA_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter6/SARSA_RACETRACK.png -------------------------------------------------------------------------------- /chapter6/td.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter6/td.py -------------------------------------------------------------------------------- /chapter7/SARSA_lambda_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter7/SARSA_lambda_RACETRACK.png -------------------------------------------------------------------------------- /chapter7/naive_Q_lambda_RACETRACK.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter7/naive_Q_lambda_RACETRACK.png -------------------------------------------------------------------------------- /chapter7/td_lambda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter7/td_lambda.py -------------------------------------------------------------------------------- /chapter8/Dyna_Q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/chapter8/Dyna_Q.py -------------------------------------------------------------------------------- /papers/A3C.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/A3C.pdf -------------------------------------------------------------------------------- /papers/DDPG.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/DDPG.pdf -------------------------------------------------------------------------------- /papers/DPG.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/DPG.pdf -------------------------------------------------------------------------------- /papers/DQN.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/DQN.pdf -------------------------------------------------------------------------------- /papers/DRL_simulated_Auto_Vehicle.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/DRL_simulated_Auto_Vehicle.pdf -------------------------------------------------------------------------------- /papers/TRPO.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/TRPO.pdf -------------------------------------------------------------------------------- /papers/bookdraft2017june19.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/bookdraft2017june19.pdf -------------------------------------------------------------------------------- /papers/crossing.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xubo92/an-introduction-to-reinforcement-learning/HEAD/papers/crossing.pdf --------------------------------------------------------------------------------