├── .gitattributes ├── .idea ├── ReinforceLearning.iml ├── inspectionProfiles │ └── profiles_settings.xml ├── misc.xml ├── modules.xml ├── vcs.xml └── workspace.xml ├── .ipynb_checkpoints └── QTable-checkpoint.ipynb ├── Actor_Critic ├── AC_Pole.py └── AC_continue_Pendulum.py ├── DDPG └── DDPG.py ├── DQLearing ├── Brains │ ├── DQLearning.py │ ├── DQN.py │ ├── DQNTF2.py │ ├── DuelingDQN.py │ ├── Priority_DQN.py │ ├── RL_brain.py │ └── __pycache__ │ │ ├── DQN.cpython-36.pyc │ │ ├── DQN.cpython-37.pyc │ │ ├── DQNTF2.cpython-36.pyc │ │ ├── DQNTF2.cpython-37.pyc │ │ └── DuelingDQN.cpython-36.pyc ├── gym │ ├── CartPole.py │ ├── Mountain_Car.py │ ├── Pendulum.py │ ├── checkpoint │ ├── logs │ │ └── events.out.tfevents.1579495704.DESKTOP-JBV63R4 │ ├── tmp_model.data-00000-of-00001 │ └── tmp_model.index ├── logs │ ├── events.out.tfevents.1578211690.DESKTOP-JBV63R4 │ ├── events.out.tfevents.1578225153.DESKTOP-JBV63R4 │ ├── events.out.tfevents.1578226418.DESKTOP-JBV63R4 │ ├── events.out.tfevents.1578226429.DESKTOP-JBV63R4 │ └── events.out.tfevents.1578228234.DESKTOP-JBV63R4 ├── run_dqn.py └── tkinter │ ├── chessboard.py │ └── maze_env.py ├── PolicyGradient ├── Brain │ ├── PG.py │ └── PolicyGradient.py └── gym │ └── PGCartPole.py └── QTable ├── 五子棋 ├── chessboard.py ├── q_table1.csv ├── q_table2.csv └── train.py └── 走迷宫 ├── RL_brain.py ├── RunQTable.py ├── RunSarsaTable.py ├── SarsaLambda.py ├── SarsaLearning.py └── maze_env.py /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.gitattributes -------------------------------------------------------------------------------- /.idea/ReinforceLearning.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.idea/ReinforceLearning.iml -------------------------------------------------------------------------------- /.idea/inspectionProfiles/profiles_settings.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.idea/inspectionProfiles/profiles_settings.xml -------------------------------------------------------------------------------- /.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.idea/misc.xml -------------------------------------------------------------------------------- /.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.idea/modules.xml -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /.idea/workspace.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.idea/workspace.xml -------------------------------------------------------------------------------- /.ipynb_checkpoints/QTable-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/.ipynb_checkpoints/QTable-checkpoint.ipynb -------------------------------------------------------------------------------- /Actor_Critic/AC_Pole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/Actor_Critic/AC_Pole.py -------------------------------------------------------------------------------- /Actor_Critic/AC_continue_Pendulum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/Actor_Critic/AC_continue_Pendulum.py -------------------------------------------------------------------------------- /DDPG/DDPG.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DDPG/DDPG.py -------------------------------------------------------------------------------- /DQLearing/Brains/DQLearning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/DQLearning.py -------------------------------------------------------------------------------- /DQLearing/Brains/DQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/DQN.py -------------------------------------------------------------------------------- /DQLearing/Brains/DQNTF2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/DQNTF2.py -------------------------------------------------------------------------------- /DQLearing/Brains/DuelingDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/DuelingDQN.py -------------------------------------------------------------------------------- /DQLearing/Brains/Priority_DQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/Priority_DQN.py -------------------------------------------------------------------------------- /DQLearing/Brains/RL_brain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/RL_brain.py -------------------------------------------------------------------------------- /DQLearing/Brains/__pycache__/DQN.cpython-36.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/__pycache__/DQN.cpython-36.pyc -------------------------------------------------------------------------------- /DQLearing/Brains/__pycache__/DQN.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/__pycache__/DQN.cpython-37.pyc -------------------------------------------------------------------------------- /DQLearing/Brains/__pycache__/DQNTF2.cpython-36.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/__pycache__/DQNTF2.cpython-36.pyc -------------------------------------------------------------------------------- /DQLearing/Brains/__pycache__/DQNTF2.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/__pycache__/DQNTF2.cpython-37.pyc -------------------------------------------------------------------------------- /DQLearing/Brains/__pycache__/DuelingDQN.cpython-36.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/Brains/__pycache__/DuelingDQN.cpython-36.pyc -------------------------------------------------------------------------------- /DQLearing/gym/CartPole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/gym/CartPole.py -------------------------------------------------------------------------------- /DQLearing/gym/Mountain_Car.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /DQLearing/gym/Pendulum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/gym/Pendulum.py -------------------------------------------------------------------------------- /DQLearing/gym/checkpoint: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/gym/checkpoint -------------------------------------------------------------------------------- /DQLearing/gym/logs/events.out.tfevents.1579495704.DESKTOP-JBV63R4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/gym/logs/events.out.tfevents.1579495704.DESKTOP-JBV63R4 -------------------------------------------------------------------------------- /DQLearing/gym/tmp_model.data-00000-of-00001: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/gym/tmp_model.data-00000-of-00001 -------------------------------------------------------------------------------- /DQLearing/gym/tmp_model.index: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/gym/tmp_model.index -------------------------------------------------------------------------------- /DQLearing/logs/events.out.tfevents.1578211690.DESKTOP-JBV63R4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/logs/events.out.tfevents.1578211690.DESKTOP-JBV63R4 -------------------------------------------------------------------------------- /DQLearing/logs/events.out.tfevents.1578225153.DESKTOP-JBV63R4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/logs/events.out.tfevents.1578225153.DESKTOP-JBV63R4 -------------------------------------------------------------------------------- /DQLearing/logs/events.out.tfevents.1578226418.DESKTOP-JBV63R4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/logs/events.out.tfevents.1578226418.DESKTOP-JBV63R4 -------------------------------------------------------------------------------- /DQLearing/logs/events.out.tfevents.1578226429.DESKTOP-JBV63R4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/logs/events.out.tfevents.1578226429.DESKTOP-JBV63R4 -------------------------------------------------------------------------------- /DQLearing/logs/events.out.tfevents.1578228234.DESKTOP-JBV63R4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/logs/events.out.tfevents.1578228234.DESKTOP-JBV63R4 -------------------------------------------------------------------------------- /DQLearing/run_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/run_dqn.py -------------------------------------------------------------------------------- /DQLearing/tkinter/chessboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/tkinter/chessboard.py -------------------------------------------------------------------------------- /DQLearing/tkinter/maze_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/DQLearing/tkinter/maze_env.py -------------------------------------------------------------------------------- /PolicyGradient/Brain/PG.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/PolicyGradient/Brain/PG.py -------------------------------------------------------------------------------- /PolicyGradient/Brain/PolicyGradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/PolicyGradient/Brain/PolicyGradient.py -------------------------------------------------------------------------------- /PolicyGradient/gym/PGCartPole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/PolicyGradient/gym/PGCartPole.py -------------------------------------------------------------------------------- /QTable/五子棋/chessboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/五子棋/chessboard.py -------------------------------------------------------------------------------- /QTable/五子棋/q_table1.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/五子棋/q_table1.csv -------------------------------------------------------------------------------- /QTable/五子棋/q_table2.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/五子棋/q_table2.csv -------------------------------------------------------------------------------- /QTable/五子棋/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/五子棋/train.py -------------------------------------------------------------------------------- /QTable/走迷宫/RL_brain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/走迷宫/RL_brain.py -------------------------------------------------------------------------------- /QTable/走迷宫/RunQTable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/走迷宫/RunQTable.py -------------------------------------------------------------------------------- /QTable/走迷宫/RunSarsaTable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/走迷宫/RunSarsaTable.py -------------------------------------------------------------------------------- /QTable/走迷宫/SarsaLambda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/走迷宫/SarsaLambda.py -------------------------------------------------------------------------------- /QTable/走迷宫/SarsaLearning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/走迷宫/SarsaLearning.py -------------------------------------------------------------------------------- /QTable/走迷宫/maze_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/belowthetree/ReinforceLearning/HEAD/QTable/走迷宫/maze_env.py --------------------------------------------------------------------------------