├── LICENSE ├── README.md ├── a3c ├── README.md ├── play.py ├── resources │ ├── average-scores.png │ └── sample-game.gif ├── sample-weights │ └── model-Breakout-v0-91750000.h5 └── train.py ├── q-learning-1-step ├── README.md ├── play.py ├── resources │ ├── after-12h-training.gif │ ├── after-18h-training.gif │ └── after-6h-training.gif ├── sample-weights │ ├── model-12h.h5 │ ├── model-18h.h5 │ └── model-6h.h5 └── train.py └── q-learning-n-step ├── README.md ├── play.py └── train.py /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/README.md -------------------------------------------------------------------------------- /a3c/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/a3c/README.md -------------------------------------------------------------------------------- /a3c/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/a3c/play.py -------------------------------------------------------------------------------- /a3c/resources/average-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/a3c/resources/average-scores.png -------------------------------------------------------------------------------- /a3c/resources/sample-game.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/a3c/resources/sample-game.gif -------------------------------------------------------------------------------- /a3c/sample-weights/model-Breakout-v0-91750000.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/a3c/sample-weights/model-Breakout-v0-91750000.h5 -------------------------------------------------------------------------------- /a3c/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/a3c/train.py -------------------------------------------------------------------------------- /q-learning-1-step/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/README.md -------------------------------------------------------------------------------- /q-learning-1-step/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/play.py -------------------------------------------------------------------------------- /q-learning-1-step/resources/after-12h-training.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/resources/after-12h-training.gif -------------------------------------------------------------------------------- /q-learning-1-step/resources/after-18h-training.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/resources/after-18h-training.gif -------------------------------------------------------------------------------- /q-learning-1-step/resources/after-6h-training.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/resources/after-6h-training.gif -------------------------------------------------------------------------------- /q-learning-1-step/sample-weights/model-12h.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/sample-weights/model-12h.h5 -------------------------------------------------------------------------------- /q-learning-1-step/sample-weights/model-18h.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/sample-weights/model-18h.h5 -------------------------------------------------------------------------------- /q-learning-1-step/sample-weights/model-6h.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/sample-weights/model-6h.h5 -------------------------------------------------------------------------------- /q-learning-1-step/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-1-step/train.py -------------------------------------------------------------------------------- /q-learning-n-step/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-n-step/README.md -------------------------------------------------------------------------------- /q-learning-n-step/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-n-step/play.py -------------------------------------------------------------------------------- /q-learning-n-step/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Grzego/async-rl/HEAD/q-learning-n-step/train.py --------------------------------------------------------------------------------