├── .circleci └── config.yml ├── .gitignore ├── Pipfile ├── Pipfile.lock ├── README.md ├── debug_wrappers.py ├── env.py ├── images ├── Beamrider.gif ├── Breakout.gif ├── Pong.gif ├── Qbert.gif ├── SpaceInvaders.gif ├── actions.png ├── all_scores_graph.png ├── all_scores_paper.png ├── pong_scores_graph.png ├── pong_scores_paper.png ├── pong_scores_tb.png ├── preprocessing_play.gif ├── returns.png ├── step1.png ├── step2.png ├── step3.png ├── step4.png ├── step5.png ├── step6.png ├── step6_2.png └── train_batch.png ├── multi_scope_train_op.py ├── network.py ├── params.py ├── preprocessing.py ├── run_checkpoint.py ├── tests ├── multi_scope_train_op_test.py ├── network_test.py ├── preprocessing_play.py ├── preprocessing_test.py ├── shared_statistics_test.py ├── show_debug_data.py ├── train_test.py └── utils_test.py ├── train.py ├── utils.py ├── utils_tensorflow.py └── worker.py /.circleci/config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/.circleci/config.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/.gitignore -------------------------------------------------------------------------------- /Pipfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/Pipfile -------------------------------------------------------------------------------- /Pipfile.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/Pipfile.lock -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/README.md -------------------------------------------------------------------------------- /debug_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/debug_wrappers.py -------------------------------------------------------------------------------- /env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/env.py -------------------------------------------------------------------------------- /images/Beamrider.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/Beamrider.gif -------------------------------------------------------------------------------- /images/Breakout.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/Breakout.gif -------------------------------------------------------------------------------- /images/Pong.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/Pong.gif -------------------------------------------------------------------------------- /images/Qbert.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/Qbert.gif -------------------------------------------------------------------------------- /images/SpaceInvaders.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/SpaceInvaders.gif -------------------------------------------------------------------------------- /images/actions.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/actions.png -------------------------------------------------------------------------------- /images/all_scores_graph.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/all_scores_graph.png -------------------------------------------------------------------------------- /images/all_scores_paper.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/all_scores_paper.png -------------------------------------------------------------------------------- /images/pong_scores_graph.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/pong_scores_graph.png -------------------------------------------------------------------------------- /images/pong_scores_paper.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/pong_scores_paper.png -------------------------------------------------------------------------------- /images/pong_scores_tb.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/pong_scores_tb.png -------------------------------------------------------------------------------- /images/preprocessing_play.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/preprocessing_play.gif -------------------------------------------------------------------------------- /images/returns.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/returns.png -------------------------------------------------------------------------------- /images/step1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step1.png -------------------------------------------------------------------------------- /images/step2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step2.png -------------------------------------------------------------------------------- /images/step3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step3.png -------------------------------------------------------------------------------- /images/step4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step4.png -------------------------------------------------------------------------------- /images/step5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step5.png -------------------------------------------------------------------------------- /images/step6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step6.png -------------------------------------------------------------------------------- /images/step6_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/step6_2.png -------------------------------------------------------------------------------- /images/train_batch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/images/train_batch.png -------------------------------------------------------------------------------- /multi_scope_train_op.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/multi_scope_train_op.py -------------------------------------------------------------------------------- /network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/network.py -------------------------------------------------------------------------------- /params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/params.py -------------------------------------------------------------------------------- /preprocessing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/preprocessing.py -------------------------------------------------------------------------------- /run_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/run_checkpoint.py -------------------------------------------------------------------------------- /tests/multi_scope_train_op_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/multi_scope_train_op_test.py -------------------------------------------------------------------------------- /tests/network_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/network_test.py -------------------------------------------------------------------------------- /tests/preprocessing_play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/preprocessing_play.py -------------------------------------------------------------------------------- /tests/preprocessing_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/preprocessing_test.py -------------------------------------------------------------------------------- /tests/shared_statistics_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/shared_statistics_test.py -------------------------------------------------------------------------------- /tests/show_debug_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/show_debug_data.py -------------------------------------------------------------------------------- /tests/train_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/train_test.py -------------------------------------------------------------------------------- /tests/utils_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/tests/utils_test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/train.py -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/utils.py -------------------------------------------------------------------------------- /utils_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/utils_tensorflow.py -------------------------------------------------------------------------------- /worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrahtz/ocd-a3c/HEAD/worker.py --------------------------------------------------------------------------------