├── .gitignore ├── README.md ├── dqn ├── LICENSE ├── NeuralQLearner.lua ├── NeuralQLearnerB.lua ├── Rectifier.lua ├── Scale.lua ├── TransitionTable.lua ├── convnet.lua ├── convnet_atari3.lua ├── extract_data.lua ├── initenv.lua ├── msleep.c ├── net_downsample_2x_full_y.lua ├── nnutils.lua ├── plot_results.lua ├── test_2agent.lua ├── test_agent.lua ├── train_2agent.lua └── train_agent.lua ├── extract_data ├── install_dependencies.sh ├── plot_2results ├── plot_results ├── plots ├── Pong2Player.csv ├── Pong2Player0.csv ├── Pong2Player025.csv ├── Pong2Player025_average_reward.png ├── Pong2Player025_episode_counts.png ├── Pong2Player025_history_A.csv ├── Pong2Player025_history_B.csv ├── Pong2Player025_meanq.png ├── Pong2Player025_reward_counts.png ├── Pong2Player025_tderror.png ├── Pong2Player025_time.png ├── Pong2Player025p.csv ├── Pong2Player025p_average_reward.png ├── Pong2Player025p_episode_counts.png ├── Pong2Player025p_history_A.csv ├── Pong2Player025p_history_B.csv ├── Pong2Player025p_meanq.png ├── Pong2Player025p_reward_counts.png ├── Pong2Player025p_tderror.png ├── Pong2Player025p_time.png ├── Pong2Player05.csv ├── Pong2Player05_average_reward.png ├── Pong2Player05_episode_counts.png ├── Pong2Player05_history_A.csv ├── Pong2Player05_history_B.csv ├── Pong2Player05_meanq.png ├── Pong2Player05_reward_counts.png ├── Pong2Player05_tderror.png ├── Pong2Player05_time.png ├── Pong2Player05p.csv ├── Pong2Player05p_average_reward.png ├── Pong2Player05p_episode_counts.png ├── Pong2Player05p_history_A.csv ├── Pong2Player05p_history_B.csv ├── Pong2Player05p_meanq.png ├── Pong2Player05p_reward_counts.png ├── Pong2Player05p_tderror.png ├── Pong2Player05p_time.png ├── Pong2Player075.csv ├── Pong2Player075_average_reward.png ├── Pong2Player075_episode_counts.png ├── Pong2Player075_history_A.csv ├── Pong2Player075_history_B.csv ├── Pong2Player075_meanq.png ├── Pong2Player075_reward_counts.png ├── Pong2Player075_tderror.png ├── Pong2Player075_time.png ├── Pong2Player075p.csv ├── Pong2Player075p_average_reward.png ├── Pong2Player075p_episode_counts.png ├── Pong2Player075p_history_A.csv ├── Pong2Player075p_history_B.csv ├── Pong2Player075p_meanq.png ├── Pong2Player075p_reward_counts.png ├── Pong2Player075p_tderror.png ├── Pong2Player075p_time.png ├── Pong2Player0_average_reward.png ├── Pong2Player0_episode_counts.png ├── Pong2Player0_history_A.csv ├── Pong2Player0_history_B.csv ├── Pong2Player0_meanq.png ├── Pong2Player0_reward_counts.png ├── Pong2Player0_tderror.png ├── Pong2Player0_time.png ├── Pong2PlayerVS.csv ├── Pong2PlayerVS_average_reward.png ├── Pong2PlayerVS_episode_counts.png ├── Pong2PlayerVS_history_A.csv ├── Pong2PlayerVS_history_B.csv ├── Pong2PlayerVS_meanq.png ├── Pong2PlayerVS_reward_counts.png ├── Pong2PlayerVS_tderror.png ├── Pong2PlayerVS_time.png ├── Pong2Player_average_reward.png ├── Pong2Player_episode_counts.png ├── Pong2Player_history_A.csv ├── Pong2Player_history_B.csv ├── Pong2Player_meanq.png ├── Pong2Player_reward_counts.png ├── Pong2Player_tderror.png ├── Pong2Player_time.png ├── plot.py ├── plot_history.py ├── scatter.py ├── serving_time_history.png ├── serving_time_history_competitive.png ├── serving_time_history_cooperative.png ├── serving_time_per_point.png ├── serving_time_per_point_scatter.png ├── sidebounces_history.png ├── sidebounces_history_competitive.png ├── sidebounces_history_cooperative.png ├── sidebounces_per_point.png ├── sidebounces_per_point_scatter.png ├── stats.tex ├── table.py ├── wallbounces_history.png ├── wallbounces_history_competitive.png ├── wallbounces_history_cooperative.png ├── wallbounces_per_sidebounce.png └── wallbounces_per_sidebounce_scatter.png ├── roms ├── Pong2Player.bin ├── Pong2Player0.bin ├── Pong2Player025.bin ├── Pong2Player025p.bin ├── Pong2Player05.bin ├── Pong2Player05p.bin ├── Pong2Player075.bin ├── Pong2Player075p.bin ├── Pong2PlayerVS.bin ├── README ├── breakout.bin ├── breakout_2player.bin ├── pong.bin ├── surround.bin ├── wizard_of_wor.bin └── wizard_of_wor_2player.bin ├── run_cpu ├── run_gpu ├── run_gpu2 ├── run_gpu2_resume ├── test_cpu ├── test_gpu ├── test_gpu2 ├── test_gpu2_seeds ├── test_gpu2_versions └── test_schemes /.gitignore: -------------------------------------------------------------------------------- 1 | *~ 2 | torch 3 | dqn/*.t7 4 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/README.md -------------------------------------------------------------------------------- /dqn/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/LICENSE -------------------------------------------------------------------------------- /dqn/NeuralQLearner.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/NeuralQLearner.lua -------------------------------------------------------------------------------- /dqn/NeuralQLearnerB.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/NeuralQLearnerB.lua -------------------------------------------------------------------------------- /dqn/Rectifier.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/Rectifier.lua -------------------------------------------------------------------------------- /dqn/Scale.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/Scale.lua -------------------------------------------------------------------------------- /dqn/TransitionTable.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/TransitionTable.lua -------------------------------------------------------------------------------- /dqn/convnet.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/convnet.lua -------------------------------------------------------------------------------- /dqn/convnet_atari3.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/convnet_atari3.lua -------------------------------------------------------------------------------- /dqn/extract_data.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/extract_data.lua -------------------------------------------------------------------------------- /dqn/initenv.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/initenv.lua -------------------------------------------------------------------------------- /dqn/msleep.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/msleep.c -------------------------------------------------------------------------------- /dqn/net_downsample_2x_full_y.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/net_downsample_2x_full_y.lua -------------------------------------------------------------------------------- /dqn/nnutils.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/nnutils.lua -------------------------------------------------------------------------------- /dqn/plot_results.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/plot_results.lua -------------------------------------------------------------------------------- /dqn/test_2agent.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/test_2agent.lua -------------------------------------------------------------------------------- /dqn/test_agent.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/test_agent.lua -------------------------------------------------------------------------------- /dqn/train_2agent.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/train_2agent.lua -------------------------------------------------------------------------------- /dqn/train_agent.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/dqn/train_agent.lua -------------------------------------------------------------------------------- /extract_data: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/extract_data -------------------------------------------------------------------------------- /install_dependencies.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/install_dependencies.sh -------------------------------------------------------------------------------- /plot_2results: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plot_2results -------------------------------------------------------------------------------- /plot_results: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plot_results -------------------------------------------------------------------------------- /plots/Pong2Player.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player.csv -------------------------------------------------------------------------------- /plots/Pong2Player0.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0.csv -------------------------------------------------------------------------------- /plots/Pong2Player025.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025.csv -------------------------------------------------------------------------------- /plots/Pong2Player025_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player025_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player025_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player025_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player025_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player025_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player025_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player025_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025_time.png -------------------------------------------------------------------------------- /plots/Pong2Player025p.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p.csv -------------------------------------------------------------------------------- /plots/Pong2Player025p_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player025p_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player025p_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player025p_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player025p_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player025p_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player025p_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player025p_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player025p_time.png -------------------------------------------------------------------------------- /plots/Pong2Player05.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05.csv -------------------------------------------------------------------------------- /plots/Pong2Player05_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player05_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player05_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player05_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player05_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player05_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player05_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player05_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05_time.png -------------------------------------------------------------------------------- /plots/Pong2Player05p.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p.csv -------------------------------------------------------------------------------- /plots/Pong2Player05p_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player05p_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player05p_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player05p_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player05p_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player05p_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player05p_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player05p_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player05p_time.png -------------------------------------------------------------------------------- /plots/Pong2Player075.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075.csv -------------------------------------------------------------------------------- /plots/Pong2Player075_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player075_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player075_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player075_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player075_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player075_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player075_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player075_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075_time.png -------------------------------------------------------------------------------- /plots/Pong2Player075p.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p.csv -------------------------------------------------------------------------------- /plots/Pong2Player075p_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player075p_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player075p_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player075p_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player075p_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player075p_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player075p_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player075p_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player075p_time.png -------------------------------------------------------------------------------- /plots/Pong2Player0_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player0_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player0_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player0_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player0_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player0_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player0_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player0_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player0_time.png -------------------------------------------------------------------------------- /plots/Pong2PlayerVS.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS.csv -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_meanq.png -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_tderror.png -------------------------------------------------------------------------------- /plots/Pong2PlayerVS_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2PlayerVS_time.png -------------------------------------------------------------------------------- /plots/Pong2Player_average_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_average_reward.png -------------------------------------------------------------------------------- /plots/Pong2Player_episode_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_episode_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player_history_A.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_history_A.csv -------------------------------------------------------------------------------- /plots/Pong2Player_history_B.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_history_B.csv -------------------------------------------------------------------------------- /plots/Pong2Player_meanq.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_meanq.png -------------------------------------------------------------------------------- /plots/Pong2Player_reward_counts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_reward_counts.png -------------------------------------------------------------------------------- /plots/Pong2Player_tderror.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_tderror.png -------------------------------------------------------------------------------- /plots/Pong2Player_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/Pong2Player_time.png -------------------------------------------------------------------------------- /plots/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/plot.py -------------------------------------------------------------------------------- /plots/plot_history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/plot_history.py -------------------------------------------------------------------------------- /plots/scatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/scatter.py -------------------------------------------------------------------------------- /plots/serving_time_history.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/serving_time_history.png -------------------------------------------------------------------------------- /plots/serving_time_history_competitive.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/serving_time_history_competitive.png -------------------------------------------------------------------------------- /plots/serving_time_history_cooperative.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/serving_time_history_cooperative.png -------------------------------------------------------------------------------- /plots/serving_time_per_point.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/serving_time_per_point.png -------------------------------------------------------------------------------- /plots/serving_time_per_point_scatter.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/serving_time_per_point_scatter.png -------------------------------------------------------------------------------- /plots/sidebounces_history.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/sidebounces_history.png -------------------------------------------------------------------------------- /plots/sidebounces_history_competitive.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/sidebounces_history_competitive.png -------------------------------------------------------------------------------- /plots/sidebounces_history_cooperative.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/sidebounces_history_cooperative.png -------------------------------------------------------------------------------- /plots/sidebounces_per_point.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/sidebounces_per_point.png -------------------------------------------------------------------------------- /plots/sidebounces_per_point_scatter.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/sidebounces_per_point_scatter.png -------------------------------------------------------------------------------- /plots/stats.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/stats.tex -------------------------------------------------------------------------------- /plots/table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/table.py -------------------------------------------------------------------------------- /plots/wallbounces_history.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/wallbounces_history.png -------------------------------------------------------------------------------- /plots/wallbounces_history_competitive.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/wallbounces_history_competitive.png -------------------------------------------------------------------------------- /plots/wallbounces_history_cooperative.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/wallbounces_history_cooperative.png -------------------------------------------------------------------------------- /plots/wallbounces_per_sidebounce.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/wallbounces_per_sidebounce.png -------------------------------------------------------------------------------- /plots/wallbounces_per_sidebounce_scatter.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/plots/wallbounces_per_sidebounce_scatter.png -------------------------------------------------------------------------------- /roms/Pong2Player.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player0.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player025.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player025p.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player05.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player05p.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player075.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2Player075p.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/Pong2PlayerVS.bin: -------------------------------------------------------------------------------- 1 | pong.bin -------------------------------------------------------------------------------- /roms/README: -------------------------------------------------------------------------------- 1 | Rom files should be put in this directory 2 | -------------------------------------------------------------------------------- /roms/breakout.bin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/roms/breakout.bin -------------------------------------------------------------------------------- /roms/breakout_2player.bin: -------------------------------------------------------------------------------- 1 | breakout.bin -------------------------------------------------------------------------------- /roms/pong.bin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/roms/pong.bin -------------------------------------------------------------------------------- /roms/surround.bin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/roms/surround.bin -------------------------------------------------------------------------------- /roms/wizard_of_wor.bin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/roms/wizard_of_wor.bin -------------------------------------------------------------------------------- /roms/wizard_of_wor_2player.bin: -------------------------------------------------------------------------------- 1 | wizard_of_wor.bin -------------------------------------------------------------------------------- /run_cpu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/run_cpu -------------------------------------------------------------------------------- /run_gpu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/run_gpu -------------------------------------------------------------------------------- /run_gpu2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/run_gpu2 -------------------------------------------------------------------------------- /run_gpu2_resume: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/run_gpu2_resume -------------------------------------------------------------------------------- /test_cpu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/test_cpu -------------------------------------------------------------------------------- /test_gpu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/test_gpu -------------------------------------------------------------------------------- /test_gpu2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/test_gpu2 -------------------------------------------------------------------------------- /test_gpu2_seeds: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/test_gpu2_seeds -------------------------------------------------------------------------------- /test_gpu2_versions: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/test_gpu2_versions -------------------------------------------------------------------------------- /test_schemes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NeuroCSUT/DeepMind-Atari-Deep-Q-Learner-2Player/HEAD/test_schemes --------------------------------------------------------------------------------