├── .gitignore ├── LICENSE ├── README.md ├── algo ├── __init__.py ├── a2c_acktr.py ├── kfac.py ├── ppo.py └── sil.py ├── arguments.py ├── distributions.py ├── enjoy.py ├── envs ├── __init__.py ├── make_env.py └── pommerman.py ├── helpers ├── README.md ├── __init__.py ├── atari_wrappers.py ├── benchmarks.py ├── cg.py ├── cmd_util.py ├── console_util.py ├── filters.py ├── identity_env.py ├── logger.py ├── math_util.py ├── misc_util.py ├── monitor.py ├── results_plotter.py ├── retro_wrappers.py ├── running_mean_std.py ├── running_stat.py ├── segment_tree.py ├── tile_images.py └── vec_env │ ├── __init__.py │ ├── dummy_vec_env.py │ ├── shmem_vec_env.py │ ├── subproc_vec_env.py │ ├── test_vec_env.py │ ├── util.py │ ├── vec_frame_stack.py │ ├── vec_monitor.py │ └── vec_normalize.py ├── imgs ├── a2c_beamrider.png ├── a2c_breakout.png ├── a2c_qbert.png ├── a2c_seaquest.png ├── acktr_beamrider.png ├── acktr_breakout.png ├── acktr_qbert.png ├── acktr_seaquest.png ├── ppo_halfcheetah.png ├── ppo_hopper.png ├── ppo_reacher.png └── ppo_walker.png ├── main.py ├── models ├── __init__.py ├── factory.py ├── model_generic.py ├── model_pomm.py └── policy.py ├── replay_storage.py ├── requirements.txt ├── results └── training-conv4-FFA.jpg ├── rollout_storage.py ├── utils.py └── visualize.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/README.md -------------------------------------------------------------------------------- /algo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/algo/__init__.py -------------------------------------------------------------------------------- /algo/a2c_acktr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/algo/a2c_acktr.py -------------------------------------------------------------------------------- /algo/kfac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/algo/kfac.py -------------------------------------------------------------------------------- /algo/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/algo/ppo.py -------------------------------------------------------------------------------- /algo/sil.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/algo/sil.py -------------------------------------------------------------------------------- /arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/arguments.py -------------------------------------------------------------------------------- /distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/distributions.py -------------------------------------------------------------------------------- /enjoy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/enjoy.py -------------------------------------------------------------------------------- /envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/envs/__init__.py -------------------------------------------------------------------------------- /envs/make_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/envs/make_env.py -------------------------------------------------------------------------------- /envs/pommerman.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/envs/pommerman.py -------------------------------------------------------------------------------- /helpers/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/README.md -------------------------------------------------------------------------------- /helpers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /helpers/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/atari_wrappers.py -------------------------------------------------------------------------------- /helpers/benchmarks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/benchmarks.py -------------------------------------------------------------------------------- /helpers/cg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/cg.py -------------------------------------------------------------------------------- /helpers/cmd_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/cmd_util.py -------------------------------------------------------------------------------- /helpers/console_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/console_util.py -------------------------------------------------------------------------------- /helpers/filters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/filters.py -------------------------------------------------------------------------------- /helpers/identity_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/identity_env.py -------------------------------------------------------------------------------- /helpers/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/logger.py -------------------------------------------------------------------------------- /helpers/math_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/math_util.py -------------------------------------------------------------------------------- /helpers/misc_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/misc_util.py -------------------------------------------------------------------------------- /helpers/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/monitor.py -------------------------------------------------------------------------------- /helpers/results_plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/results_plotter.py -------------------------------------------------------------------------------- /helpers/retro_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/retro_wrappers.py -------------------------------------------------------------------------------- /helpers/running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/running_mean_std.py -------------------------------------------------------------------------------- /helpers/running_stat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/running_stat.py -------------------------------------------------------------------------------- /helpers/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/segment_tree.py -------------------------------------------------------------------------------- /helpers/tile_images.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/tile_images.py -------------------------------------------------------------------------------- /helpers/vec_env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/__init__.py -------------------------------------------------------------------------------- /helpers/vec_env/dummy_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/dummy_vec_env.py -------------------------------------------------------------------------------- /helpers/vec_env/shmem_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/shmem_vec_env.py -------------------------------------------------------------------------------- /helpers/vec_env/subproc_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/subproc_vec_env.py -------------------------------------------------------------------------------- /helpers/vec_env/test_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/test_vec_env.py -------------------------------------------------------------------------------- /helpers/vec_env/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/util.py -------------------------------------------------------------------------------- /helpers/vec_env/vec_frame_stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/vec_frame_stack.py -------------------------------------------------------------------------------- /helpers/vec_env/vec_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/vec_monitor.py -------------------------------------------------------------------------------- /helpers/vec_env/vec_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/helpers/vec_env/vec_normalize.py -------------------------------------------------------------------------------- /imgs/a2c_beamrider.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/a2c_beamrider.png -------------------------------------------------------------------------------- /imgs/a2c_breakout.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/a2c_breakout.png -------------------------------------------------------------------------------- /imgs/a2c_qbert.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/a2c_qbert.png -------------------------------------------------------------------------------- /imgs/a2c_seaquest.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/a2c_seaquest.png -------------------------------------------------------------------------------- /imgs/acktr_beamrider.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/acktr_beamrider.png -------------------------------------------------------------------------------- /imgs/acktr_breakout.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/acktr_breakout.png -------------------------------------------------------------------------------- /imgs/acktr_qbert.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/acktr_qbert.png -------------------------------------------------------------------------------- /imgs/acktr_seaquest.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/acktr_seaquest.png -------------------------------------------------------------------------------- /imgs/ppo_halfcheetah.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/ppo_halfcheetah.png -------------------------------------------------------------------------------- /imgs/ppo_hopper.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/ppo_hopper.png -------------------------------------------------------------------------------- /imgs/ppo_reacher.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/ppo_reacher.png -------------------------------------------------------------------------------- /imgs/ppo_walker.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/imgs/ppo_walker.png -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/main.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- 1 | from .factory import create_policy -------------------------------------------------------------------------------- /models/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/models/factory.py -------------------------------------------------------------------------------- /models/model_generic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/models/model_generic.py -------------------------------------------------------------------------------- /models/model_pomm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/models/model_pomm.py -------------------------------------------------------------------------------- /models/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/models/policy.py -------------------------------------------------------------------------------- /replay_storage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/replay_storage.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | gym 2 | matplotlib 3 | pybullet 4 | -------------------------------------------------------------------------------- /results/training-conv4-FFA.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/results/training-conv4-FFA.jpg -------------------------------------------------------------------------------- /rollout_storage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/rollout_storage.py -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/utils.py -------------------------------------------------------------------------------- /visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rwightman/pytorch-pommerman-rl/HEAD/visualize.py --------------------------------------------------------------------------------