├── .dockerignore ├── .gitattributes ├── .github └── workflows │ ├── docker.yml │ └── pythonpublish.yml ├── .gitignore ├── .travis.yml ├── Dockerfile ├── LICENSE ├── README.md ├── agnes ├── __init__.py ├── algos │ ├── __init__.py │ ├── a2c.py │ ├── base.py │ ├── configs │ │ ├── __init__.py │ │ ├── a2c_config.py │ │ └── ppo_config.py │ ├── ppo.py │ └── ppo_rnd.py ├── common │ ├── __init__.py │ ├── distributions.py │ ├── env_maker.py │ ├── envs_prep │ │ ├── __init__.py │ │ ├── atari_wrappers.py │ │ ├── dummy_vec_env.py │ │ ├── monitor.py │ │ ├── subproc_vec_env.py │ │ ├── tile_images.py │ │ ├── util.py │ │ ├── vec_env.py │ │ ├── vec_frame_stack.py │ │ ├── vec_normalize.py │ │ └── wrappers.py │ ├── init_weights.py │ ├── logger.py │ ├── make_nn.py │ ├── play.py │ ├── plotter.py │ ├── rnd_networks.py │ ├── running_mean_std.py │ ├── schedules.py │ └── tests │ │ ├── CNN_Discrete.py │ │ ├── MLP_Continuous.py │ │ ├── MLP_Discrete.py │ │ ├── MLP_Discrete_Competitive.py │ │ ├── MPI_MLP_Discrete.py │ │ ├── MPI_runner.py │ │ ├── RNN_Discrete.py │ │ └── __init__.py ├── nns │ ├── __init__.py │ ├── base.py │ ├── cnn.py │ ├── initializer.py │ ├── mlp.py │ └── rnn.py └── runners │ ├── __init__.py │ ├── base_runner.py │ ├── competitive_single.py │ ├── distributed_mpi.py │ └── single.py ├── examples ├── algo_example.py ├── atari_example.py ├── atari_rnn_example.py ├── classic_example.py ├── distributed │ ├── distributed_example.py │ └── distributed_example_supplementary.py ├── distributed_rnn │ ├── Breakout.pth │ ├── distributed_example.py │ └── distributed_example_supplementary.py ├── mujoco_example.py ├── mujoco_example_rnd.py ├── play.py ├── plot.py └── viz_attention.py ├── requirements.txt ├── results ├── Atari-BreakoutNoFrameskip-v4-PPO-10M │ ├── Breakout-LSTMCNN-Grad-Cam.gif │ ├── Breakout-LSTMCNN.gif │ ├── events.out.tfevents.1570824188.7d032cd4d92e.16828.0 │ └── reward_per_update.svg └── MuJoCo │ ├── Ant-v2_MLP │ └── PPO │ │ ├── 2020_01_24T10_49_13 │ │ ├── progress.csv │ │ └── tensorboard │ │ │ └── events.out.tfevents.1579862954.TRACY.30884.0 │ │ ├── 2020_01_24T16_28_28 │ │ ├── progress.csv │ │ └── tensorboard │ │ │ └── events.out.tfevents.1579883309.TRACY.32264.0 │ │ └── 2020_01_24T19_26_35 │ │ ├── progress.csv │ │ └── tensorboard │ │ └── events.out.tfevents.1579893997.TRACY.10460.0 │ └── reward_per_timestep.svg ├── setup.py ├── test.py └── version.py /.dockerignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/.dockerignore -------------------------------------------------------------------------------- /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/.gitattributes -------------------------------------------------------------------------------- /.github/workflows/docker.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/.github/workflows/docker.yml -------------------------------------------------------------------------------- /.github/workflows/pythonpublish.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/.github/workflows/pythonpublish.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/.gitignore -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/.travis.yml -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/Dockerfile -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/README.md -------------------------------------------------------------------------------- /agnes/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/__init__.py -------------------------------------------------------------------------------- /agnes/algos/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/__init__.py -------------------------------------------------------------------------------- /agnes/algos/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/a2c.py -------------------------------------------------------------------------------- /agnes/algos/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/base.py -------------------------------------------------------------------------------- /agnes/algos/configs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /agnes/algos/configs/a2c_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/configs/a2c_config.py -------------------------------------------------------------------------------- /agnes/algos/configs/ppo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/configs/ppo_config.py -------------------------------------------------------------------------------- /agnes/algos/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/ppo.py -------------------------------------------------------------------------------- /agnes/algos/ppo_rnd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/algos/ppo_rnd.py -------------------------------------------------------------------------------- /agnes/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/__init__.py -------------------------------------------------------------------------------- /agnes/common/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/distributions.py -------------------------------------------------------------------------------- /agnes/common/env_maker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/env_maker.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/__init__.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/atari_wrappers.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/dummy_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/dummy_vec_env.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/monitor.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/subproc_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/subproc_vec_env.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/tile_images.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/tile_images.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/util.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/vec_env.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/vec_frame_stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/vec_frame_stack.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/vec_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/vec_normalize.py -------------------------------------------------------------------------------- /agnes/common/envs_prep/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/envs_prep/wrappers.py -------------------------------------------------------------------------------- /agnes/common/init_weights.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/init_weights.py -------------------------------------------------------------------------------- /agnes/common/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/logger.py -------------------------------------------------------------------------------- /agnes/common/make_nn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/make_nn.py -------------------------------------------------------------------------------- /agnes/common/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/play.py -------------------------------------------------------------------------------- /agnes/common/plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/plotter.py -------------------------------------------------------------------------------- /agnes/common/rnd_networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/rnd_networks.py -------------------------------------------------------------------------------- /agnes/common/running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/running_mean_std.py -------------------------------------------------------------------------------- /agnes/common/schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/schedules.py -------------------------------------------------------------------------------- /agnes/common/tests/CNN_Discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/CNN_Discrete.py -------------------------------------------------------------------------------- /agnes/common/tests/MLP_Continuous.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/MLP_Continuous.py -------------------------------------------------------------------------------- /agnes/common/tests/MLP_Discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/MLP_Discrete.py -------------------------------------------------------------------------------- /agnes/common/tests/MLP_Discrete_Competitive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/MLP_Discrete_Competitive.py -------------------------------------------------------------------------------- /agnes/common/tests/MPI_MLP_Discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/MPI_MLP_Discrete.py -------------------------------------------------------------------------------- /agnes/common/tests/MPI_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/MPI_runner.py -------------------------------------------------------------------------------- /agnes/common/tests/RNN_Discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/RNN_Discrete.py -------------------------------------------------------------------------------- /agnes/common/tests/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/common/tests/__init__.py -------------------------------------------------------------------------------- /agnes/nns/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/nns/__init__.py -------------------------------------------------------------------------------- /agnes/nns/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/nns/base.py -------------------------------------------------------------------------------- /agnes/nns/cnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/nns/cnn.py -------------------------------------------------------------------------------- /agnes/nns/initializer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/nns/initializer.py -------------------------------------------------------------------------------- /agnes/nns/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/nns/mlp.py -------------------------------------------------------------------------------- /agnes/nns/rnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/nns/rnn.py -------------------------------------------------------------------------------- /agnes/runners/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/runners/__init__.py -------------------------------------------------------------------------------- /agnes/runners/base_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/runners/base_runner.py -------------------------------------------------------------------------------- /agnes/runners/competitive_single.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/runners/competitive_single.py -------------------------------------------------------------------------------- /agnes/runners/distributed_mpi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/runners/distributed_mpi.py -------------------------------------------------------------------------------- /agnes/runners/single.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/agnes/runners/single.py -------------------------------------------------------------------------------- /examples/algo_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/algo_example.py -------------------------------------------------------------------------------- /examples/atari_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/atari_example.py -------------------------------------------------------------------------------- /examples/atari_rnn_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/atari_rnn_example.py -------------------------------------------------------------------------------- /examples/classic_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/classic_example.py -------------------------------------------------------------------------------- /examples/distributed/distributed_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/distributed/distributed_example.py -------------------------------------------------------------------------------- /examples/distributed/distributed_example_supplementary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/distributed/distributed_example_supplementary.py -------------------------------------------------------------------------------- /examples/distributed_rnn/Breakout.pth: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/distributed_rnn/Breakout.pth -------------------------------------------------------------------------------- /examples/distributed_rnn/distributed_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/distributed_rnn/distributed_example.py -------------------------------------------------------------------------------- /examples/distributed_rnn/distributed_example_supplementary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/distributed_rnn/distributed_example_supplementary.py -------------------------------------------------------------------------------- /examples/mujoco_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/mujoco_example.py -------------------------------------------------------------------------------- /examples/mujoco_example_rnd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/mujoco_example_rnd.py -------------------------------------------------------------------------------- /examples/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/play.py -------------------------------------------------------------------------------- /examples/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/plot.py -------------------------------------------------------------------------------- /examples/viz_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/examples/viz_attention.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/requirements.txt -------------------------------------------------------------------------------- /results/Atari-BreakoutNoFrameskip-v4-PPO-10M/Breakout-LSTMCNN-Grad-Cam.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/Atari-BreakoutNoFrameskip-v4-PPO-10M/Breakout-LSTMCNN-Grad-Cam.gif -------------------------------------------------------------------------------- /results/Atari-BreakoutNoFrameskip-v4-PPO-10M/Breakout-LSTMCNN.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/Atari-BreakoutNoFrameskip-v4-PPO-10M/Breakout-LSTMCNN.gif -------------------------------------------------------------------------------- /results/Atari-BreakoutNoFrameskip-v4-PPO-10M/events.out.tfevents.1570824188.7d032cd4d92e.16828.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/Atari-BreakoutNoFrameskip-v4-PPO-10M/events.out.tfevents.1570824188.7d032cd4d92e.16828.0 -------------------------------------------------------------------------------- /results/Atari-BreakoutNoFrameskip-v4-PPO-10M/reward_per_update.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/Atari-BreakoutNoFrameskip-v4-PPO-10M/reward_per_update.svg -------------------------------------------------------------------------------- /results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T10_49_13/progress.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T10_49_13/progress.csv -------------------------------------------------------------------------------- /results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T10_49_13/tensorboard/events.out.tfevents.1579862954.TRACY.30884.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T10_49_13/tensorboard/events.out.tfevents.1579862954.TRACY.30884.0 -------------------------------------------------------------------------------- /results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T16_28_28/progress.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T16_28_28/progress.csv -------------------------------------------------------------------------------- /results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T16_28_28/tensorboard/events.out.tfevents.1579883309.TRACY.32264.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T16_28_28/tensorboard/events.out.tfevents.1579883309.TRACY.32264.0 -------------------------------------------------------------------------------- /results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T19_26_35/progress.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T19_26_35/progress.csv -------------------------------------------------------------------------------- /results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T19_26_35/tensorboard/events.out.tfevents.1579893997.TRACY.10460.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/Ant-v2_MLP/PPO/2020_01_24T19_26_35/tensorboard/events.out.tfevents.1579893997.TRACY.10460.0 -------------------------------------------------------------------------------- /results/MuJoCo/reward_per_timestep.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/results/MuJoCo/reward_per_timestep.svg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/setup.py -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rotinov/AGNES/HEAD/test.py -------------------------------------------------------------------------------- /version.py: -------------------------------------------------------------------------------- 1 | version = '0.0.7.5' 2 | --------------------------------------------------------------------------------