├── .gitignore ├── .python-version ├── LICENSE ├── README.MD ├── gym_vec_api ├── ppo_multidiscrete.py └── ppo_multidiscrete_mask.py ├── invalid_action_masking ├── ppo_10x10.py ├── ppo_16x16.py ├── ppo_24x24.py ├── ppo_4x4.py ├── ppo_no_adj_10x10.py ├── ppo_no_adj_16x16.py ├── ppo_no_adj_24x24.py ├── ppo_no_adj_4x4.py ├── ppo_no_mask_10x10.py ├── ppo_no_mask_16x16.py ├── ppo_no_mask_24x24.py └── ppo_no_mask_4x4.py ├── plots ├── analysis.py ├── approx_kl.py ├── charts_episode_reward-MicrortsMining10x10F9-v0.pdf ├── charts_episode_reward-MicrortsMining16x16F9-v0.pdf ├── charts_episode_reward-MicrortsMining24x24F9-v0.pdf ├── charts_episode_reward-MicrortsMining4x4F9-v0.pdf ├── charts_episode_reward │ ├── all_df_cache.pkl │ ├── data │ │ ├── MicrortsMining10x10F9-v0.pkl │ │ ├── MicrortsMining16x16F9-v0.pkl │ │ ├── MicrortsMining24x24F9-v0.pkl │ │ └── MicrortsMining4x4F9-v0.pkl │ ├── envs_cache.pkl │ ├── exp_names_cache.pkl │ ├── legend.pdf │ ├── legend.svg │ └── plots │ │ ├── MicrortsMining10x10F9-v0.pdf │ │ ├── MicrortsMining10x10F9-v0.svg │ │ ├── MicrortsMining16x16F9-v0.pdf │ │ ├── MicrortsMining24x24F9-v0.pdf │ │ └── MicrortsMining4x4F9-v0.pdf ├── episode_reward.py ├── legend1.pdf ├── losses_approx_kl-MicrortsMining10x10F9-v0.pdf ├── losses_approx_kl-MicrortsMining16x16F9-v0.pdf ├── losses_approx_kl-MicrortsMining24x24F9-v0.pdf ├── losses_approx_kl-MicrortsMining4x4F9-v0.pdf └── losses_approx_kl │ ├── all_df_cache.pkl │ ├── data │ ├── MicrortsMining10x10F9-v0.pkl │ ├── MicrortsMining16x16F9-v0.pkl │ ├── MicrortsMining24x24F9-v0.pkl │ └── MicrortsMining4x4F9-v0.pkl │ ├── envs_cache.pkl │ ├── exp_names_cache.pkl │ ├── legend.pdf │ └── plots │ ├── MicrortsMining10x10F9-v0.pdf │ ├── MicrortsMining16x16F9-v0.pdf │ ├── MicrortsMining24x24F9-v0.pdf │ └── MicrortsMining4x4F9-v0.pdf ├── poetry.lock ├── ppo.py ├── pyproject.toml ├── requirements.txt └── test.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/.gitignore -------------------------------------------------------------------------------- /.python-version: -------------------------------------------------------------------------------- 1 | 3.9.5/envs/invalid-action-masking -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/LICENSE -------------------------------------------------------------------------------- /README.MD: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/README.MD -------------------------------------------------------------------------------- /gym_vec_api/ppo_multidiscrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/gym_vec_api/ppo_multidiscrete.py -------------------------------------------------------------------------------- /gym_vec_api/ppo_multidiscrete_mask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/gym_vec_api/ppo_multidiscrete_mask.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_10x10.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_10x10.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_16x16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_16x16.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_24x24.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_24x24.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_4x4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_4x4.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_adj_10x10.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_adj_10x10.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_adj_16x16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_adj_16x16.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_adj_24x24.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_adj_24x24.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_adj_4x4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_adj_4x4.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_mask_10x10.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_mask_10x10.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_mask_16x16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_mask_16x16.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_mask_24x24.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_mask_24x24.py -------------------------------------------------------------------------------- /invalid_action_masking/ppo_no_mask_4x4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/invalid_action_masking/ppo_no_mask_4x4.py -------------------------------------------------------------------------------- /plots/analysis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/analysis.py -------------------------------------------------------------------------------- /plots/approx_kl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/approx_kl.py -------------------------------------------------------------------------------- /plots/charts_episode_reward-MicrortsMining10x10F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward-MicrortsMining10x10F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward-MicrortsMining16x16F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward-MicrortsMining16x16F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward-MicrortsMining24x24F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward-MicrortsMining24x24F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward-MicrortsMining4x4F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward-MicrortsMining4x4F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward/all_df_cache.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/all_df_cache.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/data/MicrortsMining10x10F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/data/MicrortsMining10x10F9-v0.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/data/MicrortsMining16x16F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/data/MicrortsMining16x16F9-v0.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/data/MicrortsMining24x24F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/data/MicrortsMining24x24F9-v0.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/data/MicrortsMining4x4F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/data/MicrortsMining4x4F9-v0.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/envs_cache.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/envs_cache.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/exp_names_cache.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/exp_names_cache.pkl -------------------------------------------------------------------------------- /plots/charts_episode_reward/legend.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/legend.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward/legend.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/legend.svg -------------------------------------------------------------------------------- /plots/charts_episode_reward/plots/MicrortsMining10x10F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/plots/MicrortsMining10x10F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward/plots/MicrortsMining10x10F9-v0.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/plots/MicrortsMining10x10F9-v0.svg -------------------------------------------------------------------------------- /plots/charts_episode_reward/plots/MicrortsMining16x16F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/plots/MicrortsMining16x16F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward/plots/MicrortsMining24x24F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/plots/MicrortsMining24x24F9-v0.pdf -------------------------------------------------------------------------------- /plots/charts_episode_reward/plots/MicrortsMining4x4F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/charts_episode_reward/plots/MicrortsMining4x4F9-v0.pdf -------------------------------------------------------------------------------- /plots/episode_reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/episode_reward.py -------------------------------------------------------------------------------- /plots/legend1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/legend1.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl-MicrortsMining10x10F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl-MicrortsMining10x10F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl-MicrortsMining16x16F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl-MicrortsMining16x16F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl-MicrortsMining24x24F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl-MicrortsMining24x24F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl-MicrortsMining4x4F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl-MicrortsMining4x4F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl/all_df_cache.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/all_df_cache.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/data/MicrortsMining10x10F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/data/MicrortsMining10x10F9-v0.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/data/MicrortsMining16x16F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/data/MicrortsMining16x16F9-v0.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/data/MicrortsMining24x24F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/data/MicrortsMining24x24F9-v0.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/data/MicrortsMining4x4F9-v0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/data/MicrortsMining4x4F9-v0.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/envs_cache.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/envs_cache.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/exp_names_cache.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/exp_names_cache.pkl -------------------------------------------------------------------------------- /plots/losses_approx_kl/legend.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/legend.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl/plots/MicrortsMining10x10F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/plots/MicrortsMining10x10F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl/plots/MicrortsMining16x16F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/plots/MicrortsMining16x16F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl/plots/MicrortsMining24x24F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/plots/MicrortsMining24x24F9-v0.pdf -------------------------------------------------------------------------------- /plots/losses_approx_kl/plots/MicrortsMining4x4F9-v0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/plots/losses_approx_kl/plots/MicrortsMining4x4F9-v0.pdf -------------------------------------------------------------------------------- /poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/poetry.lock -------------------------------------------------------------------------------- /ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/ppo.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/requirements.txt -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vwxyzjn/invalid-action-masking/HEAD/test.py --------------------------------------------------------------------------------