├── .gitignore ├── LICENSE ├── README.md ├── classic_policies ├── Acrobot-v0.h5 ├── CartPole-v0.h5 ├── InvertedPendulum-v1.h5 └── MountainCar-v0.h5 ├── environments ├── __init__.py ├── __init__.pyc ├── rlgymenv.py └── rlgymenv.pyc ├── expert_policies ├── classic │ ├── Acrobot-v0.h5 │ ├── CartPole-v0.h5 │ ├── InvertedPendulum-v1.h5 │ └── MountainCar-v0.h5 └── modern │ ├── log_Ant-v1_0.h5 │ ├── log_HalfCheetah-v0_2.h5 │ ├── log_HalfCheetah-v1_2.h5 │ ├── log_Hopper-v0_3.h5 │ ├── log_Hopper-v1_4.h5 │ ├── log_Reacher-v1_4.h5 │ ├── log_Walker2d-v1_1.h5 │ ├── log_humanoid_1.h5 │ └── walker_eb5b2e_1.h5 ├── pipelines ├── im_classic_pipeline.yaml ├── im_humanoid_pipeline.yaml ├── im_pipeline.yaml └── im_regtest_pipeline.yaml ├── policyopt ├── __init__.py ├── gmmil.py ├── imitation.py ├── nn.py ├── optim.py ├── rl.py ├── thutil.py ├── tqdm.py └── util.py ├── results ├── classic_results.h5 ├── entreg_results.h5 ├── humanoid_results.h5 └── modern_results.h5 ├── scripts ├── __init__.py ├── check_progress.py ├── comparelog.py ├── evaluation.py ├── gen_classic_policies.py ├── im_pipeline.py ├── imitate_mj.py ├── media │ ├── README │ ├── print_env_info.py │ ├── print_env_randreturn.py │ └── video_mj.py ├── print_saved_returns.py ├── run_rl_mj.py ├── showlog.py └── vis_mj.py └── train.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/README.md -------------------------------------------------------------------------------- /classic_policies/Acrobot-v0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/classic_policies/Acrobot-v0.h5 -------------------------------------------------------------------------------- /classic_policies/CartPole-v0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/classic_policies/CartPole-v0.h5 -------------------------------------------------------------------------------- /classic_policies/InvertedPendulum-v1.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/classic_policies/InvertedPendulum-v1.h5 -------------------------------------------------------------------------------- /classic_policies/MountainCar-v0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/classic_policies/MountainCar-v0.h5 -------------------------------------------------------------------------------- /environments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /environments/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/environments/__init__.pyc -------------------------------------------------------------------------------- /environments/rlgymenv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/environments/rlgymenv.py -------------------------------------------------------------------------------- /environments/rlgymenv.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/environments/rlgymenv.pyc -------------------------------------------------------------------------------- /expert_policies/classic/Acrobot-v0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/classic/Acrobot-v0.h5 -------------------------------------------------------------------------------- /expert_policies/classic/CartPole-v0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/classic/CartPole-v0.h5 -------------------------------------------------------------------------------- /expert_policies/classic/InvertedPendulum-v1.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/classic/InvertedPendulum-v1.h5 -------------------------------------------------------------------------------- /expert_policies/classic/MountainCar-v0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/classic/MountainCar-v0.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_Ant-v1_0.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_Ant-v1_0.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_HalfCheetah-v0_2.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_HalfCheetah-v0_2.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_HalfCheetah-v1_2.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_HalfCheetah-v1_2.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_Hopper-v0_3.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_Hopper-v0_3.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_Hopper-v1_4.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_Hopper-v1_4.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_Reacher-v1_4.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_Reacher-v1_4.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_Walker2d-v1_1.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_Walker2d-v1_1.h5 -------------------------------------------------------------------------------- /expert_policies/modern/log_humanoid_1.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/log_humanoid_1.h5 -------------------------------------------------------------------------------- /expert_policies/modern/walker_eb5b2e_1.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/expert_policies/modern/walker_eb5b2e_1.h5 -------------------------------------------------------------------------------- /pipelines/im_classic_pipeline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/pipelines/im_classic_pipeline.yaml -------------------------------------------------------------------------------- /pipelines/im_humanoid_pipeline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/pipelines/im_humanoid_pipeline.yaml -------------------------------------------------------------------------------- /pipelines/im_pipeline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/pipelines/im_pipeline.yaml -------------------------------------------------------------------------------- /pipelines/im_regtest_pipeline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/pipelines/im_regtest_pipeline.yaml -------------------------------------------------------------------------------- /policyopt/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/__init__.py -------------------------------------------------------------------------------- /policyopt/gmmil.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/gmmil.py -------------------------------------------------------------------------------- /policyopt/imitation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/imitation.py -------------------------------------------------------------------------------- /policyopt/nn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/nn.py -------------------------------------------------------------------------------- /policyopt/optim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/optim.py -------------------------------------------------------------------------------- /policyopt/rl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/rl.py -------------------------------------------------------------------------------- /policyopt/thutil.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/thutil.py -------------------------------------------------------------------------------- /policyopt/tqdm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/tqdm.py -------------------------------------------------------------------------------- /policyopt/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/policyopt/util.py -------------------------------------------------------------------------------- /results/classic_results.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/results/classic_results.h5 -------------------------------------------------------------------------------- /results/entreg_results.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/results/entreg_results.h5 -------------------------------------------------------------------------------- /results/humanoid_results.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/results/humanoid_results.h5 -------------------------------------------------------------------------------- /results/modern_results.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/results/modern_results.h5 -------------------------------------------------------------------------------- /scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/check_progress.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/check_progress.py -------------------------------------------------------------------------------- /scripts/comparelog.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/comparelog.py -------------------------------------------------------------------------------- /scripts/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/evaluation.py -------------------------------------------------------------------------------- /scripts/gen_classic_policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/gen_classic_policies.py -------------------------------------------------------------------------------- /scripts/im_pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/im_pipeline.py -------------------------------------------------------------------------------- /scripts/imitate_mj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/imitate_mj.py -------------------------------------------------------------------------------- /scripts/media/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/media/README -------------------------------------------------------------------------------- /scripts/media/print_env_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/media/print_env_info.py -------------------------------------------------------------------------------- /scripts/media/print_env_randreturn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/media/print_env_randreturn.py -------------------------------------------------------------------------------- /scripts/media/video_mj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/media/video_mj.py -------------------------------------------------------------------------------- /scripts/print_saved_returns.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/print_saved_returns.py -------------------------------------------------------------------------------- /scripts/run_rl_mj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/run_rl_mj.py -------------------------------------------------------------------------------- /scripts/showlog.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/showlog.py -------------------------------------------------------------------------------- /scripts/vis_mj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/scripts/vis_mj.py -------------------------------------------------------------------------------- /train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/KAIST-AILab/gmmil/HEAD/train.sh --------------------------------------------------------------------------------