├── .gitignore ├── LICENSE ├── README.md ├── _assets └── halfcheetahdir.gif ├── configs └── maml │ ├── 2d-navigation.yaml │ ├── ant-dir.yaml │ ├── ant-goal.yaml │ ├── ant-vel.yaml │ ├── bandit │ ├── bandit-k10-n10.yaml │ ├── bandit-k10-n100.yaml │ ├── bandit-k10-n500.yaml │ ├── bandit-k5-n10.yaml │ ├── bandit-k5-n100.yaml │ ├── bandit-k5-n500.yaml │ ├── bandit-k50-n10.yaml │ ├── bandit-k50-n100.yaml │ └── bandit-k50-n500.yaml │ ├── halfcheetah-dir.yaml │ └── halfcheetah-vel.yaml ├── maml_rl ├── __init__.py ├── baseline.py ├── envs │ ├── __init__.py │ ├── bandit.py │ ├── mdp.py │ ├── mujoco │ │ ├── __init__.py │ │ ├── ant.py │ │ └── half_cheetah.py │ ├── navigation.py │ └── utils │ │ ├── __init__.py │ │ ├── normalized_env.py │ │ ├── sync_vector_env.py │ │ └── wrappers.py ├── episode.py ├── metalearners │ ├── __init__.py │ ├── base.py │ └── maml_trpo.py ├── policies │ ├── __init__.py │ ├── categorical_mlp.py │ ├── normal_mlp.py │ └── policy.py ├── samplers │ ├── __init__.py │ ├── multi_task_sampler.py │ └── sampler.py ├── tests │ ├── __init__.py │ ├── samplers │ │ ├── __init__.py │ │ └── test_multi_task_sampler.py │ ├── test_episode.py │ └── utils │ │ ├── __init__.py │ │ └── test_torch_utils.py └── utils │ ├── __init__.py │ ├── helpers.py │ ├── optimization.py │ ├── reinforcement_learning.py │ └── torch_utils.py ├── requirements.txt ├── test.py └── train.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/README.md -------------------------------------------------------------------------------- /_assets/halfcheetahdir.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/_assets/halfcheetahdir.gif -------------------------------------------------------------------------------- /configs/maml/2d-navigation.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/2d-navigation.yaml -------------------------------------------------------------------------------- /configs/maml/ant-dir.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/ant-dir.yaml -------------------------------------------------------------------------------- /configs/maml/ant-goal.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/ant-goal.yaml -------------------------------------------------------------------------------- /configs/maml/ant-vel.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/ant-vel.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k10-n10.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k10-n10.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k10-n100.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k10-n100.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k10-n500.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k10-n500.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k5-n10.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k5-n10.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k5-n100.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k5-n100.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k5-n500.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k5-n500.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k50-n10.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k50-n10.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k50-n100.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k50-n100.yaml -------------------------------------------------------------------------------- /configs/maml/bandit/bandit-k50-n500.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/bandit/bandit-k50-n500.yaml -------------------------------------------------------------------------------- /configs/maml/halfcheetah-dir.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/halfcheetah-dir.yaml -------------------------------------------------------------------------------- /configs/maml/halfcheetah-vel.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/configs/maml/halfcheetah-vel.yaml -------------------------------------------------------------------------------- /maml_rl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /maml_rl/baseline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/baseline.py -------------------------------------------------------------------------------- /maml_rl/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/__init__.py -------------------------------------------------------------------------------- /maml_rl/envs/bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/bandit.py -------------------------------------------------------------------------------- /maml_rl/envs/mdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/mdp.py -------------------------------------------------------------------------------- /maml_rl/envs/mujoco/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /maml_rl/envs/mujoco/ant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/mujoco/ant.py -------------------------------------------------------------------------------- /maml_rl/envs/mujoco/half_cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/mujoco/half_cheetah.py -------------------------------------------------------------------------------- /maml_rl/envs/navigation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/navigation.py -------------------------------------------------------------------------------- /maml_rl/envs/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /maml_rl/envs/utils/normalized_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/utils/normalized_env.py -------------------------------------------------------------------------------- /maml_rl/envs/utils/sync_vector_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/utils/sync_vector_env.py -------------------------------------------------------------------------------- /maml_rl/envs/utils/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/envs/utils/wrappers.py -------------------------------------------------------------------------------- /maml_rl/episode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/episode.py -------------------------------------------------------------------------------- /maml_rl/metalearners/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/metalearners/__init__.py -------------------------------------------------------------------------------- /maml_rl/metalearners/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/metalearners/base.py -------------------------------------------------------------------------------- /maml_rl/metalearners/maml_trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/metalearners/maml_trpo.py -------------------------------------------------------------------------------- /maml_rl/policies/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/policies/__init__.py -------------------------------------------------------------------------------- /maml_rl/policies/categorical_mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/policies/categorical_mlp.py -------------------------------------------------------------------------------- /maml_rl/policies/normal_mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/policies/normal_mlp.py -------------------------------------------------------------------------------- /maml_rl/policies/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/policies/policy.py -------------------------------------------------------------------------------- /maml_rl/samplers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/samplers/__init__.py -------------------------------------------------------------------------------- /maml_rl/samplers/multi_task_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/samplers/multi_task_sampler.py -------------------------------------------------------------------------------- /maml_rl/samplers/sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/samplers/sampler.py -------------------------------------------------------------------------------- /maml_rl/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /maml_rl/tests/samplers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /maml_rl/tests/samplers/test_multi_task_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/tests/samplers/test_multi_task_sampler.py -------------------------------------------------------------------------------- /maml_rl/tests/test_episode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/tests/test_episode.py -------------------------------------------------------------------------------- /maml_rl/tests/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/tests/utils/__init__.py -------------------------------------------------------------------------------- /maml_rl/tests/utils/test_torch_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/tests/utils/test_torch_utils.py -------------------------------------------------------------------------------- /maml_rl/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /maml_rl/utils/helpers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/utils/helpers.py -------------------------------------------------------------------------------- /maml_rl/utils/optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/utils/optimization.py -------------------------------------------------------------------------------- /maml_rl/utils/reinforcement_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/utils/reinforcement_learning.py -------------------------------------------------------------------------------- /maml_rl/utils/torch_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/maml_rl/utils/torch_utils.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | torch>=1.3 2 | gym[mujoco]>=0.15 3 | tqdm>=4.0 4 | pyyaml>=5.1 -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tristandeleu/pytorch-maml-rl/HEAD/train.py --------------------------------------------------------------------------------