├── .gitignore ├── README.md ├── fig └── method.png ├── log └── directory_place_holder ├── meta_config ├── mt10 │ ├── modular_2_2_2_256_rand.json │ ├── modular_2_2_2_256_reweight.json │ ├── modular_2_2_2_256_reweight_rand.json │ ├── modular_4_4_2_128_reweight.json │ ├── modular_4_4_2_128_reweight_rand.json │ ├── mtmhsac.json │ ├── mtmhsac_rand.json │ ├── mtsac.json │ └── mtsac_rand.json └── mt50 │ ├── modular_2_2_2_256_reweight.json │ ├── modular_2_2_2_256_reweight_rand.json │ ├── modular_4_4_2_128_reweight.json │ ├── modular_4_4_2_128_reweight_rand.json │ ├── mtmhsac.json │ ├── mtmhsac_rand.json │ ├── mtsac.json │ └── mtsac_rand.json ├── metaworld_utils ├── __init__.py └── meta_env.py ├── starter ├── mt_para_mhmt_sac.py ├── mt_para_mtsac.py └── mt_para_mtsac_modular_gated_cas.py └── torchrl ├── __init__.py ├── algo ├── __init__.py ├── off_policy │ ├── __init__.py │ ├── mt_sac.py │ ├── mtmh_sac.py │ ├── off_rl_algo.py │ ├── sac.py │ ├── twin_sac.py │ └── twin_sac_q.py ├── rl_algo.py └── utils.py ├── collector ├── __init__.py ├── base.py ├── mt.py └── para │ ├── __init__.py │ ├── async_mt.py │ ├── base.py │ └── mt.py ├── env ├── __init__.py ├── base_wrapper.py ├── continuous_wrapper.py └── get_env.py ├── networks ├── __init__.py ├── base.py ├── init.py └── nets.py ├── policies ├── __init__.py ├── continuous_policy.py └── distribution.py ├── replay_buffers ├── __init__.py ├── base.py └── shared │ ├── __init__.py │ ├── base.py │ └── shmarray.py └── utils ├── __init__.py ├── args.py ├── logger.py └── plot_csv.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/README.md -------------------------------------------------------------------------------- /fig/method.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/fig/method.png -------------------------------------------------------------------------------- /log/directory_place_holder: -------------------------------------------------------------------------------- 1 | use empty file to add log into git -------------------------------------------------------------------------------- /meta_config/mt10/modular_2_2_2_256_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/modular_2_2_2_256_rand.json -------------------------------------------------------------------------------- /meta_config/mt10/modular_2_2_2_256_reweight.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/modular_2_2_2_256_reweight.json -------------------------------------------------------------------------------- /meta_config/mt10/modular_2_2_2_256_reweight_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/modular_2_2_2_256_reweight_rand.json -------------------------------------------------------------------------------- /meta_config/mt10/modular_4_4_2_128_reweight.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/modular_4_4_2_128_reweight.json -------------------------------------------------------------------------------- /meta_config/mt10/modular_4_4_2_128_reweight_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/modular_4_4_2_128_reweight_rand.json -------------------------------------------------------------------------------- /meta_config/mt10/mtmhsac.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/mtmhsac.json -------------------------------------------------------------------------------- /meta_config/mt10/mtmhsac_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/mtmhsac_rand.json -------------------------------------------------------------------------------- /meta_config/mt10/mtsac.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/mtsac.json -------------------------------------------------------------------------------- /meta_config/mt10/mtsac_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt10/mtsac_rand.json -------------------------------------------------------------------------------- /meta_config/mt50/modular_2_2_2_256_reweight.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/modular_2_2_2_256_reweight.json -------------------------------------------------------------------------------- /meta_config/mt50/modular_2_2_2_256_reweight_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/modular_2_2_2_256_reweight_rand.json -------------------------------------------------------------------------------- /meta_config/mt50/modular_4_4_2_128_reweight.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/modular_4_4_2_128_reweight.json -------------------------------------------------------------------------------- /meta_config/mt50/modular_4_4_2_128_reweight_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/modular_4_4_2_128_reweight_rand.json -------------------------------------------------------------------------------- /meta_config/mt50/mtmhsac.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/mtmhsac.json -------------------------------------------------------------------------------- /meta_config/mt50/mtmhsac_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/mtmhsac_rand.json -------------------------------------------------------------------------------- /meta_config/mt50/mtsac.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/mtsac.json -------------------------------------------------------------------------------- /meta_config/mt50/mtsac_rand.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/meta_config/mt50/mtsac_rand.json -------------------------------------------------------------------------------- /metaworld_utils/__init__.py: -------------------------------------------------------------------------------- 1 | from .meta_env import * -------------------------------------------------------------------------------- /metaworld_utils/meta_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/metaworld_utils/meta_env.py -------------------------------------------------------------------------------- /starter/mt_para_mhmt_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/starter/mt_para_mhmt_sac.py -------------------------------------------------------------------------------- /starter/mt_para_mtsac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/starter/mt_para_mtsac.py -------------------------------------------------------------------------------- /starter/mt_para_mtsac_modular_gated_cas.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/starter/mt_para_mtsac_modular_gated_cas.py -------------------------------------------------------------------------------- /torchrl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /torchrl/algo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/__init__.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/__init__.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/mt_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/mt_sac.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/mtmh_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/mtmh_sac.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/off_rl_algo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/off_rl_algo.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/sac.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/twin_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/twin_sac.py -------------------------------------------------------------------------------- /torchrl/algo/off_policy/twin_sac_q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/off_policy/twin_sac_q.py -------------------------------------------------------------------------------- /torchrl/algo/rl_algo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/rl_algo.py -------------------------------------------------------------------------------- /torchrl/algo/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/algo/utils.py -------------------------------------------------------------------------------- /torchrl/collector/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/__init__.py -------------------------------------------------------------------------------- /torchrl/collector/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/base.py -------------------------------------------------------------------------------- /torchrl/collector/mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/mt.py -------------------------------------------------------------------------------- /torchrl/collector/para/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/para/__init__.py -------------------------------------------------------------------------------- /torchrl/collector/para/async_mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/para/async_mt.py -------------------------------------------------------------------------------- /torchrl/collector/para/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/para/base.py -------------------------------------------------------------------------------- /torchrl/collector/para/mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/collector/para/mt.py -------------------------------------------------------------------------------- /torchrl/env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/env/__init__.py -------------------------------------------------------------------------------- /torchrl/env/base_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/env/base_wrapper.py -------------------------------------------------------------------------------- /torchrl/env/continuous_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/env/continuous_wrapper.py -------------------------------------------------------------------------------- /torchrl/env/get_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/env/get_env.py -------------------------------------------------------------------------------- /torchrl/networks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/networks/__init__.py -------------------------------------------------------------------------------- /torchrl/networks/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/networks/base.py -------------------------------------------------------------------------------- /torchrl/networks/init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/networks/init.py -------------------------------------------------------------------------------- /torchrl/networks/nets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/networks/nets.py -------------------------------------------------------------------------------- /torchrl/policies/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/policies/__init__.py -------------------------------------------------------------------------------- /torchrl/policies/continuous_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/policies/continuous_policy.py -------------------------------------------------------------------------------- /torchrl/policies/distribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/policies/distribution.py -------------------------------------------------------------------------------- /torchrl/replay_buffers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/replay_buffers/__init__.py -------------------------------------------------------------------------------- /torchrl/replay_buffers/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/replay_buffers/base.py -------------------------------------------------------------------------------- /torchrl/replay_buffers/shared/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/replay_buffers/shared/__init__.py -------------------------------------------------------------------------------- /torchrl/replay_buffers/shared/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/replay_buffers/shared/base.py -------------------------------------------------------------------------------- /torchrl/replay_buffers/shared/shmarray.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/replay_buffers/shared/shmarray.py -------------------------------------------------------------------------------- /torchrl/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/utils/__init__.py -------------------------------------------------------------------------------- /torchrl/utils/args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/utils/args.py -------------------------------------------------------------------------------- /torchrl/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/utils/logger.py -------------------------------------------------------------------------------- /torchrl/utils/plot_csv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RchalYang/Soft-Module/HEAD/torchrl/utils/plot_csv.py --------------------------------------------------------------------------------