├── .gitignore ├── .gitmodules ├── LICENSE ├── README.md ├── environment ├── gpu-env.yml └── requirements.txt ├── examples ├── __init__.py ├── config │ ├── __init__.py │ └── d4rl │ │ ├── base.py │ │ ├── base_mopo.py │ │ ├── halfcheetah_medium.py │ │ ├── halfcheetah_medium_expert.py │ │ ├── halfcheetah_mixed.py │ │ ├── halfcheetah_random.py │ │ ├── hopper_medium.py │ │ ├── hopper_medium_expert.py │ │ ├── hopper_mixed.py │ │ ├── hopper_random.py │ │ ├── walker2d_medium.py │ │ ├── walker2d_medium_expert.py │ │ ├── walker2d_mixed.py │ │ └── walker2d_random.py ├── development │ ├── __init__.py │ ├── base.py │ ├── main.py │ ├── simulate_policy.py │ ├── simulate_policy_with_state.py │ └── variants.py ├── instrument.py └── utils.py ├── mopo ├── __init__.py ├── algorithms │ ├── __init__.py │ └── mopo.py ├── env │ ├── __init__.py │ ├── ant.py │ └── humanoid.py ├── models │ ├── __init__.py │ ├── bnn.py │ ├── constructor.py │ ├── fake_env.py │ ├── fc.py │ └── utils.py ├── off_policy │ ├── __init__.py │ └── loader.py ├── parallel │ ├── __init__.py │ ├── parallel_env.py │ ├── parallel_hopper.py │ └── test.py ├── scripts │ ├── __init__.py │ ├── console_scripts.py │ └── train_model_offline.py ├── static │ ├── __init__.py │ ├── ant.py │ ├── antangle.py │ ├── halfcheetah.py │ ├── halfcheetahjump.py │ ├── halfcheetahvel.py │ ├── halfcheetahveljump.py │ ├── hopper.py │ ├── humanoid.py │ ├── pendulum.py │ ├── point2denv.py │ ├── point2dwallenv.py │ └── walker2d.py └── utils │ ├── __init__.py │ ├── filesystem.py │ ├── logging.py │ ├── visualization.py │ └── writer.py ├── plots └── .gitkeep ├── run.sh ├── setup.py └── softlearning ├── __init__.py ├── algorithms ├── __init__.py ├── rl_algorithm.py ├── sac.py ├── sql.py └── utils.py ├── distributions ├── __init__.py ├── real_nvp_flow.py └── squash_bijector.py ├── environments ├── __init__.py ├── adapters │ ├── __init__.py │ ├── gym_adapter.py │ └── softlearning_env.py ├── dm_control │ └── __init__.py ├── gym │ ├── __init__.py │ ├── mujoco │ │ ├── __init__.py │ │ ├── image_pusher_2d.py │ │ └── pusher_2d.py │ ├── multi_goal.py │ ├── robotics │ │ └── __init__.py │ └── wrappers │ │ ├── __init__.py │ │ └── normalize_action.py ├── helpers.py └── utils.py ├── misc ├── __init__.py ├── kernel.py ├── plotter.py └── utils.py ├── models ├── __init__.py ├── feedforward.py └── utils.py ├── policies ├── __init__.py ├── base_policy.py ├── gaussian_policy.py ├── uniform_policy.py └── utils.py ├── preprocessors ├── __init__.py ├── convnet.py └── utils.py ├── replay_pools ├── __init__.py ├── extra_policy_info_replay_pool.py ├── flexible_replay_pool.py ├── replay_pool.py ├── simple_replay_pool.py ├── trajectory_replay_pool.py ├── union_pool.py └── utils.py ├── samplers ├── __init__.py ├── base_sampler.py ├── dummy_sampler.py ├── explore_sampler.py ├── extra_policy_info_sampler.py ├── remote_sampler.py ├── simple_sampler.py └── utils.py ├── scripts ├── __init__.py └── console_scripts.py ├── softlearning.md ├── utils ├── keras.py └── numpy.py └── value_functions ├── __init__.py ├── utils.py ├── value_function.py └── vanilla.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/.gitmodules -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/README.md -------------------------------------------------------------------------------- /environment/gpu-env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/environment/gpu-env.yml -------------------------------------------------------------------------------- /environment/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/environment/requirements.txt -------------------------------------------------------------------------------- /examples/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /examples/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/__init__.py -------------------------------------------------------------------------------- /examples/config/d4rl/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/base.py -------------------------------------------------------------------------------- /examples/config/d4rl/base_mopo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/base_mopo.py -------------------------------------------------------------------------------- /examples/config/d4rl/halfcheetah_medium.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/halfcheetah_medium.py -------------------------------------------------------------------------------- /examples/config/d4rl/halfcheetah_medium_expert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/halfcheetah_medium_expert.py -------------------------------------------------------------------------------- /examples/config/d4rl/halfcheetah_mixed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/halfcheetah_mixed.py -------------------------------------------------------------------------------- /examples/config/d4rl/halfcheetah_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/halfcheetah_random.py -------------------------------------------------------------------------------- /examples/config/d4rl/hopper_medium.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/hopper_medium.py -------------------------------------------------------------------------------- /examples/config/d4rl/hopper_medium_expert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/hopper_medium_expert.py -------------------------------------------------------------------------------- /examples/config/d4rl/hopper_mixed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/hopper_mixed.py -------------------------------------------------------------------------------- /examples/config/d4rl/hopper_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/hopper_random.py -------------------------------------------------------------------------------- /examples/config/d4rl/walker2d_medium.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/walker2d_medium.py -------------------------------------------------------------------------------- /examples/config/d4rl/walker2d_medium_expert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/walker2d_medium_expert.py -------------------------------------------------------------------------------- /examples/config/d4rl/walker2d_mixed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/walker2d_mixed.py -------------------------------------------------------------------------------- /examples/config/d4rl/walker2d_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/config/d4rl/walker2d_random.py -------------------------------------------------------------------------------- /examples/development/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/development/__init__.py -------------------------------------------------------------------------------- /examples/development/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/development/base.py -------------------------------------------------------------------------------- /examples/development/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/development/main.py -------------------------------------------------------------------------------- /examples/development/simulate_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/development/simulate_policy.py -------------------------------------------------------------------------------- /examples/development/simulate_policy_with_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/development/simulate_policy_with_state.py -------------------------------------------------------------------------------- /examples/development/variants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/development/variants.py -------------------------------------------------------------------------------- /examples/instrument.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/instrument.py -------------------------------------------------------------------------------- /examples/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/examples/utils.py -------------------------------------------------------------------------------- /mopo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mopo/algorithms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mopo/algorithms/mopo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/algorithms/mopo.py -------------------------------------------------------------------------------- /mopo/env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/env/__init__.py -------------------------------------------------------------------------------- /mopo/env/ant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/env/ant.py -------------------------------------------------------------------------------- /mopo/env/humanoid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/env/humanoid.py -------------------------------------------------------------------------------- /mopo/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mopo/models/bnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/models/bnn.py -------------------------------------------------------------------------------- /mopo/models/constructor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/models/constructor.py -------------------------------------------------------------------------------- /mopo/models/fake_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/models/fake_env.py -------------------------------------------------------------------------------- /mopo/models/fc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/models/fc.py -------------------------------------------------------------------------------- /mopo/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/models/utils.py -------------------------------------------------------------------------------- /mopo/off_policy/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mopo/off_policy/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/off_policy/loader.py -------------------------------------------------------------------------------- /mopo/parallel/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mopo/parallel/parallel_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/parallel/parallel_env.py -------------------------------------------------------------------------------- /mopo/parallel/parallel_hopper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/parallel/parallel_hopper.py -------------------------------------------------------------------------------- /mopo/parallel/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/parallel/test.py -------------------------------------------------------------------------------- /mopo/scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mopo/scripts/console_scripts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/scripts/console_scripts.py -------------------------------------------------------------------------------- /mopo/scripts/train_model_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/scripts/train_model_offline.py -------------------------------------------------------------------------------- /mopo/static/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/__init__.py -------------------------------------------------------------------------------- /mopo/static/ant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/ant.py -------------------------------------------------------------------------------- /mopo/static/antangle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/antangle.py -------------------------------------------------------------------------------- /mopo/static/halfcheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/halfcheetah.py -------------------------------------------------------------------------------- /mopo/static/halfcheetahjump.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/halfcheetahjump.py -------------------------------------------------------------------------------- /mopo/static/halfcheetahvel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/halfcheetahvel.py -------------------------------------------------------------------------------- /mopo/static/halfcheetahveljump.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/halfcheetahveljump.py -------------------------------------------------------------------------------- /mopo/static/hopper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/hopper.py -------------------------------------------------------------------------------- /mopo/static/humanoid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/humanoid.py -------------------------------------------------------------------------------- /mopo/static/pendulum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/pendulum.py -------------------------------------------------------------------------------- /mopo/static/point2denv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/point2denv.py -------------------------------------------------------------------------------- /mopo/static/point2dwallenv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/point2dwallenv.py -------------------------------------------------------------------------------- /mopo/static/walker2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/static/walker2d.py -------------------------------------------------------------------------------- /mopo/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/utils/__init__.py -------------------------------------------------------------------------------- /mopo/utils/filesystem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/utils/filesystem.py -------------------------------------------------------------------------------- /mopo/utils/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/utils/logging.py -------------------------------------------------------------------------------- /mopo/utils/visualization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/utils/visualization.py -------------------------------------------------------------------------------- /mopo/utils/writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/mopo/utils/writer.py -------------------------------------------------------------------------------- /plots/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/run.sh -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/setup.py -------------------------------------------------------------------------------- /softlearning/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/algorithms/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/algorithms/__init__.py -------------------------------------------------------------------------------- /softlearning/algorithms/rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/algorithms/rl_algorithm.py -------------------------------------------------------------------------------- /softlearning/algorithms/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/algorithms/sac.py -------------------------------------------------------------------------------- /softlearning/algorithms/sql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/algorithms/sql.py -------------------------------------------------------------------------------- /softlearning/algorithms/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/algorithms/utils.py -------------------------------------------------------------------------------- /softlearning/distributions/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/distributions/__init__.py -------------------------------------------------------------------------------- /softlearning/distributions/real_nvp_flow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/distributions/real_nvp_flow.py -------------------------------------------------------------------------------- /softlearning/distributions/squash_bijector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/distributions/squash_bijector.py -------------------------------------------------------------------------------- /softlearning/environments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/environments/adapters/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/adapters/__init__.py -------------------------------------------------------------------------------- /softlearning/environments/adapters/gym_adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/adapters/gym_adapter.py -------------------------------------------------------------------------------- /softlearning/environments/adapters/softlearning_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/adapters/softlearning_env.py -------------------------------------------------------------------------------- /softlearning/environments/dm_control/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/dm_control/__init__.py -------------------------------------------------------------------------------- /softlearning/environments/gym/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/gym/__init__.py -------------------------------------------------------------------------------- /softlearning/environments/gym/mujoco/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/environments/gym/mujoco/image_pusher_2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/gym/mujoco/image_pusher_2d.py -------------------------------------------------------------------------------- /softlearning/environments/gym/mujoco/pusher_2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/gym/mujoco/pusher_2d.py -------------------------------------------------------------------------------- /softlearning/environments/gym/multi_goal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/gym/multi_goal.py -------------------------------------------------------------------------------- /softlearning/environments/gym/robotics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/environments/gym/wrappers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/gym/wrappers/__init__.py -------------------------------------------------------------------------------- /softlearning/environments/gym/wrappers/normalize_action.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/gym/wrappers/normalize_action.py -------------------------------------------------------------------------------- /softlearning/environments/helpers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/helpers.py -------------------------------------------------------------------------------- /softlearning/environments/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/environments/utils.py -------------------------------------------------------------------------------- /softlearning/misc/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/misc/kernel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/misc/kernel.py -------------------------------------------------------------------------------- /softlearning/misc/plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/misc/plotter.py -------------------------------------------------------------------------------- /softlearning/misc/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/misc/utils.py -------------------------------------------------------------------------------- /softlearning/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/models/feedforward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/models/feedforward.py -------------------------------------------------------------------------------- /softlearning/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/models/utils.py -------------------------------------------------------------------------------- /softlearning/policies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/policies/base_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/policies/base_policy.py -------------------------------------------------------------------------------- /softlearning/policies/gaussian_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/policies/gaussian_policy.py -------------------------------------------------------------------------------- /softlearning/policies/uniform_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/policies/uniform_policy.py -------------------------------------------------------------------------------- /softlearning/policies/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/policies/utils.py -------------------------------------------------------------------------------- /softlearning/preprocessors/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/preprocessors/convnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/preprocessors/convnet.py -------------------------------------------------------------------------------- /softlearning/preprocessors/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/preprocessors/utils.py -------------------------------------------------------------------------------- /softlearning/replay_pools/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/__init__.py -------------------------------------------------------------------------------- /softlearning/replay_pools/extra_policy_info_replay_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/extra_policy_info_replay_pool.py -------------------------------------------------------------------------------- /softlearning/replay_pools/flexible_replay_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/flexible_replay_pool.py -------------------------------------------------------------------------------- /softlearning/replay_pools/replay_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/replay_pool.py -------------------------------------------------------------------------------- /softlearning/replay_pools/simple_replay_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/simple_replay_pool.py -------------------------------------------------------------------------------- /softlearning/replay_pools/trajectory_replay_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/trajectory_replay_pool.py -------------------------------------------------------------------------------- /softlearning/replay_pools/union_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/union_pool.py -------------------------------------------------------------------------------- /softlearning/replay_pools/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/replay_pools/utils.py -------------------------------------------------------------------------------- /softlearning/samplers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/__init__.py -------------------------------------------------------------------------------- /softlearning/samplers/base_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/base_sampler.py -------------------------------------------------------------------------------- /softlearning/samplers/dummy_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/dummy_sampler.py -------------------------------------------------------------------------------- /softlearning/samplers/explore_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/explore_sampler.py -------------------------------------------------------------------------------- /softlearning/samplers/extra_policy_info_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/extra_policy_info_sampler.py -------------------------------------------------------------------------------- /softlearning/samplers/remote_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/remote_sampler.py -------------------------------------------------------------------------------- /softlearning/samplers/simple_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/simple_sampler.py -------------------------------------------------------------------------------- /softlearning/samplers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/samplers/utils.py -------------------------------------------------------------------------------- /softlearning/scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/scripts/console_scripts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/scripts/console_scripts.py -------------------------------------------------------------------------------- /softlearning/softlearning.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/softlearning.md -------------------------------------------------------------------------------- /softlearning/utils/keras.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/utils/keras.py -------------------------------------------------------------------------------- /softlearning/utils/numpy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/utils/numpy.py -------------------------------------------------------------------------------- /softlearning/value_functions/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /softlearning/value_functions/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/value_functions/utils.py -------------------------------------------------------------------------------- /softlearning/value_functions/value_function.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/value_functions/value_function.py -------------------------------------------------------------------------------- /softlearning/value_functions/vanilla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianheyu927/mopo/HEAD/softlearning/value_functions/vanilla.py --------------------------------------------------------------------------------