├── .gitignore ├── readme.md ├── requirements.txt ├── result └── slbo.png ├── setup.py └── slbo ├── __init__.py ├── algos ├── __init__.py ├── mbrl │ ├── __init__.py │ └── slbo.py └── mfrl │ ├── __init__.py │ ├── ppo.py │ └── trpo.py ├── configs ├── __init__.py ├── config.py ├── slbo_config.yaml └── trpo_config.yaml ├── envs ├── __init__.py ├── mujoco │ ├── __init__.py │ ├── gym │ │ ├── __init__.py │ │ ├── ant_env.py │ │ ├── half_cheetah_env.py │ │ ├── hopper_env.py │ │ ├── swimmer_env.py │ │ └── walker2d_env.py │ ├── mujoco_envs.py │ └── rllab │ │ ├── __init__.py │ │ ├── ant_env.py │ │ ├── half_cheetah_env.py │ │ ├── hopper_env.py │ │ ├── humanoid_env.py │ │ ├── mujoco_models │ │ ├── ant.xml │ │ ├── green_ball.xml │ │ ├── half_cheetah.xml │ │ ├── hill_ant_env.xml.mako │ │ ├── hill_half_cheetah_env.xml.mako │ │ ├── hill_hopper_env.xml.mako │ │ ├── hill_swimmer3d_env.xml.mako │ │ ├── hill_walker2d_env.xml.mako │ │ ├── hopper.xml │ │ ├── humanoid.xml │ │ ├── inverted_double_pendulum.xml │ │ ├── inverted_double_pendulum.xml.mako │ │ ├── point.xml │ │ ├── red_ball.xml │ │ ├── simple_humanoid.xml │ │ ├── swimmer.xml │ │ ├── swimmer3d.xml │ │ ├── utils.mako │ │ └── walker2d.xml │ │ ├── rllab_ant.xml │ │ ├── rllab_half_cheetah.xml │ │ ├── rllab_hopper.xml │ │ ├── rllab_simple_humanoid.xml │ │ ├── rllab_swimmer.xml │ │ ├── rllab_walker2d.xml │ │ ├── swimmer_env.py │ │ └── walker2d_env.py ├── virtual_env.py └── wrapped_envs.py ├── misc ├── __init__.py ├── distributions.py ├── logger.py ├── ou_noise.py ├── param.py └── utils.py ├── models ├── __init__.py ├── actor.py ├── actor_critic.py ├── actor_layer.py ├── critic.py ├── dynamics.py ├── initializer.py ├── normalizers.py └── utils.py ├── scripts ├── run_slbo.py └── run_trpo.py └── storages ├── __init__.py ├── off_policy_buffer.py └── on_policy_buffer.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/.gitignore -------------------------------------------------------------------------------- /readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/readme.md -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/requirements.txt -------------------------------------------------------------------------------- /result/slbo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/result/slbo.png -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/setup.py -------------------------------------------------------------------------------- /slbo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/algos/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/algos/__init__.py -------------------------------------------------------------------------------- /slbo/algos/mbrl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/algos/mbrl/slbo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/algos/mbrl/slbo.py -------------------------------------------------------------------------------- /slbo/algos/mfrl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/algos/mfrl/__init__.py -------------------------------------------------------------------------------- /slbo/algos/mfrl/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/algos/mfrl/ppo.py -------------------------------------------------------------------------------- /slbo/algos/mfrl/trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/algos/mfrl/trpo.py -------------------------------------------------------------------------------- /slbo/configs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/configs/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/configs/config.py -------------------------------------------------------------------------------- /slbo/configs/slbo_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/configs/slbo_config.yaml -------------------------------------------------------------------------------- /slbo/configs/trpo_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/configs/trpo_config.yaml -------------------------------------------------------------------------------- /slbo/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/__init__.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/envs/mujoco/gym/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/envs/mujoco/gym/ant_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/gym/ant_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/gym/half_cheetah_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/gym/half_cheetah_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/gym/hopper_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/gym/hopper_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/gym/swimmer_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/gym/swimmer_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/gym/walker2d_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/gym/walker2d_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/mujoco_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/mujoco_envs.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/ant_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/ant_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/half_cheetah_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/half_cheetah_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/hopper_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/hopper_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/humanoid_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/humanoid_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/ant.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/ant.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/green_ball.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/green_ball.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/half_cheetah.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/half_cheetah.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/hill_ant_env.xml.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/hill_ant_env.xml.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/hill_half_cheetah_env.xml.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/hill_half_cheetah_env.xml.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/hill_hopper_env.xml.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/hill_hopper_env.xml.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/hill_swimmer3d_env.xml.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/hill_swimmer3d_env.xml.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/hill_walker2d_env.xml.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/hill_walker2d_env.xml.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/hopper.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/hopper.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/humanoid.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/humanoid.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/inverted_double_pendulum.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/inverted_double_pendulum.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/inverted_double_pendulum.xml.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/inverted_double_pendulum.xml.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/point.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/point.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/red_ball.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/red_ball.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/simple_humanoid.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/simple_humanoid.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/swimmer.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/swimmer.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/swimmer3d.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/swimmer3d.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/utils.mako: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/utils.mako -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/mujoco_models/walker2d.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/mujoco_models/walker2d.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/rllab_ant.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/rllab_ant.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/rllab_half_cheetah.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/rllab_half_cheetah.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/rllab_hopper.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/rllab_hopper.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/rllab_simple_humanoid.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/rllab_simple_humanoid.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/rllab_swimmer.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/rllab_swimmer.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/rllab_walker2d.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/rllab_walker2d.xml -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/swimmer_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/swimmer_env.py -------------------------------------------------------------------------------- /slbo/envs/mujoco/rllab/walker2d_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/mujoco/rllab/walker2d_env.py -------------------------------------------------------------------------------- /slbo/envs/virtual_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/virtual_env.py -------------------------------------------------------------------------------- /slbo/envs/wrapped_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/envs/wrapped_envs.py -------------------------------------------------------------------------------- /slbo/misc/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/misc/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/misc/distributions.py -------------------------------------------------------------------------------- /slbo/misc/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/misc/logger.py -------------------------------------------------------------------------------- /slbo/misc/ou_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/misc/ou_noise.py -------------------------------------------------------------------------------- /slbo/misc/param.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/misc/param.py -------------------------------------------------------------------------------- /slbo/misc/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/misc/utils.py -------------------------------------------------------------------------------- /slbo/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/__init__.py -------------------------------------------------------------------------------- /slbo/models/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/actor.py -------------------------------------------------------------------------------- /slbo/models/actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/actor_critic.py -------------------------------------------------------------------------------- /slbo/models/actor_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/actor_layer.py -------------------------------------------------------------------------------- /slbo/models/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/critic.py -------------------------------------------------------------------------------- /slbo/models/dynamics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/dynamics.py -------------------------------------------------------------------------------- /slbo/models/initializer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/initializer.py -------------------------------------------------------------------------------- /slbo/models/normalizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/normalizers.py -------------------------------------------------------------------------------- /slbo/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/models/utils.py -------------------------------------------------------------------------------- /slbo/scripts/run_slbo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/scripts/run_slbo.py -------------------------------------------------------------------------------- /slbo/scripts/run_trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/scripts/run_trpo.py -------------------------------------------------------------------------------- /slbo/storages/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slbo/storages/off_policy_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/storages/off_policy_buffer.py -------------------------------------------------------------------------------- /slbo/storages/on_policy_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jiangsy/slbo_pytorch/HEAD/slbo/storages/on_policy_buffer.py --------------------------------------------------------------------------------