├── .gitignore ├── .python-version ├── LICENSE ├── README.md ├── README_RLKIT.md ├── docs ├── HER.md ├── RIG.md ├── SkewFit.md ├── TDMs.md ├── goal_based_envs.md └── images │ ├── FetchReach-v1_HER-TD3.png │ ├── SawyerReachXYZEnv-v0_HER-TD3.png │ ├── diayn_intrinsic_rewards.png │ ├── diayn_policy_loss.png │ ├── her_dqn.png │ ├── her_td3_sawyer_reacher.png │ ├── skewfit_door.png │ ├── skewfit_pickup.png │ └── skewfit_pusher.png ├── environment ├── docker │ ├── Dockerfile │ └── vendor │ │ ├── 10_nvidia.json │ │ ├── Xdummy │ │ └── Xdummy-entrypoint ├── linux-cpu-env.yml ├── linux-gpu-env.yml └── mac-env.yml ├── examples ├── ddpg.py ├── diayn.py ├── doodad │ ├── ec2_example.py │ └── gcp_example.py ├── dqn_and_double_dqn.py ├── her │ ├── her_dqn_gridworld.py │ ├── her_sac_gym_fetch_reach.py │ └── her_td3_multiworld_sawyer_reach.py ├── ppo.py ├── ppo_diayn.py ├── ppo_random.py ├── sac.py ├── sanity.py ├── skewfit │ ├── sawyer_door.py │ ├── sawyer_pickup.py │ └── sawyer_push.py └── td3.py ├── rlkit ├── __init__.py ├── core │ ├── __init__.py │ ├── batch_rl_algorithm.py │ ├── eval_util.py │ ├── logging.py │ ├── online_rl_algorithm.py │ ├── rl_algorithm.py │ ├── serializable.py │ ├── tabulate.py │ └── trainer.py ├── data_management │ ├── __init__.py │ ├── env_replay_buffer.py │ ├── normalizer.py │ ├── obs_dict_replay_buffer.py │ ├── online_vae_replay_buffer.py │ ├── path_builder.py │ ├── replay_buffer.py │ ├── shared_obs_dict_replay_buffer.py │ └── simple_replay_buffer.py ├── envs │ ├── ant.py │ ├── assets │ │ ├── low_gear_ratio_ant.xml │ │ └── reacher_7dof.xml │ ├── env_utils.py │ ├── goal_generation │ │ └── pickup_goal_dataset.py │ ├── mujoco_env.py │ ├── mujoco_image_env.py │ ├── vae_wrapper.py │ └── wrappers.py ├── exploration_strategies │ ├── __init__.py │ ├── base.py │ ├── epsilon_greedy.py │ ├── gaussian_and_epsilon_strategy.py │ ├── gaussian_strategy.py │ └── ou_strategy.py ├── launchers │ ├── __init__.py │ ├── conf.py │ ├── launcher_util.py │ └── skewfit_experiments.py ├── policies │ ├── __init__.py │ ├── argmax.py │ ├── base.py │ └── simple.py ├── pythonplusplus.py ├── samplers │ ├── __init__.py │ ├── data_collector │ │ ├── __init__.py │ │ ├── base.py │ │ ├── path_collector.py │ │ ├── step_collector.py │ │ └── vae_env.py │ ├── rollout_functions.py │ └── util.py ├── torch │ ├── __init__.py │ ├── conv_networks.py │ ├── core.py │ ├── data.py │ ├── data_management │ │ ├── __init__.py │ │ └── normalizer.py │ ├── ddpg │ │ ├── __init__.py │ │ └── ddpg.py │ ├── distributions.py │ ├── dqn │ │ ├── __init__.py │ │ ├── double_dqn.py │ │ └── dqn.py │ ├── h_diayn │ │ ├── h_diayn_rollout_functions.py │ │ ├── manager_ppo_env_replay_buffer.py │ │ └── manager_ppo_path_collector.py │ ├── her │ │ ├── __init__.py │ │ └── her.py │ ├── modules.py │ ├── networks.py │ ├── ppo │ │ ├── __init__.py │ │ ├── discrete_ppo.py │ │ ├── policies.py │ │ ├── ppo.py │ │ ├── ppo_env_replay_buffer.py │ │ ├── ppo_path_collector.py │ │ └── ppo_torch_batch_rl_algorithm.py │ ├── pytorch_util.py │ ├── sac │ │ ├── __init__.py │ │ ├── diayn │ │ │ ├── diayn.py │ │ │ ├── diayn_env_replay_buffer.py │ │ │ ├── diayn_path_collector.py │ │ │ ├── diayn_torch_online_rl_algorithm.py │ │ │ ├── policies.py │ │ │ └── random_policies.py │ │ ├── policies.py │ │ └── sac.py │ ├── skewfit │ │ ├── online_vae_algorithm.py │ │ └── video_gen.py │ ├── td3 │ │ ├── __init__.py │ │ └── td3.py │ ├── torch_rl_algorithm.py │ └── vae │ │ ├── conv_vae.py │ │ ├── vae_base.py │ │ ├── vae_schedules.py │ │ └── vae_trainer.py └── util │ ├── hyperparameter.py │ ├── io.py │ ├── ml_util.py │ └── video.py ├── scripts ├── run_experiment_from_doodad.py ├── run_goal_conditioned_policy.py ├── run_policy.py ├── run_policy_diayn.py ├── run_policy_h_diayn.py ├── run_policy_h_random_policy.py └── run_policy_ppo.py └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/.gitignore -------------------------------------------------------------------------------- /.python-version: -------------------------------------------------------------------------------- 1 | anaconda3-4.2.0/envs/rlkit 2 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/README.md -------------------------------------------------------------------------------- /README_RLKIT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/README_RLKIT.md -------------------------------------------------------------------------------- /docs/HER.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/HER.md -------------------------------------------------------------------------------- /docs/RIG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/RIG.md -------------------------------------------------------------------------------- /docs/SkewFit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/SkewFit.md -------------------------------------------------------------------------------- /docs/TDMs.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/TDMs.md -------------------------------------------------------------------------------- /docs/goal_based_envs.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/goal_based_envs.md -------------------------------------------------------------------------------- /docs/images/FetchReach-v1_HER-TD3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/FetchReach-v1_HER-TD3.png -------------------------------------------------------------------------------- /docs/images/SawyerReachXYZEnv-v0_HER-TD3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/SawyerReachXYZEnv-v0_HER-TD3.png -------------------------------------------------------------------------------- /docs/images/diayn_intrinsic_rewards.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/diayn_intrinsic_rewards.png -------------------------------------------------------------------------------- /docs/images/diayn_policy_loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/diayn_policy_loss.png -------------------------------------------------------------------------------- /docs/images/her_dqn.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/her_dqn.png -------------------------------------------------------------------------------- /docs/images/her_td3_sawyer_reacher.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/her_td3_sawyer_reacher.png -------------------------------------------------------------------------------- /docs/images/skewfit_door.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/skewfit_door.png -------------------------------------------------------------------------------- /docs/images/skewfit_pickup.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/skewfit_pickup.png -------------------------------------------------------------------------------- /docs/images/skewfit_pusher.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/docs/images/skewfit_pusher.png -------------------------------------------------------------------------------- /environment/docker/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/docker/Dockerfile -------------------------------------------------------------------------------- /environment/docker/vendor/10_nvidia.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/docker/vendor/10_nvidia.json -------------------------------------------------------------------------------- /environment/docker/vendor/Xdummy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/docker/vendor/Xdummy -------------------------------------------------------------------------------- /environment/docker/vendor/Xdummy-entrypoint: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/docker/vendor/Xdummy-entrypoint -------------------------------------------------------------------------------- /environment/linux-cpu-env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/linux-cpu-env.yml -------------------------------------------------------------------------------- /environment/linux-gpu-env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/linux-gpu-env.yml -------------------------------------------------------------------------------- /environment/mac-env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/environment/mac-env.yml -------------------------------------------------------------------------------- /examples/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/ddpg.py -------------------------------------------------------------------------------- /examples/diayn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/diayn.py -------------------------------------------------------------------------------- /examples/doodad/ec2_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/doodad/ec2_example.py -------------------------------------------------------------------------------- /examples/doodad/gcp_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/doodad/gcp_example.py -------------------------------------------------------------------------------- /examples/dqn_and_double_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/dqn_and_double_dqn.py -------------------------------------------------------------------------------- /examples/her/her_dqn_gridworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/her/her_dqn_gridworld.py -------------------------------------------------------------------------------- /examples/her/her_sac_gym_fetch_reach.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/her/her_sac_gym_fetch_reach.py -------------------------------------------------------------------------------- /examples/her/her_td3_multiworld_sawyer_reach.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/her/her_td3_multiworld_sawyer_reach.py -------------------------------------------------------------------------------- /examples/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/ppo.py -------------------------------------------------------------------------------- /examples/ppo_diayn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/ppo_diayn.py -------------------------------------------------------------------------------- /examples/ppo_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/ppo_random.py -------------------------------------------------------------------------------- /examples/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/sac.py -------------------------------------------------------------------------------- /examples/sanity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/sanity.py -------------------------------------------------------------------------------- /examples/skewfit/sawyer_door.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/skewfit/sawyer_door.py -------------------------------------------------------------------------------- /examples/skewfit/sawyer_pickup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/skewfit/sawyer_pickup.py -------------------------------------------------------------------------------- /examples/skewfit/sawyer_push.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/skewfit/sawyer_push.py -------------------------------------------------------------------------------- /examples/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/examples/td3.py -------------------------------------------------------------------------------- /rlkit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/core/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/__init__.py -------------------------------------------------------------------------------- /rlkit/core/batch_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/batch_rl_algorithm.py -------------------------------------------------------------------------------- /rlkit/core/eval_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/eval_util.py -------------------------------------------------------------------------------- /rlkit/core/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/logging.py -------------------------------------------------------------------------------- /rlkit/core/online_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/online_rl_algorithm.py -------------------------------------------------------------------------------- /rlkit/core/rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/rl_algorithm.py -------------------------------------------------------------------------------- /rlkit/core/serializable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/serializable.py -------------------------------------------------------------------------------- /rlkit/core/tabulate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/tabulate.py -------------------------------------------------------------------------------- /rlkit/core/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/core/trainer.py -------------------------------------------------------------------------------- /rlkit/data_management/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/data_management/env_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/env_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/data_management/normalizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/normalizer.py -------------------------------------------------------------------------------- /rlkit/data_management/obs_dict_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/obs_dict_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/data_management/online_vae_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/online_vae_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/data_management/path_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/path_builder.py -------------------------------------------------------------------------------- /rlkit/data_management/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/replay_buffer.py -------------------------------------------------------------------------------- /rlkit/data_management/shared_obs_dict_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/shared_obs_dict_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/data_management/simple_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/data_management/simple_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/envs/ant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/ant.py -------------------------------------------------------------------------------- /rlkit/envs/assets/low_gear_ratio_ant.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/assets/low_gear_ratio_ant.xml -------------------------------------------------------------------------------- /rlkit/envs/assets/reacher_7dof.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/assets/reacher_7dof.xml -------------------------------------------------------------------------------- /rlkit/envs/env_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/env_utils.py -------------------------------------------------------------------------------- /rlkit/envs/goal_generation/pickup_goal_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/goal_generation/pickup_goal_dataset.py -------------------------------------------------------------------------------- /rlkit/envs/mujoco_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/mujoco_env.py -------------------------------------------------------------------------------- /rlkit/envs/mujoco_image_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/mujoco_image_env.py -------------------------------------------------------------------------------- /rlkit/envs/vae_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/vae_wrapper.py -------------------------------------------------------------------------------- /rlkit/envs/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/envs/wrappers.py -------------------------------------------------------------------------------- /rlkit/exploration_strategies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/exploration_strategies/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/exploration_strategies/base.py -------------------------------------------------------------------------------- /rlkit/exploration_strategies/epsilon_greedy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/exploration_strategies/epsilon_greedy.py -------------------------------------------------------------------------------- /rlkit/exploration_strategies/gaussian_and_epsilon_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/exploration_strategies/gaussian_and_epsilon_strategy.py -------------------------------------------------------------------------------- /rlkit/exploration_strategies/gaussian_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/exploration_strategies/gaussian_strategy.py -------------------------------------------------------------------------------- /rlkit/exploration_strategies/ou_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/exploration_strategies/ou_strategy.py -------------------------------------------------------------------------------- /rlkit/launchers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/launchers/__init__.py -------------------------------------------------------------------------------- /rlkit/launchers/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/launchers/conf.py -------------------------------------------------------------------------------- /rlkit/launchers/launcher_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/launchers/launcher_util.py -------------------------------------------------------------------------------- /rlkit/launchers/skewfit_experiments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/launchers/skewfit_experiments.py -------------------------------------------------------------------------------- /rlkit/policies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/policies/argmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/policies/argmax.py -------------------------------------------------------------------------------- /rlkit/policies/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/policies/base.py -------------------------------------------------------------------------------- /rlkit/policies/simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/policies/simple.py -------------------------------------------------------------------------------- /rlkit/pythonplusplus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/pythonplusplus.py -------------------------------------------------------------------------------- /rlkit/samplers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/samplers/data_collector/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/data_collector/__init__.py -------------------------------------------------------------------------------- /rlkit/samplers/data_collector/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/data_collector/base.py -------------------------------------------------------------------------------- /rlkit/samplers/data_collector/path_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/data_collector/path_collector.py -------------------------------------------------------------------------------- /rlkit/samplers/data_collector/step_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/data_collector/step_collector.py -------------------------------------------------------------------------------- /rlkit/samplers/data_collector/vae_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/data_collector/vae_env.py -------------------------------------------------------------------------------- /rlkit/samplers/rollout_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/rollout_functions.py -------------------------------------------------------------------------------- /rlkit/samplers/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/samplers/util.py -------------------------------------------------------------------------------- /rlkit/torch/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/conv_networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/conv_networks.py -------------------------------------------------------------------------------- /rlkit/torch/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/core.py -------------------------------------------------------------------------------- /rlkit/torch/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/data.py -------------------------------------------------------------------------------- /rlkit/torch/data_management/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/data_management/normalizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/data_management/normalizer.py -------------------------------------------------------------------------------- /rlkit/torch/ddpg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/ddpg/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ddpg/ddpg.py -------------------------------------------------------------------------------- /rlkit/torch/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/distributions.py -------------------------------------------------------------------------------- /rlkit/torch/dqn/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/dqn/double_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/dqn/double_dqn.py -------------------------------------------------------------------------------- /rlkit/torch/dqn/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/dqn/dqn.py -------------------------------------------------------------------------------- /rlkit/torch/h_diayn/h_diayn_rollout_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/h_diayn/h_diayn_rollout_functions.py -------------------------------------------------------------------------------- /rlkit/torch/h_diayn/manager_ppo_env_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/h_diayn/manager_ppo_env_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/torch/h_diayn/manager_ppo_path_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/h_diayn/manager_ppo_path_collector.py -------------------------------------------------------------------------------- /rlkit/torch/her/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/her/her.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/her/her.py -------------------------------------------------------------------------------- /rlkit/torch/modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/modules.py -------------------------------------------------------------------------------- /rlkit/torch/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/networks.py -------------------------------------------------------------------------------- /rlkit/torch/ppo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/ppo/discrete_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ppo/discrete_ppo.py -------------------------------------------------------------------------------- /rlkit/torch/ppo/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ppo/policies.py -------------------------------------------------------------------------------- /rlkit/torch/ppo/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ppo/ppo.py -------------------------------------------------------------------------------- /rlkit/torch/ppo/ppo_env_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ppo/ppo_env_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/torch/ppo/ppo_path_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ppo/ppo_path_collector.py -------------------------------------------------------------------------------- /rlkit/torch/ppo/ppo_torch_batch_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/ppo/ppo_torch_batch_rl_algorithm.py -------------------------------------------------------------------------------- /rlkit/torch/pytorch_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/pytorch_util.py -------------------------------------------------------------------------------- /rlkit/torch/sac/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/sac/diayn/diayn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/diayn/diayn.py -------------------------------------------------------------------------------- /rlkit/torch/sac/diayn/diayn_env_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/diayn/diayn_env_replay_buffer.py -------------------------------------------------------------------------------- /rlkit/torch/sac/diayn/diayn_path_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/diayn/diayn_path_collector.py -------------------------------------------------------------------------------- /rlkit/torch/sac/diayn/diayn_torch_online_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/diayn/diayn_torch_online_rl_algorithm.py -------------------------------------------------------------------------------- /rlkit/torch/sac/diayn/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/diayn/policies.py -------------------------------------------------------------------------------- /rlkit/torch/sac/diayn/random_policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/diayn/random_policies.py -------------------------------------------------------------------------------- /rlkit/torch/sac/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/policies.py -------------------------------------------------------------------------------- /rlkit/torch/sac/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/sac/sac.py -------------------------------------------------------------------------------- /rlkit/torch/skewfit/online_vae_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/skewfit/online_vae_algorithm.py -------------------------------------------------------------------------------- /rlkit/torch/skewfit/video_gen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/skewfit/video_gen.py -------------------------------------------------------------------------------- /rlkit/torch/td3/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rlkit/torch/td3/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/td3/td3.py -------------------------------------------------------------------------------- /rlkit/torch/torch_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/torch_rl_algorithm.py -------------------------------------------------------------------------------- /rlkit/torch/vae/conv_vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/vae/conv_vae.py -------------------------------------------------------------------------------- /rlkit/torch/vae/vae_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/vae/vae_base.py -------------------------------------------------------------------------------- /rlkit/torch/vae/vae_schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/vae/vae_schedules.py -------------------------------------------------------------------------------- /rlkit/torch/vae/vae_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/torch/vae/vae_trainer.py -------------------------------------------------------------------------------- /rlkit/util/hyperparameter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/util/hyperparameter.py -------------------------------------------------------------------------------- /rlkit/util/io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/util/io.py -------------------------------------------------------------------------------- /rlkit/util/ml_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/util/ml_util.py -------------------------------------------------------------------------------- /rlkit/util/video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/rlkit/util/video.py -------------------------------------------------------------------------------- /scripts/run_experiment_from_doodad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_experiment_from_doodad.py -------------------------------------------------------------------------------- /scripts/run_goal_conditioned_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_goal_conditioned_policy.py -------------------------------------------------------------------------------- /scripts/run_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_policy.py -------------------------------------------------------------------------------- /scripts/run_policy_diayn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_policy_diayn.py -------------------------------------------------------------------------------- /scripts/run_policy_h_diayn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_policy_h_diayn.py -------------------------------------------------------------------------------- /scripts/run_policy_h_random_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_policy_h_random_policy.py -------------------------------------------------------------------------------- /scripts/run_policy_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/scripts/run_policy_ppo.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/johnlime/RlkitExtension/HEAD/setup.py --------------------------------------------------------------------------------