├── .github └── ISSUE_TEMPLATE │ ├── bug_report.md │ └── feature_request.md ├── .gitignore ├── Algorithms ├── __init__.py ├── body.py ├── dac_ppo │ ├── __init__.py │ ├── buffer.py │ ├── core.py │ ├── dac_ppo.py │ └── dac_ppo_config.json ├── ddpg │ ├── __init__.py │ ├── core.py │ ├── ddpg.py │ ├── ddpg_config.json │ └── replay_buffer.py ├── option_critic │ ├── __init__.py │ ├── buffer.py │ ├── core.py │ ├── oc_continuous.py │ ├── oc_discrete.py │ └── option_critic_config.json ├── ppo │ ├── __init__.py │ ├── core.py │ ├── gae_buffer.py │ ├── ppo.py │ └── ppo_config.json ├── td3 │ ├── __init__.py │ ├── core.py │ ├── replay_buffer.py │ ├── td3.py │ └── td3_config.json ├── trpo │ ├── __init__.py │ ├── core.py │ ├── gae_buffer.py │ ├── trpo.py │ └── trpo_config.json └── utils.py ├── Logger ├── __init__.py └── logger.py ├── Model_Weights ├── AntBulletEnv-v0 │ ├── comparison.png │ ├── dac_ppo │ │ └── dac_ppo_config.json │ ├── ddpg │ │ └── ddpg_config.json │ ├── option_critic │ │ └── option_critic_config.json │ ├── ppo │ │ └── ppo_config.json │ ├── td3 │ │ ├── recording.gif │ │ └── td3_config.json │ └── trpo │ │ └── trpo_config.json ├── CartPoleContinuousBulletEnv-v0 │ ├── comparison.png │ ├── dac_ppo │ │ └── dac_ppo_config.json │ ├── ddpg │ │ ├── ddpg_config.json │ │ └── recording.gif │ ├── option_critic │ │ └── option_critic_config.json │ ├── ppo │ │ └── ppo_config.json │ ├── td3 │ │ └── td3_config.json │ └── trpo │ │ └── trpo_config.json ├── HalfCheetahBulletEnv-v0 │ ├── comparison.png │ ├── dac_ppo │ │ └── dac_ppo_config.json │ ├── ddpg │ │ ├── ddpg_config.json │ │ └── recording.gif │ ├── option_critic │ │ └── option_critic_config.json │ ├── ppo │ │ └── ppo_config.json │ ├── td3 │ │ └── td3_config.json │ └── trpo │ │ └── trpo_config.json ├── HopperBulletEnv-v0 │ ├── comparison.png │ ├── dac_ppo │ │ └── dac_ppo_config.json │ ├── ddpg │ │ └── ddpg_config.json │ ├── option_critic │ │ └── option_critic_config.json │ ├── ppo │ │ └── ppo_config.json │ ├── td3 │ │ ├── recording.gif │ │ └── td3_config.json │ └── trpo │ │ └── trpo_config.json ├── close_box-vision-v0 │ ├── comparison.png │ ├── comparison_full.png │ ├── ddpg │ │ └── ddpg_config.json │ ├── oc_conv │ │ └── option_critic_config.json │ ├── oc_vae │ │ ├── option_critic_config.json │ │ └── recording.gif │ ├── ppo │ │ └── ppo_config.json │ └── trpo │ │ └── trpo_config.json ├── open_box-vision-v0 │ ├── close_box-vision-v0.png │ ├── comparison.png │ ├── comparison_full.png │ ├── ddpg │ │ └── ddpg_config.json │ ├── oc_conv │ │ ├── option_critic_config.json │ │ └── recording.gif │ ├── oc_vae │ │ ├── option_critic_config.json │ │ └── recording.gif │ ├── open_box-vision-v0.png │ ├── pick_up_cup-vision-v0.png │ ├── ppo │ │ └── ppo_config.json │ ├── scoop_with_spatula-vision-v0.png │ └── trpo │ │ └── trpo_config.json ├── pick_up_cup-vision-v0 │ ├── comparison.png │ ├── comparison_full.png │ ├── ddpg │ │ └── ddpg_config.json │ ├── oc_conv │ │ └── option_critic_config.json │ ├── oc_vae │ │ └── option_critic_config.json │ ├── ppo │ │ └── ppo_config.json │ └── trpo │ │ └── trpo_config.json └── scoop_with_spatula-vision-v0 │ ├── comparison.png │ ├── ddpg │ └── ddpg_config.json │ ├── oc_conv │ └── option_critic_config.json │ ├── oc_vae │ └── option_critic_config.json │ ├── ppo │ └── ppo_config.json │ └── trpo │ └── trpo_config.json ├── README.md ├── Stable_Baselines ├── __init__.py ├── monitor_training.py ├── plot_results.py ├── savebest_callback.py └── test.py ├── VAE ├── README.md ├── Wrappers │ ├── __init__.py │ ├── image_learning.py │ └── rlbench_wrapper.py ├── __init__.py ├── dataset │ ├── Dataset.py │ └── __init__.py ├── generate_data.py ├── logger.py ├── train_tasks.sh ├── train_vae.py └── vae.py ├── Wrappers ├── __init__.py ├── image_learning.py ├── normalize_observation.py ├── normalized_action.py ├── rlbench_wrapper.py └── serialize_env.py ├── plot_results.py ├── requirements.txt ├── test.py └── train.py /.github/ISSUE_TEMPLATE/bug_report.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/.github/ISSUE_TEMPLATE/bug_report.md -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/feature_request.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/.github/ISSUE_TEMPLATE/feature_request.md -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/.gitignore -------------------------------------------------------------------------------- /Algorithms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/body.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/body.py -------------------------------------------------------------------------------- /Algorithms/dac_ppo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/dac_ppo/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/dac_ppo/buffer.py -------------------------------------------------------------------------------- /Algorithms/dac_ppo/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/dac_ppo/core.py -------------------------------------------------------------------------------- /Algorithms/dac_ppo/dac_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/dac_ppo/dac_ppo.py -------------------------------------------------------------------------------- /Algorithms/dac_ppo/dac_ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/dac_ppo/dac_ppo_config.json -------------------------------------------------------------------------------- /Algorithms/ddpg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/ddpg/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ddpg/core.py -------------------------------------------------------------------------------- /Algorithms/ddpg/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ddpg/ddpg.py -------------------------------------------------------------------------------- /Algorithms/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Algorithms/ddpg/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ddpg/replay_buffer.py -------------------------------------------------------------------------------- /Algorithms/option_critic/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/option_critic/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/option_critic/buffer.py -------------------------------------------------------------------------------- /Algorithms/option_critic/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/option_critic/core.py -------------------------------------------------------------------------------- /Algorithms/option_critic/oc_continuous.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/option_critic/oc_continuous.py -------------------------------------------------------------------------------- /Algorithms/option_critic/oc_discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/option_critic/oc_discrete.py -------------------------------------------------------------------------------- /Algorithms/option_critic/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/option_critic/option_critic_config.json -------------------------------------------------------------------------------- /Algorithms/ppo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/ppo/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ppo/core.py -------------------------------------------------------------------------------- /Algorithms/ppo/gae_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ppo/gae_buffer.py -------------------------------------------------------------------------------- /Algorithms/ppo/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ppo/ppo.py -------------------------------------------------------------------------------- /Algorithms/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/ppo/ppo_config.json -------------------------------------------------------------------------------- /Algorithms/td3/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/td3/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/td3/core.py -------------------------------------------------------------------------------- /Algorithms/td3/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/td3/replay_buffer.py -------------------------------------------------------------------------------- /Algorithms/td3/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/td3/td3.py -------------------------------------------------------------------------------- /Algorithms/td3/td3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/td3/td3_config.json -------------------------------------------------------------------------------- /Algorithms/trpo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Algorithms/trpo/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/trpo/core.py -------------------------------------------------------------------------------- /Algorithms/trpo/gae_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/trpo/gae_buffer.py -------------------------------------------------------------------------------- /Algorithms/trpo/trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/trpo/trpo.py -------------------------------------------------------------------------------- /Algorithms/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/trpo/trpo_config.json -------------------------------------------------------------------------------- /Algorithms/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Algorithms/utils.py -------------------------------------------------------------------------------- /Logger/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Logger/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Logger/logger.py -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/dac_ppo/dac_ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/dac_ppo/dac_ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/option_critic/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/option_critic/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/td3/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/td3/recording.gif -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/td3/td3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/td3/td3_config.json -------------------------------------------------------------------------------- /Model_Weights/AntBulletEnv-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/AntBulletEnv-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/dac_ppo/dac_ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/dac_ppo/dac_ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/ddpg/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/ddpg/recording.gif -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/option_critic/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/option_critic/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/td3/td3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/td3/td3_config.json -------------------------------------------------------------------------------- /Model_Weights/CartPoleContinuousBulletEnv-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/CartPoleContinuousBulletEnv-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/dac_ppo/dac_ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/dac_ppo/dac_ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/ddpg/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/ddpg/recording.gif -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/option_critic/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/option_critic/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/td3/td3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/td3/td3_config.json -------------------------------------------------------------------------------- /Model_Weights/HalfCheetahBulletEnv-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HalfCheetahBulletEnv-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/dac_ppo/dac_ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/dac_ppo/dac_ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/option_critic/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/option_critic/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/td3/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/td3/recording.gif -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/td3/td3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/td3/td3_config.json -------------------------------------------------------------------------------- /Model_Weights/HopperBulletEnv-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/HopperBulletEnv-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/comparison_full.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/comparison_full.png -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/oc_conv/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/oc_conv/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/oc_vae/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/oc_vae/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/oc_vae/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/oc_vae/recording.gif -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/close_box-vision-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/close_box-vision-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/close_box-vision-v0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/close_box-vision-v0.png -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/comparison_full.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/comparison_full.png -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/oc_conv/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/oc_conv/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/oc_conv/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/oc_conv/recording.gif -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/oc_vae/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/oc_vae/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/oc_vae/recording.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/oc_vae/recording.gif -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/open_box-vision-v0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/open_box-vision-v0.png -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/pick_up_cup-vision-v0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/pick_up_cup-vision-v0.png -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/scoop_with_spatula-vision-v0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/scoop_with_spatula-vision-v0.png -------------------------------------------------------------------------------- /Model_Weights/open_box-vision-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/open_box-vision-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/comparison_full.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/comparison_full.png -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/oc_conv/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/oc_conv/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/oc_vae/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/oc_vae/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/pick_up_cup-vision-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/pick_up_cup-vision-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /Model_Weights/scoop_with_spatula-vision-v0/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/scoop_with_spatula-vision-v0/comparison.png -------------------------------------------------------------------------------- /Model_Weights/scoop_with_spatula-vision-v0/ddpg/ddpg_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/scoop_with_spatula-vision-v0/ddpg/ddpg_config.json -------------------------------------------------------------------------------- /Model_Weights/scoop_with_spatula-vision-v0/oc_conv/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/scoop_with_spatula-vision-v0/oc_conv/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/scoop_with_spatula-vision-v0/oc_vae/option_critic_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/scoop_with_spatula-vision-v0/oc_vae/option_critic_config.json -------------------------------------------------------------------------------- /Model_Weights/scoop_with_spatula-vision-v0/ppo/ppo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/scoop_with_spatula-vision-v0/ppo/ppo_config.json -------------------------------------------------------------------------------- /Model_Weights/scoop_with_spatula-vision-v0/trpo/trpo_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Model_Weights/scoop_with_spatula-vision-v0/trpo/trpo_config.json -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/README.md -------------------------------------------------------------------------------- /Stable_Baselines/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Stable_Baselines/monitor_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Stable_Baselines/monitor_training.py -------------------------------------------------------------------------------- /Stable_Baselines/plot_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Stable_Baselines/plot_results.py -------------------------------------------------------------------------------- /Stable_Baselines/savebest_callback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Stable_Baselines/savebest_callback.py -------------------------------------------------------------------------------- /Stable_Baselines/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Stable_Baselines/test.py -------------------------------------------------------------------------------- /VAE/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/README.md -------------------------------------------------------------------------------- /VAE/Wrappers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VAE/Wrappers/image_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/Wrappers/image_learning.py -------------------------------------------------------------------------------- /VAE/Wrappers/rlbench_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/Wrappers/rlbench_wrapper.py -------------------------------------------------------------------------------- /VAE/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VAE/dataset/Dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/dataset/Dataset.py -------------------------------------------------------------------------------- /VAE/dataset/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VAE/generate_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/generate_data.py -------------------------------------------------------------------------------- /VAE/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/logger.py -------------------------------------------------------------------------------- /VAE/train_tasks.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/train_tasks.sh -------------------------------------------------------------------------------- /VAE/train_vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/train_vae.py -------------------------------------------------------------------------------- /VAE/vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/VAE/vae.py -------------------------------------------------------------------------------- /Wrappers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Wrappers/image_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Wrappers/image_learning.py -------------------------------------------------------------------------------- /Wrappers/normalize_observation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Wrappers/normalize_observation.py -------------------------------------------------------------------------------- /Wrappers/normalized_action.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Wrappers/normalized_action.py -------------------------------------------------------------------------------- /Wrappers/rlbench_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Wrappers/rlbench_wrapper.py -------------------------------------------------------------------------------- /Wrappers/serialize_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/Wrappers/serialize_env.py -------------------------------------------------------------------------------- /plot_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/plot_results.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/requirements.txt -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jason-CKY/DeepRL-pytorch/HEAD/train.py --------------------------------------------------------------------------------