├── .gitignore ├── LICENSE ├── README.md ├── configs ├── diff_config.py ├── diff_pixels_config.py ├── drq_config.py ├── iql_config.py ├── opal_config.py ├── pixel_config.py ├── pixel_rm_config.py ├── pixel_rnd_config.py ├── rlpd_config.py ├── rlpd_pixels_config.py ├── rm_config.py ├── rnd_config.py ├── sac_config.py └── td_config.py ├── create_env.sh ├── get_hilp_agent.py ├── gym_lib.py ├── requirements.txt ├── run_opal.py ├── supe ├── __init__.py ├── agents │ ├── __init__.py │ ├── agent.py │ ├── diffusion.py │ ├── drq │ │ ├── __init__.py │ │ ├── augmentations.py │ │ ├── drq_learner.py │ │ ├── icvf.py │ │ ├── rm.py │ │ └── rnd.py │ ├── model.py │ ├── rm.py │ ├── rnd.py │ └── sac │ │ ├── __init__.py │ │ ├── sac_learner.py │ │ └── temperature.py ├── data │ ├── __init__.py │ ├── chunk_dataset.py │ ├── d4rl_datasets.py │ ├── dataset.py │ ├── gc_dataset.py │ ├── memory_efficient_replay_buffer.py │ ├── ogbench_dataset.py │ └── replay_buffer.py ├── distributions │ ├── __init__.py │ ├── tanh_normal.py │ └── tanh_transformed.py ├── evaluation.py ├── networks │ ├── __init__.py │ ├── encoders │ │ ├── __init__.py │ │ └── d4pg_encoder.py │ ├── ensemble.py │ ├── mlp.py │ ├── pixel_multiplexer.py │ └── state_action_value.py ├── pretraining │ ├── __init__.py │ ├── iql.py │ └── opal.py ├── types.py ├── utils.py ├── visualization │ ├── __init__.py │ ├── plot_rnd_reward.py │ └── visualize.py └── wrappers │ ├── __init__.py │ ├── mask_kitchen_goal.py │ ├── meta_env_wrapper.py │ ├── ogbench_wrapper.py │ ├── render_observation.py │ ├── single_precision.py │ ├── sparse_reward_wrapper.py │ ├── tanh_converter.py │ ├── universal_seed.py │ └── wandb_video.py ├── train_finetuning_explore.py ├── train_finetuning_explore_pixels.py ├── train_finetuning_supe.py ├── train_finetuning_supe_hilp.py ├── train_finetuning_supe_pixels.py └── train_finetuning_supe_pixels_hilp.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/README.md -------------------------------------------------------------------------------- /configs/diff_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/diff_config.py -------------------------------------------------------------------------------- /configs/diff_pixels_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/diff_pixels_config.py -------------------------------------------------------------------------------- /configs/drq_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/drq_config.py -------------------------------------------------------------------------------- /configs/iql_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/iql_config.py -------------------------------------------------------------------------------- /configs/opal_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/opal_config.py -------------------------------------------------------------------------------- /configs/pixel_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/pixel_config.py -------------------------------------------------------------------------------- /configs/pixel_rm_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/pixel_rm_config.py -------------------------------------------------------------------------------- /configs/pixel_rnd_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/pixel_rnd_config.py -------------------------------------------------------------------------------- /configs/rlpd_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/rlpd_config.py -------------------------------------------------------------------------------- /configs/rlpd_pixels_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/rlpd_pixels_config.py -------------------------------------------------------------------------------- /configs/rm_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/rm_config.py -------------------------------------------------------------------------------- /configs/rnd_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/rnd_config.py -------------------------------------------------------------------------------- /configs/sac_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/sac_config.py -------------------------------------------------------------------------------- /configs/td_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/configs/td_config.py -------------------------------------------------------------------------------- /create_env.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/create_env.sh -------------------------------------------------------------------------------- /get_hilp_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/get_hilp_agent.py -------------------------------------------------------------------------------- /gym_lib.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/gym_lib.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/requirements.txt -------------------------------------------------------------------------------- /run_opal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/run_opal.py -------------------------------------------------------------------------------- /supe/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /supe/agents/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/__init__.py -------------------------------------------------------------------------------- /supe/agents/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/agent.py -------------------------------------------------------------------------------- /supe/agents/diffusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/diffusion.py -------------------------------------------------------------------------------- /supe/agents/drq/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/drq/__init__.py -------------------------------------------------------------------------------- /supe/agents/drq/augmentations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/drq/augmentations.py -------------------------------------------------------------------------------- /supe/agents/drq/drq_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/drq/drq_learner.py -------------------------------------------------------------------------------- /supe/agents/drq/icvf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/drq/icvf.py -------------------------------------------------------------------------------- /supe/agents/drq/rm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/drq/rm.py -------------------------------------------------------------------------------- /supe/agents/drq/rnd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/drq/rnd.py -------------------------------------------------------------------------------- /supe/agents/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/model.py -------------------------------------------------------------------------------- /supe/agents/rm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/rm.py -------------------------------------------------------------------------------- /supe/agents/rnd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/rnd.py -------------------------------------------------------------------------------- /supe/agents/sac/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /supe/agents/sac/sac_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/sac/sac_learner.py -------------------------------------------------------------------------------- /supe/agents/sac/temperature.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/agents/sac/temperature.py -------------------------------------------------------------------------------- /supe/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/__init__.py -------------------------------------------------------------------------------- /supe/data/chunk_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/chunk_dataset.py -------------------------------------------------------------------------------- /supe/data/d4rl_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/d4rl_datasets.py -------------------------------------------------------------------------------- /supe/data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/dataset.py -------------------------------------------------------------------------------- /supe/data/gc_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/gc_dataset.py -------------------------------------------------------------------------------- /supe/data/memory_efficient_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/memory_efficient_replay_buffer.py -------------------------------------------------------------------------------- /supe/data/ogbench_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/ogbench_dataset.py -------------------------------------------------------------------------------- /supe/data/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/data/replay_buffer.py -------------------------------------------------------------------------------- /supe/distributions/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/distributions/__init__.py -------------------------------------------------------------------------------- /supe/distributions/tanh_normal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/distributions/tanh_normal.py -------------------------------------------------------------------------------- /supe/distributions/tanh_transformed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/distributions/tanh_transformed.py -------------------------------------------------------------------------------- /supe/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/evaluation.py -------------------------------------------------------------------------------- /supe/networks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/__init__.py -------------------------------------------------------------------------------- /supe/networks/encoders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/encoders/__init__.py -------------------------------------------------------------------------------- /supe/networks/encoders/d4pg_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/encoders/d4pg_encoder.py -------------------------------------------------------------------------------- /supe/networks/ensemble.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/ensemble.py -------------------------------------------------------------------------------- /supe/networks/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/mlp.py -------------------------------------------------------------------------------- /supe/networks/pixel_multiplexer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/pixel_multiplexer.py -------------------------------------------------------------------------------- /supe/networks/state_action_value.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/networks/state_action_value.py -------------------------------------------------------------------------------- /supe/pretraining/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /supe/pretraining/iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/pretraining/iql.py -------------------------------------------------------------------------------- /supe/pretraining/opal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/pretraining/opal.py -------------------------------------------------------------------------------- /supe/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/types.py -------------------------------------------------------------------------------- /supe/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/utils.py -------------------------------------------------------------------------------- /supe/visualization/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/visualization/__init__.py -------------------------------------------------------------------------------- /supe/visualization/plot_rnd_reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/visualization/plot_rnd_reward.py -------------------------------------------------------------------------------- /supe/visualization/visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/visualization/visualize.py -------------------------------------------------------------------------------- /supe/wrappers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/__init__.py -------------------------------------------------------------------------------- /supe/wrappers/mask_kitchen_goal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/mask_kitchen_goal.py -------------------------------------------------------------------------------- /supe/wrappers/meta_env_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/meta_env_wrapper.py -------------------------------------------------------------------------------- /supe/wrappers/ogbench_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/ogbench_wrapper.py -------------------------------------------------------------------------------- /supe/wrappers/render_observation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/render_observation.py -------------------------------------------------------------------------------- /supe/wrappers/single_precision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/single_precision.py -------------------------------------------------------------------------------- /supe/wrappers/sparse_reward_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/sparse_reward_wrapper.py -------------------------------------------------------------------------------- /supe/wrappers/tanh_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/tanh_converter.py -------------------------------------------------------------------------------- /supe/wrappers/universal_seed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/universal_seed.py -------------------------------------------------------------------------------- /supe/wrappers/wandb_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/supe/wrappers/wandb_video.py -------------------------------------------------------------------------------- /train_finetuning_explore.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/train_finetuning_explore.py -------------------------------------------------------------------------------- /train_finetuning_explore_pixels.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/train_finetuning_explore_pixels.py -------------------------------------------------------------------------------- /train_finetuning_supe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/train_finetuning_supe.py -------------------------------------------------------------------------------- /train_finetuning_supe_hilp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/train_finetuning_supe_hilp.py -------------------------------------------------------------------------------- /train_finetuning_supe_pixels.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/train_finetuning_supe_pixels.py -------------------------------------------------------------------------------- /train_finetuning_supe_pixels_hilp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rail-berkeley/SUPE/HEAD/train_finetuning_supe_pixels_hilp.py --------------------------------------------------------------------------------