├── .circleci └── config.yml ├── .github ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md └── ISSUE_TEMPLATE.md ├── .gitignore ├── .pylintrc ├── .streamlit └── config.toml ├── LICENSE ├── README.md ├── controllable_agent ├── __init__.py ├── data │ └── mockpretrain │ │ ├── eval.csv │ │ ├── hip.log │ │ └── train.csv ├── executor.py ├── runner.py ├── test_executor.py └── test_url_benchmark.py ├── demo └── main.py ├── env.sh ├── mypy.ini ├── requirements.txt └── url_benchmark ├── LICENSE ├── README.md ├── __init__.py ├── agent ├── __init__.py ├── aps.py ├── ddpg.py ├── diayn.py ├── disagreement.py ├── disagreement.yaml ├── discrete_fb.py ├── discrete_sf.py ├── fb_ddpg.py ├── fb_modules.py ├── goal_sm.py ├── goal_td3.py ├── icm.py ├── icm.yaml ├── icm_apt.py ├── ind_apt.yaml ├── max_ent.py ├── new_aps.py ├── proto.py ├── rnd.py ├── sf.py ├── sf_svd.py ├── smm.py ├── smm.yaml ├── state_apt.yaml ├── test_agent.py └── uvf.py ├── anytrain.py ├── base_config.yaml ├── custom_dmc_tasks ├── __init__.py ├── cheetah.py ├── cheetah.xml ├── hopper.py ├── hopper.xml ├── jaco.py ├── point_mass_maze.py ├── point_mass_maze_multi_goal.xml ├── point_mass_maze_reach_bottom_left.xml ├── point_mass_maze_reach_bottom_right.xml ├── point_mass_maze_reach_top_left.xml ├── point_mass_maze_reach_top_right.xml ├── quadruped.py ├── quadruped.xml ├── walker.py └── walker.xml ├── d4rl_benchmark.py ├── dmc.py ├── dmc_benchmark.py ├── goals.py ├── gridworld ├── __init__.py └── env.py ├── hiplogs.py ├── in_memory_replay_buffer.py ├── logger.py ├── play_behaviors.py ├── pretrain.py ├── relabel_buffer.py ├── replay_buffer.py ├── test_dmc.py ├── test_goals.py ├── test_hiplogs.py ├── test_in_memory_replay_buffer.py ├── test_pretrain.py ├── test_replay_buffer.py ├── train_offline.py ├── train_online.py ├── utils.py └── video.py /.circleci/config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.circleci/config.yml -------------------------------------------------------------------------------- /.github/CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.github/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /.github/CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.github/CONTRIBUTING.md -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.github/ISSUE_TEMPLATE.md -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.gitignore -------------------------------------------------------------------------------- /.pylintrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.pylintrc -------------------------------------------------------------------------------- /.streamlit/config.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/.streamlit/config.toml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/README.md -------------------------------------------------------------------------------- /controllable_agent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/__init__.py -------------------------------------------------------------------------------- /controllable_agent/data/mockpretrain/eval.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/data/mockpretrain/eval.csv -------------------------------------------------------------------------------- /controllable_agent/data/mockpretrain/hip.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/data/mockpretrain/hip.log -------------------------------------------------------------------------------- /controllable_agent/data/mockpretrain/train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/data/mockpretrain/train.csv -------------------------------------------------------------------------------- /controllable_agent/executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/executor.py -------------------------------------------------------------------------------- /controllable_agent/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/runner.py -------------------------------------------------------------------------------- /controllable_agent/test_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/test_executor.py -------------------------------------------------------------------------------- /controllable_agent/test_url_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/controllable_agent/test_url_benchmark.py -------------------------------------------------------------------------------- /demo/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/demo/main.py -------------------------------------------------------------------------------- /env.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/env.sh -------------------------------------------------------------------------------- /mypy.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/mypy.ini -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/requirements.txt -------------------------------------------------------------------------------- /url_benchmark/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/LICENSE -------------------------------------------------------------------------------- /url_benchmark/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/README.md -------------------------------------------------------------------------------- /url_benchmark/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/__init__.py -------------------------------------------------------------------------------- /url_benchmark/agent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/__init__.py -------------------------------------------------------------------------------- /url_benchmark/agent/aps.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/aps.py -------------------------------------------------------------------------------- /url_benchmark/agent/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/ddpg.py -------------------------------------------------------------------------------- /url_benchmark/agent/diayn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/diayn.py -------------------------------------------------------------------------------- /url_benchmark/agent/disagreement.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/disagreement.py -------------------------------------------------------------------------------- /url_benchmark/agent/disagreement.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/disagreement.yaml -------------------------------------------------------------------------------- /url_benchmark/agent/discrete_fb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/discrete_fb.py -------------------------------------------------------------------------------- /url_benchmark/agent/discrete_sf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/discrete_sf.py -------------------------------------------------------------------------------- /url_benchmark/agent/fb_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/fb_ddpg.py -------------------------------------------------------------------------------- /url_benchmark/agent/fb_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/fb_modules.py -------------------------------------------------------------------------------- /url_benchmark/agent/goal_sm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/goal_sm.py -------------------------------------------------------------------------------- /url_benchmark/agent/goal_td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/goal_td3.py -------------------------------------------------------------------------------- /url_benchmark/agent/icm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/icm.py -------------------------------------------------------------------------------- /url_benchmark/agent/icm.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/icm.yaml -------------------------------------------------------------------------------- /url_benchmark/agent/icm_apt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/icm_apt.py -------------------------------------------------------------------------------- /url_benchmark/agent/ind_apt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/ind_apt.yaml -------------------------------------------------------------------------------- /url_benchmark/agent/max_ent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/max_ent.py -------------------------------------------------------------------------------- /url_benchmark/agent/new_aps.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/new_aps.py -------------------------------------------------------------------------------- /url_benchmark/agent/proto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/proto.py -------------------------------------------------------------------------------- /url_benchmark/agent/rnd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/rnd.py -------------------------------------------------------------------------------- /url_benchmark/agent/sf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/sf.py -------------------------------------------------------------------------------- /url_benchmark/agent/sf_svd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/sf_svd.py -------------------------------------------------------------------------------- /url_benchmark/agent/smm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/smm.py -------------------------------------------------------------------------------- /url_benchmark/agent/smm.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/smm.yaml -------------------------------------------------------------------------------- /url_benchmark/agent/state_apt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/state_apt.yaml -------------------------------------------------------------------------------- /url_benchmark/agent/test_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/test_agent.py -------------------------------------------------------------------------------- /url_benchmark/agent/uvf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/agent/uvf.py -------------------------------------------------------------------------------- /url_benchmark/anytrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/anytrain.py -------------------------------------------------------------------------------- /url_benchmark/base_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/base_config.yaml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/__init__.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/cheetah.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/cheetah.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/cheetah.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/hopper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/hopper.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/hopper.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/hopper.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/jaco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/jaco.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/point_mass_maze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/point_mass_maze.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/point_mass_maze_multi_goal.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/point_mass_maze_multi_goal.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/point_mass_maze_reach_bottom_left.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/point_mass_maze_reach_bottom_left.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/point_mass_maze_reach_bottom_right.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/point_mass_maze_reach_bottom_right.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/point_mass_maze_reach_top_left.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/point_mass_maze_reach_top_left.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/point_mass_maze_reach_top_right.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/point_mass_maze_reach_top_right.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/quadruped.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/quadruped.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/quadruped.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/quadruped.xml -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/walker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/walker.py -------------------------------------------------------------------------------- /url_benchmark/custom_dmc_tasks/walker.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/custom_dmc_tasks/walker.xml -------------------------------------------------------------------------------- /url_benchmark/d4rl_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/d4rl_benchmark.py -------------------------------------------------------------------------------- /url_benchmark/dmc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/dmc.py -------------------------------------------------------------------------------- /url_benchmark/dmc_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/dmc_benchmark.py -------------------------------------------------------------------------------- /url_benchmark/goals.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/goals.py -------------------------------------------------------------------------------- /url_benchmark/gridworld/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/gridworld/__init__.py -------------------------------------------------------------------------------- /url_benchmark/gridworld/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/gridworld/env.py -------------------------------------------------------------------------------- /url_benchmark/hiplogs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/hiplogs.py -------------------------------------------------------------------------------- /url_benchmark/in_memory_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/in_memory_replay_buffer.py -------------------------------------------------------------------------------- /url_benchmark/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/logger.py -------------------------------------------------------------------------------- /url_benchmark/play_behaviors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/play_behaviors.py -------------------------------------------------------------------------------- /url_benchmark/pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/pretrain.py -------------------------------------------------------------------------------- /url_benchmark/relabel_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/relabel_buffer.py -------------------------------------------------------------------------------- /url_benchmark/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/replay_buffer.py -------------------------------------------------------------------------------- /url_benchmark/test_dmc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/test_dmc.py -------------------------------------------------------------------------------- /url_benchmark/test_goals.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/test_goals.py -------------------------------------------------------------------------------- /url_benchmark/test_hiplogs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/test_hiplogs.py -------------------------------------------------------------------------------- /url_benchmark/test_in_memory_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/test_in_memory_replay_buffer.py -------------------------------------------------------------------------------- /url_benchmark/test_pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/test_pretrain.py -------------------------------------------------------------------------------- /url_benchmark/test_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/test_replay_buffer.py -------------------------------------------------------------------------------- /url_benchmark/train_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/train_offline.py -------------------------------------------------------------------------------- /url_benchmark/train_online.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/train_online.py -------------------------------------------------------------------------------- /url_benchmark/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/utils.py -------------------------------------------------------------------------------- /url_benchmark/video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/facebookresearch/controllable_agent/HEAD/url_benchmark/video.py --------------------------------------------------------------------------------