├── .github └── workflows │ └── jekyll-gh-pages.yml ├── .gitignore ├── Gumbel_Regression.ipynb ├── README.md ├── docs ├── approach.png ├── bibtex.txt ├── compare.png ├── diagram.svg ├── extreme_q_learning.pdf ├── gumbel_regression.png ├── hopper_sac.gif ├── hopper_td3_2q.gif ├── hopper_xsac.gif ├── hopper_xtd3_2q.gif ├── icons │ ├── github-brands.svg:Zone.Identifier │ ├── github.svg │ ├── paper_icon.svg │ ├── video-solid.svg:Zone.Identifier │ ├── video.svg │ ├── youtube-brands.svg:Zone.Identifier │ └── youtube.svg ├── iframe.php ├── index.html ├── index_old.html ├── iql_franka.gif ├── js │ ├── analytics.js │ └── jsapi ├── neurips_2021_iq.txt ├── paper_thumb.png ├── poster.pdf ├── quad_td3.gif ├── quad_xtd3.gif ├── style.css ├── video.html ├── website_td3.png └── xql_franka.gif ├── offline ├── README.md ├── actor.py ├── common.py ├── configs │ ├── antmaze_config.py │ ├── antmaze_finetune_config.py │ ├── kitchen_config.py │ ├── mujoco_config.py │ └── mujoco_config_finetune.py ├── create_gif.py ├── critic.py ├── dataset_utils.py ├── evaluation.py ├── learner.py ├── policy.py ├── reproduce │ ├── androit │ │ └── androit_consistent.sh │ ├── antmaze │ │ ├── ant_consistent.sh │ │ ├── ant_large_diverse.sh │ │ ├── ant_large_play.sh │ │ ├── ant_medium_diverse.sh │ │ ├── ant_medium_play.sh │ │ ├── ant_umaze.sh │ │ └── ant_umaze_diverse.sh │ ├── franka │ │ ├── kitchen_complete.sh │ │ ├── kitchen_consistent.sh │ │ ├── kitchen_mixed.sh │ │ └── kitchen_partial.sh │ └── mujoco │ │ ├── halfcheetah_expert.sh │ │ ├── halfcheetah_medium.sh │ │ ├── halfcheetah_replay.sh │ │ ├── hopper_expert.sh │ │ ├── hopper_medium.sh │ │ ├── hopper_replay.sh │ │ ├── mujoco_consistent.sh │ │ ├── walker_expert.sh │ │ ├── walker_medium.sh │ │ └── walker_replay.sh ├── requirements.txt ├── requirements_exact.txt ├── test.py ├── train_finetune.py ├── train_offline.py ├── value_net.py └── wrappers │ ├── __init__.py │ ├── common.py │ ├── episode_monitor.py │ └── single_precision.py └── online ├── README.md ├── configs ├── sac_experiments.json ├── td3_1q_experiments.json ├── td3_2q_experiments.json ├── xsac.yaml └── xtd3.yaml ├── environment_cpu.yaml ├── environment_gpu.yaml ├── research ├── __init__.py ├── algs │ ├── __init__.py │ ├── base.py │ ├── gumbel_sac.py │ ├── gumbel_td3.py │ ├── sac.py │ └── td3.py ├── datasets │ ├── __init__.py │ └── replay_buffer.py ├── envs │ ├── __init__.py │ ├── dm_control.py │ └── empty.py ├── networks │ ├── __init__.py │ ├── base.py │ ├── common.py │ └── mlp.py ├── processors │ ├── __init__.py │ ├── base.py │ ├── normalization.py │ └── random_shifts_aug.py └── utils │ ├── config.py │ ├── evaluate.py │ ├── logger.py │ ├── schedules.py │ ├── trainer.py │ └── utils.py ├── scripts ├── create_random_dataset.py ├── plot.py ├── train.py └── visualize.py ├── setup.py ├── setup_shell.sh └── tools ├── cleanup.py ├── run_local.py ├── run_slurm.py └── utils.py /.github/workflows/jekyll-gh-pages.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/.github/workflows/jekyll-gh-pages.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/.gitignore -------------------------------------------------------------------------------- /Gumbel_Regression.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/Gumbel_Regression.ipynb -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/README.md -------------------------------------------------------------------------------- /docs/approach.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/approach.png -------------------------------------------------------------------------------- /docs/bibtex.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/bibtex.txt -------------------------------------------------------------------------------- /docs/compare.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/compare.png -------------------------------------------------------------------------------- /docs/diagram.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/diagram.svg -------------------------------------------------------------------------------- /docs/extreme_q_learning.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/extreme_q_learning.pdf -------------------------------------------------------------------------------- /docs/gumbel_regression.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/gumbel_regression.png -------------------------------------------------------------------------------- /docs/hopper_sac.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/hopper_sac.gif -------------------------------------------------------------------------------- /docs/hopper_td3_2q.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/hopper_td3_2q.gif -------------------------------------------------------------------------------- /docs/hopper_xsac.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/hopper_xsac.gif -------------------------------------------------------------------------------- /docs/hopper_xtd3_2q.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/hopper_xtd3_2q.gif -------------------------------------------------------------------------------- /docs/icons/github-brands.svg:Zone.Identifier: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/github-brands.svg:Zone.Identifier -------------------------------------------------------------------------------- /docs/icons/github.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/github.svg -------------------------------------------------------------------------------- /docs/icons/paper_icon.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/paper_icon.svg -------------------------------------------------------------------------------- /docs/icons/video-solid.svg:Zone.Identifier: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/video-solid.svg:Zone.Identifier -------------------------------------------------------------------------------- /docs/icons/video.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/video.svg -------------------------------------------------------------------------------- /docs/icons/youtube-brands.svg:Zone.Identifier: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/youtube-brands.svg:Zone.Identifier -------------------------------------------------------------------------------- /docs/icons/youtube.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/icons/youtube.svg -------------------------------------------------------------------------------- /docs/iframe.php: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/iframe.php -------------------------------------------------------------------------------- /docs/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/index.html -------------------------------------------------------------------------------- /docs/index_old.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/index_old.html -------------------------------------------------------------------------------- /docs/iql_franka.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/iql_franka.gif -------------------------------------------------------------------------------- /docs/js/analytics.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/js/analytics.js -------------------------------------------------------------------------------- /docs/js/jsapi: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/js/jsapi -------------------------------------------------------------------------------- /docs/neurips_2021_iq.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/neurips_2021_iq.txt -------------------------------------------------------------------------------- /docs/paper_thumb.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/paper_thumb.png -------------------------------------------------------------------------------- /docs/poster.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/poster.pdf -------------------------------------------------------------------------------- /docs/quad_td3.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/quad_td3.gif -------------------------------------------------------------------------------- /docs/quad_xtd3.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/quad_xtd3.gif -------------------------------------------------------------------------------- /docs/style.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/style.css -------------------------------------------------------------------------------- /docs/video.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/video.html -------------------------------------------------------------------------------- /docs/website_td3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/website_td3.png -------------------------------------------------------------------------------- /docs/xql_franka.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/docs/xql_franka.gif -------------------------------------------------------------------------------- /offline/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/README.md -------------------------------------------------------------------------------- /offline/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/actor.py -------------------------------------------------------------------------------- /offline/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/common.py -------------------------------------------------------------------------------- /offline/configs/antmaze_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/configs/antmaze_config.py -------------------------------------------------------------------------------- /offline/configs/antmaze_finetune_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/configs/antmaze_finetune_config.py -------------------------------------------------------------------------------- /offline/configs/kitchen_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/configs/kitchen_config.py -------------------------------------------------------------------------------- /offline/configs/mujoco_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/configs/mujoco_config.py -------------------------------------------------------------------------------- /offline/configs/mujoco_config_finetune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/configs/mujoco_config_finetune.py -------------------------------------------------------------------------------- /offline/create_gif.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/create_gif.py -------------------------------------------------------------------------------- /offline/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/critic.py -------------------------------------------------------------------------------- /offline/dataset_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/dataset_utils.py -------------------------------------------------------------------------------- /offline/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/evaluation.py -------------------------------------------------------------------------------- /offline/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/learner.py -------------------------------------------------------------------------------- /offline/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/policy.py -------------------------------------------------------------------------------- /offline/reproduce/androit/androit_consistent.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/androit/androit_consistent.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_consistent.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_consistent.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_large_diverse.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_large_diverse.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_large_play.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_large_play.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_medium_diverse.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_medium_diverse.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_medium_play.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_medium_play.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_umaze.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_umaze.sh -------------------------------------------------------------------------------- /offline/reproduce/antmaze/ant_umaze_diverse.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/antmaze/ant_umaze_diverse.sh -------------------------------------------------------------------------------- /offline/reproduce/franka/kitchen_complete.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/franka/kitchen_complete.sh -------------------------------------------------------------------------------- /offline/reproduce/franka/kitchen_consistent.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/franka/kitchen_consistent.sh -------------------------------------------------------------------------------- /offline/reproduce/franka/kitchen_mixed.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/franka/kitchen_mixed.sh -------------------------------------------------------------------------------- /offline/reproduce/franka/kitchen_partial.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/franka/kitchen_partial.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/halfcheetah_expert.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/halfcheetah_expert.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/halfcheetah_medium.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/halfcheetah_medium.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/halfcheetah_replay.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/halfcheetah_replay.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/hopper_expert.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/hopper_expert.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/hopper_medium.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/hopper_medium.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/hopper_replay.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/hopper_replay.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/mujoco_consistent.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/mujoco_consistent.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/walker_expert.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/walker_expert.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/walker_medium.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/walker_medium.sh -------------------------------------------------------------------------------- /offline/reproduce/mujoco/walker_replay.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/reproduce/mujoco/walker_replay.sh -------------------------------------------------------------------------------- /offline/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/requirements.txt -------------------------------------------------------------------------------- /offline/requirements_exact.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/requirements_exact.txt -------------------------------------------------------------------------------- /offline/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/test.py -------------------------------------------------------------------------------- /offline/train_finetune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/train_finetune.py -------------------------------------------------------------------------------- /offline/train_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/train_offline.py -------------------------------------------------------------------------------- /offline/value_net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/value_net.py -------------------------------------------------------------------------------- /offline/wrappers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/wrappers/__init__.py -------------------------------------------------------------------------------- /offline/wrappers/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/wrappers/common.py -------------------------------------------------------------------------------- /offline/wrappers/episode_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/wrappers/episode_monitor.py -------------------------------------------------------------------------------- /offline/wrappers/single_precision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/offline/wrappers/single_precision.py -------------------------------------------------------------------------------- /online/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/README.md -------------------------------------------------------------------------------- /online/configs/sac_experiments.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/configs/sac_experiments.json -------------------------------------------------------------------------------- /online/configs/td3_1q_experiments.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/configs/td3_1q_experiments.json -------------------------------------------------------------------------------- /online/configs/td3_2q_experiments.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/configs/td3_2q_experiments.json -------------------------------------------------------------------------------- /online/configs/xsac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/configs/xsac.yaml -------------------------------------------------------------------------------- /online/configs/xtd3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/configs/xtd3.yaml -------------------------------------------------------------------------------- /online/environment_cpu.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/environment_cpu.yaml -------------------------------------------------------------------------------- /online/environment_gpu.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/environment_gpu.yaml -------------------------------------------------------------------------------- /online/research/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/__init__.py -------------------------------------------------------------------------------- /online/research/algs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/algs/__init__.py -------------------------------------------------------------------------------- /online/research/algs/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/algs/base.py -------------------------------------------------------------------------------- /online/research/algs/gumbel_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/algs/gumbel_sac.py -------------------------------------------------------------------------------- /online/research/algs/gumbel_td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/algs/gumbel_td3.py -------------------------------------------------------------------------------- /online/research/algs/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/algs/sac.py -------------------------------------------------------------------------------- /online/research/algs/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/algs/td3.py -------------------------------------------------------------------------------- /online/research/datasets/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/datasets/__init__.py -------------------------------------------------------------------------------- /online/research/datasets/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/datasets/replay_buffer.py -------------------------------------------------------------------------------- /online/research/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/envs/__init__.py -------------------------------------------------------------------------------- /online/research/envs/dm_control.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/envs/dm_control.py -------------------------------------------------------------------------------- /online/research/envs/empty.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/envs/empty.py -------------------------------------------------------------------------------- /online/research/networks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/networks/__init__.py -------------------------------------------------------------------------------- /online/research/networks/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/networks/base.py -------------------------------------------------------------------------------- /online/research/networks/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/networks/common.py -------------------------------------------------------------------------------- /online/research/networks/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/networks/mlp.py -------------------------------------------------------------------------------- /online/research/processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/processors/__init__.py -------------------------------------------------------------------------------- /online/research/processors/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/processors/base.py -------------------------------------------------------------------------------- /online/research/processors/normalization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/processors/normalization.py -------------------------------------------------------------------------------- /online/research/processors/random_shifts_aug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/processors/random_shifts_aug.py -------------------------------------------------------------------------------- /online/research/utils/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/utils/config.py -------------------------------------------------------------------------------- /online/research/utils/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/utils/evaluate.py -------------------------------------------------------------------------------- /online/research/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/utils/logger.py -------------------------------------------------------------------------------- /online/research/utils/schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/utils/schedules.py -------------------------------------------------------------------------------- /online/research/utils/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/utils/trainer.py -------------------------------------------------------------------------------- /online/research/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/research/utils/utils.py -------------------------------------------------------------------------------- /online/scripts/create_random_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/scripts/create_random_dataset.py -------------------------------------------------------------------------------- /online/scripts/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/scripts/plot.py -------------------------------------------------------------------------------- /online/scripts/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/scripts/train.py -------------------------------------------------------------------------------- /online/scripts/visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/scripts/visualize.py -------------------------------------------------------------------------------- /online/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/setup.py -------------------------------------------------------------------------------- /online/setup_shell.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/setup_shell.sh -------------------------------------------------------------------------------- /online/tools/cleanup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/tools/cleanup.py -------------------------------------------------------------------------------- /online/tools/run_local.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/tools/run_local.py -------------------------------------------------------------------------------- /online/tools/run_slurm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/tools/run_slurm.py -------------------------------------------------------------------------------- /online/tools/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Div-Infinity/XQL/HEAD/online/tools/utils.py --------------------------------------------------------------------------------