├── .gitignore ├── LICENSE ├── README.md ├── images └── overview.png ├── otr ├── __init__.py ├── agents │ ├── __init__.py │ ├── iql │ │ ├── __init__.py │ │ ├── learning.py │ │ └── networks.py │ └── otil │ │ ├── __init__.py │ │ ├── adder.py │ │ ├── builder.py │ │ ├── rewarder.py │ │ └── rewarder_test.py ├── configs │ ├── otr_iql_adroit.py │ ├── otr_iql_antmaze.py │ └── otr_iql_mujoco.py ├── dataset_utils.py ├── evaluation.py ├── experiment_utils.py ├── train_offline.py └── wandb_logger.py ├── patches └── mujoco_py.patch ├── pyproject.toml ├── requirements.txt └── requirements ├── base.in └── dev.in /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/README.md -------------------------------------------------------------------------------- /images/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/images/overview.png -------------------------------------------------------------------------------- /otr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /otr/agents/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /otr/agents/iql/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/iql/__init__.py -------------------------------------------------------------------------------- /otr/agents/iql/learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/iql/learning.py -------------------------------------------------------------------------------- /otr/agents/iql/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/iql/networks.py -------------------------------------------------------------------------------- /otr/agents/otil/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/otil/__init__.py -------------------------------------------------------------------------------- /otr/agents/otil/adder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/otil/adder.py -------------------------------------------------------------------------------- /otr/agents/otil/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/otil/builder.py -------------------------------------------------------------------------------- /otr/agents/otil/rewarder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/otil/rewarder.py -------------------------------------------------------------------------------- /otr/agents/otil/rewarder_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/agents/otil/rewarder_test.py -------------------------------------------------------------------------------- /otr/configs/otr_iql_adroit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/configs/otr_iql_adroit.py -------------------------------------------------------------------------------- /otr/configs/otr_iql_antmaze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/configs/otr_iql_antmaze.py -------------------------------------------------------------------------------- /otr/configs/otr_iql_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/configs/otr_iql_mujoco.py -------------------------------------------------------------------------------- /otr/dataset_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/dataset_utils.py -------------------------------------------------------------------------------- /otr/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/evaluation.py -------------------------------------------------------------------------------- /otr/experiment_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/experiment_utils.py -------------------------------------------------------------------------------- /otr/train_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/train_offline.py -------------------------------------------------------------------------------- /otr/wandb_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/otr/wandb_logger.py -------------------------------------------------------------------------------- /patches/mujoco_py.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/patches/mujoco_py.patch -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/requirements.txt -------------------------------------------------------------------------------- /requirements/base.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/requirements/base.in -------------------------------------------------------------------------------- /requirements/dev.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ethanluoyc/optimal_transport_reward/HEAD/requirements/dev.in --------------------------------------------------------------------------------