├── .gitattributes ├── .gitignore ├── LICENSE ├── README.md ├── download_data.sh ├── examples └── 01_LSIQ │ ├── 01_episode │ ├── launcher.py │ └── lsiq_experiments.py │ ├── 02_episode_5 │ ├── launcher.py │ └── lsiq_experiments.py │ ├── 03_episode_10 │ ├── launcher.py │ └── lsiq_experiments.py │ └── 04_episode_25 │ ├── launcher.py │ └── lsiq_experiments.py ├── img └── Divergence_Minimization.gif ├── imitation_lib ├── __init__.py ├── imitation │ ├── __init__.py │ ├── gail_TRPO.py │ ├── iq_sac.py │ ├── iqfo_orig.py │ ├── iqfo_sac.py │ ├── lsiq.py │ ├── lsiq_h.py │ ├── lsiq_hc.py │ ├── lsiqfo.py │ ├── lsiqfo_h.py │ ├── lsiqfo_hc.py │ ├── offline │ │ ├── __init__.py │ │ ├── behavioral_cloning.py │ │ ├── iq_offline.py │ │ ├── lsiq_offline.py │ │ └── lsiq_offline_dm.py │ ├── sqil_sac.py │ └── vail_TRPO.py └── utils │ ├── __init__.py │ ├── action_models.py │ ├── distributions.py │ ├── math.py │ ├── networks.py │ ├── preprocessor.py │ └── training.py └── setup.py /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/.gitattributes -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/README.md -------------------------------------------------------------------------------- /download_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/download_data.sh -------------------------------------------------------------------------------- /examples/01_LSIQ/01_episode/launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/01_episode/launcher.py -------------------------------------------------------------------------------- /examples/01_LSIQ/01_episode/lsiq_experiments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/01_episode/lsiq_experiments.py -------------------------------------------------------------------------------- /examples/01_LSIQ/02_episode_5/launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/02_episode_5/launcher.py -------------------------------------------------------------------------------- /examples/01_LSIQ/02_episode_5/lsiq_experiments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/02_episode_5/lsiq_experiments.py -------------------------------------------------------------------------------- /examples/01_LSIQ/03_episode_10/launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/03_episode_10/launcher.py -------------------------------------------------------------------------------- /examples/01_LSIQ/03_episode_10/lsiq_experiments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/03_episode_10/lsiq_experiments.py -------------------------------------------------------------------------------- /examples/01_LSIQ/04_episode_25/launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/04_episode_25/launcher.py -------------------------------------------------------------------------------- /examples/01_LSIQ/04_episode_25/lsiq_experiments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/examples/01_LSIQ/04_episode_25/lsiq_experiments.py -------------------------------------------------------------------------------- /img/Divergence_Minimization.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/img/Divergence_Minimization.gif -------------------------------------------------------------------------------- /imitation_lib/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /imitation_lib/imitation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/__init__.py -------------------------------------------------------------------------------- /imitation_lib/imitation/gail_TRPO.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/gail_TRPO.py -------------------------------------------------------------------------------- /imitation_lib/imitation/iq_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/iq_sac.py -------------------------------------------------------------------------------- /imitation_lib/imitation/iqfo_orig.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/iqfo_orig.py -------------------------------------------------------------------------------- /imitation_lib/imitation/iqfo_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/iqfo_sac.py -------------------------------------------------------------------------------- /imitation_lib/imitation/lsiq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/lsiq.py -------------------------------------------------------------------------------- /imitation_lib/imitation/lsiq_h.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/lsiq_h.py -------------------------------------------------------------------------------- /imitation_lib/imitation/lsiq_hc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/lsiq_hc.py -------------------------------------------------------------------------------- /imitation_lib/imitation/lsiqfo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/lsiqfo.py -------------------------------------------------------------------------------- /imitation_lib/imitation/lsiqfo_h.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/lsiqfo_h.py -------------------------------------------------------------------------------- /imitation_lib/imitation/lsiqfo_hc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/lsiqfo_hc.py -------------------------------------------------------------------------------- /imitation_lib/imitation/offline/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/offline/__init__.py -------------------------------------------------------------------------------- /imitation_lib/imitation/offline/behavioral_cloning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/offline/behavioral_cloning.py -------------------------------------------------------------------------------- /imitation_lib/imitation/offline/iq_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/offline/iq_offline.py -------------------------------------------------------------------------------- /imitation_lib/imitation/offline/lsiq_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/offline/lsiq_offline.py -------------------------------------------------------------------------------- /imitation_lib/imitation/offline/lsiq_offline_dm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/offline/lsiq_offline_dm.py -------------------------------------------------------------------------------- /imitation_lib/imitation/sqil_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/sqil_sac.py -------------------------------------------------------------------------------- /imitation_lib/imitation/vail_TRPO.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/imitation/vail_TRPO.py -------------------------------------------------------------------------------- /imitation_lib/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/__init__.py -------------------------------------------------------------------------------- /imitation_lib/utils/action_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/action_models.py -------------------------------------------------------------------------------- /imitation_lib/utils/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/distributions.py -------------------------------------------------------------------------------- /imitation_lib/utils/math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/math.py -------------------------------------------------------------------------------- /imitation_lib/utils/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/networks.py -------------------------------------------------------------------------------- /imitation_lib/utils/preprocessor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/preprocessor.py -------------------------------------------------------------------------------- /imitation_lib/utils/training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/imitation_lib/utils/training.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/robfiras/ls-iq/HEAD/setup.py --------------------------------------------------------------------------------