├── LICENSE ├── README.md ├── ant_data_collect.py ├── ant_irl.py ├── ant_transfer_disabled.py ├── base.py ├── gaussian_mlp_inverse_policy.py └── inverse_rl ├── algos ├── batch_polopt.py ├── irl_batch_polopt.py ├── irl_npo.py ├── irl_trpo.py ├── npo.py ├── penalty_lbfgs_optimizer.py └── trpo.py ├── envs ├── __init__.py ├── ant_env.py ├── ant_maze.py ├── assets │ └── twod_maze.xml ├── dynamic_mjc │ ├── mjc_models.py │ └── model_builder.py ├── env_utils.py ├── point_maze_env.py ├── pusher_env.py ├── swimmer_env.py ├── twod_maze.py ├── twod_mjc_env.py ├── utils.py └── visual_pointmass.py ├── models ├── architectures.py ├── eairl.py ├── empowerment.py ├── fusion_manager.py ├── imitation_learning.py ├── qvar.py └── tf_util.py └── utils ├── __init__.py ├── general.py ├── hyper_sweep.py ├── hyperparametrized.py ├── log_utils.py └── math_utils.py /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/README.md -------------------------------------------------------------------------------- /ant_data_collect.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/ant_data_collect.py -------------------------------------------------------------------------------- /ant_irl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/ant_irl.py -------------------------------------------------------------------------------- /ant_transfer_disabled.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/ant_transfer_disabled.py -------------------------------------------------------------------------------- /base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/base.py -------------------------------------------------------------------------------- /gaussian_mlp_inverse_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/gaussian_mlp_inverse_policy.py -------------------------------------------------------------------------------- /inverse_rl/algos/batch_polopt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/batch_polopt.py -------------------------------------------------------------------------------- /inverse_rl/algos/irl_batch_polopt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/irl_batch_polopt.py -------------------------------------------------------------------------------- /inverse_rl/algos/irl_npo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/irl_npo.py -------------------------------------------------------------------------------- /inverse_rl/algos/irl_trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/irl_trpo.py -------------------------------------------------------------------------------- /inverse_rl/algos/npo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/npo.py -------------------------------------------------------------------------------- /inverse_rl/algos/penalty_lbfgs_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/penalty_lbfgs_optimizer.py -------------------------------------------------------------------------------- /inverse_rl/algos/trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/algos/trpo.py -------------------------------------------------------------------------------- /inverse_rl/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/__init__.py -------------------------------------------------------------------------------- /inverse_rl/envs/ant_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/ant_env.py -------------------------------------------------------------------------------- /inverse_rl/envs/ant_maze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/ant_maze.py -------------------------------------------------------------------------------- /inverse_rl/envs/assets/twod_maze.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/assets/twod_maze.xml -------------------------------------------------------------------------------- /inverse_rl/envs/dynamic_mjc/mjc_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/dynamic_mjc/mjc_models.py -------------------------------------------------------------------------------- /inverse_rl/envs/dynamic_mjc/model_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/dynamic_mjc/model_builder.py -------------------------------------------------------------------------------- /inverse_rl/envs/env_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/env_utils.py -------------------------------------------------------------------------------- /inverse_rl/envs/point_maze_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/point_maze_env.py -------------------------------------------------------------------------------- /inverse_rl/envs/pusher_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/pusher_env.py -------------------------------------------------------------------------------- /inverse_rl/envs/swimmer_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/swimmer_env.py -------------------------------------------------------------------------------- /inverse_rl/envs/twod_maze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/twod_maze.py -------------------------------------------------------------------------------- /inverse_rl/envs/twod_mjc_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/twod_mjc_env.py -------------------------------------------------------------------------------- /inverse_rl/envs/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/utils.py -------------------------------------------------------------------------------- /inverse_rl/envs/visual_pointmass.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/envs/visual_pointmass.py -------------------------------------------------------------------------------- /inverse_rl/models/architectures.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/architectures.py -------------------------------------------------------------------------------- /inverse_rl/models/eairl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/eairl.py -------------------------------------------------------------------------------- /inverse_rl/models/empowerment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/empowerment.py -------------------------------------------------------------------------------- /inverse_rl/models/fusion_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/fusion_manager.py -------------------------------------------------------------------------------- /inverse_rl/models/imitation_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/imitation_learning.py -------------------------------------------------------------------------------- /inverse_rl/models/qvar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/qvar.py -------------------------------------------------------------------------------- /inverse_rl/models/tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/models/tf_util.py -------------------------------------------------------------------------------- /inverse_rl/utils/__init__.py: -------------------------------------------------------------------------------- 1 | from inverse_rl.utils.general import * 2 | -------------------------------------------------------------------------------- /inverse_rl/utils/general.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/utils/general.py -------------------------------------------------------------------------------- /inverse_rl/utils/hyper_sweep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/utils/hyper_sweep.py -------------------------------------------------------------------------------- /inverse_rl/utils/hyperparametrized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/utils/hyperparametrized.py -------------------------------------------------------------------------------- /inverse_rl/utils/log_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/utils/log_utils.py -------------------------------------------------------------------------------- /inverse_rl/utils/math_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ahq1993/inverse_rl/HEAD/inverse_rl/utils/math_utils.py --------------------------------------------------------------------------------