├── .github └── workflows │ └── upload.yml ├── .gitignore ├── .pre-commit-config.yaml ├── LICENSE ├── README.md ├── assets └── banner.png ├── scripts ├── configs │ ├── bt_awac │ │ ├── adroit.yaml │ │ ├── gym.yaml │ │ ├── metaworld.yaml │ │ └── metaworld │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── bt_iql │ │ ├── adroit │ │ │ └── default.yaml │ │ ├── cliff │ │ │ └── default.yaml │ │ ├── gym │ │ │ └── default.yaml │ │ └── metaworld │ │ │ ├── default.yaml │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── cpl │ │ └── metaworld │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── cpl_kl │ │ └── metaworld │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── hpl │ │ ├── adroit.yaml │ │ ├── default.yaml │ │ ├── discrete │ │ │ ├── adroit.yaml │ │ │ ├── gym.yaml │ │ │ ├── metaworld.yaml │ │ │ └── mismatch │ │ │ │ ├── hopper-expert-medium.yaml │ │ │ │ ├── hopper-expert-replay.yaml │ │ │ │ ├── hopper-replay-expert.yaml │ │ │ │ ├── walker2d-expert-medium.yaml │ │ │ │ ├── walker2d-expert-replay.yaml │ │ │ │ └── walker2d-replay-expert.yaml │ │ ├── gym.yaml │ │ ├── metaworld.yaml │ │ ├── mismatch │ │ │ ├── bt_awac │ │ │ │ └── default.yaml │ │ │ ├── bt_iql │ │ │ │ ├── hopper-expert-medium.yaml │ │ │ │ ├── hopper-expert-replay.yaml │ │ │ │ ├── hopper-replay-expert.yaml │ │ │ │ ├── hopper-replay-medium.yaml │ │ │ │ ├── walker2d-expert-medium.yaml │ │ │ │ ├── walker2d-expert-replay.yaml │ │ │ │ ├── walker2d-replay-expert.yaml │ │ │ │ └── walker2d-replay-medium.yaml │ │ │ ├── hpl │ │ │ │ ├── hopper-expert-medium.yaml │ │ │ │ ├── hopper-expert-replay.yaml │ │ │ │ ├── hopper-replay-expert.yaml │ │ │ │ ├── hopper-replay-medium.yaml │ │ │ │ ├── walker2d-expert-medium.yaml │ │ │ │ ├── walker2d-expert-replay.yaml │ │ │ │ ├── walker2d-replay-expert.yaml │ │ │ │ └── walker2d-replay-medium.yaml │ │ │ ├── hpl_awac │ │ │ │ └── default.yaml │ │ │ ├── ipl_iql │ │ │ │ ├── hopper-expert-medium.yaml │ │ │ │ ├── hopper-expert-replay.yaml │ │ │ │ ├── hopper-replay-expert.yaml │ │ │ │ ├── hopper-replay-medium.yaml │ │ │ │ ├── walker2d-expert-medium.yaml │ │ │ │ ├── walker2d-expert-replay.yaml │ │ │ │ ├── walker2d-replay-expert.yaml │ │ │ │ └── walker2d-replay-medium.yaml │ │ │ └── pt_iql │ │ │ │ ├── hopper-expert-medium.yaml │ │ │ │ ├── hopper-expert-replay.yaml │ │ │ │ ├── hopper-replay-expert.yaml │ │ │ │ ├── hopper-replay-medium.yaml │ │ │ │ ├── walker2d-expert-medium.yaml │ │ │ │ ├── walker2d-expert-replay.yaml │ │ │ │ ├── walker2d-replay-expert.yaml │ │ │ │ └── walker2d-replay-medium.yaml │ │ ├── robomimic.yaml │ │ └── tuned │ │ │ ├── hopper-medium-expert-v2.yaml │ │ │ ├── hopper-medium-replay-v2.yaml │ │ │ ├── walker2d-medium-expert-v2.yaml │ │ │ └── walker2d-medium-replay-v2.yaml │ ├── hpl_awac │ │ └── discrete │ │ │ ├── adroit.yaml │ │ │ ├── gym.yaml │ │ │ └── metaworld.yaml │ ├── hpl_pomdp │ │ └── discrete │ │ │ └── gym.yaml │ ├── ipl_awac │ │ ├── adroit.yaml │ │ ├── gym.yaml │ │ ├── metaworld.yaml │ │ └── metaworld │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── ipl_iql │ │ ├── adroit │ │ │ └── default.yaml │ │ ├── gym │ │ │ └── default.yaml │ │ └── metaworld │ │ │ ├── default.yaml │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── mismatched_rpl │ │ └── default.yaml │ ├── oracle_awac │ │ └── metaworld │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── oracle_iql │ │ └── metaworld │ │ │ ├── state_dense.yaml │ │ │ └── state_sparse.yaml │ ├── pt_awac │ │ ├── adroit.yaml │ │ ├── gym.yaml │ │ └── metaworld.yaml │ ├── pt_iql │ │ ├── adroit.yaml │ │ ├── gym.yaml │ │ └── metaworld.yaml │ └── sft │ │ ├── adroit.yaml │ │ ├── gym.yaml │ │ ├── metaworld.yaml │ │ └── metaworld │ │ ├── state_dense.yaml │ │ └── state_sparse.yaml ├── generate_labeled_dataset.py ├── main.py └── rmb_main.py ├── setup.py └── wiserl ├── __init__.py ├── algorithm ├── __init__.py ├── base.py ├── bt │ ├── bt_awac.py │ └── bt_iql.py ├── cpl.py ├── cpl_kl.py ├── hpl │ ├── hpl.py │ ├── hpl_awac.py │ └── hpl_pomdp.py ├── ipl │ ├── ipl_awac.py │ └── ipl_iql.py ├── oracle_awac.py ├── oracle_iql.py ├── pt │ ├── pt_awac.py │ └── pt_iql.py ├── rpl │ └── rpl_iql.py └── sft.py ├── dataset ├── __init__.py ├── cliff_walking_dataset.py ├── d4rl_dataset.py ├── ipl_dataset.py ├── metaworld_dataset.py ├── metaworld_offline_dataset.py ├── mismatched_mujoco_dataset.py ├── replay_buffer.py └── robomimic_dataset.py ├── env ├── __init__.py ├── base.py ├── cliffwalking_env.py ├── metaworld_env.py ├── metaworld_env_bkp.py └── robomimic_env.py ├── eval ├── __init__.py ├── cliff.py ├── offline.py └── reward_model.py ├── module ├── __init__.py ├── actor.py ├── critic.py ├── encoder_decoder.py └── net │ ├── __init__.py │ ├── attention │ ├── __init__.py │ ├── base.py │ ├── dt.py │ ├── gpt2.py │ ├── positional_encoding.py │ ├── preference_transformer.py │ └── transformer.py │ ├── basic.py │ └── mlp.py ├── processor ├── __init__.py ├── base.py └── image_augmentation.py ├── trainer ├── offline_trainer.py └── rmb_offline_trainer.py └── utils ├── __init__.py ├── distributions.py ├── functional.py ├── misc.py ├── optim.py └── utils.py /.github/workflows/upload.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/.github/workflows/upload.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/README.md -------------------------------------------------------------------------------- /assets/banner.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/assets/banner.png -------------------------------------------------------------------------------- /scripts/configs/bt_awac/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_awac/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_awac/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_awac/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_awac/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_awac/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_awac/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_awac/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_awac/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_awac/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_iql/adroit/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_iql/adroit/default.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_iql/cliff/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_iql/cliff/default.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_iql/gym/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_iql/gym/default.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_iql/metaworld/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_iql/metaworld/default.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_iql/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_iql/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/bt_iql/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/bt_iql/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/cpl/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/cpl/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/cpl/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/cpl/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/cpl_kl/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/cpl_kl/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/cpl_kl/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/cpl_kl/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/default.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/mismatch/hopper-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/mismatch/hopper-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/mismatch/hopper-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/mismatch/hopper-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/mismatch/hopper-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/mismatch/hopper-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/mismatch/walker2d-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/mismatch/walker2d-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/mismatch/walker2d-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/mismatch/walker2d-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/discrete/mismatch/walker2d-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/discrete/mismatch/walker2d-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_awac/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_awac/default.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/hopper-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/hopper-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/hopper-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/hopper-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/hopper-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/hopper-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/hopper-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/hopper-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/walker2d-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/walker2d-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/walker2d-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/walker2d-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/walker2d-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/walker2d-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/bt_iql/walker2d-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/bt_iql/walker2d-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/hopper-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/hopper-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/hopper-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/hopper-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/hopper-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/hopper-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/hopper-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/hopper-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/walker2d-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/walker2d-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/walker2d-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/walker2d-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/walker2d-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/walker2d-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl/walker2d-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl/walker2d-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/hpl_awac/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/hpl_awac/default.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/hopper-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/hopper-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/hopper-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/hopper-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/hopper-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/hopper-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/hopper-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/hopper-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/walker2d-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/walker2d-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/walker2d-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/walker2d-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/walker2d-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/walker2d-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/ipl_iql/walker2d-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/ipl_iql/walker2d-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/hopper-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/hopper-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/hopper-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/hopper-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/hopper-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/hopper-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/hopper-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/hopper-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/walker2d-expert-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/walker2d-expert-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/walker2d-expert-replay.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/walker2d-expert-replay.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/walker2d-replay-expert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/walker2d-replay-expert.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/mismatch/pt_iql/walker2d-replay-medium.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/mismatch/pt_iql/walker2d-replay-medium.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/robomimic.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/robomimic.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/tuned/hopper-medium-expert-v2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/tuned/hopper-medium-expert-v2.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/tuned/hopper-medium-replay-v2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/tuned/hopper-medium-replay-v2.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/tuned/walker2d-medium-expert-v2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/tuned/walker2d-medium-expert-v2.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl/tuned/walker2d-medium-replay-v2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl/tuned/walker2d-medium-replay-v2.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl_awac/discrete/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl_awac/discrete/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl_awac/discrete/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl_awac/discrete/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl_awac/discrete/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl_awac/discrete/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/hpl_pomdp/discrete/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/hpl_pomdp/discrete/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_awac/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_awac/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_awac/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_awac/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_awac/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_awac/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_awac/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_awac/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_awac/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_awac/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_iql/adroit/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_iql/adroit/default.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_iql/gym/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_iql/gym/default.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_iql/metaworld/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_iql/metaworld/default.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_iql/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_iql/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/ipl_iql/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/ipl_iql/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/mismatched_rpl/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/mismatched_rpl/default.yaml -------------------------------------------------------------------------------- /scripts/configs/oracle_awac/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/oracle_awac/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/oracle_awac/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/oracle_awac/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/oracle_iql/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/oracle_iql/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/oracle_iql/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/oracle_iql/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/configs/pt_awac/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/pt_awac/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/pt_awac/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/pt_awac/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/pt_awac/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/pt_awac/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/pt_iql/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/pt_iql/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/pt_iql/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/pt_iql/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/pt_iql/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/pt_iql/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/sft/adroit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/sft/adroit.yaml -------------------------------------------------------------------------------- /scripts/configs/sft/gym.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/sft/gym.yaml -------------------------------------------------------------------------------- /scripts/configs/sft/metaworld.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/sft/metaworld.yaml -------------------------------------------------------------------------------- /scripts/configs/sft/metaworld/state_dense.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/sft/metaworld/state_dense.yaml -------------------------------------------------------------------------------- /scripts/configs/sft/metaworld/state_sparse.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/configs/sft/metaworld/state_sparse.yaml -------------------------------------------------------------------------------- /scripts/generate_labeled_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/generate_labeled_dataset.py -------------------------------------------------------------------------------- /scripts/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/main.py -------------------------------------------------------------------------------- /scripts/rmb_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/scripts/rmb_main.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/setup.py -------------------------------------------------------------------------------- /wiserl/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | __version__ = "0.0.2" 3 | -------------------------------------------------------------------------------- /wiserl/algorithm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/__init__.py -------------------------------------------------------------------------------- /wiserl/algorithm/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/base.py -------------------------------------------------------------------------------- /wiserl/algorithm/bt/bt_awac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/bt/bt_awac.py -------------------------------------------------------------------------------- /wiserl/algorithm/bt/bt_iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/bt/bt_iql.py -------------------------------------------------------------------------------- /wiserl/algorithm/cpl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/cpl.py -------------------------------------------------------------------------------- /wiserl/algorithm/cpl_kl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/cpl_kl.py -------------------------------------------------------------------------------- /wiserl/algorithm/hpl/hpl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/hpl/hpl.py -------------------------------------------------------------------------------- /wiserl/algorithm/hpl/hpl_awac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/hpl/hpl_awac.py -------------------------------------------------------------------------------- /wiserl/algorithm/hpl/hpl_pomdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/hpl/hpl_pomdp.py -------------------------------------------------------------------------------- /wiserl/algorithm/ipl/ipl_awac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/ipl/ipl_awac.py -------------------------------------------------------------------------------- /wiserl/algorithm/ipl/ipl_iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/ipl/ipl_iql.py -------------------------------------------------------------------------------- /wiserl/algorithm/oracle_awac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/oracle_awac.py -------------------------------------------------------------------------------- /wiserl/algorithm/oracle_iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/oracle_iql.py -------------------------------------------------------------------------------- /wiserl/algorithm/pt/pt_awac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/pt/pt_awac.py -------------------------------------------------------------------------------- /wiserl/algorithm/pt/pt_iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/pt/pt_iql.py -------------------------------------------------------------------------------- /wiserl/algorithm/rpl/rpl_iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/rpl/rpl_iql.py -------------------------------------------------------------------------------- /wiserl/algorithm/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/algorithm/sft.py -------------------------------------------------------------------------------- /wiserl/dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/__init__.py -------------------------------------------------------------------------------- /wiserl/dataset/cliff_walking_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/cliff_walking_dataset.py -------------------------------------------------------------------------------- /wiserl/dataset/d4rl_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/d4rl_dataset.py -------------------------------------------------------------------------------- /wiserl/dataset/ipl_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/ipl_dataset.py -------------------------------------------------------------------------------- /wiserl/dataset/metaworld_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/metaworld_dataset.py -------------------------------------------------------------------------------- /wiserl/dataset/metaworld_offline_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/metaworld_offline_dataset.py -------------------------------------------------------------------------------- /wiserl/dataset/mismatched_mujoco_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/mismatched_mujoco_dataset.py -------------------------------------------------------------------------------- /wiserl/dataset/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/replay_buffer.py -------------------------------------------------------------------------------- /wiserl/dataset/robomimic_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/dataset/robomimic_dataset.py -------------------------------------------------------------------------------- /wiserl/env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/env/__init__.py -------------------------------------------------------------------------------- /wiserl/env/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/env/base.py -------------------------------------------------------------------------------- /wiserl/env/cliffwalking_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/env/cliffwalking_env.py -------------------------------------------------------------------------------- /wiserl/env/metaworld_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/env/metaworld_env.py -------------------------------------------------------------------------------- /wiserl/env/metaworld_env_bkp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/env/metaworld_env_bkp.py -------------------------------------------------------------------------------- /wiserl/env/robomimic_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/env/robomimic_env.py -------------------------------------------------------------------------------- /wiserl/eval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/eval/__init__.py -------------------------------------------------------------------------------- /wiserl/eval/cliff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/eval/cliff.py -------------------------------------------------------------------------------- /wiserl/eval/offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/eval/offline.py -------------------------------------------------------------------------------- /wiserl/eval/reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/eval/reward_model.py -------------------------------------------------------------------------------- /wiserl/module/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/__init__.py -------------------------------------------------------------------------------- /wiserl/module/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/actor.py -------------------------------------------------------------------------------- /wiserl/module/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/critic.py -------------------------------------------------------------------------------- /wiserl/module/encoder_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/encoder_decoder.py -------------------------------------------------------------------------------- /wiserl/module/net/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /wiserl/module/net/attention/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /wiserl/module/net/attention/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/attention/base.py -------------------------------------------------------------------------------- /wiserl/module/net/attention/dt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/attention/dt.py -------------------------------------------------------------------------------- /wiserl/module/net/attention/gpt2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/attention/gpt2.py -------------------------------------------------------------------------------- /wiserl/module/net/attention/positional_encoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/attention/positional_encoding.py -------------------------------------------------------------------------------- /wiserl/module/net/attention/preference_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/attention/preference_transformer.py -------------------------------------------------------------------------------- /wiserl/module/net/attention/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/attention/transformer.py -------------------------------------------------------------------------------- /wiserl/module/net/basic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/basic.py -------------------------------------------------------------------------------- /wiserl/module/net/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/module/net/mlp.py -------------------------------------------------------------------------------- /wiserl/processor/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/processor/__init__.py -------------------------------------------------------------------------------- /wiserl/processor/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/processor/base.py -------------------------------------------------------------------------------- /wiserl/processor/image_augmentation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/processor/image_augmentation.py -------------------------------------------------------------------------------- /wiserl/trainer/offline_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/trainer/offline_trainer.py -------------------------------------------------------------------------------- /wiserl/trainer/rmb_offline_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/trainer/rmb_offline_trainer.py -------------------------------------------------------------------------------- /wiserl/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /wiserl/utils/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/utils/distributions.py -------------------------------------------------------------------------------- /wiserl/utils/functional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/utils/functional.py -------------------------------------------------------------------------------- /wiserl/utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/utils/misc.py -------------------------------------------------------------------------------- /wiserl/utils/optim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/utils/optim.py -------------------------------------------------------------------------------- /wiserl/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/typoverflow/WiseRL/HEAD/wiserl/utils/utils.py --------------------------------------------------------------------------------