├── .gitignore ├── .idea ├── .gitignore ├── OfflineRL.iml ├── inspectionProfiles │ └── profiles_settings.xml ├── modules.xml └── vcs.xml ├── LICENSE ├── README.md ├── d4rl_results ├── evaluate.ipynb ├── loader.py └── results.csv ├── environment.yml ├── environment_orig.yml ├── ex_01.py ├── ex_02.py ├── ex_03.py ├── ex_04.py ├── ex_05.py ├── ex_06.py ├── ex_101.py ├── ex_102.py ├── ex_103.py ├── ex_104.py ├── ex_105.py ├── ex_106.py └── source ├── agents ├── agent.py ├── bc.py ├── bcq.py ├── bve.py ├── cql.py ├── crr.py ├── dqn.py ├── mce.py ├── qrdqn.py ├── random.py └── rem.py ├── networks ├── actor.py └── critic.py ├── offline_ds_evaluation ├── datasets.py ├── evaluator.py ├── metrics_manager.py ├── networks.py ├── training.py └── utils.py ├── plotting ├── create_plots.py ├── join_csv_files.py ├── learning_curves.py ├── occupancy.ipynb ├── parallel_coordinates.py └── plot_ablations.py ├── train_offline.py ├── train_online.py └── utils ├── buffer.py ├── evaluation.py ├── utils.py └── wrappers.py /.gitignore: -------------------------------------------------------------------------------- 1 | /runs/ 2 | /data/ 3 | /results/ -------------------------------------------------------------------------------- /.idea/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/.idea/.gitignore -------------------------------------------------------------------------------- /.idea/OfflineRL.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/.idea/OfflineRL.iml -------------------------------------------------------------------------------- /.idea/inspectionProfiles/profiles_settings.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/.idea/inspectionProfiles/profiles_settings.xml -------------------------------------------------------------------------------- /.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/.idea/modules.xml -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/README.md -------------------------------------------------------------------------------- /d4rl_results/evaluate.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/d4rl_results/evaluate.ipynb -------------------------------------------------------------------------------- /d4rl_results/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/d4rl_results/loader.py -------------------------------------------------------------------------------- /d4rl_results/results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/d4rl_results/results.csv -------------------------------------------------------------------------------- /environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/environment.yml -------------------------------------------------------------------------------- /environment_orig.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/environment_orig.yml -------------------------------------------------------------------------------- /ex_01.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_01.py -------------------------------------------------------------------------------- /ex_02.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_02.py -------------------------------------------------------------------------------- /ex_03.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_03.py -------------------------------------------------------------------------------- /ex_04.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_04.py -------------------------------------------------------------------------------- /ex_05.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_05.py -------------------------------------------------------------------------------- /ex_06.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_06.py -------------------------------------------------------------------------------- /ex_101.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_101.py -------------------------------------------------------------------------------- /ex_102.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_102.py -------------------------------------------------------------------------------- /ex_103.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_103.py -------------------------------------------------------------------------------- /ex_104.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_104.py -------------------------------------------------------------------------------- /ex_105.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_105.py -------------------------------------------------------------------------------- /ex_106.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/ex_106.py -------------------------------------------------------------------------------- /source/agents/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/agent.py -------------------------------------------------------------------------------- /source/agents/bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/bc.py -------------------------------------------------------------------------------- /source/agents/bcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/bcq.py -------------------------------------------------------------------------------- /source/agents/bve.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/bve.py -------------------------------------------------------------------------------- /source/agents/cql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/cql.py -------------------------------------------------------------------------------- /source/agents/crr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/crr.py -------------------------------------------------------------------------------- /source/agents/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/dqn.py -------------------------------------------------------------------------------- /source/agents/mce.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/mce.py -------------------------------------------------------------------------------- /source/agents/qrdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/qrdqn.py -------------------------------------------------------------------------------- /source/agents/random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/random.py -------------------------------------------------------------------------------- /source/agents/rem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/agents/rem.py -------------------------------------------------------------------------------- /source/networks/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/networks/actor.py -------------------------------------------------------------------------------- /source/networks/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/networks/critic.py -------------------------------------------------------------------------------- /source/offline_ds_evaluation/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/offline_ds_evaluation/datasets.py -------------------------------------------------------------------------------- /source/offline_ds_evaluation/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/offline_ds_evaluation/evaluator.py -------------------------------------------------------------------------------- /source/offline_ds_evaluation/metrics_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/offline_ds_evaluation/metrics_manager.py -------------------------------------------------------------------------------- /source/offline_ds_evaluation/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/offline_ds_evaluation/networks.py -------------------------------------------------------------------------------- /source/offline_ds_evaluation/training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/offline_ds_evaluation/training.py -------------------------------------------------------------------------------- /source/offline_ds_evaluation/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/offline_ds_evaluation/utils.py -------------------------------------------------------------------------------- /source/plotting/create_plots.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/plotting/create_plots.py -------------------------------------------------------------------------------- /source/plotting/join_csv_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/plotting/join_csv_files.py -------------------------------------------------------------------------------- /source/plotting/learning_curves.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/plotting/learning_curves.py -------------------------------------------------------------------------------- /source/plotting/occupancy.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/plotting/occupancy.ipynb -------------------------------------------------------------------------------- /source/plotting/parallel_coordinates.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/plotting/parallel_coordinates.py -------------------------------------------------------------------------------- /source/plotting/plot_ablations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/plotting/plot_ablations.py -------------------------------------------------------------------------------- /source/train_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/train_offline.py -------------------------------------------------------------------------------- /source/train_online.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/train_online.py -------------------------------------------------------------------------------- /source/utils/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/utils/buffer.py -------------------------------------------------------------------------------- /source/utils/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/utils/evaluation.py -------------------------------------------------------------------------------- /source/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/utils/utils.py -------------------------------------------------------------------------------- /source/utils/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kschweig/OfflineRL/HEAD/source/utils/wrappers.py --------------------------------------------------------------------------------