├── .dockerignore ├── .github ├── ISSUE_TEMPLATE │ ├── bug_report.yml │ ├── custom_env.yml │ ├── documentation.yml │ ├── feature_request.yml │ └── question.yml ├── PULL_REQUEST_TEMPLATE.md └── workflows │ └── ci.yml ├── .gitignore ├── .readthedocs.yml ├── CITATION.bib ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── Dockerfile ├── LICENSE ├── Makefile ├── NOTICE ├── README.md ├── docs ├── Makefile ├── README.md ├── _static │ ├── css │ │ └── baselines_theme.css │ └── img │ │ ├── Tensorboard_example.png │ │ ├── breakout.gif │ │ ├── colab-badge.svg │ │ ├── colab.svg │ │ ├── logo.png │ │ ├── mistake.png │ │ ├── net_arch.png │ │ ├── sb3_loop.png │ │ ├── sb3_policy.png │ │ ├── split_graph.png │ │ └── try_it.png ├── common │ ├── atari_wrappers.rst │ ├── distributions.rst │ ├── env_checker.rst │ ├── env_util.rst │ ├── envs.rst │ ├── evaluation.rst │ ├── logger.rst │ ├── monitor.rst │ ├── noise.rst │ └── utils.rst ├── conda_env.yml ├── conf.py ├── guide │ ├── algos.rst │ ├── callbacks.rst │ ├── checking_nan.rst │ ├── custom_env.rst │ ├── custom_policy.rst │ ├── developer.rst │ ├── examples.rst │ ├── export.rst │ ├── imitation.rst │ ├── install.rst │ ├── integrations.rst │ ├── migration.rst │ ├── plotting.rst │ ├── quickstart.rst │ ├── rl.rst │ ├── rl_tips.rst │ ├── rl_zoo.rst │ ├── save_format.rst │ ├── sb3_contrib.rst │ ├── sbx.rst │ ├── tensorboard.rst │ └── vec_envs.rst ├── index.rst ├── make.bat ├── misc │ ├── changelog.rst │ └── projects.rst ├── modules │ ├── a2c.rst │ ├── base.rst │ ├── ddpg.rst │ ├── dqn.rst │ ├── her.rst │ ├── ppo.rst │ ├── sac.rst │ └── td3.rst └── spelling_wordlist.txt ├── pyproject.toml ├── scripts ├── build_docker.sh ├── run_docker_cpu.sh ├── run_docker_gpu.sh └── run_tests.sh ├── setup.py ├── stable_baselines3 ├── __init__.py ├── a2c │ ├── __init__.py │ ├── a2c.py │ └── policies.py ├── common │ ├── __init__.py │ ├── atari_wrappers.py │ ├── base_class.py │ ├── buffers.py │ ├── callbacks.py │ ├── distributions.py │ ├── env_checker.py │ ├── env_util.py │ ├── envs │ │ ├── __init__.py │ │ ├── bit_flipping_env.py │ │ ├── identity_env.py │ │ └── multi_input_envs.py │ ├── evaluation.py │ ├── logger.py │ ├── monitor.py │ ├── noise.py │ ├── off_policy_algorithm.py │ ├── on_policy_algorithm.py │ ├── policies.py │ ├── preprocessing.py │ ├── results_plotter.py │ ├── running_mean_std.py │ ├── save_util.py │ ├── sb2_compat │ │ ├── __init__.py │ │ └── rmsprop_tf_like.py │ ├── torch_layers.py │ ├── type_aliases.py │ ├── utils.py │ └── vec_env │ │ ├── __init__.py │ │ ├── base_vec_env.py │ │ ├── dummy_vec_env.py │ │ ├── patch_gym.py │ │ ├── stacked_observations.py │ │ ├── subproc_vec_env.py │ │ ├── util.py │ │ ├── vec_check_nan.py │ │ ├── vec_extract_dict_obs.py │ │ ├── vec_frame_stack.py │ │ ├── vec_monitor.py │ │ ├── vec_normalize.py │ │ ├── vec_transpose.py │ │ └── vec_video_recorder.py ├── ddpg │ ├── __init__.py │ ├── ddpg.py │ └── policies.py ├── dqn │ ├── __init__.py │ ├── dqn.py │ └── policies.py ├── her │ ├── __init__.py │ ├── goal_selection_strategy.py │ └── her_replay_buffer.py ├── ppo │ ├── __init__.py │ ├── policies.py │ └── ppo.py ├── py.typed ├── sac │ ├── __init__.py │ ├── policies.py │ └── sac.py ├── td3 │ ├── __init__.py │ ├── policies.py │ └── td3.py └── version.txt └── tests ├── __init__.py ├── test_buffers.py ├── test_callbacks.py ├── test_cnn.py ├── test_custom_policy.py ├── test_deterministic.py ├── test_dict_env.py ├── test_distributions.py ├── test_env_checker.py ├── test_envs.py ├── test_gae.py ├── test_her.py ├── test_identity.py ├── test_logger.py ├── test_monitor.py ├── test_n_step_replay.py ├── test_predict.py ├── test_preprocessing.py ├── test_run.py ├── test_save_load.py ├── test_sde.py ├── test_spaces.py ├── test_tensorboard.py ├── test_train_eval_mode.py ├── test_utils.py ├── test_vec_check_nan.py ├── test_vec_envs.py ├── test_vec_extract_dict_obs.py ├── test_vec_monitor.py ├── test_vec_normalize.py └── test_vec_stacked_obs.py /.dockerignore: -------------------------------------------------------------------------------- 1 | .gitignore -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/bug_report.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/ISSUE_TEMPLATE/bug_report.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/custom_env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/ISSUE_TEMPLATE/custom_env.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/documentation.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/ISSUE_TEMPLATE/documentation.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/feature_request.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/ISSUE_TEMPLATE/feature_request.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/question.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/ISSUE_TEMPLATE/question.yml -------------------------------------------------------------------------------- /.github/PULL_REQUEST_TEMPLATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/PULL_REQUEST_TEMPLATE.md -------------------------------------------------------------------------------- /.github/workflows/ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.github/workflows/ci.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.gitignore -------------------------------------------------------------------------------- /.readthedocs.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/.readthedocs.yml -------------------------------------------------------------------------------- /CITATION.bib: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/CITATION.bib -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/Dockerfile -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/Makefile -------------------------------------------------------------------------------- /NOTICE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/NOTICE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/README.md -------------------------------------------------------------------------------- /docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/Makefile -------------------------------------------------------------------------------- /docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/README.md -------------------------------------------------------------------------------- /docs/_static/css/baselines_theme.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/css/baselines_theme.css -------------------------------------------------------------------------------- /docs/_static/img/Tensorboard_example.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/Tensorboard_example.png -------------------------------------------------------------------------------- /docs/_static/img/breakout.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/breakout.gif -------------------------------------------------------------------------------- /docs/_static/img/colab-badge.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/colab-badge.svg -------------------------------------------------------------------------------- /docs/_static/img/colab.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/colab.svg -------------------------------------------------------------------------------- /docs/_static/img/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/logo.png -------------------------------------------------------------------------------- /docs/_static/img/mistake.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/mistake.png -------------------------------------------------------------------------------- /docs/_static/img/net_arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/net_arch.png -------------------------------------------------------------------------------- /docs/_static/img/sb3_loop.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/sb3_loop.png -------------------------------------------------------------------------------- /docs/_static/img/sb3_policy.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/sb3_policy.png -------------------------------------------------------------------------------- /docs/_static/img/split_graph.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/split_graph.png -------------------------------------------------------------------------------- /docs/_static/img/try_it.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/_static/img/try_it.png -------------------------------------------------------------------------------- /docs/common/atari_wrappers.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/atari_wrappers.rst -------------------------------------------------------------------------------- /docs/common/distributions.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/distributions.rst -------------------------------------------------------------------------------- /docs/common/env_checker.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/env_checker.rst -------------------------------------------------------------------------------- /docs/common/env_util.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/env_util.rst -------------------------------------------------------------------------------- /docs/common/envs.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/envs.rst -------------------------------------------------------------------------------- /docs/common/evaluation.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/evaluation.rst -------------------------------------------------------------------------------- /docs/common/logger.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/logger.rst -------------------------------------------------------------------------------- /docs/common/monitor.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/monitor.rst -------------------------------------------------------------------------------- /docs/common/noise.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/noise.rst -------------------------------------------------------------------------------- /docs/common/utils.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/common/utils.rst -------------------------------------------------------------------------------- /docs/conda_env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/conda_env.yml -------------------------------------------------------------------------------- /docs/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/conf.py -------------------------------------------------------------------------------- /docs/guide/algos.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/algos.rst -------------------------------------------------------------------------------- /docs/guide/callbacks.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/callbacks.rst -------------------------------------------------------------------------------- /docs/guide/checking_nan.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/checking_nan.rst -------------------------------------------------------------------------------- /docs/guide/custom_env.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/custom_env.rst -------------------------------------------------------------------------------- /docs/guide/custom_policy.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/custom_policy.rst -------------------------------------------------------------------------------- /docs/guide/developer.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/developer.rst -------------------------------------------------------------------------------- /docs/guide/examples.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/examples.rst -------------------------------------------------------------------------------- /docs/guide/export.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/export.rst -------------------------------------------------------------------------------- /docs/guide/imitation.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/imitation.rst -------------------------------------------------------------------------------- /docs/guide/install.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/install.rst -------------------------------------------------------------------------------- /docs/guide/integrations.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/integrations.rst -------------------------------------------------------------------------------- /docs/guide/migration.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/migration.rst -------------------------------------------------------------------------------- /docs/guide/plotting.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/plotting.rst -------------------------------------------------------------------------------- /docs/guide/quickstart.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/quickstart.rst -------------------------------------------------------------------------------- /docs/guide/rl.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/rl.rst -------------------------------------------------------------------------------- /docs/guide/rl_tips.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/rl_tips.rst -------------------------------------------------------------------------------- /docs/guide/rl_zoo.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/rl_zoo.rst -------------------------------------------------------------------------------- /docs/guide/save_format.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/save_format.rst -------------------------------------------------------------------------------- /docs/guide/sb3_contrib.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/sb3_contrib.rst -------------------------------------------------------------------------------- /docs/guide/sbx.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/sbx.rst -------------------------------------------------------------------------------- /docs/guide/tensorboard.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/tensorboard.rst -------------------------------------------------------------------------------- /docs/guide/vec_envs.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/guide/vec_envs.rst -------------------------------------------------------------------------------- /docs/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/index.rst -------------------------------------------------------------------------------- /docs/make.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/make.bat -------------------------------------------------------------------------------- /docs/misc/changelog.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/misc/changelog.rst -------------------------------------------------------------------------------- /docs/misc/projects.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/misc/projects.rst -------------------------------------------------------------------------------- /docs/modules/a2c.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/a2c.rst -------------------------------------------------------------------------------- /docs/modules/base.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/base.rst -------------------------------------------------------------------------------- /docs/modules/ddpg.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/ddpg.rst -------------------------------------------------------------------------------- /docs/modules/dqn.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/dqn.rst -------------------------------------------------------------------------------- /docs/modules/her.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/her.rst -------------------------------------------------------------------------------- /docs/modules/ppo.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/ppo.rst -------------------------------------------------------------------------------- /docs/modules/sac.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/sac.rst -------------------------------------------------------------------------------- /docs/modules/td3.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/modules/td3.rst -------------------------------------------------------------------------------- /docs/spelling_wordlist.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/docs/spelling_wordlist.txt -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/pyproject.toml -------------------------------------------------------------------------------- /scripts/build_docker.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/scripts/build_docker.sh -------------------------------------------------------------------------------- /scripts/run_docker_cpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/scripts/run_docker_cpu.sh -------------------------------------------------------------------------------- /scripts/run_docker_gpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/scripts/run_docker_gpu.sh -------------------------------------------------------------------------------- /scripts/run_tests.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/scripts/run_tests.sh -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/setup.py -------------------------------------------------------------------------------- /stable_baselines3/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/a2c/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/a2c/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/a2c/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/a2c/a2c.py -------------------------------------------------------------------------------- /stable_baselines3/a2c/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/a2c/policies.py -------------------------------------------------------------------------------- /stable_baselines3/common/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /stable_baselines3/common/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/atari_wrappers.py -------------------------------------------------------------------------------- /stable_baselines3/common/base_class.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/base_class.py -------------------------------------------------------------------------------- /stable_baselines3/common/buffers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/buffers.py -------------------------------------------------------------------------------- /stable_baselines3/common/callbacks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/callbacks.py -------------------------------------------------------------------------------- /stable_baselines3/common/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/distributions.py -------------------------------------------------------------------------------- /stable_baselines3/common/env_checker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/env_checker.py -------------------------------------------------------------------------------- /stable_baselines3/common/env_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/env_util.py -------------------------------------------------------------------------------- /stable_baselines3/common/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/envs/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/common/envs/bit_flipping_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/envs/bit_flipping_env.py -------------------------------------------------------------------------------- /stable_baselines3/common/envs/identity_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/envs/identity_env.py -------------------------------------------------------------------------------- /stable_baselines3/common/envs/multi_input_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/envs/multi_input_envs.py -------------------------------------------------------------------------------- /stable_baselines3/common/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/evaluation.py -------------------------------------------------------------------------------- /stable_baselines3/common/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/logger.py -------------------------------------------------------------------------------- /stable_baselines3/common/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/monitor.py -------------------------------------------------------------------------------- /stable_baselines3/common/noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/noise.py -------------------------------------------------------------------------------- /stable_baselines3/common/off_policy_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/off_policy_algorithm.py -------------------------------------------------------------------------------- /stable_baselines3/common/on_policy_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/on_policy_algorithm.py -------------------------------------------------------------------------------- /stable_baselines3/common/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/policies.py -------------------------------------------------------------------------------- /stable_baselines3/common/preprocessing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/preprocessing.py -------------------------------------------------------------------------------- /stable_baselines3/common/results_plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/results_plotter.py -------------------------------------------------------------------------------- /stable_baselines3/common/running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/running_mean_std.py -------------------------------------------------------------------------------- /stable_baselines3/common/save_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/save_util.py -------------------------------------------------------------------------------- /stable_baselines3/common/sb2_compat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /stable_baselines3/common/sb2_compat/rmsprop_tf_like.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/sb2_compat/rmsprop_tf_like.py -------------------------------------------------------------------------------- /stable_baselines3/common/torch_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/torch_layers.py -------------------------------------------------------------------------------- /stable_baselines3/common/type_aliases.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/type_aliases.py -------------------------------------------------------------------------------- /stable_baselines3/common/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/utils.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/base_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/base_vec_env.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/dummy_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/dummy_vec_env.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/patch_gym.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/patch_gym.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/stacked_observations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/stacked_observations.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/subproc_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/subproc_vec_env.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/util.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_check_nan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_check_nan.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_extract_dict_obs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_extract_dict_obs.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_frame_stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_frame_stack.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_monitor.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_normalize.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_transpose.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_transpose.py -------------------------------------------------------------------------------- /stable_baselines3/common/vec_env/vec_video_recorder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/common/vec_env/vec_video_recorder.py -------------------------------------------------------------------------------- /stable_baselines3/ddpg/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/ddpg/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/ddpg/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/ddpg/ddpg.py -------------------------------------------------------------------------------- /stable_baselines3/ddpg/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/ddpg/policies.py -------------------------------------------------------------------------------- /stable_baselines3/dqn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/dqn/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/dqn/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/dqn/dqn.py -------------------------------------------------------------------------------- /stable_baselines3/dqn/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/dqn/policies.py -------------------------------------------------------------------------------- /stable_baselines3/her/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/her/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/her/goal_selection_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/her/goal_selection_strategy.py -------------------------------------------------------------------------------- /stable_baselines3/her/her_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/her/her_replay_buffer.py -------------------------------------------------------------------------------- /stable_baselines3/ppo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/ppo/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/ppo/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/ppo/policies.py -------------------------------------------------------------------------------- /stable_baselines3/ppo/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/ppo/ppo.py -------------------------------------------------------------------------------- /stable_baselines3/py.typed: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /stable_baselines3/sac/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/sac/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/sac/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/sac/policies.py -------------------------------------------------------------------------------- /stable_baselines3/sac/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/sac/sac.py -------------------------------------------------------------------------------- /stable_baselines3/td3/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/td3/__init__.py -------------------------------------------------------------------------------- /stable_baselines3/td3/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/td3/policies.py -------------------------------------------------------------------------------- /stable_baselines3/td3/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/stable_baselines3/td3/td3.py -------------------------------------------------------------------------------- /stable_baselines3/version.txt: -------------------------------------------------------------------------------- 1 | 2.8.0a1 2 | -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/test_buffers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_buffers.py -------------------------------------------------------------------------------- /tests/test_callbacks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_callbacks.py -------------------------------------------------------------------------------- /tests/test_cnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_cnn.py -------------------------------------------------------------------------------- /tests/test_custom_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_custom_policy.py -------------------------------------------------------------------------------- /tests/test_deterministic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_deterministic.py -------------------------------------------------------------------------------- /tests/test_dict_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_dict_env.py -------------------------------------------------------------------------------- /tests/test_distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_distributions.py -------------------------------------------------------------------------------- /tests/test_env_checker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_env_checker.py -------------------------------------------------------------------------------- /tests/test_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_envs.py -------------------------------------------------------------------------------- /tests/test_gae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_gae.py -------------------------------------------------------------------------------- /tests/test_her.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_her.py -------------------------------------------------------------------------------- /tests/test_identity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_identity.py -------------------------------------------------------------------------------- /tests/test_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_logger.py -------------------------------------------------------------------------------- /tests/test_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_monitor.py -------------------------------------------------------------------------------- /tests/test_n_step_replay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_n_step_replay.py -------------------------------------------------------------------------------- /tests/test_predict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_predict.py -------------------------------------------------------------------------------- /tests/test_preprocessing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_preprocessing.py -------------------------------------------------------------------------------- /tests/test_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_run.py -------------------------------------------------------------------------------- /tests/test_save_load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_save_load.py -------------------------------------------------------------------------------- /tests/test_sde.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_sde.py -------------------------------------------------------------------------------- /tests/test_spaces.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_spaces.py -------------------------------------------------------------------------------- /tests/test_tensorboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_tensorboard.py -------------------------------------------------------------------------------- /tests/test_train_eval_mode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_train_eval_mode.py -------------------------------------------------------------------------------- /tests/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_utils.py -------------------------------------------------------------------------------- /tests/test_vec_check_nan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_vec_check_nan.py -------------------------------------------------------------------------------- /tests/test_vec_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_vec_envs.py -------------------------------------------------------------------------------- /tests/test_vec_extract_dict_obs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_vec_extract_dict_obs.py -------------------------------------------------------------------------------- /tests/test_vec_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_vec_monitor.py -------------------------------------------------------------------------------- /tests/test_vec_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_vec_normalize.py -------------------------------------------------------------------------------- /tests/test_vec_stacked_obs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/DLR-RM/stable-baselines3/HEAD/tests/test_vec_stacked_obs.py --------------------------------------------------------------------------------