├── .benchmark_pattern ├── .gitignore ├── .travis.yml ├── Dockerfile ├── LICENSE ├── README.md ├── baselines ├── __init__.py ├── a2c │ ├── README.md │ ├── __init__.py │ ├── a2c.py │ ├── runner.py │ └── utils.py ├── acer │ ├── README.md │ ├── __init__.py │ ├── acer.py │ ├── buffer.py │ ├── defaults.py │ ├── policies.py │ └── runner.py ├── acktr │ ├── README.md │ ├── __init__.py │ ├── acktr.py │ ├── defaults.py │ ├── kfac.py │ ├── kfac_utils.py │ └── utils.py ├── bench │ ├── __init__.py │ ├── benchmarks.py │ ├── monitor.py │ └── test_monitor.py ├── common │ ├── __init__.py │ ├── atari_wrappers.py │ ├── cg.py │ ├── cmd_util.py │ ├── console_util.py │ ├── dataset.py │ ├── distributions.py │ ├── input.py │ ├── math_util.py │ ├── misc_util.py │ ├── models.py │ ├── mpi_adam.py │ ├── mpi_adam_optimizer.py │ ├── mpi_fork.py │ ├── mpi_moments.py │ ├── mpi_running_mean_std.py │ ├── mpi_util.py │ ├── plot_util.py │ ├── policies.py │ ├── retro_wrappers.py │ ├── runners.py │ ├── running_mean_std.py │ ├── schedules.py │ ├── segment_tree.py │ ├── test_mpi_util.py │ ├── tests │ │ ├── __init__.py │ │ ├── envs │ │ │ ├── __init__.py │ │ │ ├── fixed_sequence_env.py │ │ │ ├── identity_env.py │ │ │ ├── identity_env_test.py │ │ │ └── mnist_env.py │ │ ├── test_cartpole.py │ │ ├── test_doc_examples.py │ │ ├── test_env_after_learn.py │ │ ├── test_fetchreach.py │ │ ├── test_fixed_sequence.py │ │ ├── test_identity.py │ │ ├── test_mnist.py │ │ ├── test_plot_util.py │ │ ├── test_schedules.py │ │ ├── test_segment_tree.py │ │ ├── test_serialization.py │ │ ├── test_tf_util.py │ │ ├── test_with_mpi.py │ │ └── util.py │ ├── tf_util.py │ ├── tile_images.py │ ├── vec_env │ │ ├── __init__.py │ │ ├── dummy_vec_env.py │ │ ├── shmem_vec_env.py │ │ ├── subproc_vec_env.py │ │ ├── test_vec_env.py │ │ ├── test_video_recorder.py │ │ ├── util.py │ │ ├── vec_env.py │ │ ├── vec_frame_stack.py │ │ ├── vec_monitor.py │ │ ├── vec_normalize.py │ │ ├── vec_remove_dict_obs.py │ │ └── vec_video_recorder.py │ └── wrappers.py ├── ddpg │ ├── README.md │ ├── __init__.py │ ├── ddpg.py │ ├── ddpg_learner.py │ ├── memory.py │ ├── models.py │ ├── noise.py │ └── test_smoke.py ├── deepq │ ├── README.md │ ├── __init__.py │ ├── build_graph.py │ ├── deepq.py │ ├── defaults.py │ ├── experiments │ │ ├── __init__.py │ │ ├── custom_cartpole.py │ │ ├── enjoy_cartpole.py │ │ ├── enjoy_mountaincar.py │ │ ├── enjoy_pong.py │ │ ├── train_cartpole.py │ │ ├── train_mountaincar.py │ │ └── train_pong.py │ ├── models.py │ ├── replay_buffer.py │ └── utils.py ├── gail │ ├── README.md │ ├── __init__.py │ ├── adversary.py │ ├── behavior_clone.py │ ├── dataset │ │ ├── __init__.py │ │ └── mujoco_dset.py │ ├── gail-eval.py │ ├── mlp_policy.py │ ├── result │ │ ├── HalfCheetah-normalized-deterministic-scores.png │ │ ├── HalfCheetah-normalized-stochastic-scores.png │ │ ├── HalfCheetah-unnormalized-deterministic-scores.png │ │ ├── HalfCheetah-unnormalized-stochastic-scores.png │ │ ├── Hopper-normalized-deterministic-scores.png │ │ ├── Hopper-normalized-stochastic-scores.png │ │ ├── Hopper-unnormalized-deterministic-scores.png │ │ ├── Hopper-unnormalized-stochastic-scores.png │ │ ├── Humanoid-normalized-deterministic-scores.png │ │ ├── Humanoid-normalized-stochastic-scores.png │ │ ├── Humanoid-unnormalized-deterministic-scores.png │ │ ├── Humanoid-unnormalized-stochastic-scores.png │ │ ├── HumanoidStandup-normalized-deterministic-scores.png │ │ ├── HumanoidStandup-normalized-stochastic-scores.png │ │ ├── HumanoidStandup-unnormalized-deterministic-scores.png │ │ ├── HumanoidStandup-unnormalized-stochastic-scores.png │ │ ├── Walker2d-normalized-deterministic-scores.png │ │ ├── Walker2d-normalized-stochastic-scores.png │ │ ├── Walker2d-unnormalized-deterministic-scores.png │ │ ├── Walker2d-unnormalized-stochastic-scores.png │ │ ├── gail-result.md │ │ ├── halfcheetah-training.png │ │ ├── hopper-training.png │ │ ├── humanoid-training.png │ │ ├── humanoidstandup-training.png │ │ └── walker2d-training.png │ ├── run_mujoco.py │ ├── statistics.py │ └── trpo_mpi.py ├── her │ ├── README.md │ ├── __init__.py │ ├── actor_critic.py │ ├── ddpg.py │ ├── experiment │ │ ├── __init__.py │ │ ├── config.py │ │ ├── data_generation │ │ │ └── fetch_data_generation.py │ │ ├── play.py │ │ └── plot.py │ ├── her.py │ ├── her_sampler.py │ ├── normalizer.py │ ├── replay_buffer.py │ ├── rollout.py │ └── util.py ├── logger.py ├── ppo1 │ ├── README.md │ ├── __init__.py │ ├── cnn_policy.py │ ├── mlp_policy.py │ ├── pposgd_simple.py │ ├── run_atari.py │ ├── run_humanoid.py │ ├── run_mujoco.py │ └── run_robotics.py ├── ppo2 │ ├── README.md │ ├── __init__.py │ ├── defaults.py │ ├── microbatched_model.py │ ├── model.py │ ├── ppo2.py │ ├── runner.py │ └── test_microbatches.py ├── results_plotter.py ├── run.py └── trpo_mpi │ ├── README.md │ ├── __init__.py │ ├── defaults.py │ └── trpo_mpi.py ├── benchmarks_atari10M.htm ├── benchmarks_mujoco1M.htm ├── data ├── cartpole.gif ├── fetchPickAndPlaceContrast.png └── logo.jpg ├── docs └── viz │ └── viz.ipynb ├── setup.cfg └── setup.py /.benchmark_pattern: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/.gitignore -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/.travis.yml -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/Dockerfile -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/README.md -------------------------------------------------------------------------------- /baselines/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/a2c/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/a2c/README.md -------------------------------------------------------------------------------- /baselines/a2c/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/a2c/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/a2c/a2c.py -------------------------------------------------------------------------------- /baselines/a2c/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/a2c/runner.py -------------------------------------------------------------------------------- /baselines/a2c/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/a2c/utils.py -------------------------------------------------------------------------------- /baselines/acer/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acer/README.md -------------------------------------------------------------------------------- /baselines/acer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/acer/acer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acer/acer.py -------------------------------------------------------------------------------- /baselines/acer/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acer/buffer.py -------------------------------------------------------------------------------- /baselines/acer/defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acer/defaults.py -------------------------------------------------------------------------------- /baselines/acer/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acer/policies.py -------------------------------------------------------------------------------- /baselines/acer/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acer/runner.py -------------------------------------------------------------------------------- /baselines/acktr/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acktr/README.md -------------------------------------------------------------------------------- /baselines/acktr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/acktr/acktr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acktr/acktr.py -------------------------------------------------------------------------------- /baselines/acktr/defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acktr/defaults.py -------------------------------------------------------------------------------- /baselines/acktr/kfac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acktr/kfac.py -------------------------------------------------------------------------------- /baselines/acktr/kfac_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acktr/kfac_utils.py -------------------------------------------------------------------------------- /baselines/acktr/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/acktr/utils.py -------------------------------------------------------------------------------- /baselines/bench/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/bench/__init__.py -------------------------------------------------------------------------------- /baselines/bench/benchmarks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/bench/benchmarks.py -------------------------------------------------------------------------------- /baselines/bench/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/bench/monitor.py -------------------------------------------------------------------------------- /baselines/bench/test_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/bench/test_monitor.py -------------------------------------------------------------------------------- /baselines/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/__init__.py -------------------------------------------------------------------------------- /baselines/common/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/atari_wrappers.py -------------------------------------------------------------------------------- /baselines/common/cg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/cg.py -------------------------------------------------------------------------------- /baselines/common/cmd_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/cmd_util.py -------------------------------------------------------------------------------- /baselines/common/console_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/console_util.py -------------------------------------------------------------------------------- /baselines/common/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/dataset.py -------------------------------------------------------------------------------- /baselines/common/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/distributions.py -------------------------------------------------------------------------------- /baselines/common/input.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/input.py -------------------------------------------------------------------------------- /baselines/common/math_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/math_util.py -------------------------------------------------------------------------------- /baselines/common/misc_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/misc_util.py -------------------------------------------------------------------------------- /baselines/common/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/models.py -------------------------------------------------------------------------------- /baselines/common/mpi_adam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/mpi_adam.py -------------------------------------------------------------------------------- /baselines/common/mpi_adam_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/mpi_adam_optimizer.py -------------------------------------------------------------------------------- /baselines/common/mpi_fork.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/mpi_fork.py -------------------------------------------------------------------------------- /baselines/common/mpi_moments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/mpi_moments.py -------------------------------------------------------------------------------- /baselines/common/mpi_running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/mpi_running_mean_std.py -------------------------------------------------------------------------------- /baselines/common/mpi_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/mpi_util.py -------------------------------------------------------------------------------- /baselines/common/plot_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/plot_util.py -------------------------------------------------------------------------------- /baselines/common/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/policies.py -------------------------------------------------------------------------------- /baselines/common/retro_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/retro_wrappers.py -------------------------------------------------------------------------------- /baselines/common/runners.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/runners.py -------------------------------------------------------------------------------- /baselines/common/running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/running_mean_std.py -------------------------------------------------------------------------------- /baselines/common/schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/schedules.py -------------------------------------------------------------------------------- /baselines/common/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/segment_tree.py -------------------------------------------------------------------------------- /baselines/common/test_mpi_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/test_mpi_util.py -------------------------------------------------------------------------------- /baselines/common/tests/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/__init__.py -------------------------------------------------------------------------------- /baselines/common/tests/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/common/tests/envs/fixed_sequence_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/envs/fixed_sequence_env.py -------------------------------------------------------------------------------- /baselines/common/tests/envs/identity_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/envs/identity_env.py -------------------------------------------------------------------------------- /baselines/common/tests/envs/identity_env_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/envs/identity_env_test.py -------------------------------------------------------------------------------- /baselines/common/tests/envs/mnist_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/envs/mnist_env.py -------------------------------------------------------------------------------- /baselines/common/tests/test_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_cartpole.py -------------------------------------------------------------------------------- /baselines/common/tests/test_doc_examples.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_doc_examples.py -------------------------------------------------------------------------------- /baselines/common/tests/test_env_after_learn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_env_after_learn.py -------------------------------------------------------------------------------- /baselines/common/tests/test_fetchreach.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_fetchreach.py -------------------------------------------------------------------------------- /baselines/common/tests/test_fixed_sequence.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_fixed_sequence.py -------------------------------------------------------------------------------- /baselines/common/tests/test_identity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_identity.py -------------------------------------------------------------------------------- /baselines/common/tests/test_mnist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_mnist.py -------------------------------------------------------------------------------- /baselines/common/tests/test_plot_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_plot_util.py -------------------------------------------------------------------------------- /baselines/common/tests/test_schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_schedules.py -------------------------------------------------------------------------------- /baselines/common/tests/test_segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_segment_tree.py -------------------------------------------------------------------------------- /baselines/common/tests/test_serialization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_serialization.py -------------------------------------------------------------------------------- /baselines/common/tests/test_tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_tf_util.py -------------------------------------------------------------------------------- /baselines/common/tests/test_with_mpi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/test_with_mpi.py -------------------------------------------------------------------------------- /baselines/common/tests/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tests/util.py -------------------------------------------------------------------------------- /baselines/common/tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tf_util.py -------------------------------------------------------------------------------- /baselines/common/tile_images.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/tile_images.py -------------------------------------------------------------------------------- /baselines/common/vec_env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/__init__.py -------------------------------------------------------------------------------- /baselines/common/vec_env/dummy_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/dummy_vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/shmem_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/shmem_vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/subproc_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/subproc_vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/test_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/test_vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/test_video_recorder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/test_video_recorder.py -------------------------------------------------------------------------------- /baselines/common/vec_env/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/util.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_frame_stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/vec_frame_stack.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/vec_monitor.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/vec_normalize.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_remove_dict_obs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/vec_remove_dict_obs.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_video_recorder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/vec_env/vec_video_recorder.py -------------------------------------------------------------------------------- /baselines/common/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/common/wrappers.py -------------------------------------------------------------------------------- /baselines/ddpg/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/README.md -------------------------------------------------------------------------------- /baselines/ddpg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/ddpg/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/ddpg.py -------------------------------------------------------------------------------- /baselines/ddpg/ddpg_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/ddpg_learner.py -------------------------------------------------------------------------------- /baselines/ddpg/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/memory.py -------------------------------------------------------------------------------- /baselines/ddpg/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/models.py -------------------------------------------------------------------------------- /baselines/ddpg/noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/noise.py -------------------------------------------------------------------------------- /baselines/ddpg/test_smoke.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ddpg/test_smoke.py -------------------------------------------------------------------------------- /baselines/deepq/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/README.md -------------------------------------------------------------------------------- /baselines/deepq/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/__init__.py -------------------------------------------------------------------------------- /baselines/deepq/build_graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/build_graph.py -------------------------------------------------------------------------------- /baselines/deepq/deepq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/deepq.py -------------------------------------------------------------------------------- /baselines/deepq/defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/defaults.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/deepq/experiments/custom_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/custom_cartpole.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/enjoy_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/enjoy_cartpole.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/enjoy_mountaincar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/enjoy_mountaincar.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/enjoy_pong.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/enjoy_pong.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/train_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/train_cartpole.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/train_mountaincar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/train_mountaincar.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/train_pong.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/experiments/train_pong.py -------------------------------------------------------------------------------- /baselines/deepq/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/models.py -------------------------------------------------------------------------------- /baselines/deepq/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/replay_buffer.py -------------------------------------------------------------------------------- /baselines/deepq/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/deepq/utils.py -------------------------------------------------------------------------------- /baselines/gail/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/README.md -------------------------------------------------------------------------------- /baselines/gail/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/gail/adversary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/adversary.py -------------------------------------------------------------------------------- /baselines/gail/behavior_clone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/behavior_clone.py -------------------------------------------------------------------------------- /baselines/gail/dataset/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/gail/dataset/mujoco_dset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/dataset/mujoco_dset.py -------------------------------------------------------------------------------- /baselines/gail/gail-eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/gail-eval.py -------------------------------------------------------------------------------- /baselines/gail/mlp_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/mlp_policy.py -------------------------------------------------------------------------------- /baselines/gail/result/HalfCheetah-normalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HalfCheetah-normalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HalfCheetah-normalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HalfCheetah-normalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HalfCheetah-unnormalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HalfCheetah-unnormalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HalfCheetah-unnormalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HalfCheetah-unnormalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Hopper-normalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Hopper-normalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Hopper-normalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Hopper-normalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Hopper-unnormalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Hopper-unnormalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Hopper-unnormalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Hopper-unnormalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Humanoid-normalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Humanoid-normalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Humanoid-normalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Humanoid-normalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Humanoid-unnormalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Humanoid-unnormalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Humanoid-unnormalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Humanoid-unnormalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HumanoidStandup-normalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HumanoidStandup-normalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HumanoidStandup-normalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HumanoidStandup-normalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HumanoidStandup-unnormalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HumanoidStandup-unnormalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/HumanoidStandup-unnormalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/HumanoidStandup-unnormalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Walker2d-normalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Walker2d-normalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Walker2d-normalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Walker2d-normalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Walker2d-unnormalized-deterministic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Walker2d-unnormalized-deterministic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/Walker2d-unnormalized-stochastic-scores.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/Walker2d-unnormalized-stochastic-scores.png -------------------------------------------------------------------------------- /baselines/gail/result/gail-result.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/gail-result.md -------------------------------------------------------------------------------- /baselines/gail/result/halfcheetah-training.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/halfcheetah-training.png -------------------------------------------------------------------------------- /baselines/gail/result/hopper-training.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/hopper-training.png -------------------------------------------------------------------------------- /baselines/gail/result/humanoid-training.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/humanoid-training.png -------------------------------------------------------------------------------- /baselines/gail/result/humanoidstandup-training.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/humanoidstandup-training.png -------------------------------------------------------------------------------- /baselines/gail/result/walker2d-training.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/result/walker2d-training.png -------------------------------------------------------------------------------- /baselines/gail/run_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/run_mujoco.py -------------------------------------------------------------------------------- /baselines/gail/statistics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/statistics.py -------------------------------------------------------------------------------- /baselines/gail/trpo_mpi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/gail/trpo_mpi.py -------------------------------------------------------------------------------- /baselines/her/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/README.md -------------------------------------------------------------------------------- /baselines/her/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/her/actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/actor_critic.py -------------------------------------------------------------------------------- /baselines/her/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/ddpg.py -------------------------------------------------------------------------------- /baselines/her/experiment/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/her/experiment/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/experiment/config.py -------------------------------------------------------------------------------- /baselines/her/experiment/data_generation/fetch_data_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/experiment/data_generation/fetch_data_generation.py -------------------------------------------------------------------------------- /baselines/her/experiment/play.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/experiment/play.py -------------------------------------------------------------------------------- /baselines/her/experiment/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/experiment/plot.py -------------------------------------------------------------------------------- /baselines/her/her.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/her.py -------------------------------------------------------------------------------- /baselines/her/her_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/her_sampler.py -------------------------------------------------------------------------------- /baselines/her/normalizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/normalizer.py -------------------------------------------------------------------------------- /baselines/her/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/replay_buffer.py -------------------------------------------------------------------------------- /baselines/her/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/rollout.py -------------------------------------------------------------------------------- /baselines/her/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/her/util.py -------------------------------------------------------------------------------- /baselines/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/logger.py -------------------------------------------------------------------------------- /baselines/ppo1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/README.md -------------------------------------------------------------------------------- /baselines/ppo1/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/ppo1/cnn_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/cnn_policy.py -------------------------------------------------------------------------------- /baselines/ppo1/mlp_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/mlp_policy.py -------------------------------------------------------------------------------- /baselines/ppo1/pposgd_simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/pposgd_simple.py -------------------------------------------------------------------------------- /baselines/ppo1/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/run_atari.py -------------------------------------------------------------------------------- /baselines/ppo1/run_humanoid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/run_humanoid.py -------------------------------------------------------------------------------- /baselines/ppo1/run_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/run_mujoco.py -------------------------------------------------------------------------------- /baselines/ppo1/run_robotics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo1/run_robotics.py -------------------------------------------------------------------------------- /baselines/ppo2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/README.md -------------------------------------------------------------------------------- /baselines/ppo2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/ppo2/defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/defaults.py -------------------------------------------------------------------------------- /baselines/ppo2/microbatched_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/microbatched_model.py -------------------------------------------------------------------------------- /baselines/ppo2/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/model.py -------------------------------------------------------------------------------- /baselines/ppo2/ppo2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/ppo2.py -------------------------------------------------------------------------------- /baselines/ppo2/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/runner.py -------------------------------------------------------------------------------- /baselines/ppo2/test_microbatches.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/ppo2/test_microbatches.py -------------------------------------------------------------------------------- /baselines/results_plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/results_plotter.py -------------------------------------------------------------------------------- /baselines/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/run.py -------------------------------------------------------------------------------- /baselines/trpo_mpi/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/trpo_mpi/README.md -------------------------------------------------------------------------------- /baselines/trpo_mpi/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/trpo_mpi/defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/trpo_mpi/defaults.py -------------------------------------------------------------------------------- /baselines/trpo_mpi/trpo_mpi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/baselines/trpo_mpi/trpo_mpi.py -------------------------------------------------------------------------------- /benchmarks_atari10M.htm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/benchmarks_atari10M.htm -------------------------------------------------------------------------------- /benchmarks_mujoco1M.htm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/benchmarks_mujoco1M.htm -------------------------------------------------------------------------------- /data/cartpole.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/data/cartpole.gif -------------------------------------------------------------------------------- /data/fetchPickAndPlaceContrast.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/data/fetchPickAndPlaceContrast.png -------------------------------------------------------------------------------- /data/logo.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/data/logo.jpg -------------------------------------------------------------------------------- /docs/viz/viz.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/docs/viz/viz.ipynb -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/setup.cfg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/openai/baselines/HEAD/setup.py --------------------------------------------------------------------------------