├── .gitignore ├── LICENSE ├── README.md ├── baselines ├── __init__.py ├── a2c │ ├── README.md │ ├── __init__.py │ ├── a2c.py │ ├── policies.py │ ├── run_atari.py │ └── utils.py ├── acer │ ├── README.md │ ├── __init__.py │ ├── acer_simple.py │ ├── buffer.py │ ├── policies.py │ └── run_atari.py ├── acktr │ ├── README.md │ ├── __init__.py │ ├── acktr_cont.py │ ├── acktr_disc.py │ ├── filters.py │ ├── kfac.py │ ├── kfac_utils.py │ ├── policies.py │ ├── run_atari.py │ ├── run_mujoco.py │ ├── running_stat.py │ ├── utils.py │ └── value_functions.py ├── bench │ ├── __init__.py │ ├── benchmarks.py │ └── monitor.py ├── common │ ├── __init__.py │ ├── atari_wrappers.py │ ├── atari_wrappers_deprecated.py │ ├── azure_utils.py │ ├── cg.py │ ├── console_util.py │ ├── dataset.py │ ├── distributions.py │ ├── math_util.py │ ├── misc_util.py │ ├── mpi_adam.py │ ├── mpi_fork.py │ ├── mpi_moments.py │ ├── mpi_running_mean_std.py │ ├── running_mean_std.py │ ├── schedules.py │ ├── segment_tree.py │ ├── tests │ │ ├── test_schedules.py │ │ ├── test_segment_tree.py │ │ └── test_tf_util.py │ ├── tf_util.py │ └── vec_env │ │ ├── __init__.py │ │ ├── dummy_vec_env.py │ │ ├── subproc_vec_env.py │ │ ├── vec_frame_stack.py │ │ └── vec_normalize.py ├── ddpg │ ├── README.md │ ├── __init__.py │ ├── ddpg.py │ ├── main.py │ ├── memory.py │ ├── models.py │ ├── noise.py │ ├── training.py │ └── util.py ├── deepq │ ├── README.md │ ├── __init__.py │ ├── build_graph.py │ ├── experiments │ │ ├── __init__.py │ │ ├── atari │ │ │ ├── __init__.py │ │ │ ├── download_model.py │ │ │ ├── enjoy.py │ │ │ ├── model.py │ │ │ ├── train.py │ │ │ └── wang2015_eval.py │ │ ├── custom_cartpole.py │ │ ├── enjoy_cartpole.py │ │ ├── enjoy_mountaincar.py │ │ ├── enjoy_pong.py │ │ ├── run_atari.py │ │ ├── train_cartpole.py │ │ └── train_mountaincar.py │ ├── models.py │ ├── replay_buffer.py │ └── simple.py ├── logger.py ├── ppo1 │ ├── README.md │ ├── __init__.py │ ├── cnn_policy.py │ ├── mlp_policy.py │ ├── pposgd_simple.py │ ├── run_atari.py │ └── run_mujoco.py ├── ppo2 │ ├── README.md │ ├── __init__.py │ ├── policies.py │ ├── ppo2.py │ ├── run_atari.py │ └── run_mujoco.py ├── rainbow │ ├── README.md │ ├── __init__.py │ ├── build_graph.py │ └── experiments │ │ ├── __init__.py │ │ └── atari │ │ ├── __init__.py │ │ ├── enjoy.py │ │ ├── model.py │ │ └── rainbow.py ├── results_plotter.py └── trpo_mpi │ ├── README.md │ ├── __init__.py │ ├── nosharing_cnn_policy.py │ ├── run_atari.py │ ├── run_mujoco.py │ └── trpo_mpi.py ├── data ├── cartpole.gif └── logo.jpg └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/README.md -------------------------------------------------------------------------------- /baselines/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/a2c/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/a2c/README.md -------------------------------------------------------------------------------- /baselines/a2c/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/a2c/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/a2c/a2c.py -------------------------------------------------------------------------------- /baselines/a2c/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/a2c/policies.py -------------------------------------------------------------------------------- /baselines/a2c/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/a2c/run_atari.py -------------------------------------------------------------------------------- /baselines/a2c/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/a2c/utils.py -------------------------------------------------------------------------------- /baselines/acer/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acer/README.md -------------------------------------------------------------------------------- /baselines/acer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/acer/acer_simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acer/acer_simple.py -------------------------------------------------------------------------------- /baselines/acer/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acer/buffer.py -------------------------------------------------------------------------------- /baselines/acer/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acer/policies.py -------------------------------------------------------------------------------- /baselines/acer/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acer/run_atari.py -------------------------------------------------------------------------------- /baselines/acktr/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/README.md -------------------------------------------------------------------------------- /baselines/acktr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/acktr/acktr_cont.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/acktr_cont.py -------------------------------------------------------------------------------- /baselines/acktr/acktr_disc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/acktr_disc.py -------------------------------------------------------------------------------- /baselines/acktr/filters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/filters.py -------------------------------------------------------------------------------- /baselines/acktr/kfac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/kfac.py -------------------------------------------------------------------------------- /baselines/acktr/kfac_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/kfac_utils.py -------------------------------------------------------------------------------- /baselines/acktr/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/policies.py -------------------------------------------------------------------------------- /baselines/acktr/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/run_atari.py -------------------------------------------------------------------------------- /baselines/acktr/run_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/run_mujoco.py -------------------------------------------------------------------------------- /baselines/acktr/running_stat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/running_stat.py -------------------------------------------------------------------------------- /baselines/acktr/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/utils.py -------------------------------------------------------------------------------- /baselines/acktr/value_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/acktr/value_functions.py -------------------------------------------------------------------------------- /baselines/bench/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/bench/__init__.py -------------------------------------------------------------------------------- /baselines/bench/benchmarks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/bench/benchmarks.py -------------------------------------------------------------------------------- /baselines/bench/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/bench/monitor.py -------------------------------------------------------------------------------- /baselines/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/__init__.py -------------------------------------------------------------------------------- /baselines/common/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/atari_wrappers.py -------------------------------------------------------------------------------- /baselines/common/atari_wrappers_deprecated.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/atari_wrappers_deprecated.py -------------------------------------------------------------------------------- /baselines/common/azure_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/azure_utils.py -------------------------------------------------------------------------------- /baselines/common/cg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/cg.py -------------------------------------------------------------------------------- /baselines/common/console_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/console_util.py -------------------------------------------------------------------------------- /baselines/common/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/dataset.py -------------------------------------------------------------------------------- /baselines/common/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/distributions.py -------------------------------------------------------------------------------- /baselines/common/math_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/math_util.py -------------------------------------------------------------------------------- /baselines/common/misc_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/misc_util.py -------------------------------------------------------------------------------- /baselines/common/mpi_adam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/mpi_adam.py -------------------------------------------------------------------------------- /baselines/common/mpi_fork.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/mpi_fork.py -------------------------------------------------------------------------------- /baselines/common/mpi_moments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/mpi_moments.py -------------------------------------------------------------------------------- /baselines/common/mpi_running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/mpi_running_mean_std.py -------------------------------------------------------------------------------- /baselines/common/running_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/running_mean_std.py -------------------------------------------------------------------------------- /baselines/common/schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/schedules.py -------------------------------------------------------------------------------- /baselines/common/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/segment_tree.py -------------------------------------------------------------------------------- /baselines/common/tests/test_schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/tests/test_schedules.py -------------------------------------------------------------------------------- /baselines/common/tests/test_segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/tests/test_segment_tree.py -------------------------------------------------------------------------------- /baselines/common/tests/test_tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/tests/test_tf_util.py -------------------------------------------------------------------------------- /baselines/common/tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/tf_util.py -------------------------------------------------------------------------------- /baselines/common/vec_env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/vec_env/__init__.py -------------------------------------------------------------------------------- /baselines/common/vec_env/dummy_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/vec_env/dummy_vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/subproc_vec_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/vec_env/subproc_vec_env.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_frame_stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/vec_env/vec_frame_stack.py -------------------------------------------------------------------------------- /baselines/common/vec_env/vec_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/common/vec_env/vec_normalize.py -------------------------------------------------------------------------------- /baselines/ddpg/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/README.md -------------------------------------------------------------------------------- /baselines/ddpg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/ddpg/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/ddpg.py -------------------------------------------------------------------------------- /baselines/ddpg/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/main.py -------------------------------------------------------------------------------- /baselines/ddpg/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/memory.py -------------------------------------------------------------------------------- /baselines/ddpg/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/models.py -------------------------------------------------------------------------------- /baselines/ddpg/noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/noise.py -------------------------------------------------------------------------------- /baselines/ddpg/training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/training.py -------------------------------------------------------------------------------- /baselines/ddpg/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ddpg/util.py -------------------------------------------------------------------------------- /baselines/deepq/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/README.md -------------------------------------------------------------------------------- /baselines/deepq/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/__init__.py -------------------------------------------------------------------------------- /baselines/deepq/build_graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/build_graph.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/deepq/experiments/atari/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/deepq/experiments/atari/download_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/atari/download_model.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/atari/enjoy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/atari/enjoy.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/atari/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/atari/model.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/atari/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/atari/train.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/atari/wang2015_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/atari/wang2015_eval.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/custom_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/custom_cartpole.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/enjoy_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/enjoy_cartpole.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/enjoy_mountaincar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/enjoy_mountaincar.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/enjoy_pong.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/enjoy_pong.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/run_atari.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/train_cartpole.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/train_cartpole.py -------------------------------------------------------------------------------- /baselines/deepq/experiments/train_mountaincar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/experiments/train_mountaincar.py -------------------------------------------------------------------------------- /baselines/deepq/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/models.py -------------------------------------------------------------------------------- /baselines/deepq/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/replay_buffer.py -------------------------------------------------------------------------------- /baselines/deepq/simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/deepq/simple.py -------------------------------------------------------------------------------- /baselines/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/logger.py -------------------------------------------------------------------------------- /baselines/ppo1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo1/README.md -------------------------------------------------------------------------------- /baselines/ppo1/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/ppo1/cnn_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo1/cnn_policy.py -------------------------------------------------------------------------------- /baselines/ppo1/mlp_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo1/mlp_policy.py -------------------------------------------------------------------------------- /baselines/ppo1/pposgd_simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo1/pposgd_simple.py -------------------------------------------------------------------------------- /baselines/ppo1/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo1/run_atari.py -------------------------------------------------------------------------------- /baselines/ppo1/run_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo1/run_mujoco.py -------------------------------------------------------------------------------- /baselines/ppo2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo2/README.md -------------------------------------------------------------------------------- /baselines/ppo2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/ppo2/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo2/policies.py -------------------------------------------------------------------------------- /baselines/ppo2/ppo2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo2/ppo2.py -------------------------------------------------------------------------------- /baselines/ppo2/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo2/run_atari.py -------------------------------------------------------------------------------- /baselines/ppo2/run_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/ppo2/run_mujoco.py -------------------------------------------------------------------------------- /baselines/rainbow/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/rainbow/README.md -------------------------------------------------------------------------------- /baselines/rainbow/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/rainbow/__init__.py -------------------------------------------------------------------------------- /baselines/rainbow/build_graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/rainbow/build_graph.py -------------------------------------------------------------------------------- /baselines/rainbow/experiments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/rainbow/experiments/atari/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/rainbow/experiments/atari/enjoy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/rainbow/experiments/atari/enjoy.py -------------------------------------------------------------------------------- /baselines/rainbow/experiments/atari/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/rainbow/experiments/atari/model.py -------------------------------------------------------------------------------- /baselines/rainbow/experiments/atari/rainbow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/rainbow/experiments/atari/rainbow.py -------------------------------------------------------------------------------- /baselines/results_plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/results_plotter.py -------------------------------------------------------------------------------- /baselines/trpo_mpi/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/trpo_mpi/README.md -------------------------------------------------------------------------------- /baselines/trpo_mpi/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /baselines/trpo_mpi/nosharing_cnn_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/trpo_mpi/nosharing_cnn_policy.py -------------------------------------------------------------------------------- /baselines/trpo_mpi/run_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/trpo_mpi/run_atari.py -------------------------------------------------------------------------------- /baselines/trpo_mpi/run_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/trpo_mpi/run_mujoco.py -------------------------------------------------------------------------------- /baselines/trpo_mpi/trpo_mpi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/baselines/trpo_mpi/trpo_mpi.py -------------------------------------------------------------------------------- /data/cartpole.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/data/cartpole.gif -------------------------------------------------------------------------------- /data/logo.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/data/logo.jpg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cxxgtxy/deeprl-baselines/HEAD/setup.py --------------------------------------------------------------------------------