├── .github └── ISSUE_TEMPLATE │ ├── bug_report.md │ └── feature_request.md ├── .gitignore ├── LICENSE ├── PPO ├── pytorch │ ├── ppo_pong_pytorch.py │ └── ppo_pytorch.py └── tensorflow 2 │ ├── ppo_pong_tensorflow.py │ └── ppo_tensorflow.py ├── PPO_RND ├── pytorch │ ├── ppo_rnd_frozen_notslippery_pytorch.py │ └── ppo_rnd_pytorch.py └── tensorflow 2 │ ├── ppo_frozenlake_notslippery_tensorflow.py │ └── ppo_rnd_tensorflow.py ├── PPO_continous ├── pytorch │ └── ppo_continous_pytorch.py └── tensorflow │ ├── ppo_continous_bipedal_tensorflow.py │ └── ppo_continous_tensorflow.py ├── README.md └── Result ├── bipedal.gif ├── lunarlander.gif ├── lunarlander_ppo.png ├── pendulum.gif ├── pong.gif └── ppo_pendulum_tf2.png /.github/ISSUE_TEMPLATE/bug_report.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/.github/ISSUE_TEMPLATE/bug_report.md -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/feature_request.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/.github/ISSUE_TEMPLATE/feature_request.md -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/LICENSE -------------------------------------------------------------------------------- /PPO/pytorch/ppo_pong_pytorch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO/pytorch/ppo_pong_pytorch.py -------------------------------------------------------------------------------- /PPO/pytorch/ppo_pytorch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO/pytorch/ppo_pytorch.py -------------------------------------------------------------------------------- /PPO/tensorflow 2/ppo_pong_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO/tensorflow 2/ppo_pong_tensorflow.py -------------------------------------------------------------------------------- /PPO/tensorflow 2/ppo_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO/tensorflow 2/ppo_tensorflow.py -------------------------------------------------------------------------------- /PPO_RND/pytorch/ppo_rnd_frozen_notslippery_pytorch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_RND/pytorch/ppo_rnd_frozen_notslippery_pytorch.py -------------------------------------------------------------------------------- /PPO_RND/pytorch/ppo_rnd_pytorch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_RND/pytorch/ppo_rnd_pytorch.py -------------------------------------------------------------------------------- /PPO_RND/tensorflow 2/ppo_frozenlake_notslippery_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_RND/tensorflow 2/ppo_frozenlake_notslippery_tensorflow.py -------------------------------------------------------------------------------- /PPO_RND/tensorflow 2/ppo_rnd_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_RND/tensorflow 2/ppo_rnd_tensorflow.py -------------------------------------------------------------------------------- /PPO_continous/pytorch/ppo_continous_pytorch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_continous/pytorch/ppo_continous_pytorch.py -------------------------------------------------------------------------------- /PPO_continous/tensorflow/ppo_continous_bipedal_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_continous/tensorflow/ppo_continous_bipedal_tensorflow.py -------------------------------------------------------------------------------- /PPO_continous/tensorflow/ppo_continous_tensorflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/PPO_continous/tensorflow/ppo_continous_tensorflow.py -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/README.md -------------------------------------------------------------------------------- /Result/bipedal.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/Result/bipedal.gif -------------------------------------------------------------------------------- /Result/lunarlander.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/Result/lunarlander.gif -------------------------------------------------------------------------------- /Result/lunarlander_ppo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/Result/lunarlander_ppo.png -------------------------------------------------------------------------------- /Result/pendulum.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/Result/pendulum.gif -------------------------------------------------------------------------------- /Result/pong.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/Result/pong.gif -------------------------------------------------------------------------------- /Result/ppo_pendulum_tf2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wisnunugroho21/reinforcement_learning_ppo_rnd/HEAD/Result/ppo_pendulum_tf2.png --------------------------------------------------------------------------------