├── .all-contributorsrc ├── .flake8 ├── .github ├── CODEOWNERS └── workflows │ └── python-publish.yaml ├── .gitignore ├── .isort.cfg ├── .pre-commit-config.yaml ├── .pylintrc ├── Dockerfile ├── Jenkinsfile ├── LICENSE.md ├── MANIFEST.in ├── Makefile ├── README.md ├── configs ├── lunarlander_continuous_v2 │ ├── __init__.py │ ├── a2c.yaml │ ├── bc_ddpg.yaml │ ├── bc_sac.yaml │ ├── ddpg.yaml │ ├── ddpgfd.yaml │ ├── gail_ppo.yaml │ ├── ppo.yaml │ ├── sac.yaml │ ├── sacfd.yaml │ └── td3.yaml ├── lunarlander_v2 │ ├── __init__.py │ ├── acer.yaml │ ├── distillation_dqn.yaml │ ├── dqfd.yaml │ ├── dqn.yaml │ ├── ppo.yaml │ └── r2d1.yaml ├── pong_no_frameskip_v4 │ ├── __init__.py │ ├── apex_dqn.yaml │ ├── distillation_dqn.yaml │ ├── dqn.yaml │ ├── dqn_resnet.yaml │ ├── ppo.yaml │ └── r2d1.yaml └── reacher_v2 │ ├── __init__.py │ ├── bc_ddpg.yaml │ ├── bc_sac.yaml │ ├── ddpg.yaml │ ├── sac.yaml │ └── td3.yaml ├── data ├── lunarlander_continuous_demo.pkl ├── lunarlander_discrete_demo.pkl └── reacher_demo.pkl ├── mypy.ini ├── requirements-dev.txt ├── requirements.txt ├── rl_algorithms ├── __init__.py ├── a2c │ ├── __init__.py │ ├── agent.py │ └── learner.py ├── acer │ ├── __init__.py │ ├── agent.py │ ├── buffer.py │ └── learner.py ├── bc │ ├── __init__.py │ ├── ddpg_agent.py │ ├── ddpg_learner.py │ ├── her.py │ ├── sac_agent.py │ └── sac_learner.py ├── common │ ├── __init__.py │ ├── abstract │ │ ├── __init__.py │ │ ├── agent.py │ │ ├── architecture.py │ │ ├── buffer.py │ │ ├── distributed_logger.py │ │ ├── distributed_worker.py │ │ ├── her.py │ │ ├── learner.py │ │ └── reward_fn.py │ ├── apex │ │ ├── __init__.py │ │ ├── architecture.py │ │ ├── learner.py │ │ └── worker.py │ ├── buffer │ │ ├── __init__.py │ │ ├── distillation_buffer.py │ │ ├── gail_buffer.py │ │ ├── replay_buffer.py │ │ ├── segment_tree.py │ │ └── wrapper.py │ ├── env │ │ ├── __init__.py │ │ ├── atari_wrappers.py │ │ ├── multiprocessing_env.py │ │ ├── normalizers.py │ │ └── utils.py │ ├── grad_cam.py │ ├── helper_functions.py │ ├── networks │ │ ├── __init__.py │ │ ├── backbones │ │ │ ├── __init__.py │ │ │ ├── cnn.py │ │ │ └── resnet.py │ │ ├── brain.py │ │ └── heads.py │ ├── noise.py │ └── saliency_map.py ├── ddpg │ ├── __init__.py │ ├── agent.py │ └── learner.py ├── distillation │ ├── README.md │ ├── __init__.py │ └── dqn_agent.py ├── dqn │ ├── __init__.py │ ├── agent.py │ ├── distributed_logger.py │ ├── distributed_worker.py │ ├── learner.py │ ├── linear.py │ ├── losses.py │ └── networks.py ├── fd │ ├── __init__.py │ ├── ddpg_agent.py │ ├── ddpg_learner.py │ ├── dqn_agent.py │ ├── dqn_learner.py │ ├── sac_agent.py │ └── sac_learner.py ├── gail │ ├── __init__.py │ ├── agent.py │ ├── learner.py │ ├── networks.py │ └── utils.py ├── ppo │ ├── __init__.py │ ├── agent.py │ ├── learner.py │ └── utils.py ├── recurrent │ ├── __init__.py │ ├── dqn_agent.py │ ├── learner.py │ ├── losses.py │ └── utils.py ├── registry.py ├── sac │ ├── __init__.py │ ├── agent.py │ └── learner.py ├── td3 │ ├── __init__.py │ ├── agent.py │ └── learner.py ├── utils │ ├── __init__.py │ ├── config.py │ └── registry.py └── version ├── run_lunarlander_continuous_v2.py ├── run_lunarlander_v2.py ├── run_pong_no_frameskip_v4.py ├── run_reacher_v2.py ├── setup.py ├── tests ├── buffer │ ├── test_distillation_buffer.py │ ├── test_prioritized_buffer.py │ └── test_uniform_buffer.py ├── integration │ ├── test_run_agent.py │ ├── test_run_apex.py │ └── test_run_distillation_agent.py ├── test_cnn_cfg.py ├── test_config_registry.py └── test_helper_funcion.py └── tools ├── check_version.sh ├── run_descrete_env.sh ├── run_lunarlander_continuous_v2.sh ├── run_reacher_v2.sh └── run_test.sh /.all-contributorsrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.all-contributorsrc -------------------------------------------------------------------------------- /.flake8: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.flake8 -------------------------------------------------------------------------------- /.github/CODEOWNERS: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.github/CODEOWNERS -------------------------------------------------------------------------------- /.github/workflows/python-publish.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.github/workflows/python-publish.yaml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.gitignore -------------------------------------------------------------------------------- /.isort.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.isort.cfg -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /.pylintrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/.pylintrc -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/Dockerfile -------------------------------------------------------------------------------- /Jenkinsfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/Jenkinsfile -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/LICENSE.md -------------------------------------------------------------------------------- /MANIFEST.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/MANIFEST.in -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/README.md -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/a2c.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/a2c.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/bc_ddpg.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/bc_ddpg.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/bc_sac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/bc_sac.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/ddpg.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/ddpg.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/ddpgfd.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/ddpgfd.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/gail_ppo.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/gail_ppo.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/ppo.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/ppo.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/sac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/sac.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/sacfd.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/sacfd.yaml -------------------------------------------------------------------------------- /configs/lunarlander_continuous_v2/td3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_continuous_v2/td3.yaml -------------------------------------------------------------------------------- /configs/lunarlander_v2/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /configs/lunarlander_v2/acer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_v2/acer.yaml -------------------------------------------------------------------------------- /configs/lunarlander_v2/distillation_dqn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_v2/distillation_dqn.yaml -------------------------------------------------------------------------------- /configs/lunarlander_v2/dqfd.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_v2/dqfd.yaml -------------------------------------------------------------------------------- /configs/lunarlander_v2/dqn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_v2/dqn.yaml -------------------------------------------------------------------------------- /configs/lunarlander_v2/ppo.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_v2/ppo.yaml -------------------------------------------------------------------------------- /configs/lunarlander_v2/r2d1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/lunarlander_v2/r2d1.yaml -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/apex_dqn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/pong_no_frameskip_v4/apex_dqn.yaml -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/distillation_dqn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/pong_no_frameskip_v4/distillation_dqn.yaml -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/dqn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/pong_no_frameskip_v4/dqn.yaml -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/dqn_resnet.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/pong_no_frameskip_v4/dqn_resnet.yaml -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/ppo.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/pong_no_frameskip_v4/ppo.yaml -------------------------------------------------------------------------------- /configs/pong_no_frameskip_v4/r2d1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/pong_no_frameskip_v4/r2d1.yaml -------------------------------------------------------------------------------- /configs/reacher_v2/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /configs/reacher_v2/bc_ddpg.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/reacher_v2/bc_ddpg.yaml -------------------------------------------------------------------------------- /configs/reacher_v2/bc_sac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/reacher_v2/bc_sac.yaml -------------------------------------------------------------------------------- /configs/reacher_v2/ddpg.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/reacher_v2/ddpg.yaml -------------------------------------------------------------------------------- /configs/reacher_v2/sac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/reacher_v2/sac.yaml -------------------------------------------------------------------------------- /configs/reacher_v2/td3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/configs/reacher_v2/td3.yaml -------------------------------------------------------------------------------- /data/lunarlander_continuous_demo.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/data/lunarlander_continuous_demo.pkl -------------------------------------------------------------------------------- /data/lunarlander_discrete_demo.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/data/lunarlander_discrete_demo.pkl -------------------------------------------------------------------------------- /data/reacher_demo.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/data/reacher_demo.pkl -------------------------------------------------------------------------------- /mypy.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/mypy.ini -------------------------------------------------------------------------------- /requirements-dev.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/requirements-dev.txt -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/requirements.txt -------------------------------------------------------------------------------- /rl_algorithms/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/__init__.py -------------------------------------------------------------------------------- /rl_algorithms/a2c/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/a2c/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/a2c/agent.py -------------------------------------------------------------------------------- /rl_algorithms/a2c/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/a2c/learner.py -------------------------------------------------------------------------------- /rl_algorithms/acer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rl_algorithms/acer/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/acer/agent.py -------------------------------------------------------------------------------- /rl_algorithms/acer/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/acer/buffer.py -------------------------------------------------------------------------------- /rl_algorithms/acer/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/acer/learner.py -------------------------------------------------------------------------------- /rl_algorithms/bc/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/bc/ddpg_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/bc/ddpg_agent.py -------------------------------------------------------------------------------- /rl_algorithms/bc/ddpg_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/bc/ddpg_learner.py -------------------------------------------------------------------------------- /rl_algorithms/bc/her.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/bc/her.py -------------------------------------------------------------------------------- /rl_algorithms/bc/sac_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/bc/sac_agent.py -------------------------------------------------------------------------------- /rl_algorithms/bc/sac_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/bc/sac_learner.py -------------------------------------------------------------------------------- /rl_algorithms/common/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/agent.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/architecture.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/architecture.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/buffer.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/distributed_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/distributed_logger.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/distributed_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/distributed_worker.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/her.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/her.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/learner.py -------------------------------------------------------------------------------- /rl_algorithms/common/abstract/reward_fn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/abstract/reward_fn.py -------------------------------------------------------------------------------- /rl_algorithms/common/apex/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rl_algorithms/common/apex/architecture.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/apex/architecture.py -------------------------------------------------------------------------------- /rl_algorithms/common/apex/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/apex/learner.py -------------------------------------------------------------------------------- /rl_algorithms/common/apex/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/apex/worker.py -------------------------------------------------------------------------------- /rl_algorithms/common/buffer/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/common/buffer/distillation_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/buffer/distillation_buffer.py -------------------------------------------------------------------------------- /rl_algorithms/common/buffer/gail_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/buffer/gail_buffer.py -------------------------------------------------------------------------------- /rl_algorithms/common/buffer/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/buffer/replay_buffer.py -------------------------------------------------------------------------------- /rl_algorithms/common/buffer/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/buffer/segment_tree.py -------------------------------------------------------------------------------- /rl_algorithms/common/buffer/wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/buffer/wrapper.py -------------------------------------------------------------------------------- /rl_algorithms/common/env/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/common/env/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/env/atari_wrappers.py -------------------------------------------------------------------------------- /rl_algorithms/common/env/multiprocessing_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/env/multiprocessing_env.py -------------------------------------------------------------------------------- /rl_algorithms/common/env/normalizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/env/normalizers.py -------------------------------------------------------------------------------- /rl_algorithms/common/env/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/env/utils.py -------------------------------------------------------------------------------- /rl_algorithms/common/grad_cam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/grad_cam.py -------------------------------------------------------------------------------- /rl_algorithms/common/helper_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/helper_functions.py -------------------------------------------------------------------------------- /rl_algorithms/common/networks/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/common/networks/backbones/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/networks/backbones/__init__.py -------------------------------------------------------------------------------- /rl_algorithms/common/networks/backbones/cnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/networks/backbones/cnn.py -------------------------------------------------------------------------------- /rl_algorithms/common/networks/backbones/resnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/networks/backbones/resnet.py -------------------------------------------------------------------------------- /rl_algorithms/common/networks/brain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/networks/brain.py -------------------------------------------------------------------------------- /rl_algorithms/common/networks/heads.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/networks/heads.py -------------------------------------------------------------------------------- /rl_algorithms/common/noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/noise.py -------------------------------------------------------------------------------- /rl_algorithms/common/saliency_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/common/saliency_map.py -------------------------------------------------------------------------------- /rl_algorithms/ddpg/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/ddpg/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/ddpg/agent.py -------------------------------------------------------------------------------- /rl_algorithms/ddpg/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/ddpg/learner.py -------------------------------------------------------------------------------- /rl_algorithms/distillation/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/distillation/README.md -------------------------------------------------------------------------------- /rl_algorithms/distillation/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/distillation/dqn_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/distillation/dqn_agent.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/dqn/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/agent.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/distributed_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/distributed_logger.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/distributed_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/distributed_worker.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/learner.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/linear.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/linear.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/losses.py -------------------------------------------------------------------------------- /rl_algorithms/dqn/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/dqn/networks.py -------------------------------------------------------------------------------- /rl_algorithms/fd/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/fd/ddpg_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/fd/ddpg_agent.py -------------------------------------------------------------------------------- /rl_algorithms/fd/ddpg_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/fd/ddpg_learner.py -------------------------------------------------------------------------------- /rl_algorithms/fd/dqn_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/fd/dqn_agent.py -------------------------------------------------------------------------------- /rl_algorithms/fd/dqn_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/fd/dqn_learner.py -------------------------------------------------------------------------------- /rl_algorithms/fd/sac_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/fd/sac_agent.py -------------------------------------------------------------------------------- /rl_algorithms/fd/sac_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/fd/sac_learner.py -------------------------------------------------------------------------------- /rl_algorithms/gail/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/gail/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/gail/agent.py -------------------------------------------------------------------------------- /rl_algorithms/gail/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/gail/learner.py -------------------------------------------------------------------------------- /rl_algorithms/gail/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/gail/networks.py -------------------------------------------------------------------------------- /rl_algorithms/gail/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/gail/utils.py -------------------------------------------------------------------------------- /rl_algorithms/ppo/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/ppo/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/ppo/agent.py -------------------------------------------------------------------------------- /rl_algorithms/ppo/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/ppo/learner.py -------------------------------------------------------------------------------- /rl_algorithms/ppo/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/ppo/utils.py -------------------------------------------------------------------------------- /rl_algorithms/recurrent/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/recurrent/dqn_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/recurrent/dqn_agent.py -------------------------------------------------------------------------------- /rl_algorithms/recurrent/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/recurrent/learner.py -------------------------------------------------------------------------------- /rl_algorithms/recurrent/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/recurrent/losses.py -------------------------------------------------------------------------------- /rl_algorithms/recurrent/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/recurrent/utils.py -------------------------------------------------------------------------------- /rl_algorithms/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/registry.py -------------------------------------------------------------------------------- /rl_algorithms/sac/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/sac/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/sac/agent.py -------------------------------------------------------------------------------- /rl_algorithms/sac/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/sac/learner.py -------------------------------------------------------------------------------- /rl_algorithms/td3/__init__.py: -------------------------------------------------------------------------------- 1 | """Empty.""" 2 | -------------------------------------------------------------------------------- /rl_algorithms/td3/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/td3/agent.py -------------------------------------------------------------------------------- /rl_algorithms/td3/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/td3/learner.py -------------------------------------------------------------------------------- /rl_algorithms/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/utils/__init__.py -------------------------------------------------------------------------------- /rl_algorithms/utils/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/utils/config.py -------------------------------------------------------------------------------- /rl_algorithms/utils/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/rl_algorithms/utils/registry.py -------------------------------------------------------------------------------- /rl_algorithms/version: -------------------------------------------------------------------------------- 1 | 1.2.0 -------------------------------------------------------------------------------- /run_lunarlander_continuous_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/run_lunarlander_continuous_v2.py -------------------------------------------------------------------------------- /run_lunarlander_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/run_lunarlander_v2.py -------------------------------------------------------------------------------- /run_pong_no_frameskip_v4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/run_pong_no_frameskip_v4.py -------------------------------------------------------------------------------- /run_reacher_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/run_reacher_v2.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/setup.py -------------------------------------------------------------------------------- /tests/buffer/test_distillation_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/buffer/test_distillation_buffer.py -------------------------------------------------------------------------------- /tests/buffer/test_prioritized_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/buffer/test_prioritized_buffer.py -------------------------------------------------------------------------------- /tests/buffer/test_uniform_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/buffer/test_uniform_buffer.py -------------------------------------------------------------------------------- /tests/integration/test_run_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/integration/test_run_agent.py -------------------------------------------------------------------------------- /tests/integration/test_run_apex.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/integration/test_run_apex.py -------------------------------------------------------------------------------- /tests/integration/test_run_distillation_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/integration/test_run_distillation_agent.py -------------------------------------------------------------------------------- /tests/test_cnn_cfg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/test_cnn_cfg.py -------------------------------------------------------------------------------- /tests/test_config_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/test_config_registry.py -------------------------------------------------------------------------------- /tests/test_helper_funcion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tests/test_helper_funcion.py -------------------------------------------------------------------------------- /tools/check_version.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tools/check_version.sh -------------------------------------------------------------------------------- /tools/run_descrete_env.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tools/run_descrete_env.sh -------------------------------------------------------------------------------- /tools/run_lunarlander_continuous_v2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tools/run_lunarlander_continuous_v2.sh -------------------------------------------------------------------------------- /tools/run_reacher_v2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tools/run_reacher_v2.sh -------------------------------------------------------------------------------- /tools/run_test.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/medipixel/rl_algorithms/HEAD/tools/run_test.sh --------------------------------------------------------------------------------