├── .codecov.yml ├── .coveragerc ├── .github ├── .mergify.yml └── workflows │ ├── cancel.yml │ ├── codecov.yml │ ├── lint-check.yml │ ├── stale.yml │ ├── test_linux.yml │ ├── test_macos.yml │ └── test_windows.yml ├── .gitignore ├── .isort.cfg ├── .lgtm.yml ├── .pre-commit-config.yaml ├── .pyup.yml ├── .scripts ├── unix_cpu_build.sh └── windows_cpu_build.ps1 ├── .travis.yml ├── AUTHORS.rst ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── GETTING_STARTED.md ├── INSTALL.md ├── LICENSE ├── README.md ├── contrib └── placeholder ├── docs ├── Makefile ├── make.bat ├── requirements.txt └── source │ ├── RL │ ├── background │ │ ├── index.rst │ │ ├── supervised_basic.rst │ │ └── unsupervised_basic.rst │ └── introduction │ │ └── index.rst │ ├── api │ ├── agents │ │ ├── genrl.agents.bandits.contextual.rst │ │ ├── genrl.agents.bandits.multiarmed.rst │ │ ├── genrl.agents.classical.qlearning.rst │ │ ├── genrl.agents.classical.sarsa.rst │ │ ├── genrl.agents.deep.a2c.rst │ │ ├── genrl.agents.deep.base.rst │ │ ├── genrl.agents.deep.ddpg.rst │ │ ├── genrl.agents.deep.dqn.rst │ │ ├── genrl.agents.deep.ppo1.rst │ │ ├── genrl.agents.deep.sac.rst │ │ ├── genrl.agents.deep.td3.rst │ │ ├── genrl.agents.deep.vpg.rst │ │ └── index.rst │ ├── common │ │ ├── bandit.rst │ │ ├── classical.rst │ │ └── index.rst │ ├── core │ │ └── index.rst │ ├── environments │ │ ├── genrl.environments.rst │ │ ├── genrl.environments.vec_env.rst │ │ └── index.rst │ ├── trainers │ │ └── index.rst │ └── utils │ │ └── index.rst │ ├── assets │ └── images │ │ ├── genrl.png │ │ └── genrl_cropped.png │ ├── conf.py │ ├── index.rst │ └── usage │ ├── about │ ├── about.rst │ └── index.rst │ ├── getting_started.md │ ├── install.md │ └── tutorials │ ├── Classical │ ├── Q_Learning.rst │ ├── Sarsa.rst │ └── index.rst │ ├── Deep │ ├── A2C.rst │ ├── Background.rst │ ├── Categorical_DQN.rst │ ├── DDPG.rst │ ├── DQN.rst │ ├── Double_DQN.rst │ ├── Dueling_DQN.rst │ ├── NoisyNet_DQN.rst │ ├── PPO.rst │ ├── Prioritized_DQN.rst │ ├── SAC.rst │ ├── TD3.rst │ ├── VPG.rst │ ├── index.rst │ └── static │ │ └── Categorical_DQN.png │ ├── Saving and loading.rst │ ├── Using A2C.md │ ├── Using Custom Policies.md │ ├── Using shared parameters in actor critic agents.rst │ ├── bandit │ ├── adding_data_bandit.rst │ ├── adding_dcb_agent.rst │ ├── bandit_overview.rst │ ├── bayesian.rst │ ├── bootstrap.rst │ ├── contextual_overview.rst │ ├── gradients.rst │ ├── index.rst │ ├── linpos.rst │ ├── noise.rst │ ├── thompson_sampling.rst │ ├── ucb.rst │ └── variational.rst │ ├── index.rst │ └── using_vpg.md ├── environment.yml ├── examples ├── Bandit_demo.ipynb ├── DQN_demo.ipynb ├── bandit.py ├── deep.py ├── deep_cb.py ├── genetic_rl.py ├── genetic_rl_q_learning.py ├── hyperparameters │ ├── known_parameters │ │ └── placeholder │ └── optuna │ │ ├── A2C-CartPole-v0-ep100.db │ │ ├── a2c_cartpole-v0.py │ │ ├── read.py │ │ └── td3_pendulum-v0.py ├── run_cb.py └── sample.py ├── genrl ├── __init__.py ├── agents │ ├── __init__.py │ ├── bandits │ │ ├── __init__.py │ │ ├── contextual │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── bootstrap_neural.py │ │ │ ├── common │ │ │ │ ├── __init__.py │ │ │ │ ├── base_model.py │ │ │ │ ├── bayesian.py │ │ │ │ ├── neural.py │ │ │ │ └── transition.py │ │ │ ├── fixed.py │ │ │ ├── linpos.py │ │ │ ├── neural_greedy.py │ │ │ ├── neural_linpos.py │ │ │ ├── neural_noise_sampling.py │ │ │ └── variational.py │ │ └── multiarmed │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── bayesian.py │ │ │ ├── bernoulli_mab.py │ │ │ ├── epsgreedy.py │ │ │ ├── gaussian_mab.py │ │ │ ├── gradient.py │ │ │ ├── thompson.py │ │ │ └── ucb.py │ ├── classical │ │ ├── __init__.py │ │ ├── qlearning │ │ │ ├── __init__.py │ │ │ └── qlearning.py │ │ ├── sarsa │ │ │ ├── __init__.py │ │ │ └── sarsa.py │ │ └── valueiteration │ │ │ ├── __init__.py │ │ │ └── valueiteration.py │ └── deep │ │ ├── __init__.py │ │ ├── a2c │ │ ├── __init__.py │ │ └── a2c.py │ │ ├── base │ │ ├── __init__.py │ │ ├── base.py │ │ ├── offpolicy.py │ │ └── onpolicy.py │ │ ├── ddpg │ │ ├── __init__.py │ │ └── ddpg.py │ │ ├── dqn │ │ ├── __init__.py │ │ ├── base.py │ │ ├── categorical.py │ │ ├── double.py │ │ ├── dueling.py │ │ ├── noisy.py │ │ ├── prioritized.py │ │ └── utils.py │ │ ├── ppo1 │ │ ├── __init__.py │ │ └── ppo1.py │ │ ├── sac │ │ ├── __init__.py │ │ └── sac.py │ │ ├── td3 │ │ ├── __init__.py │ │ └── td3.py │ │ └── vpg │ │ ├── __init__.py │ │ └── vpg.py ├── core │ ├── __init__.py │ ├── actor_critic.py │ ├── bandit.py │ ├── base.py │ ├── buffers.py │ ├── noise.py │ ├── policies.py │ ├── rollout_storage.py │ └── values.py ├── environments │ ├── __init__.py │ ├── action_wrappers.py │ ├── atari_preprocessing.py │ ├── atari_wrappers.py │ ├── base_wrapper.py │ ├── frame_stack.py │ ├── gym_wrapper.py │ ├── suite.py │ ├── time_limit.py │ ├── torch.py │ └── vec_env │ │ ├── __init__.py │ │ ├── monitor.py │ │ ├── normalize.py │ │ ├── utils.py │ │ ├── vector_envs.py │ │ └── wrappers.py ├── evolutionary │ ├── __init__.py │ ├── genetic_hyperparam.py │ └── utils.py ├── trainers │ ├── __init__.py │ ├── bandit.py │ ├── base.py │ ├── classical.py │ ├── offpolicy.py │ └── onpolicy.py └── utils │ ├── __init__.py │ ├── data_bandits │ ├── __init__.py │ ├── adult_bandit.py │ ├── base.py │ ├── census_bandit.py │ ├── covertype_bandit.py │ ├── magic_bandit.py │ ├── mushroom_bandit.py │ ├── statlog_bandit.py │ └── utils.py │ ├── discount.py │ ├── logger.py │ ├── models.py │ └── utils.py ├── requirements.txt ├── setup.cfg ├── setup.py └── tests ├── __init__.py ├── test_agents ├── __init__.py ├── test_bandit │ ├── __init__.py │ ├── test_cb_agents.py │ ├── test_data_bandits.py │ ├── test_mab_agents.py │ ├── test_multi_armed_bandits.py │ └── utils.py ├── test_classical │ ├── __init__.py │ └── test_agents.py └── test_deep │ ├── __init__.py │ ├── test_a2c.py │ ├── test_custom.py │ ├── test_ddpg.py │ ├── test_dqn.py │ ├── test_dqn_cnn.py │ ├── test_ppo1.py │ ├── test_sac.py │ ├── test_td3.py │ └── test_vpg.py ├── test_core └── __init__.py ├── test_environments ├── __init__.py ├── test_atari_wrappers.py ├── test_vecenv.py └── test_wrappers.py ├── test_trainers ├── __init__.py ├── test_bandit_trainer.py ├── test_classical_trainer.py └── test_deep_trainer.py └── test_utils ├── __init__.py ├── test_logger.py ├── test_models.py └── test_utils.py /.codecov.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.codecov.yml -------------------------------------------------------------------------------- /.coveragerc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.coveragerc -------------------------------------------------------------------------------- /.github/.mergify.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/.mergify.yml -------------------------------------------------------------------------------- /.github/workflows/cancel.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/cancel.yml -------------------------------------------------------------------------------- /.github/workflows/codecov.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/codecov.yml -------------------------------------------------------------------------------- /.github/workflows/lint-check.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/lint-check.yml -------------------------------------------------------------------------------- /.github/workflows/stale.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/stale.yml -------------------------------------------------------------------------------- /.github/workflows/test_linux.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/test_linux.yml -------------------------------------------------------------------------------- /.github/workflows/test_macos.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/test_macos.yml -------------------------------------------------------------------------------- /.github/workflows/test_windows.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.github/workflows/test_windows.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.gitignore -------------------------------------------------------------------------------- /.isort.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.isort.cfg -------------------------------------------------------------------------------- /.lgtm.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.lgtm.yml -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /.pyup.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.pyup.yml -------------------------------------------------------------------------------- /.scripts/unix_cpu_build.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.scripts/unix_cpu_build.sh -------------------------------------------------------------------------------- /.scripts/windows_cpu_build.ps1: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.scripts/windows_cpu_build.ps1 -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/.travis.yml -------------------------------------------------------------------------------- /AUTHORS.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/AUTHORS.rst -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /GETTING_STARTED.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/GETTING_STARTED.md -------------------------------------------------------------------------------- /INSTALL.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/INSTALL.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/README.md -------------------------------------------------------------------------------- /contrib/placeholder: -------------------------------------------------------------------------------- 1 | placeholder 2 | -------------------------------------------------------------------------------- /docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/Makefile -------------------------------------------------------------------------------- /docs/make.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/make.bat -------------------------------------------------------------------------------- /docs/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/requirements.txt -------------------------------------------------------------------------------- /docs/source/RL/background/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/RL/background/index.rst -------------------------------------------------------------------------------- /docs/source/RL/background/supervised_basic.rst: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /docs/source/RL/background/unsupervised_basic.rst: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /docs/source/RL/introduction/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/RL/introduction/index.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.bandits.contextual.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.bandits.contextual.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.bandits.multiarmed.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.bandits.multiarmed.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.classical.qlearning.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.classical.qlearning.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.classical.sarsa.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.classical.sarsa.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.a2c.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.a2c.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.base.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.base.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.ddpg.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.ddpg.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.dqn.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.dqn.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.ppo1.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.ppo1.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.sac.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.sac.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.td3.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.td3.rst -------------------------------------------------------------------------------- /docs/source/api/agents/genrl.agents.deep.vpg.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/genrl.agents.deep.vpg.rst -------------------------------------------------------------------------------- /docs/source/api/agents/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/agents/index.rst -------------------------------------------------------------------------------- /docs/source/api/common/bandit.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/common/bandit.rst -------------------------------------------------------------------------------- /docs/source/api/common/classical.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/common/classical.rst -------------------------------------------------------------------------------- /docs/source/api/common/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/common/index.rst -------------------------------------------------------------------------------- /docs/source/api/core/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/core/index.rst -------------------------------------------------------------------------------- /docs/source/api/environments/genrl.environments.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/environments/genrl.environments.rst -------------------------------------------------------------------------------- /docs/source/api/environments/genrl.environments.vec_env.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/environments/genrl.environments.vec_env.rst -------------------------------------------------------------------------------- /docs/source/api/environments/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/environments/index.rst -------------------------------------------------------------------------------- /docs/source/api/trainers/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/trainers/index.rst -------------------------------------------------------------------------------- /docs/source/api/utils/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/api/utils/index.rst -------------------------------------------------------------------------------- /docs/source/assets/images/genrl.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/assets/images/genrl.png -------------------------------------------------------------------------------- /docs/source/assets/images/genrl_cropped.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/assets/images/genrl_cropped.png -------------------------------------------------------------------------------- /docs/source/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/conf.py -------------------------------------------------------------------------------- /docs/source/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/index.rst -------------------------------------------------------------------------------- /docs/source/usage/about/about.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/about/about.rst -------------------------------------------------------------------------------- /docs/source/usage/about/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/about/index.rst -------------------------------------------------------------------------------- /docs/source/usage/getting_started.md: -------------------------------------------------------------------------------- 1 | ../../../GETTING_STARTED.md -------------------------------------------------------------------------------- /docs/source/usage/install.md: -------------------------------------------------------------------------------- 1 | ../../../INSTALL.md -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Classical/Q_Learning.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Classical/Q_Learning.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Classical/Sarsa.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Classical/Sarsa.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Classical/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Classical/index.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/A2C.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/A2C.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/Background.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/Background.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/Categorical_DQN.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/Categorical_DQN.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/DDPG.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/DDPG.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/DQN.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/DQN.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/Double_DQN.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/Double_DQN.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/Dueling_DQN.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/Dueling_DQN.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/NoisyNet_DQN.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/NoisyNet_DQN.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/PPO.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/PPO.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/Prioritized_DQN.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/Prioritized_DQN.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/SAC.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/SAC.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/TD3.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/TD3.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/VPG.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/VPG.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/index.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Deep/static/Categorical_DQN.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Deep/static/Categorical_DQN.png -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Saving and loading.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Saving and loading.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Using A2C.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Using A2C.md -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Using Custom Policies.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Using Custom Policies.md -------------------------------------------------------------------------------- /docs/source/usage/tutorials/Using shared parameters in actor critic agents.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/Using shared parameters in actor critic agents.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/adding_data_bandit.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/adding_data_bandit.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/adding_dcb_agent.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/adding_dcb_agent.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/bandit_overview.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/bandit_overview.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/bayesian.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/bayesian.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/bootstrap.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/bootstrap.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/contextual_overview.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/contextual_overview.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/gradients.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/gradients.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/index.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/linpos.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/linpos.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/noise.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/noise.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/thompson_sampling.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/thompson_sampling.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/ucb.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/ucb.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/bandit/variational.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/bandit/variational.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/index.rst -------------------------------------------------------------------------------- /docs/source/usage/tutorials/using_vpg.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/docs/source/usage/tutorials/using_vpg.md -------------------------------------------------------------------------------- /environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/environment.yml -------------------------------------------------------------------------------- /examples/Bandit_demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/Bandit_demo.ipynb -------------------------------------------------------------------------------- /examples/DQN_demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/DQN_demo.ipynb -------------------------------------------------------------------------------- /examples/bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/bandit.py -------------------------------------------------------------------------------- /examples/deep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/deep.py -------------------------------------------------------------------------------- /examples/deep_cb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/deep_cb.py -------------------------------------------------------------------------------- /examples/genetic_rl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/genetic_rl.py -------------------------------------------------------------------------------- /examples/genetic_rl_q_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/genetic_rl_q_learning.py -------------------------------------------------------------------------------- /examples/hyperparameters/known_parameters/placeholder: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /examples/hyperparameters/optuna/A2C-CartPole-v0-ep100.db: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/hyperparameters/optuna/A2C-CartPole-v0-ep100.db -------------------------------------------------------------------------------- /examples/hyperparameters/optuna/a2c_cartpole-v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/hyperparameters/optuna/a2c_cartpole-v0.py -------------------------------------------------------------------------------- /examples/hyperparameters/optuna/read.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/hyperparameters/optuna/read.py -------------------------------------------------------------------------------- /examples/hyperparameters/optuna/td3_pendulum-v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/hyperparameters/optuna/td3_pendulum-v0.py -------------------------------------------------------------------------------- /examples/run_cb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/examples/run_cb.py -------------------------------------------------------------------------------- /examples/sample.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/__init__.py -------------------------------------------------------------------------------- /genrl/agents/bandits/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/base.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/bootstrap_neural.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/bootstrap_neural.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/common/__init__.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/common/base_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/common/base_model.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/common/bayesian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/common/bayesian.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/common/neural.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/common/neural.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/common/transition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/common/transition.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/fixed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/fixed.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/linpos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/linpos.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/neural_greedy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/neural_greedy.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/neural_linpos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/neural_linpos.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/neural_noise_sampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/neural_noise_sampling.py -------------------------------------------------------------------------------- /genrl/agents/bandits/contextual/variational.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/contextual/variational.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/base.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/bayesian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/bayesian.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/bernoulli_mab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/bernoulli_mab.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/epsgreedy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/epsgreedy.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/gaussian_mab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/gaussian_mab.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/gradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/gradient.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/thompson.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/thompson.py -------------------------------------------------------------------------------- /genrl/agents/bandits/multiarmed/ucb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/bandits/multiarmed/ucb.py -------------------------------------------------------------------------------- /genrl/agents/classical/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/classical/qlearning/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/classical/qlearning/qlearning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/classical/qlearning/qlearning.py -------------------------------------------------------------------------------- /genrl/agents/classical/sarsa/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/classical/sarsa/sarsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/classical/sarsa/sarsa.py -------------------------------------------------------------------------------- /genrl/agents/classical/valueiteration/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/classical/valueiteration/valueiteration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/classical/valueiteration/valueiteration.py -------------------------------------------------------------------------------- /genrl/agents/deep/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/a2c/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/a2c/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/a2c/a2c.py -------------------------------------------------------------------------------- /genrl/agents/deep/base/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/base/__init__.py -------------------------------------------------------------------------------- /genrl/agents/deep/base/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/base/base.py -------------------------------------------------------------------------------- /genrl/agents/deep/base/offpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/base/offpolicy.py -------------------------------------------------------------------------------- /genrl/agents/deep/base/onpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/base/onpolicy.py -------------------------------------------------------------------------------- /genrl/agents/deep/ddpg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/ddpg/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/ddpg/ddpg.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/base.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/categorical.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/categorical.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/double.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/double.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/dueling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/dueling.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/noisy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/noisy.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/prioritized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/prioritized.py -------------------------------------------------------------------------------- /genrl/agents/deep/dqn/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/dqn/utils.py -------------------------------------------------------------------------------- /genrl/agents/deep/ppo1/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/ppo1/ppo1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/ppo1/ppo1.py -------------------------------------------------------------------------------- /genrl/agents/deep/sac/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/sac/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/sac/sac.py -------------------------------------------------------------------------------- /genrl/agents/deep/td3/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/td3/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/td3/td3.py -------------------------------------------------------------------------------- /genrl/agents/deep/vpg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /genrl/agents/deep/vpg/vpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/agents/deep/vpg/vpg.py -------------------------------------------------------------------------------- /genrl/core/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/__init__.py -------------------------------------------------------------------------------- /genrl/core/actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/actor_critic.py -------------------------------------------------------------------------------- /genrl/core/bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/bandit.py -------------------------------------------------------------------------------- /genrl/core/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/base.py -------------------------------------------------------------------------------- /genrl/core/buffers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/buffers.py -------------------------------------------------------------------------------- /genrl/core/noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/noise.py -------------------------------------------------------------------------------- /genrl/core/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/policies.py -------------------------------------------------------------------------------- /genrl/core/rollout_storage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/rollout_storage.py -------------------------------------------------------------------------------- /genrl/core/values.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/core/values.py -------------------------------------------------------------------------------- /genrl/environments/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/__init__.py -------------------------------------------------------------------------------- /genrl/environments/action_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/action_wrappers.py -------------------------------------------------------------------------------- /genrl/environments/atari_preprocessing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/atari_preprocessing.py -------------------------------------------------------------------------------- /genrl/environments/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/atari_wrappers.py -------------------------------------------------------------------------------- /genrl/environments/base_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/base_wrapper.py -------------------------------------------------------------------------------- /genrl/environments/frame_stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/frame_stack.py -------------------------------------------------------------------------------- /genrl/environments/gym_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/gym_wrapper.py -------------------------------------------------------------------------------- /genrl/environments/suite.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/suite.py -------------------------------------------------------------------------------- /genrl/environments/time_limit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/time_limit.py -------------------------------------------------------------------------------- /genrl/environments/torch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/torch.py -------------------------------------------------------------------------------- /genrl/environments/vec_env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/vec_env/__init__.py -------------------------------------------------------------------------------- /genrl/environments/vec_env/monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/vec_env/monitor.py -------------------------------------------------------------------------------- /genrl/environments/vec_env/normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/vec_env/normalize.py -------------------------------------------------------------------------------- /genrl/environments/vec_env/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/vec_env/utils.py -------------------------------------------------------------------------------- /genrl/environments/vec_env/vector_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/vec_env/vector_envs.py -------------------------------------------------------------------------------- /genrl/environments/vec_env/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/environments/vec_env/wrappers.py -------------------------------------------------------------------------------- /genrl/evolutionary/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/evolutionary/__init__.py -------------------------------------------------------------------------------- /genrl/evolutionary/genetic_hyperparam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/evolutionary/genetic_hyperparam.py -------------------------------------------------------------------------------- /genrl/evolutionary/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/evolutionary/utils.py -------------------------------------------------------------------------------- /genrl/trainers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/trainers/__init__.py -------------------------------------------------------------------------------- /genrl/trainers/bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/trainers/bandit.py -------------------------------------------------------------------------------- /genrl/trainers/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/trainers/base.py -------------------------------------------------------------------------------- /genrl/trainers/classical.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/trainers/classical.py -------------------------------------------------------------------------------- /genrl/trainers/offpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/trainers/offpolicy.py -------------------------------------------------------------------------------- /genrl/trainers/onpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/trainers/onpolicy.py -------------------------------------------------------------------------------- /genrl/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/__init__.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/__init__.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/adult_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/adult_bandit.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/base.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/census_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/census_bandit.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/covertype_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/covertype_bandit.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/magic_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/magic_bandit.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/mushroom_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/mushroom_bandit.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/statlog_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/statlog_bandit.py -------------------------------------------------------------------------------- /genrl/utils/data_bandits/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/data_bandits/utils.py -------------------------------------------------------------------------------- /genrl/utils/discount.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/discount.py -------------------------------------------------------------------------------- /genrl/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/logger.py -------------------------------------------------------------------------------- /genrl/utils/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/models.py -------------------------------------------------------------------------------- /genrl/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/genrl/utils/utils.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/requirements.txt -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/setup.cfg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/setup.py -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/test_agents/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/test_agents/test_bandit/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_bandit/__init__.py -------------------------------------------------------------------------------- /tests/test_agents/test_bandit/test_cb_agents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_bandit/test_cb_agents.py -------------------------------------------------------------------------------- /tests/test_agents/test_bandit/test_data_bandits.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_bandit/test_data_bandits.py -------------------------------------------------------------------------------- /tests/test_agents/test_bandit/test_mab_agents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_bandit/test_mab_agents.py -------------------------------------------------------------------------------- /tests/test_agents/test_bandit/test_multi_armed_bandits.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_bandit/test_multi_armed_bandits.py -------------------------------------------------------------------------------- /tests/test_agents/test_bandit/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_bandit/utils.py -------------------------------------------------------------------------------- /tests/test_agents/test_classical/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_classical/__init__.py -------------------------------------------------------------------------------- /tests/test_agents/test_classical/test_agents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_classical/test_agents.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/__init__.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_a2c.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_custom.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_custom.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_ddpg.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_dqn.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_dqn_cnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_dqn_cnn.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_ppo1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_ppo1.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_sac.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_td3.py -------------------------------------------------------------------------------- /tests/test_agents/test_deep/test_vpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_agents/test_deep/test_vpg.py -------------------------------------------------------------------------------- /tests/test_core/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/test_environments/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_environments/__init__.py -------------------------------------------------------------------------------- /tests/test_environments/test_atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_environments/test_atari_wrappers.py -------------------------------------------------------------------------------- /tests/test_environments/test_vecenv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_environments/test_vecenv.py -------------------------------------------------------------------------------- /tests/test_environments/test_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_environments/test_wrappers.py -------------------------------------------------------------------------------- /tests/test_trainers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_trainers/__init__.py -------------------------------------------------------------------------------- /tests/test_trainers/test_bandit_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_trainers/test_bandit_trainer.py -------------------------------------------------------------------------------- /tests/test_trainers/test_classical_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_trainers/test_classical_trainer.py -------------------------------------------------------------------------------- /tests/test_trainers/test_deep_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_trainers/test_deep_trainer.py -------------------------------------------------------------------------------- /tests/test_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_utils/__init__.py -------------------------------------------------------------------------------- /tests/test_utils/test_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_utils/test_logger.py -------------------------------------------------------------------------------- /tests/test_utils/test_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_utils/test_models.py -------------------------------------------------------------------------------- /tests/test_utils/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/SforAiDl/genrl/HEAD/tests/test_utils/test_utils.py --------------------------------------------------------------------------------