├── .github ├── ISSUE_TEMPLATE.md └── workflows │ └── poetry-package.yml ├── .gitignore ├── .idea ├── .gitignore ├── inspectionProfiles │ ├── Project_Default.xml │ └── profiles_settings.xml ├── misc.xml ├── modules.xml ├── raylab.iml └── vcs.xml ├── .pre-commit-config.yaml ├── AUTHORS.rst ├── CONTRIBUTING.rst ├── LICENSE ├── Makefile ├── README.rst ├── docs ├── Makefile ├── authors.rst ├── conf.py ├── contributing.rst ├── history.rst ├── index.rst ├── installation.rst ├── make.bat ├── readme.rst └── usage.rst ├── examples ├── ACKTR │ ├── cheetah_defaults.py │ ├── mujoco_cheetah_kfac_vs_ekfac.py │ └── pybullet_reacher.py ├── MAGE │ └── pusher.py ├── MAPO │ └── swingup.py ├── MBPO │ └── swingup.py ├── NAF │ ├── cheetah_defaults.py │ ├── exploration_experiment.py │ └── reacher_defaults.py ├── PG │ ├── cartpole_defaults.py │ └── navigation_defaults.py ├── SAC │ ├── cheetah.py │ ├── mountaincar_continuous.py │ ├── reacher_defaults.py │ ├── swingup.py │ └── walker2d.py ├── SOP │ ├── cheetah.py │ ├── hopper.py │ ├── industrial_benchmark.py │ ├── swingup.py │ ├── walker.py │ └── walker2d.py ├── SVG(1) │ ├── cheetah_defaults.py │ ├── ib_defaults.py │ ├── invpendulum_defaults.py │ ├── navigation_defaults.py │ ├── reacher_defaults.py │ └── realnvp_vs_gaussian_reacher.py ├── SVG(inf) │ ├── cartpole_defaults.py │ ├── cheetah_defaults.py │ ├── navigation_defaults.py │ └── reacher_defaults.py ├── SoftSVG │ ├── cheetah_defaults.py │ ├── nfmbrl_reacher.py │ ├── reacher_defaults.py │ └── swingup.py ├── TD3 │ └── cheetah.py └── TRPO │ ├── cartpole_defaults.py │ ├── cheetah_defaults.py │ ├── gaussian_cheetah.py │ ├── gaussian_swingup.py │ ├── pybullet_walker.py │ ├── real_nvp_cheetah.py │ ├── real_nvp_swimmer.py │ ├── tang_2018_cheetah.py │ ├── tang_2018_hopper.py │ └── tang_2018_lander.py ├── poetry.lock ├── pylintrc ├── pyproject.toml ├── raylab ├── __init__.py ├── agents │ ├── __init__.py │ ├── acktr │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── mage │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── mbpo │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── model_based.py │ ├── naf │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── off_policy.py │ ├── registry.py │ ├── sac │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── sop │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── svg │ │ ├── __init__.py │ │ ├── inf │ │ │ ├── __init__.py │ │ │ ├── policy.py │ │ │ └── trainer.py │ │ ├── one │ │ │ ├── __init__.py │ │ │ ├── policy.py │ │ │ └── trainer.py │ │ ├── policy.py │ │ └── soft │ │ │ ├── __init__.py │ │ │ ├── policy.py │ │ │ └── trainer.py │ ├── td3 │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py │ ├── trainer.py │ └── trpo │ │ ├── __init__.py │ │ ├── policy.py │ │ └── trainer.py ├── cli │ ├── __init__.py │ ├── best_checkpoint.py │ ├── episode_dashboard.py │ ├── evaluate_checkpoint.py │ ├── experiment.py │ ├── experiment_dashboard.py │ ├── info.py │ ├── module_dashboard.py │ ├── utils.py │ └── viz.py ├── envs │ ├── __init__.py │ ├── environments │ │ ├── __init__.py │ │ ├── cartpole_stateless.py │ │ ├── hvac.py │ │ ├── navigation.py │ │ └── reservoir.py │ ├── registry.py │ ├── rewards.py │ ├── termination.py │ ├── utils.py │ └── wrappers │ │ ├── __init__.py │ │ ├── correlated_irrelevant.py │ │ ├── gaussian_random_walks.py │ │ ├── linear_redundant.py │ │ ├── mixins.py │ │ ├── nonlinear_redundant.py │ │ ├── random_irrelevant.py │ │ ├── single_precision.py │ │ ├── time_aware_env.py │ │ └── utils.py ├── execution │ ├── __init__.py │ └── warmup.py ├── logger │ ├── __init__.py │ ├── progress_json_logger.py │ └── torch_tensorboard_logger.py ├── options.py ├── policy │ ├── __init__.py │ ├── action_dist.py │ ├── compat.py │ ├── kl_coeff_mixin.py │ ├── losses │ │ ├── __init__.py │ │ ├── abstract.py │ │ ├── dyna.py │ │ ├── isfv_iteration.py │ │ ├── mage.py │ │ ├── maximum_entropy.py │ │ ├── mixins.py │ │ ├── mle.py │ │ ├── policy_gradient.py │ │ ├── q_learning.py │ │ ├── svg.py │ │ └── utils.py │ ├── model_based │ │ ├── __init__.py │ │ ├── envfn.py │ │ ├── lightning.py │ │ ├── policy.py │ │ └── sampling.py │ ├── modules │ │ ├── __init__.py │ │ ├── base.py │ │ ├── ddpg.py │ │ ├── mage.py │ │ ├── mb_ddpg.py │ │ ├── mb_sac.py │ │ ├── naf.py │ │ ├── registry.py │ │ ├── sac.py │ │ ├── sop.py │ │ ├── svg.py │ │ ├── td3.py │ │ └── trpo.py │ ├── off_policy.py │ ├── optimizer_collection.py │ ├── stats.py │ └── torch_policy.py ├── tune │ ├── __init__.py │ └── registry.py └── utils │ ├── __init__.py │ ├── adaptive_kl.py │ ├── checkpoints.py │ ├── debug.py │ ├── dictionaries.py │ ├── dynamic_import.py │ ├── exp_data.py │ ├── explained_variance.py │ ├── exploration │ ├── __init__.py │ ├── base.py │ ├── gaussian_noise.py │ ├── parameter_noise.py │ ├── random_uniform.py │ └── stochastic_actor.py │ ├── lightning.py │ ├── param_noise.py │ ├── replay_buffer.py │ ├── timer.py │ └── types.py ├── scripts ├── debug_stochastic_module.py ├── rollout.py ├── timeit_script_module.py └── train.py ├── tests ├── __init__.py ├── conftest.py ├── mock_env.py ├── pylintrc └── raylab │ ├── __init__.py │ ├── agents │ ├── __init__.py │ ├── conftest.py │ ├── mage │ │ ├── __init__.py │ │ ├── test_policy.py │ │ └── test_trainer.py │ ├── mbpo │ │ ├── __init__.py │ │ └── test_policy.py │ ├── naf │ │ ├── __init__.py │ │ └── test_policy.py │ ├── sop │ │ ├── __init__.py │ │ └── test_policy.py │ ├── test_off_policy.py │ ├── test_registry.py │ └── test_trainer.py │ ├── cli │ ├── __init__.py │ └── test_cli.py │ ├── conftest.py │ ├── envs │ ├── __init__.py │ ├── environments │ │ ├── __init__.py │ │ ├── test_cartpole_swingup.py │ │ ├── test_hvac.py │ │ ├── test_navigation.py │ │ └── test_reservoir.py │ ├── test_basic.py │ ├── test_rewards.py │ ├── test_termination.py │ └── wrappers │ │ ├── __init__.py │ │ ├── conftest.py │ │ ├── test_correlated_irrelevant.py │ │ ├── test_gaussian_random_walks.py │ │ ├── test_linear_redundant.py │ │ ├── test_nonlinear_redundant.py │ │ └── test_random_irrelevant.py │ ├── policy │ ├── __init__.py │ ├── conftest.py │ ├── losses │ │ ├── __init__.py │ │ ├── conftest.py │ │ ├── test_dyna.py │ │ ├── test_isfv_iteration.py │ │ ├── test_mage.py │ │ ├── test_maximum_entropy.py │ │ ├── test_mle.py │ │ ├── test_policy_gradient.py │ │ ├── test_q_learning.py │ │ └── test_svg.py │ ├── model_based │ │ ├── __init__.py │ │ ├── conftest.py │ │ ├── test_envfn.py │ │ ├── test_lightning.py │ │ ├── test_policy.py │ │ └── test_sampling.py │ ├── modules │ │ ├── __init__.py │ │ ├── conftest.py │ │ ├── test_ddpg.py │ │ ├── test_naf.py │ │ ├── test_sac.py │ │ ├── test_svg.py │ │ └── test_trpo.py │ └── test_optimizer_collection.py │ ├── test_options.py │ └── utils │ ├── __init__.py │ ├── test_exp_data.py │ └── test_replay.py └── tox.ini /.github/ISSUE_TEMPLATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.github/ISSUE_TEMPLATE.md -------------------------------------------------------------------------------- /.github/workflows/poetry-package.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.github/workflows/poetry-package.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.gitignore -------------------------------------------------------------------------------- /.idea/.gitignore: -------------------------------------------------------------------------------- 1 | # Default ignored files 2 | /shelf/ 3 | /workspace.xml 4 | -------------------------------------------------------------------------------- /.idea/inspectionProfiles/Project_Default.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.idea/inspectionProfiles/Project_Default.xml -------------------------------------------------------------------------------- /.idea/inspectionProfiles/profiles_settings.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.idea/inspectionProfiles/profiles_settings.xml -------------------------------------------------------------------------------- /.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.idea/misc.xml -------------------------------------------------------------------------------- /.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.idea/modules.xml -------------------------------------------------------------------------------- /.idea/raylab.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.idea/raylab.iml -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /AUTHORS.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/AUTHORS.rst -------------------------------------------------------------------------------- /CONTRIBUTING.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/CONTRIBUTING.rst -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/Makefile -------------------------------------------------------------------------------- /README.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/README.rst -------------------------------------------------------------------------------- /docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/docs/Makefile -------------------------------------------------------------------------------- /docs/authors.rst: -------------------------------------------------------------------------------- 1 | .. include:: ../AUTHORS.rst 2 | -------------------------------------------------------------------------------- /docs/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/docs/conf.py -------------------------------------------------------------------------------- /docs/contributing.rst: -------------------------------------------------------------------------------- 1 | .. include:: ../CONTRIBUTING.rst 2 | -------------------------------------------------------------------------------- /docs/history.rst: -------------------------------------------------------------------------------- 1 | .. include:: ../HISTORY.rst 2 | -------------------------------------------------------------------------------- /docs/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/docs/index.rst -------------------------------------------------------------------------------- /docs/installation.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/docs/installation.rst -------------------------------------------------------------------------------- /docs/make.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/docs/make.bat -------------------------------------------------------------------------------- /docs/readme.rst: -------------------------------------------------------------------------------- 1 | .. include:: ../README.rst 2 | -------------------------------------------------------------------------------- /docs/usage.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/docs/usage.rst -------------------------------------------------------------------------------- /examples/ACKTR/cheetah_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/ACKTR/cheetah_defaults.py -------------------------------------------------------------------------------- /examples/ACKTR/mujoco_cheetah_kfac_vs_ekfac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/ACKTR/mujoco_cheetah_kfac_vs_ekfac.py -------------------------------------------------------------------------------- /examples/ACKTR/pybullet_reacher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/ACKTR/pybullet_reacher.py -------------------------------------------------------------------------------- /examples/MAGE/pusher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/MAGE/pusher.py -------------------------------------------------------------------------------- /examples/MAPO/swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/MAPO/swingup.py -------------------------------------------------------------------------------- /examples/MBPO/swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/MBPO/swingup.py -------------------------------------------------------------------------------- /examples/NAF/cheetah_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/NAF/cheetah_defaults.py -------------------------------------------------------------------------------- /examples/NAF/exploration_experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/NAF/exploration_experiment.py -------------------------------------------------------------------------------- /examples/NAF/reacher_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/NAF/reacher_defaults.py -------------------------------------------------------------------------------- /examples/PG/cartpole_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/PG/cartpole_defaults.py -------------------------------------------------------------------------------- /examples/PG/navigation_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/PG/navigation_defaults.py -------------------------------------------------------------------------------- /examples/SAC/cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SAC/cheetah.py -------------------------------------------------------------------------------- /examples/SAC/mountaincar_continuous.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SAC/mountaincar_continuous.py -------------------------------------------------------------------------------- /examples/SAC/reacher_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SAC/reacher_defaults.py -------------------------------------------------------------------------------- /examples/SAC/swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SAC/swingup.py -------------------------------------------------------------------------------- /examples/SAC/walker2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SAC/walker2d.py -------------------------------------------------------------------------------- /examples/SOP/cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SOP/cheetah.py -------------------------------------------------------------------------------- /examples/SOP/hopper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SOP/hopper.py -------------------------------------------------------------------------------- /examples/SOP/industrial_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SOP/industrial_benchmark.py -------------------------------------------------------------------------------- /examples/SOP/swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SOP/swingup.py -------------------------------------------------------------------------------- /examples/SOP/walker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SOP/walker.py -------------------------------------------------------------------------------- /examples/SOP/walker2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SOP/walker2d.py -------------------------------------------------------------------------------- /examples/SVG(1)/cheetah_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(1)/cheetah_defaults.py -------------------------------------------------------------------------------- /examples/SVG(1)/ib_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(1)/ib_defaults.py -------------------------------------------------------------------------------- /examples/SVG(1)/invpendulum_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(1)/invpendulum_defaults.py -------------------------------------------------------------------------------- /examples/SVG(1)/navigation_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(1)/navigation_defaults.py -------------------------------------------------------------------------------- /examples/SVG(1)/reacher_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(1)/reacher_defaults.py -------------------------------------------------------------------------------- /examples/SVG(1)/realnvp_vs_gaussian_reacher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(1)/realnvp_vs_gaussian_reacher.py -------------------------------------------------------------------------------- /examples/SVG(inf)/cartpole_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(inf)/cartpole_defaults.py -------------------------------------------------------------------------------- /examples/SVG(inf)/cheetah_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(inf)/cheetah_defaults.py -------------------------------------------------------------------------------- /examples/SVG(inf)/navigation_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(inf)/navigation_defaults.py -------------------------------------------------------------------------------- /examples/SVG(inf)/reacher_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SVG(inf)/reacher_defaults.py -------------------------------------------------------------------------------- /examples/SoftSVG/cheetah_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SoftSVG/cheetah_defaults.py -------------------------------------------------------------------------------- /examples/SoftSVG/nfmbrl_reacher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SoftSVG/nfmbrl_reacher.py -------------------------------------------------------------------------------- /examples/SoftSVG/reacher_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SoftSVG/reacher_defaults.py -------------------------------------------------------------------------------- /examples/SoftSVG/swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/SoftSVG/swingup.py -------------------------------------------------------------------------------- /examples/TD3/cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TD3/cheetah.py -------------------------------------------------------------------------------- /examples/TRPO/cartpole_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/cartpole_defaults.py -------------------------------------------------------------------------------- /examples/TRPO/cheetah_defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/cheetah_defaults.py -------------------------------------------------------------------------------- /examples/TRPO/gaussian_cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/gaussian_cheetah.py -------------------------------------------------------------------------------- /examples/TRPO/gaussian_swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/gaussian_swingup.py -------------------------------------------------------------------------------- /examples/TRPO/pybullet_walker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/pybullet_walker.py -------------------------------------------------------------------------------- /examples/TRPO/real_nvp_cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/real_nvp_cheetah.py -------------------------------------------------------------------------------- /examples/TRPO/real_nvp_swimmer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/real_nvp_swimmer.py -------------------------------------------------------------------------------- /examples/TRPO/tang_2018_cheetah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/tang_2018_cheetah.py -------------------------------------------------------------------------------- /examples/TRPO/tang_2018_hopper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/tang_2018_hopper.py -------------------------------------------------------------------------------- /examples/TRPO/tang_2018_lander.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/examples/TRPO/tang_2018_lander.py -------------------------------------------------------------------------------- /poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/poetry.lock -------------------------------------------------------------------------------- /pylintrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/pylintrc -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/pyproject.toml -------------------------------------------------------------------------------- /raylab/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/__init__.py -------------------------------------------------------------------------------- /raylab/agents/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/__init__.py -------------------------------------------------------------------------------- /raylab/agents/acktr/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/acktr/__init__.py -------------------------------------------------------------------------------- /raylab/agents/acktr/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/acktr/policy.py -------------------------------------------------------------------------------- /raylab/agents/acktr/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/acktr/trainer.py -------------------------------------------------------------------------------- /raylab/agents/mage/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/mage/__init__.py -------------------------------------------------------------------------------- /raylab/agents/mage/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/mage/policy.py -------------------------------------------------------------------------------- /raylab/agents/mage/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/mage/trainer.py -------------------------------------------------------------------------------- /raylab/agents/mbpo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/mbpo/__init__.py -------------------------------------------------------------------------------- /raylab/agents/mbpo/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/mbpo/policy.py -------------------------------------------------------------------------------- /raylab/agents/mbpo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/mbpo/trainer.py -------------------------------------------------------------------------------- /raylab/agents/model_based.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/model_based.py -------------------------------------------------------------------------------- /raylab/agents/naf/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/naf/__init__.py -------------------------------------------------------------------------------- /raylab/agents/naf/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/naf/policy.py -------------------------------------------------------------------------------- /raylab/agents/naf/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/naf/trainer.py -------------------------------------------------------------------------------- /raylab/agents/off_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/off_policy.py -------------------------------------------------------------------------------- /raylab/agents/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/registry.py -------------------------------------------------------------------------------- /raylab/agents/sac/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/sac/__init__.py -------------------------------------------------------------------------------- /raylab/agents/sac/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/sac/policy.py -------------------------------------------------------------------------------- /raylab/agents/sac/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/sac/trainer.py -------------------------------------------------------------------------------- /raylab/agents/sop/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/sop/__init__.py -------------------------------------------------------------------------------- /raylab/agents/sop/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/sop/policy.py -------------------------------------------------------------------------------- /raylab/agents/sop/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/sop/trainer.py -------------------------------------------------------------------------------- /raylab/agents/svg/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/__init__.py -------------------------------------------------------------------------------- /raylab/agents/svg/inf/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/inf/__init__.py -------------------------------------------------------------------------------- /raylab/agents/svg/inf/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/inf/policy.py -------------------------------------------------------------------------------- /raylab/agents/svg/inf/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/inf/trainer.py -------------------------------------------------------------------------------- /raylab/agents/svg/one/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/one/__init__.py -------------------------------------------------------------------------------- /raylab/agents/svg/one/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/one/policy.py -------------------------------------------------------------------------------- /raylab/agents/svg/one/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/one/trainer.py -------------------------------------------------------------------------------- /raylab/agents/svg/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/policy.py -------------------------------------------------------------------------------- /raylab/agents/svg/soft/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/soft/__init__.py -------------------------------------------------------------------------------- /raylab/agents/svg/soft/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/soft/policy.py -------------------------------------------------------------------------------- /raylab/agents/svg/soft/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/svg/soft/trainer.py -------------------------------------------------------------------------------- /raylab/agents/td3/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/td3/__init__.py -------------------------------------------------------------------------------- /raylab/agents/td3/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/td3/policy.py -------------------------------------------------------------------------------- /raylab/agents/td3/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/td3/trainer.py -------------------------------------------------------------------------------- /raylab/agents/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/trainer.py -------------------------------------------------------------------------------- /raylab/agents/trpo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/trpo/__init__.py -------------------------------------------------------------------------------- /raylab/agents/trpo/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/trpo/policy.py -------------------------------------------------------------------------------- /raylab/agents/trpo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/agents/trpo/trainer.py -------------------------------------------------------------------------------- /raylab/cli/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/__init__.py -------------------------------------------------------------------------------- /raylab/cli/best_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/best_checkpoint.py -------------------------------------------------------------------------------- /raylab/cli/episode_dashboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/episode_dashboard.py -------------------------------------------------------------------------------- /raylab/cli/evaluate_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/evaluate_checkpoint.py -------------------------------------------------------------------------------- /raylab/cli/experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/experiment.py -------------------------------------------------------------------------------- /raylab/cli/experiment_dashboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/experiment_dashboard.py -------------------------------------------------------------------------------- /raylab/cli/info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/info.py -------------------------------------------------------------------------------- /raylab/cli/module_dashboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/module_dashboard.py -------------------------------------------------------------------------------- /raylab/cli/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/utils.py -------------------------------------------------------------------------------- /raylab/cli/viz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/cli/viz.py -------------------------------------------------------------------------------- /raylab/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/__init__.py -------------------------------------------------------------------------------- /raylab/envs/environments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /raylab/envs/environments/cartpole_stateless.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/environments/cartpole_stateless.py -------------------------------------------------------------------------------- /raylab/envs/environments/hvac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/environments/hvac.py -------------------------------------------------------------------------------- /raylab/envs/environments/navigation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/environments/navigation.py -------------------------------------------------------------------------------- /raylab/envs/environments/reservoir.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/environments/reservoir.py -------------------------------------------------------------------------------- /raylab/envs/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/registry.py -------------------------------------------------------------------------------- /raylab/envs/rewards.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/rewards.py -------------------------------------------------------------------------------- /raylab/envs/termination.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/termination.py -------------------------------------------------------------------------------- /raylab/envs/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/utils.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/__init__.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/correlated_irrelevant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/correlated_irrelevant.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/gaussian_random_walks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/gaussian_random_walks.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/linear_redundant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/linear_redundant.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/mixins.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/mixins.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/nonlinear_redundant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/nonlinear_redundant.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/random_irrelevant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/random_irrelevant.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/single_precision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/single_precision.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/time_aware_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/time_aware_env.py -------------------------------------------------------------------------------- /raylab/envs/wrappers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/envs/wrappers/utils.py -------------------------------------------------------------------------------- /raylab/execution/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/execution/__init__.py -------------------------------------------------------------------------------- /raylab/execution/warmup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/execution/warmup.py -------------------------------------------------------------------------------- /raylab/logger/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/logger/__init__.py -------------------------------------------------------------------------------- /raylab/logger/progress_json_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/logger/progress_json_logger.py -------------------------------------------------------------------------------- /raylab/logger/torch_tensorboard_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/logger/torch_tensorboard_logger.py -------------------------------------------------------------------------------- /raylab/options.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/options.py -------------------------------------------------------------------------------- /raylab/policy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/__init__.py -------------------------------------------------------------------------------- /raylab/policy/action_dist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/action_dist.py -------------------------------------------------------------------------------- /raylab/policy/compat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/compat.py -------------------------------------------------------------------------------- /raylab/policy/kl_coeff_mixin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/kl_coeff_mixin.py -------------------------------------------------------------------------------- /raylab/policy/losses/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/__init__.py -------------------------------------------------------------------------------- /raylab/policy/losses/abstract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/abstract.py -------------------------------------------------------------------------------- /raylab/policy/losses/dyna.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/dyna.py -------------------------------------------------------------------------------- /raylab/policy/losses/isfv_iteration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/isfv_iteration.py -------------------------------------------------------------------------------- /raylab/policy/losses/mage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/mage.py -------------------------------------------------------------------------------- /raylab/policy/losses/maximum_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/maximum_entropy.py -------------------------------------------------------------------------------- /raylab/policy/losses/mixins.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/mixins.py -------------------------------------------------------------------------------- /raylab/policy/losses/mle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/mle.py -------------------------------------------------------------------------------- /raylab/policy/losses/policy_gradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/policy_gradient.py -------------------------------------------------------------------------------- /raylab/policy/losses/q_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/q_learning.py -------------------------------------------------------------------------------- /raylab/policy/losses/svg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/svg.py -------------------------------------------------------------------------------- /raylab/policy/losses/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/losses/utils.py -------------------------------------------------------------------------------- /raylab/policy/model_based/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/model_based/__init__.py -------------------------------------------------------------------------------- /raylab/policy/model_based/envfn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/model_based/envfn.py -------------------------------------------------------------------------------- /raylab/policy/model_based/lightning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/model_based/lightning.py -------------------------------------------------------------------------------- /raylab/policy/model_based/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/model_based/policy.py -------------------------------------------------------------------------------- /raylab/policy/model_based/sampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/model_based/sampling.py -------------------------------------------------------------------------------- /raylab/policy/modules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/__init__.py -------------------------------------------------------------------------------- /raylab/policy/modules/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/base.py -------------------------------------------------------------------------------- /raylab/policy/modules/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/ddpg.py -------------------------------------------------------------------------------- /raylab/policy/modules/mage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/mage.py -------------------------------------------------------------------------------- /raylab/policy/modules/mb_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/mb_ddpg.py -------------------------------------------------------------------------------- /raylab/policy/modules/mb_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/mb_sac.py -------------------------------------------------------------------------------- /raylab/policy/modules/naf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/naf.py -------------------------------------------------------------------------------- /raylab/policy/modules/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/registry.py -------------------------------------------------------------------------------- /raylab/policy/modules/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/sac.py -------------------------------------------------------------------------------- /raylab/policy/modules/sop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/sop.py -------------------------------------------------------------------------------- /raylab/policy/modules/svg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/svg.py -------------------------------------------------------------------------------- /raylab/policy/modules/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/td3.py -------------------------------------------------------------------------------- /raylab/policy/modules/trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/modules/trpo.py -------------------------------------------------------------------------------- /raylab/policy/off_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/off_policy.py -------------------------------------------------------------------------------- /raylab/policy/optimizer_collection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/optimizer_collection.py -------------------------------------------------------------------------------- /raylab/policy/stats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/stats.py -------------------------------------------------------------------------------- /raylab/policy/torch_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/policy/torch_policy.py -------------------------------------------------------------------------------- /raylab/tune/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /raylab/tune/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/tune/registry.py -------------------------------------------------------------------------------- /raylab/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /raylab/utils/adaptive_kl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/adaptive_kl.py -------------------------------------------------------------------------------- /raylab/utils/checkpoints.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/checkpoints.py -------------------------------------------------------------------------------- /raylab/utils/debug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/debug.py -------------------------------------------------------------------------------- /raylab/utils/dictionaries.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/dictionaries.py -------------------------------------------------------------------------------- /raylab/utils/dynamic_import.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/dynamic_import.py -------------------------------------------------------------------------------- /raylab/utils/exp_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exp_data.py -------------------------------------------------------------------------------- /raylab/utils/explained_variance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/explained_variance.py -------------------------------------------------------------------------------- /raylab/utils/exploration/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exploration/__init__.py -------------------------------------------------------------------------------- /raylab/utils/exploration/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exploration/base.py -------------------------------------------------------------------------------- /raylab/utils/exploration/gaussian_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exploration/gaussian_noise.py -------------------------------------------------------------------------------- /raylab/utils/exploration/parameter_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exploration/parameter_noise.py -------------------------------------------------------------------------------- /raylab/utils/exploration/random_uniform.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exploration/random_uniform.py -------------------------------------------------------------------------------- /raylab/utils/exploration/stochastic_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/exploration/stochastic_actor.py -------------------------------------------------------------------------------- /raylab/utils/lightning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/lightning.py -------------------------------------------------------------------------------- /raylab/utils/param_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/param_noise.py -------------------------------------------------------------------------------- /raylab/utils/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/replay_buffer.py -------------------------------------------------------------------------------- /raylab/utils/timer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/timer.py -------------------------------------------------------------------------------- /raylab/utils/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/raylab/utils/types.py -------------------------------------------------------------------------------- /scripts/debug_stochastic_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/scripts/debug_stochastic_module.py -------------------------------------------------------------------------------- /scripts/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/scripts/rollout.py -------------------------------------------------------------------------------- /scripts/timeit_script_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/scripts/timeit_script_module.py -------------------------------------------------------------------------------- /scripts/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/scripts/train.py -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/conftest.py -------------------------------------------------------------------------------- /tests/mock_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/mock_env.py -------------------------------------------------------------------------------- /tests/pylintrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/pylintrc -------------------------------------------------------------------------------- /tests/raylab/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/agents/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/agents/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/conftest.py -------------------------------------------------------------------------------- /tests/raylab/agents/mage/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/agents/mage/test_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/mage/test_policy.py -------------------------------------------------------------------------------- /tests/raylab/agents/mage/test_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/mage/test_trainer.py -------------------------------------------------------------------------------- /tests/raylab/agents/mbpo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/agents/mbpo/test_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/mbpo/test_policy.py -------------------------------------------------------------------------------- /tests/raylab/agents/naf/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/agents/naf/test_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/naf/test_policy.py -------------------------------------------------------------------------------- /tests/raylab/agents/sop/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/agents/sop/test_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/sop/test_policy.py -------------------------------------------------------------------------------- /tests/raylab/agents/test_off_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/test_off_policy.py -------------------------------------------------------------------------------- /tests/raylab/agents/test_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/test_registry.py -------------------------------------------------------------------------------- /tests/raylab/agents/test_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/agents/test_trainer.py -------------------------------------------------------------------------------- /tests/raylab/cli/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/cli/test_cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/cli/test_cli.py -------------------------------------------------------------------------------- /tests/raylab/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/conftest.py -------------------------------------------------------------------------------- /tests/raylab/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/envs/environments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/envs/environments/test_cartpole_swingup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/environments/test_cartpole_swingup.py -------------------------------------------------------------------------------- /tests/raylab/envs/environments/test_hvac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/environments/test_hvac.py -------------------------------------------------------------------------------- /tests/raylab/envs/environments/test_navigation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/environments/test_navigation.py -------------------------------------------------------------------------------- /tests/raylab/envs/environments/test_reservoir.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/environments/test_reservoir.py -------------------------------------------------------------------------------- /tests/raylab/envs/test_basic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/test_basic.py -------------------------------------------------------------------------------- /tests/raylab/envs/test_rewards.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/test_rewards.py -------------------------------------------------------------------------------- /tests/raylab/envs/test_termination.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/test_termination.py -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/wrappers/conftest.py -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/test_correlated_irrelevant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/wrappers/test_correlated_irrelevant.py -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/test_gaussian_random_walks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/wrappers/test_gaussian_random_walks.py -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/test_linear_redundant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/wrappers/test_linear_redundant.py -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/test_nonlinear_redundant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/wrappers/test_nonlinear_redundant.py -------------------------------------------------------------------------------- /tests/raylab/envs/wrappers/test_random_irrelevant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/envs/wrappers/test_random_irrelevant.py -------------------------------------------------------------------------------- /tests/raylab/policy/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/policy/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/conftest.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/policy/losses/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/conftest.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_dyna.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_dyna.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_isfv_iteration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_isfv_iteration.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_mage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_mage.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_maximum_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_maximum_entropy.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_mle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_mle.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_policy_gradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_policy_gradient.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_q_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_q_learning.py -------------------------------------------------------------------------------- /tests/raylab/policy/losses/test_svg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/losses/test_svg.py -------------------------------------------------------------------------------- /tests/raylab/policy/model_based/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/policy/model_based/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/model_based/conftest.py -------------------------------------------------------------------------------- /tests/raylab/policy/model_based/test_envfn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/model_based/test_envfn.py -------------------------------------------------------------------------------- /tests/raylab/policy/model_based/test_lightning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/model_based/test_lightning.py -------------------------------------------------------------------------------- /tests/raylab/policy/model_based/test_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/model_based/test_policy.py -------------------------------------------------------------------------------- /tests/raylab/policy/model_based/test_sampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/model_based/test_sampling.py -------------------------------------------------------------------------------- /tests/raylab/policy/modules/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/policy/modules/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/modules/conftest.py -------------------------------------------------------------------------------- /tests/raylab/policy/modules/test_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/modules/test_ddpg.py -------------------------------------------------------------------------------- /tests/raylab/policy/modules/test_naf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/modules/test_naf.py -------------------------------------------------------------------------------- /tests/raylab/policy/modules/test_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/modules/test_sac.py -------------------------------------------------------------------------------- /tests/raylab/policy/modules/test_svg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/modules/test_svg.py -------------------------------------------------------------------------------- /tests/raylab/policy/modules/test_trpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/modules/test_trpo.py -------------------------------------------------------------------------------- /tests/raylab/policy/test_optimizer_collection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/policy/test_optimizer_collection.py -------------------------------------------------------------------------------- /tests/raylab/test_options.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/test_options.py -------------------------------------------------------------------------------- /tests/raylab/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/raylab/utils/test_exp_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/utils/test_exp_data.py -------------------------------------------------------------------------------- /tests/raylab/utils/test_replay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tests/raylab/utils/test_replay.py -------------------------------------------------------------------------------- /tox.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/0xangelo/raylab/HEAD/tox.ini --------------------------------------------------------------------------------