├── .gitignore ├── LICENSE ├── README.md ├── examples ├── atari │ ├── apex.py │ └── sac_discrete.py └── mujoco │ └── sac.py ├── requirements.txt ├── rltorch ├── __init__.py ├── agent │ ├── __init__.py │ ├── apex │ │ ├── __init__.py │ │ ├── actor.py │ │ ├── base.py │ │ └── learner.py │ ├── base.py │ ├── sac │ │ ├── __init__.py │ │ ├── actor.py │ │ ├── base.py │ │ └── learner.py │ ├── sac_discrete │ │ ├── __init__.py │ │ ├── actor.py │ │ ├── base.py │ │ └── learner.py │ └── utils.py ├── distributed │ ├── __init__.py │ └── run.py ├── env │ ├── __init__.py │ └── atari_wrappers.py ├── memory │ ├── __init__.py │ ├── base.py │ ├── dummy.py │ ├── multi_step.py │ └── prioritized.py ├── network │ ├── __init__.py │ ├── base.py │ └── builder.py ├── policy │ ├── __init__.py │ ├── categorical.py │ └── gaussian.py └── q_function │ ├── __init__.py │ ├── continuous.py │ └── discrete.py └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/README.md -------------------------------------------------------------------------------- /examples/atari/apex.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/examples/atari/apex.py -------------------------------------------------------------------------------- /examples/atari/sac_discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/examples/atari/sac_discrete.py -------------------------------------------------------------------------------- /examples/mujoco/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/examples/mujoco/sac.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | numpy 2 | torch 3 | gym 4 | -------------------------------------------------------------------------------- /rltorch/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/__init__.py -------------------------------------------------------------------------------- /rltorch/agent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/__init__.py -------------------------------------------------------------------------------- /rltorch/agent/apex/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/apex/__init__.py -------------------------------------------------------------------------------- /rltorch/agent/apex/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/apex/actor.py -------------------------------------------------------------------------------- /rltorch/agent/apex/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/apex/base.py -------------------------------------------------------------------------------- /rltorch/agent/apex/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/apex/learner.py -------------------------------------------------------------------------------- /rltorch/agent/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/base.py -------------------------------------------------------------------------------- /rltorch/agent/sac/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac/__init__.py -------------------------------------------------------------------------------- /rltorch/agent/sac/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac/actor.py -------------------------------------------------------------------------------- /rltorch/agent/sac/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac/base.py -------------------------------------------------------------------------------- /rltorch/agent/sac/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac/learner.py -------------------------------------------------------------------------------- /rltorch/agent/sac_discrete/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac_discrete/__init__.py -------------------------------------------------------------------------------- /rltorch/agent/sac_discrete/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac_discrete/actor.py -------------------------------------------------------------------------------- /rltorch/agent/sac_discrete/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac_discrete/base.py -------------------------------------------------------------------------------- /rltorch/agent/sac_discrete/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/sac_discrete/learner.py -------------------------------------------------------------------------------- /rltorch/agent/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/agent/utils.py -------------------------------------------------------------------------------- /rltorch/distributed/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/distributed/__init__.py -------------------------------------------------------------------------------- /rltorch/distributed/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/distributed/run.py -------------------------------------------------------------------------------- /rltorch/env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/env/__init__.py -------------------------------------------------------------------------------- /rltorch/env/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/env/atari_wrappers.py -------------------------------------------------------------------------------- /rltorch/memory/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/memory/__init__.py -------------------------------------------------------------------------------- /rltorch/memory/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/memory/base.py -------------------------------------------------------------------------------- /rltorch/memory/dummy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/memory/dummy.py -------------------------------------------------------------------------------- /rltorch/memory/multi_step.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/memory/multi_step.py -------------------------------------------------------------------------------- /rltorch/memory/prioritized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/memory/prioritized.py -------------------------------------------------------------------------------- /rltorch/network/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/network/__init__.py -------------------------------------------------------------------------------- /rltorch/network/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/network/base.py -------------------------------------------------------------------------------- /rltorch/network/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/network/builder.py -------------------------------------------------------------------------------- /rltorch/policy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/policy/__init__.py -------------------------------------------------------------------------------- /rltorch/policy/categorical.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/policy/categorical.py -------------------------------------------------------------------------------- /rltorch/policy/gaussian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/policy/gaussian.py -------------------------------------------------------------------------------- /rltorch/q_function/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/q_function/__init__.py -------------------------------------------------------------------------------- /rltorch/q_function/continuous.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/q_function/continuous.py -------------------------------------------------------------------------------- /rltorch/q_function/discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/rltorch/q_function/discrete.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/toshikwa/rltorch/HEAD/setup.py --------------------------------------------------------------------------------