├── README.md ├── dl ├── __init__.py ├── dqn │ ├── README.md │ ├── __init__.py │ ├── demo.py │ ├── dqn.py │ └── exec.py ├── imgs │ ├── dqn_loss.png │ └── dqn_reward.png └── utils │ ├── __init__.py │ ├── memory.py │ └── wrapper.py └── predl ├── __init__.py ├── base.py ├── function_approximation ├── Q-learning.py ├── __init__.py ├── fa_base.py └── sarsa.py ├── policy_gradient ├── REINFORCE.py ├── REINFORCE_baseline.py ├── __init__.py ├── actor_critic.py └── pg_base.py └── table ├── DynaQ.py ├── NstepSarsa.py ├── Q-learning.py ├── __init__.py ├── sarsa.py ├── sarsa_lambda.py └── table_base.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/README.md -------------------------------------------------------------------------------- /dl/__init__.py: -------------------------------------------------------------------------------- 1 | from .utils import make_atari, Memory, Transition -------------------------------------------------------------------------------- /dl/dqn/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/dqn/README.md -------------------------------------------------------------------------------- /dl/dqn/__init__.py: -------------------------------------------------------------------------------- 1 | from .dqn import Agent, Trainer, DQN 2 | -------------------------------------------------------------------------------- /dl/dqn/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/dqn/demo.py -------------------------------------------------------------------------------- /dl/dqn/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/dqn/dqn.py -------------------------------------------------------------------------------- /dl/dqn/exec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/dqn/exec.py -------------------------------------------------------------------------------- /dl/imgs/dqn_loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/imgs/dqn_loss.png -------------------------------------------------------------------------------- /dl/imgs/dqn_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/imgs/dqn_reward.png -------------------------------------------------------------------------------- /dl/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/utils/__init__.py -------------------------------------------------------------------------------- /dl/utils/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/utils/memory.py -------------------------------------------------------------------------------- /dl/utils/wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/dl/utils/wrapper.py -------------------------------------------------------------------------------- /predl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/__init__.py -------------------------------------------------------------------------------- /predl/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/base.py -------------------------------------------------------------------------------- /predl/function_approximation/Q-learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/function_approximation/Q-learning.py -------------------------------------------------------------------------------- /predl/function_approximation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /predl/function_approximation/fa_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/function_approximation/fa_base.py -------------------------------------------------------------------------------- /predl/function_approximation/sarsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/function_approximation/sarsa.py -------------------------------------------------------------------------------- /predl/policy_gradient/REINFORCE.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/policy_gradient/REINFORCE.py -------------------------------------------------------------------------------- /predl/policy_gradient/REINFORCE_baseline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/policy_gradient/REINFORCE_baseline.py -------------------------------------------------------------------------------- /predl/policy_gradient/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /predl/policy_gradient/actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/policy_gradient/actor_critic.py -------------------------------------------------------------------------------- /predl/policy_gradient/pg_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/policy_gradient/pg_base.py -------------------------------------------------------------------------------- /predl/table/DynaQ.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/table/DynaQ.py -------------------------------------------------------------------------------- /predl/table/NstepSarsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/table/NstepSarsa.py -------------------------------------------------------------------------------- /predl/table/Q-learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/table/Q-learning.py -------------------------------------------------------------------------------- /predl/table/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /predl/table/sarsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/table/sarsa.py -------------------------------------------------------------------------------- /predl/table/sarsa_lambda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/table/sarsa_lambda.py -------------------------------------------------------------------------------- /predl/table/table_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/moskomule/pytorch.rl.learning/HEAD/predl/table/table_base.py --------------------------------------------------------------------------------