├── 2019 ├── code │ ├── 00-gym.ipynb │ ├── 01-genetics.ipynb │ ├── 02-cem.ipynb │ ├── 03-tabular.ipynb │ ├── 04-dqn.ipynb │ ├── __init__.py │ ├── mdp.py │ ├── mdp_get_action_value.py │ └── qlearning.py ├── slides │ ├── 01-genetics.pdf │ ├── 02-cem.pdf │ ├── 03-tabular.pdf │ └── 04-dqn.pdf └── solutions │ ├── 00-gym.ipynb │ ├── 01-genetics.ipynb │ ├── 02-cem.ipynb │ ├── 03-tabular.ipynb │ ├── 04-dqn.ipynb │ ├── __init__.py │ ├── mdp.py │ ├── mdp_get_action_value.py │ └── qlearning.py ├── 2020 ├── code │ ├── DDPG.ipynb │ ├── DQN.ipynb │ ├── RecSimDemo.ipynb │ ├── RecSysDemo.ipynb │ └── recsim_exp │ │ ├── __init__.py │ │ ├── ddpg.py │ │ └── wolpertinger.py ├── presets │ └── wolpertinger_scheme.png └── requirements.txt ├── .gitignore ├── LICENSE └── README.md /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/.gitignore -------------------------------------------------------------------------------- /2019/code/00-gym.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/00-gym.ipynb -------------------------------------------------------------------------------- /2019/code/01-genetics.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/01-genetics.ipynb -------------------------------------------------------------------------------- /2019/code/02-cem.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/02-cem.ipynb -------------------------------------------------------------------------------- /2019/code/03-tabular.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/03-tabular.ipynb -------------------------------------------------------------------------------- /2019/code/04-dqn.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/04-dqn.ipynb -------------------------------------------------------------------------------- /2019/code/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /2019/code/mdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/mdp.py -------------------------------------------------------------------------------- /2019/code/mdp_get_action_value.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/mdp_get_action_value.py -------------------------------------------------------------------------------- /2019/code/qlearning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/code/qlearning.py -------------------------------------------------------------------------------- /2019/slides/01-genetics.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/slides/01-genetics.pdf -------------------------------------------------------------------------------- /2019/slides/02-cem.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/slides/02-cem.pdf -------------------------------------------------------------------------------- /2019/slides/03-tabular.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/slides/03-tabular.pdf -------------------------------------------------------------------------------- /2019/slides/04-dqn.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/slides/04-dqn.pdf -------------------------------------------------------------------------------- /2019/solutions/00-gym.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/00-gym.ipynb -------------------------------------------------------------------------------- /2019/solutions/01-genetics.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/01-genetics.ipynb -------------------------------------------------------------------------------- /2019/solutions/02-cem.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/02-cem.ipynb -------------------------------------------------------------------------------- /2019/solutions/03-tabular.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/03-tabular.ipynb -------------------------------------------------------------------------------- /2019/solutions/04-dqn.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/04-dqn.ipynb -------------------------------------------------------------------------------- /2019/solutions/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /2019/solutions/mdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/mdp.py -------------------------------------------------------------------------------- /2019/solutions/mdp_get_action_value.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/mdp_get_action_value.py -------------------------------------------------------------------------------- /2019/solutions/qlearning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2019/solutions/qlearning.py -------------------------------------------------------------------------------- /2020/code/DDPG.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/DDPG.ipynb -------------------------------------------------------------------------------- /2020/code/DQN.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/DQN.ipynb -------------------------------------------------------------------------------- /2020/code/RecSimDemo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/RecSimDemo.ipynb -------------------------------------------------------------------------------- /2020/code/RecSysDemo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/RecSysDemo.ipynb -------------------------------------------------------------------------------- /2020/code/recsim_exp/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/recsim_exp/__init__.py -------------------------------------------------------------------------------- /2020/code/recsim_exp/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/recsim_exp/ddpg.py -------------------------------------------------------------------------------- /2020/code/recsim_exp/wolpertinger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/code/recsim_exp/wolpertinger.py -------------------------------------------------------------------------------- /2020/presets/wolpertinger_scheme.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/presets/wolpertinger_scheme.png -------------------------------------------------------------------------------- /2020/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/2020/requirements.txt -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Scitator/RL-intro/HEAD/README.md --------------------------------------------------------------------------------