├── LinUCB.ipynb ├── LinUCBVI.ipynb ├── NeuralUCB.ipynb ├── NeuralUCBVI.ipynb ├── Neural_Exploration_slides__MVA_RL_.pdf ├── README.md ├── figures ├── linucb_cosine.pdf ├── linucb_linear.pdf ├── linucb_quad.pdf ├── linucbvi_cosine.pdf ├── linucbvi_cosine_policy.pdf ├── linucbvi_linear.pdf ├── linucbvi_linear_policy.pdf ├── linucbvi_quad.pdf ├── linucbvi_quad_policy.pdf ├── neural_ucb_cosine.pdf ├── neural_ucb_linear.pdf ├── neural_ucb_quad.pdf ├── neural_ucbvi_cosine.pdf ├── neural_ucbvi_cosine_policy.pdf ├── neural_ucbvi_linear.pdf ├── neural_ucbvi_linear_policy.pdf ├── neural_ucbvi_quad.pdf └── neural_ucbvi_quad_policy.pdf └── neural_exploration ├── __init__.py ├── bandit.py ├── linucb.py ├── linucbvi.py ├── mdp.py ├── neuralucb.py ├── neuralucbvi.py ├── ucb.py ├── ucbvi.py └── utils.py /LinUCB.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/LinUCB.ipynb -------------------------------------------------------------------------------- /LinUCBVI.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/LinUCBVI.ipynb -------------------------------------------------------------------------------- /NeuralUCB.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/NeuralUCB.ipynb -------------------------------------------------------------------------------- /NeuralUCBVI.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/NeuralUCBVI.ipynb -------------------------------------------------------------------------------- /Neural_Exploration_slides__MVA_RL_.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/Neural_Exploration_slides__MVA_RL_.pdf -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/README.md -------------------------------------------------------------------------------- /figures/linucb_cosine.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucb_cosine.pdf -------------------------------------------------------------------------------- /figures/linucb_linear.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucb_linear.pdf -------------------------------------------------------------------------------- /figures/linucb_quad.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucb_quad.pdf -------------------------------------------------------------------------------- /figures/linucbvi_cosine.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucbvi_cosine.pdf -------------------------------------------------------------------------------- /figures/linucbvi_cosine_policy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucbvi_cosine_policy.pdf -------------------------------------------------------------------------------- /figures/linucbvi_linear.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucbvi_linear.pdf -------------------------------------------------------------------------------- /figures/linucbvi_linear_policy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucbvi_linear_policy.pdf -------------------------------------------------------------------------------- /figures/linucbvi_quad.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucbvi_quad.pdf -------------------------------------------------------------------------------- /figures/linucbvi_quad_policy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/linucbvi_quad_policy.pdf -------------------------------------------------------------------------------- /figures/neural_ucb_cosine.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucb_cosine.pdf -------------------------------------------------------------------------------- /figures/neural_ucb_linear.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucb_linear.pdf -------------------------------------------------------------------------------- /figures/neural_ucb_quad.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucb_quad.pdf -------------------------------------------------------------------------------- /figures/neural_ucbvi_cosine.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucbvi_cosine.pdf -------------------------------------------------------------------------------- /figures/neural_ucbvi_cosine_policy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucbvi_cosine_policy.pdf -------------------------------------------------------------------------------- /figures/neural_ucbvi_linear.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucbvi_linear.pdf -------------------------------------------------------------------------------- /figures/neural_ucbvi_linear_policy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucbvi_linear_policy.pdf -------------------------------------------------------------------------------- /figures/neural_ucbvi_quad.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucbvi_quad.pdf -------------------------------------------------------------------------------- /figures/neural_ucbvi_quad_policy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/figures/neural_ucbvi_quad_policy.pdf -------------------------------------------------------------------------------- /neural_exploration/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/__init__.py -------------------------------------------------------------------------------- /neural_exploration/bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/bandit.py -------------------------------------------------------------------------------- /neural_exploration/linucb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/linucb.py -------------------------------------------------------------------------------- /neural_exploration/linucbvi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/linucbvi.py -------------------------------------------------------------------------------- /neural_exploration/mdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/mdp.py -------------------------------------------------------------------------------- /neural_exploration/neuralucb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/neuralucb.py -------------------------------------------------------------------------------- /neural_exploration/neuralucbvi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/neuralucbvi.py -------------------------------------------------------------------------------- /neural_exploration/ucb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/ucb.py -------------------------------------------------------------------------------- /neural_exploration/ucbvi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/ucbvi.py -------------------------------------------------------------------------------- /neural_exploration/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/sauxpa/neural_exploration/HEAD/neural_exploration/utils.py --------------------------------------------------------------------------------