├── .gitignore ├── LICENSE ├── hw1 ├── README.md ├── demo.bash ├── experts │ ├── RoboschoolAnt-v1.py │ ├── RoboschoolHalfCheetah-v1.py │ ├── RoboschoolHopper-v1.py │ ├── RoboschoolHumanoid-v1.py │ ├── RoboschoolReacher-v1.py │ └── RoboschoolWalker2d-v1.py └── run_expert.py ├── hw2 ├── hw2_final.pdf ├── logz.py ├── plot.py └── train_pg.py ├── hw3 ├── README ├── atari_wrappers.py ├── dqn.py ├── dqn_utils.py ├── run_dqn_atari.py └── run_dqn_ram.py ├── hw4 ├── README ├── cheetah_env.py ├── controllers.py ├── cost_functions.py ├── dynamics.py ├── logz.py ├── main.py └── plot.py ├── sp17_hw2 ├── HW2.ipynb ├── discrete_env.py └── frozen_lake.py └── sp17_hw4 ├── README.md ├── logz.py ├── main.py └── plot_learning_curves.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/LICENSE -------------------------------------------------------------------------------- /hw1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/README.md -------------------------------------------------------------------------------- /hw1/demo.bash: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/demo.bash -------------------------------------------------------------------------------- /hw1/experts/RoboschoolAnt-v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/experts/RoboschoolAnt-v1.py -------------------------------------------------------------------------------- /hw1/experts/RoboschoolHalfCheetah-v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/experts/RoboschoolHalfCheetah-v1.py -------------------------------------------------------------------------------- /hw1/experts/RoboschoolHopper-v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/experts/RoboschoolHopper-v1.py -------------------------------------------------------------------------------- /hw1/experts/RoboschoolHumanoid-v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/experts/RoboschoolHumanoid-v1.py -------------------------------------------------------------------------------- /hw1/experts/RoboschoolReacher-v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/experts/RoboschoolReacher-v1.py -------------------------------------------------------------------------------- /hw1/experts/RoboschoolWalker2d-v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/experts/RoboschoolWalker2d-v1.py -------------------------------------------------------------------------------- /hw1/run_expert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw1/run_expert.py -------------------------------------------------------------------------------- /hw2/hw2_final.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw2/hw2_final.pdf -------------------------------------------------------------------------------- /hw2/logz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw2/logz.py -------------------------------------------------------------------------------- /hw2/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw2/plot.py -------------------------------------------------------------------------------- /hw2/train_pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw2/train_pg.py -------------------------------------------------------------------------------- /hw3/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw3/README -------------------------------------------------------------------------------- /hw3/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw3/atari_wrappers.py -------------------------------------------------------------------------------- /hw3/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw3/dqn.py -------------------------------------------------------------------------------- /hw3/dqn_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw3/dqn_utils.py -------------------------------------------------------------------------------- /hw3/run_dqn_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw3/run_dqn_atari.py -------------------------------------------------------------------------------- /hw3/run_dqn_ram.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw3/run_dqn_ram.py -------------------------------------------------------------------------------- /hw4/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/README -------------------------------------------------------------------------------- /hw4/cheetah_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/cheetah_env.py -------------------------------------------------------------------------------- /hw4/controllers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/controllers.py -------------------------------------------------------------------------------- /hw4/cost_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/cost_functions.py -------------------------------------------------------------------------------- /hw4/dynamics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/dynamics.py -------------------------------------------------------------------------------- /hw4/logz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/logz.py -------------------------------------------------------------------------------- /hw4/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/main.py -------------------------------------------------------------------------------- /hw4/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/hw4/plot.py -------------------------------------------------------------------------------- /sp17_hw2/HW2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw2/HW2.ipynb -------------------------------------------------------------------------------- /sp17_hw2/discrete_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw2/discrete_env.py -------------------------------------------------------------------------------- /sp17_hw2/frozen_lake.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw2/frozen_lake.py -------------------------------------------------------------------------------- /sp17_hw4/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw4/README.md -------------------------------------------------------------------------------- /sp17_hw4/logz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw4/logz.py -------------------------------------------------------------------------------- /sp17_hw4/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw4/main.py -------------------------------------------------------------------------------- /sp17_hw4/plot_learning_curves.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EbTech/CS294/HEAD/sp17_hw4/plot_learning_curves.py --------------------------------------------------------------------------------