├── .gitignore ├── LICENSE ├── README.md ├── hw1 ├── .DS_Store ├── DAgger.bash ├── DAgger.py ├── HW1.pdf ├── README.md ├── demo.bash ├── experts │ ├── Ant-v1.pkl │ ├── HalfCheetah-v1.pkl │ ├── Hopper-v1.pkl │ ├── Humanoid-v1.pkl │ ├── Reacher-v1.pkl │ └── Walker2d-v1.pkl ├── load_policy.py ├── model.py ├── run_expert.py └── tf_util.py ├── hw2 ├── HW2.pdf ├── TestNoteBook.ipynb ├── hw2_final.pdf ├── logz.py ├── plot.py └── train_pg.py ├── hw3 ├── HW3.pdf ├── README ├── Testing.ipynb ├── atari_wrappers.py ├── dqn.py ├── dqn_utils.py ├── run_dqn_atari.py └── run_dqn_ram.py ├── hw4 ├── HW4.pdf ├── Testing.ipynb ├── cheetah_env.py ├── controllers.py ├── cost_functions.py ├── data │ ├── mb_mpc_HalfCheetah-v1_25-06-2018_14-51-34 │ │ └── log.txt │ ├── mb_mpc_HalfCheetah-v1_25-06-2018_15-01-46 │ │ └── log.txt │ ├── mb_mpc_HalfCheetah-v1_25-06-2018_15-22-28 │ │ └── log.txt │ ├── mb_mpc_HalfCheetah-v1_25-06-2018_15-23-41 │ │ └── log.txt │ └── mb_mpc_HalfCheetah-v1_25-06-2018_15-28-11 │ │ └── log.txt ├── dynamics.py ├── logz.py ├── main.py └── plot.py └── sp17_hw ├── hw1 ├── README.md ├── demo.bash ├── experts │ ├── Ant-v1.pkl │ ├── HalfCheetah-v1.pkl │ ├── Hopper-v1.pkl │ ├── Humanoid-v1.pkl │ ├── Reacher-v1.pkl │ └── Walker2d-v1.pkl ├── load_policy.py ├── run_expert.py └── tf_util.py ├── hw2 ├── HW2.ipynb ├── discrete_env.py └── frozen_lake.py ├── hw3 ├── README ├── atari_wrappers.py ├── dqn.py ├── dqn_utils.py ├── run_dqn_atari.py └── run_dqn_ram.py └── hw4 ├── homework.md ├── logz.py ├── main.py └── plot_learning_curves.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/README.md -------------------------------------------------------------------------------- /hw1/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/.DS_Store -------------------------------------------------------------------------------- /hw1/DAgger.bash: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/DAgger.bash -------------------------------------------------------------------------------- /hw1/DAgger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/DAgger.py -------------------------------------------------------------------------------- /hw1/HW1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/HW1.pdf -------------------------------------------------------------------------------- /hw1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/README.md -------------------------------------------------------------------------------- /hw1/demo.bash: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/demo.bash -------------------------------------------------------------------------------- /hw1/experts/Ant-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/experts/Ant-v1.pkl -------------------------------------------------------------------------------- /hw1/experts/HalfCheetah-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/experts/HalfCheetah-v1.pkl -------------------------------------------------------------------------------- /hw1/experts/Hopper-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/experts/Hopper-v1.pkl -------------------------------------------------------------------------------- /hw1/experts/Humanoid-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/experts/Humanoid-v1.pkl -------------------------------------------------------------------------------- /hw1/experts/Reacher-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/experts/Reacher-v1.pkl -------------------------------------------------------------------------------- /hw1/experts/Walker2d-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/experts/Walker2d-v1.pkl -------------------------------------------------------------------------------- /hw1/load_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/load_policy.py -------------------------------------------------------------------------------- /hw1/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/model.py -------------------------------------------------------------------------------- /hw1/run_expert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/run_expert.py -------------------------------------------------------------------------------- /hw1/tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw1/tf_util.py -------------------------------------------------------------------------------- /hw2/HW2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw2/HW2.pdf -------------------------------------------------------------------------------- /hw2/TestNoteBook.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw2/TestNoteBook.ipynb -------------------------------------------------------------------------------- /hw2/hw2_final.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw2/hw2_final.pdf -------------------------------------------------------------------------------- /hw2/logz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw2/logz.py -------------------------------------------------------------------------------- /hw2/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw2/plot.py -------------------------------------------------------------------------------- /hw2/train_pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw2/train_pg.py -------------------------------------------------------------------------------- /hw3/HW3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/HW3.pdf -------------------------------------------------------------------------------- /hw3/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/README -------------------------------------------------------------------------------- /hw3/Testing.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/Testing.ipynb -------------------------------------------------------------------------------- /hw3/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/atari_wrappers.py -------------------------------------------------------------------------------- /hw3/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/dqn.py -------------------------------------------------------------------------------- /hw3/dqn_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/dqn_utils.py -------------------------------------------------------------------------------- /hw3/run_dqn_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/run_dqn_atari.py -------------------------------------------------------------------------------- /hw3/run_dqn_ram.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw3/run_dqn_ram.py -------------------------------------------------------------------------------- /hw4/HW4.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/HW4.pdf -------------------------------------------------------------------------------- /hw4/Testing.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/Testing.ipynb -------------------------------------------------------------------------------- /hw4/cheetah_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/cheetah_env.py -------------------------------------------------------------------------------- /hw4/controllers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/controllers.py -------------------------------------------------------------------------------- /hw4/cost_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/cost_functions.py -------------------------------------------------------------------------------- /hw4/data/mb_mpc_HalfCheetah-v1_25-06-2018_14-51-34/log.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /hw4/data/mb_mpc_HalfCheetah-v1_25-06-2018_15-01-46/log.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /hw4/data/mb_mpc_HalfCheetah-v1_25-06-2018_15-22-28/log.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /hw4/data/mb_mpc_HalfCheetah-v1_25-06-2018_15-23-41/log.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /hw4/data/mb_mpc_HalfCheetah-v1_25-06-2018_15-28-11/log.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /hw4/dynamics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/dynamics.py -------------------------------------------------------------------------------- /hw4/logz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/logz.py -------------------------------------------------------------------------------- /hw4/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/main.py -------------------------------------------------------------------------------- /hw4/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/hw4/plot.py -------------------------------------------------------------------------------- /sp17_hw/hw1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/README.md -------------------------------------------------------------------------------- /sp17_hw/hw1/demo.bash: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/demo.bash -------------------------------------------------------------------------------- /sp17_hw/hw1/experts/Ant-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/experts/Ant-v1.pkl -------------------------------------------------------------------------------- /sp17_hw/hw1/experts/HalfCheetah-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/experts/HalfCheetah-v1.pkl -------------------------------------------------------------------------------- /sp17_hw/hw1/experts/Hopper-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/experts/Hopper-v1.pkl -------------------------------------------------------------------------------- /sp17_hw/hw1/experts/Humanoid-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/experts/Humanoid-v1.pkl -------------------------------------------------------------------------------- /sp17_hw/hw1/experts/Reacher-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/experts/Reacher-v1.pkl -------------------------------------------------------------------------------- /sp17_hw/hw1/experts/Walker2d-v1.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/experts/Walker2d-v1.pkl -------------------------------------------------------------------------------- /sp17_hw/hw1/load_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/load_policy.py -------------------------------------------------------------------------------- /sp17_hw/hw1/run_expert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/run_expert.py -------------------------------------------------------------------------------- /sp17_hw/hw1/tf_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw1/tf_util.py -------------------------------------------------------------------------------- /sp17_hw/hw2/HW2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw2/HW2.ipynb -------------------------------------------------------------------------------- /sp17_hw/hw2/discrete_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw2/discrete_env.py -------------------------------------------------------------------------------- /sp17_hw/hw2/frozen_lake.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw2/frozen_lake.py -------------------------------------------------------------------------------- /sp17_hw/hw3/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw3/README -------------------------------------------------------------------------------- /sp17_hw/hw3/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw3/atari_wrappers.py -------------------------------------------------------------------------------- /sp17_hw/hw3/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw3/dqn.py -------------------------------------------------------------------------------- /sp17_hw/hw3/dqn_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw3/dqn_utils.py -------------------------------------------------------------------------------- /sp17_hw/hw3/run_dqn_atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw3/run_dqn_atari.py -------------------------------------------------------------------------------- /sp17_hw/hw3/run_dqn_ram.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw3/run_dqn_ram.py -------------------------------------------------------------------------------- /sp17_hw/hw4/homework.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw4/homework.md -------------------------------------------------------------------------------- /sp17_hw/hw4/logz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw4/logz.py -------------------------------------------------------------------------------- /sp17_hw/hw4/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw4/main.py -------------------------------------------------------------------------------- /sp17_hw/hw4/plot_learning_curves.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/louaaron/CS294_homework/HEAD/sp17_hw/hw4/plot_learning_curves.py --------------------------------------------------------------------------------