├── .gitignore ├── LICENSE.md ├── README.md ├── src ├── base.jl ├── envs │ ├── atari_mdp.jl │ ├── classiccontrol_mdp.jl │ └── toytext_mdp.jl ├── policies │ ├── crossentropy_policy.jl │ ├── deep_crossentropy_policy.jl │ ├── dqn_policy.jl │ ├── evolution_policy.jl │ └── value_table_policy.jl └── solvers │ ├── crossentropy_policy_solver.jl │ ├── deep_crossentropy_policy_solver.jl │ ├── dqn_policy_solver.jl │ ├── ev_sarsa_policy_solver.jl │ ├── evolution_policy_solver.jl │ ├── sarsa_policy_solver.jl │ └── value_table_policy_solver.jl ├── week_0.jl ├── week_1.jl ├── week_1_2.jl ├── week_2.jl ├── week_3.jl ├── week_3_2.jl └── week_4.jl /.gitignore: -------------------------------------------------------------------------------- 1 | 2 | test.jl 3 | weights -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/LICENSE.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/README.md -------------------------------------------------------------------------------- /src/base.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/base.jl -------------------------------------------------------------------------------- /src/envs/atari_mdp.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/envs/atari_mdp.jl -------------------------------------------------------------------------------- /src/envs/classiccontrol_mdp.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/envs/classiccontrol_mdp.jl -------------------------------------------------------------------------------- /src/envs/toytext_mdp.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/envs/toytext_mdp.jl -------------------------------------------------------------------------------- /src/policies/crossentropy_policy.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/policies/crossentropy_policy.jl -------------------------------------------------------------------------------- /src/policies/deep_crossentropy_policy.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/policies/deep_crossentropy_policy.jl -------------------------------------------------------------------------------- /src/policies/dqn_policy.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/policies/dqn_policy.jl -------------------------------------------------------------------------------- /src/policies/evolution_policy.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/policies/evolution_policy.jl -------------------------------------------------------------------------------- /src/policies/value_table_policy.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/policies/value_table_policy.jl -------------------------------------------------------------------------------- /src/solvers/crossentropy_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/crossentropy_policy_solver.jl -------------------------------------------------------------------------------- /src/solvers/deep_crossentropy_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/deep_crossentropy_policy_solver.jl -------------------------------------------------------------------------------- /src/solvers/dqn_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/dqn_policy_solver.jl -------------------------------------------------------------------------------- /src/solvers/ev_sarsa_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/ev_sarsa_policy_solver.jl -------------------------------------------------------------------------------- /src/solvers/evolution_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/evolution_policy_solver.jl -------------------------------------------------------------------------------- /src/solvers/sarsa_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/sarsa_policy_solver.jl -------------------------------------------------------------------------------- /src/solvers/value_table_policy_solver.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/src/solvers/value_table_policy_solver.jl -------------------------------------------------------------------------------- /week_0.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_0.jl -------------------------------------------------------------------------------- /week_1.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_1.jl -------------------------------------------------------------------------------- /week_1_2.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_1_2.jl -------------------------------------------------------------------------------- /week_2.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_2.jl -------------------------------------------------------------------------------- /week_3.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_3.jl -------------------------------------------------------------------------------- /week_3_2.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_3_2.jl -------------------------------------------------------------------------------- /week_4.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dmitrijsc/practical-rl/HEAD/week_4.jl --------------------------------------------------------------------------------