├── .gitignore ├── .gitmodules ├── .travis.yml ├── CMakeLists.txt ├── LICENSE ├── README.md ├── examples ├── cartpole-pg.sh ├── cartpole-random.sh ├── cartpole-td.sh ├── pendulum-pg.sh ├── run.lua └── sweep.sh ├── src ├── agent │ ├── baseAgent.lua │ ├── init.lua │ ├── learningUpdate │ │ ├── init.lua │ │ ├── noLearning.lua │ │ ├── reinforce.lua │ │ ├── tdLambda.lua │ │ └── util.lua │ ├── model │ │ ├── init.lua │ │ ├── mlp.lua │ │ ├── noModel.lua │ │ ├── qFunction.lua │ │ └── tilecoding.lua │ └── policy │ │ ├── actionSamplers.lua │ │ ├── egreedy.lua │ │ ├── init.lua │ │ ├── random.lua │ │ └── stochasticModelPolicy.lua ├── experiment.lua ├── init.lua ├── perf.lua └── util.lua ├── test ├── test-gym.lua └── test.lua └── twrl-scm-1.rockspec /.gitignore: -------------------------------------------------------------------------------- 1 | *logs* 2 | build/* 3 | .DS_Store 4 | venv/ 5 | examples/test* 6 | *.pyc 7 | __pycache__/ -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/.gitmodules -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/.travis.yml -------------------------------------------------------------------------------- /CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/CMakeLists.txt -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/README.md -------------------------------------------------------------------------------- /examples/cartpole-pg.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/examples/cartpole-pg.sh -------------------------------------------------------------------------------- /examples/cartpole-random.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/examples/cartpole-random.sh -------------------------------------------------------------------------------- /examples/cartpole-td.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/examples/cartpole-td.sh -------------------------------------------------------------------------------- /examples/pendulum-pg.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/examples/pendulum-pg.sh -------------------------------------------------------------------------------- /examples/run.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/examples/run.lua -------------------------------------------------------------------------------- /examples/sweep.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/examples/sweep.sh -------------------------------------------------------------------------------- /src/agent/baseAgent.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/baseAgent.lua -------------------------------------------------------------------------------- /src/agent/init.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/init.lua -------------------------------------------------------------------------------- /src/agent/learningUpdate/init.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/learningUpdate/init.lua -------------------------------------------------------------------------------- /src/agent/learningUpdate/noLearning.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/learningUpdate/noLearning.lua -------------------------------------------------------------------------------- /src/agent/learningUpdate/reinforce.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/learningUpdate/reinforce.lua -------------------------------------------------------------------------------- /src/agent/learningUpdate/tdLambda.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/learningUpdate/tdLambda.lua -------------------------------------------------------------------------------- /src/agent/learningUpdate/util.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/learningUpdate/util.lua -------------------------------------------------------------------------------- /src/agent/model/init.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/model/init.lua -------------------------------------------------------------------------------- /src/agent/model/mlp.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/model/mlp.lua -------------------------------------------------------------------------------- /src/agent/model/noModel.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/model/noModel.lua -------------------------------------------------------------------------------- /src/agent/model/qFunction.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/model/qFunction.lua -------------------------------------------------------------------------------- /src/agent/model/tilecoding.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/model/tilecoding.lua -------------------------------------------------------------------------------- /src/agent/policy/actionSamplers.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/policy/actionSamplers.lua -------------------------------------------------------------------------------- /src/agent/policy/egreedy.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/policy/egreedy.lua -------------------------------------------------------------------------------- /src/agent/policy/init.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/policy/init.lua -------------------------------------------------------------------------------- /src/agent/policy/random.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/policy/random.lua -------------------------------------------------------------------------------- /src/agent/policy/stochasticModelPolicy.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/agent/policy/stochasticModelPolicy.lua -------------------------------------------------------------------------------- /src/experiment.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/experiment.lua -------------------------------------------------------------------------------- /src/init.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/init.lua -------------------------------------------------------------------------------- /src/perf.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/perf.lua -------------------------------------------------------------------------------- /src/util.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/src/util.lua -------------------------------------------------------------------------------- /test/test-gym.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/test/test-gym.lua -------------------------------------------------------------------------------- /test/test.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/test/test.lua -------------------------------------------------------------------------------- /twrl-scm-1.rockspec: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/twitter-archive/torch-twrl/HEAD/twrl-scm-1.rockspec --------------------------------------------------------------------------------