├── .gitignore ├── README.md ├── example_configs ├── common-ac.yaml ├── dt.yaml ├── iql.yaml ├── mbpo.yaml ├── ppo.yaml ├── redq.yaml ├── sac.yaml ├── sop.yaml └── td3.yaml ├── force ├── __init__.py ├── alg │ ├── __init__.py │ ├── actor_critic.py │ ├── agent.py │ ├── iql.py │ ├── mbpo.py │ ├── ppo.py │ ├── redq.py │ ├── sac.py │ ├── sop.py │ └── td3.py ├── config.py ├── data │ ├── __init__.py │ ├── base.py │ ├── circular.py │ ├── hdf5.py │ └── transition_buffer.py ├── defaults.py ├── distributions.py ├── env │ ├── __init__.py │ ├── base.py │ └── mujoco │ │ ├── __init__.py │ │ ├── ant_mod.py │ │ ├── humanoid_mod.py │ │ └── termination_functions.py ├── experiment │ ├── __init__.py │ ├── base.py │ ├── epochal.py │ └── rl.py ├── log.py ├── nn │ ├── __init__.py │ ├── layers.py │ ├── loss.py │ ├── models │ │ ├── __init__.py │ │ ├── decision_transformer.py │ │ ├── gaussian_dynamics_ensemble.py │ │ ├── mlp.py │ │ ├── transformer.py │ │ ├── value_functions.py │ │ └── vision.py │ ├── module.py │ ├── normalization.py │ ├── optim.py │ ├── shape.py │ └── util.py ├── parallel │ ├── __init__.py │ ├── jobs.py │ └── minibatcher.py ├── policies.py ├── sampling │ ├── __init__.py │ ├── rollout.py │ └── runner.py ├── schedules.py ├── scripts │ └── rollout.py ├── types.py ├── util.py └── workflow │ ├── __init__.py │ ├── filter.py │ ├── launch.py │ ├── result_server.py │ └── slurm.py ├── requirements.txt ├── scripts ├── train.py └── train_dt.py └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/README.md -------------------------------------------------------------------------------- /example_configs/common-ac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/common-ac.yaml -------------------------------------------------------------------------------- /example_configs/dt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/dt.yaml -------------------------------------------------------------------------------- /example_configs/iql.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/iql.yaml -------------------------------------------------------------------------------- /example_configs/mbpo.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/mbpo.yaml -------------------------------------------------------------------------------- /example_configs/ppo.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/ppo.yaml -------------------------------------------------------------------------------- /example_configs/redq.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/redq.yaml -------------------------------------------------------------------------------- /example_configs/sac.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/sac.yaml -------------------------------------------------------------------------------- /example_configs/sop.yaml: -------------------------------------------------------------------------------- 1 | agent: 2 | _tag: SOP -------------------------------------------------------------------------------- /example_configs/td3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/example_configs/td3.yaml -------------------------------------------------------------------------------- /force/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /force/alg/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/__init__.py -------------------------------------------------------------------------------- /force/alg/actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/actor_critic.py -------------------------------------------------------------------------------- /force/alg/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/agent.py -------------------------------------------------------------------------------- /force/alg/iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/iql.py -------------------------------------------------------------------------------- /force/alg/mbpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/mbpo.py -------------------------------------------------------------------------------- /force/alg/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/ppo.py -------------------------------------------------------------------------------- /force/alg/redq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/redq.py -------------------------------------------------------------------------------- /force/alg/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/sac.py -------------------------------------------------------------------------------- /force/alg/sop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/sop.py -------------------------------------------------------------------------------- /force/alg/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/alg/td3.py -------------------------------------------------------------------------------- /force/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/config.py -------------------------------------------------------------------------------- /force/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/data/__init__.py -------------------------------------------------------------------------------- /force/data/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/data/base.py -------------------------------------------------------------------------------- /force/data/circular.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/data/circular.py -------------------------------------------------------------------------------- /force/data/hdf5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/data/hdf5.py -------------------------------------------------------------------------------- /force/data/transition_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/data/transition_buffer.py -------------------------------------------------------------------------------- /force/defaults.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/defaults.py -------------------------------------------------------------------------------- /force/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/distributions.py -------------------------------------------------------------------------------- /force/env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/env/__init__.py -------------------------------------------------------------------------------- /force/env/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/env/base.py -------------------------------------------------------------------------------- /force/env/mujoco/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/env/mujoco/__init__.py -------------------------------------------------------------------------------- /force/env/mujoco/ant_mod.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/env/mujoco/ant_mod.py -------------------------------------------------------------------------------- /force/env/mujoco/humanoid_mod.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/env/mujoco/humanoid_mod.py -------------------------------------------------------------------------------- /force/env/mujoco/termination_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/env/mujoco/termination_functions.py -------------------------------------------------------------------------------- /force/experiment/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/experiment/__init__.py -------------------------------------------------------------------------------- /force/experiment/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/experiment/base.py -------------------------------------------------------------------------------- /force/experiment/epochal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/experiment/epochal.py -------------------------------------------------------------------------------- /force/experiment/rl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/experiment/rl.py -------------------------------------------------------------------------------- /force/log.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/log.py -------------------------------------------------------------------------------- /force/nn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/__init__.py -------------------------------------------------------------------------------- /force/nn/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/layers.py -------------------------------------------------------------------------------- /force/nn/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/loss.py -------------------------------------------------------------------------------- /force/nn/models/__init__.py: -------------------------------------------------------------------------------- 1 | from .mlp import MLP -------------------------------------------------------------------------------- /force/nn/models/decision_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/models/decision_transformer.py -------------------------------------------------------------------------------- /force/nn/models/gaussian_dynamics_ensemble.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/models/gaussian_dynamics_ensemble.py -------------------------------------------------------------------------------- /force/nn/models/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/models/mlp.py -------------------------------------------------------------------------------- /force/nn/models/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/models/transformer.py -------------------------------------------------------------------------------- /force/nn/models/value_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/models/value_functions.py -------------------------------------------------------------------------------- /force/nn/models/vision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/models/vision.py -------------------------------------------------------------------------------- /force/nn/module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/module.py -------------------------------------------------------------------------------- /force/nn/normalization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/normalization.py -------------------------------------------------------------------------------- /force/nn/optim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/optim.py -------------------------------------------------------------------------------- /force/nn/shape.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/shape.py -------------------------------------------------------------------------------- /force/nn/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/nn/util.py -------------------------------------------------------------------------------- /force/parallel/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /force/parallel/jobs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/parallel/jobs.py -------------------------------------------------------------------------------- /force/parallel/minibatcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/parallel/minibatcher.py -------------------------------------------------------------------------------- /force/policies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/policies.py -------------------------------------------------------------------------------- /force/sampling/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/sampling/__init__.py -------------------------------------------------------------------------------- /force/sampling/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/sampling/rollout.py -------------------------------------------------------------------------------- /force/sampling/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/sampling/runner.py -------------------------------------------------------------------------------- /force/schedules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/schedules.py -------------------------------------------------------------------------------- /force/scripts/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/scripts/rollout.py -------------------------------------------------------------------------------- /force/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/types.py -------------------------------------------------------------------------------- /force/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/util.py -------------------------------------------------------------------------------- /force/workflow/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /force/workflow/filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/workflow/filter.py -------------------------------------------------------------------------------- /force/workflow/launch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/workflow/launch.py -------------------------------------------------------------------------------- /force/workflow/result_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/workflow/result_server.py -------------------------------------------------------------------------------- /force/workflow/slurm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/force/workflow/slurm.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/scripts/train.py -------------------------------------------------------------------------------- /scripts/train_dt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/scripts/train_dt.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/gwthomas/force/HEAD/setup.py --------------------------------------------------------------------------------