├── .gitignore ├── LICENSE ├── README.md ├── data ├── collect_data.py ├── stats.py └── utils.py ├── gpu_requirements.txt ├── instructrl ├── __init__.py ├── data.py ├── envs │ ├── __init__.py │ ├── custom.py │ ├── rlbench.py │ └── rollout.py ├── instructrl_main.py ├── local_run.py ├── model.py ├── models │ ├── m3ae │ │ ├── __init__.py │ │ ├── jax_utils.py │ │ ├── model.py │ │ └── utils.py │ └── openai │ │ ├── __init__.py │ │ ├── download.py │ │ ├── layers.py │ │ ├── model.py │ │ └── tokenizer.py └── utils.py ├── jobs ├── eval.sh ├── tpu_control.sh └── train.sh ├── pictures └── model.jpg └── scripts ├── coppeliasim.sh ├── ssh_copy.sh ├── ssh_launch.sh ├── ssh_stop.sh ├── ssh_vm_setup.sh └── tpu_vm_setup.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/README.md -------------------------------------------------------------------------------- /data/collect_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/data/collect_data.py -------------------------------------------------------------------------------- /data/stats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/data/stats.py -------------------------------------------------------------------------------- /data/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/data/utils.py -------------------------------------------------------------------------------- /gpu_requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/gpu_requirements.txt -------------------------------------------------------------------------------- /instructrl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /instructrl/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/data.py -------------------------------------------------------------------------------- /instructrl/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /instructrl/envs/custom.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/envs/custom.py -------------------------------------------------------------------------------- /instructrl/envs/rlbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/envs/rlbench.py -------------------------------------------------------------------------------- /instructrl/envs/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/envs/rollout.py -------------------------------------------------------------------------------- /instructrl/instructrl_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/instructrl_main.py -------------------------------------------------------------------------------- /instructrl/local_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/local_run.py -------------------------------------------------------------------------------- /instructrl/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/model.py -------------------------------------------------------------------------------- /instructrl/models/m3ae/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /instructrl/models/m3ae/jax_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/m3ae/jax_utils.py -------------------------------------------------------------------------------- /instructrl/models/m3ae/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/m3ae/model.py -------------------------------------------------------------------------------- /instructrl/models/m3ae/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/m3ae/utils.py -------------------------------------------------------------------------------- /instructrl/models/openai/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /instructrl/models/openai/download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/openai/download.py -------------------------------------------------------------------------------- /instructrl/models/openai/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/openai/layers.py -------------------------------------------------------------------------------- /instructrl/models/openai/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/openai/model.py -------------------------------------------------------------------------------- /instructrl/models/openai/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/models/openai/tokenizer.py -------------------------------------------------------------------------------- /instructrl/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/instructrl/utils.py -------------------------------------------------------------------------------- /jobs/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/jobs/eval.sh -------------------------------------------------------------------------------- /jobs/tpu_control.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/jobs/tpu_control.sh -------------------------------------------------------------------------------- /jobs/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/jobs/train.sh -------------------------------------------------------------------------------- /pictures/model.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/pictures/model.jpg -------------------------------------------------------------------------------- /scripts/coppeliasim.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/scripts/coppeliasim.sh -------------------------------------------------------------------------------- /scripts/ssh_copy.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/scripts/ssh_copy.sh -------------------------------------------------------------------------------- /scripts/ssh_launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/scripts/ssh_launch.sh -------------------------------------------------------------------------------- /scripts/ssh_stop.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/scripts/ssh_stop.sh -------------------------------------------------------------------------------- /scripts/ssh_vm_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/scripts/ssh_vm_setup.sh -------------------------------------------------------------------------------- /scripts/tpu_vm_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/haoliuhl/instructrl/HEAD/scripts/tpu_vm_setup.sh --------------------------------------------------------------------------------