├── .gitignore ├── LICENSE ├── MUJOCO_LOG.TXT ├── README.md ├── RL_algorithms ├── Torch │ ├── .DS_Store │ ├── DDPG │ │ └── DDPG_ENV │ │ │ ├── core.py │ │ │ ├── ddpg.py │ │ │ ├── logger │ │ │ ├── events.out.tfevents.1658931832.Tosins-MacBook-Air.local.42757.0 │ │ │ ├── events.out.tfevents.1658931911.Tosins-MacBook-Air.local.42851.0 │ │ │ ├── events.out.tfevents.1658931934.Tosins-MacBook-Air.local.42904.0 │ │ │ ├── events.out.tfevents.1658932019.Tosins-MacBook-Air.local.42965.0 │ │ │ ├── events.out.tfevents.1658932066.Tosins-MacBook-Air.local.43009.0 │ │ │ ├── events.out.tfevents.1658932179.Tosins-MacBook-Air.local.43178.0 │ │ │ ├── events.out.tfevents.1658932723.Tosins-MacBook-Air.local.43565.0 │ │ │ └── events.out.tfevents.1658932834.Tosins-MacBook-Air.local.43628.0 │ │ │ ├── memory.py │ │ │ └── training_log_csv │ │ │ ├── Avg Reward (1).svg │ │ │ └── run-.-tag-Avg Reward (1).csv │ ├── MAPPO │ │ ├── LICENSE │ │ ├── README.md │ │ ├── environment.yaml │ │ ├── onpolicy │ │ │ ├── __init__.py │ │ │ ├── algorithms │ │ │ │ ├── __init__.py │ │ │ │ ├── happo │ │ │ │ │ ├── happo_trainer.py │ │ │ │ │ └── policy.py │ │ │ │ ├── hatrpo │ │ │ │ │ ├── hatrpo_trainer.py │ │ │ │ │ └── policy.py │ │ │ │ ├── mat │ │ │ │ │ ├── algorithm │ │ │ │ │ │ ├── ma_transformer.py │ │ │ │ │ │ └── transformer_policy.py │ │ │ │ │ └── mat_trainer.py │ │ │ │ ├── r_mappo │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── algorithm │ │ │ │ │ │ ├── actor.py │ │ │ │ │ │ ├── rMAPPOPolicy.py │ │ │ │ │ │ └── r_actor_critic.py │ │ │ │ │ └── r_mappo.py │ │ │ │ └── utils │ │ │ │ │ ├── act.py │ │ │ │ │ ├── cnn.py │ │ │ │ │ ├── distributions.py │ │ │ │ │ ├── mlp.py │ │ │ │ │ ├── popart.py │ │ │ │ │ ├── popart_hatrpo.py │ │ │ │ │ ├── rnn.py │ │ │ │ │ ├── transformer_act.py │ │ │ │ │ └── util.py │ │ │ ├── config.py │ │ │ ├── envs │ │ │ │ ├── __init__.py │ │ │ │ ├── env_wrappers.py │ │ │ │ ├── football │ │ │ │ │ ├── .DS_Store │ │ │ │ │ └── Football_Env.py │ │ │ │ ├── hanabi │ │ │ │ │ ├── CMakeLists.txt │ │ │ │ │ ├── Hanabi_Env.py │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── clean_all.sh │ │ │ │ │ ├── hanabi_lib │ │ │ │ │ │ ├── CMakeLists.txt │ │ │ │ │ │ ├── canonical_encoders.cc │ │ │ │ │ │ ├── canonical_encoders.h │ │ │ │ │ │ ├── hanabi_card.cc │ │ │ │ │ │ ├── hanabi_card.h │ │ │ │ │ │ ├── hanabi_game.cc │ │ │ │ │ │ ├── hanabi_game.h │ │ │ │ │ │ ├── hanabi_hand.cc │ │ │ │ │ │ ├── hanabi_hand.h │ │ │ │ │ │ ├── hanabi_history_item.cc │ │ │ │ │ │ ├── hanabi_history_item.h │ │ │ │ │ │ ├── hanabi_move.cc │ │ │ │ │ │ ├── hanabi_move.h │ │ │ │ │ │ ├── hanabi_observation.cc │ │ │ │ │ │ ├── hanabi_observation.h │ │ │ │ │ │ ├── hanabi_state.cc │ │ │ │ │ │ ├── hanabi_state.h │ │ │ │ │ │ ├── observation_encoder.h │ │ │ │ │ │ ├── util.cc │ │ │ │ │ │ └── util.h │ │ │ │ │ ├── pyhanabi.cc │ │ │ │ │ ├── pyhanabi.h │ │ │ │ │ └── pyhanabi.py │ │ │ │ ├── mpe │ │ │ │ │ ├── MPE_env.py │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── core.py │ │ │ │ │ ├── environment.py │ │ │ │ │ ├── multi_discrete.py │ │ │ │ │ ├── rendering.py │ │ │ │ │ ├── scenario.py │ │ │ │ │ └── scenarios │ │ │ │ │ │ ├── __init__.py │ │ │ │ │ │ ├── simple_adversary.py │ │ │ │ │ │ ├── simple_attack.py │ │ │ │ │ │ ├── simple_crypto.py │ │ │ │ │ │ ├── simple_crypto_display.py │ │ │ │ │ │ ├── simple_push.py │ │ │ │ │ │ ├── simple_reference.py │ │ │ │ │ │ ├── simple_speaker_listener.py │ │ │ │ │ │ ├── simple_spread.py │ │ │ │ │ │ ├── simple_tag.py │ │ │ │ │ │ └── simple_world_comm.py │ │ │ │ ├── spacerobot │ │ │ │ │ ├── SpaceRobotBaseRot_env.py │ │ │ │ │ ├── SpaceRobotDualArmWithRot_env.py │ │ │ │ │ └── SpaceRobotFourArm_env.py │ │ │ │ └── starcraft2 │ │ │ │ │ ├── SMACv2.py │ │ │ │ │ ├── SMACv2_modified.py │ │ │ │ │ ├── StarCraft2_Env.py │ │ │ │ │ ├── StarCraft2v2 │ │ │ │ │ ├── distributions.py │ │ │ │ │ ├── starcraft2.py │ │ │ │ │ └── wrapper.py │ │ │ │ │ ├── multiagentenv.py │ │ │ │ │ └── smac_maps.py │ │ │ ├── runner │ │ │ │ ├── separated │ │ │ │ │ ├── base_runner.py │ │ │ │ │ ├── mpe_runner.py │ │ │ │ │ ├── smac_runner.py │ │ │ │ │ └── spacerobot_runner.py │ │ │ │ └── shared │ │ │ │ │ ├── base_runner.py │ │ │ │ │ ├── football_runner.py │ │ │ │ │ ├── hanabi_runner_forward.py │ │ │ │ │ ├── mpe_runner.py │ │ │ │ │ └── smac_runner.py │ │ │ ├── scripts │ │ │ │ ├── __init__.py │ │ │ │ ├── eval │ │ │ │ │ └── eval_hanabi.py │ │ │ │ ├── eval_hanabi_forward.sh │ │ │ │ ├── render │ │ │ │ │ ├── render_football.py │ │ │ │ │ └── render_mpe.py │ │ │ │ ├── render_football.sh │ │ │ │ ├── render_mpe.sh │ │ │ │ ├── train │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── train_football.py │ │ │ │ │ ├── train_hanabi_forward.py │ │ │ │ │ ├── train_mpe.py │ │ │ │ │ ├── train_smac.py │ │ │ │ │ └── train_spacerobot.py │ │ │ │ ├── train_football_scripts │ │ │ │ │ ├── train_football_3v1.sh │ │ │ │ │ ├── train_football_ca_easy.sh │ │ │ │ │ ├── train_football_ca_hard.sh │ │ │ │ │ ├── train_football_corner.sh │ │ │ │ │ ├── train_football_rp.sh │ │ │ │ │ └── train_football_rps.sh │ │ │ │ ├── train_hanabi_forward.sh │ │ │ │ ├── train_mpe_scripts │ │ │ │ │ ├── train_mpe_comm.sh │ │ │ │ │ ├── train_mpe_reference.sh │ │ │ │ │ └── train_mpe_spread.sh │ │ │ │ ├── train_other_algo │ │ │ │ │ ├── train_happo.sh │ │ │ │ │ ├── train_hatrpo.sh │ │ │ │ │ ├── train_mat.sh │ │ │ │ │ └── train_mat_dec.sh │ │ │ │ ├── train_smac_scripts │ │ │ │ │ ├── train_smac_10m_vs_11m.sh │ │ │ │ │ ├── train_smac_1c3s5z.sh │ │ │ │ │ ├── train_smac_25m.sh │ │ │ │ │ ├── train_smac_27m_vs_30m.sh │ │ │ │ │ ├── train_smac_2c_vs_64zg.sh │ │ │ │ │ ├── train_smac_2m_vs_1z.sh │ │ │ │ │ ├── train_smac_2s_vs_1sc.sh │ │ │ │ │ ├── train_smac_3m.sh │ │ │ │ │ ├── train_smac_3s5z.sh │ │ │ │ │ ├── train_smac_3s5z_vs_3s6z.sh │ │ │ │ │ ├── train_smac_3s_vs_3z.sh │ │ │ │ │ ├── train_smac_3s_vs_4z.sh │ │ │ │ │ ├── train_smac_3s_vs_5z.sh │ │ │ │ │ ├── train_smac_5m_vs_6m.sh │ │ │ │ │ ├── train_smac_6h_vs_8z.sh │ │ │ │ │ ├── train_smac_8m.sh │ │ │ │ │ ├── train_smac_8m_vs_9m.sh │ │ │ │ │ ├── train_smac_MMM.sh │ │ │ │ │ ├── train_smac_MMM2.sh │ │ │ │ │ ├── train_smac_bane_vs_bane.sh │ │ │ │ │ ├── train_smac_baneling.sh │ │ │ │ │ └── train_smac_corridor.sh │ │ │ │ ├── train_smacv2_scripts │ │ │ │ │ ├── train_protoss_10v10.sh │ │ │ │ │ ├── train_protoss_10v11.sh │ │ │ │ │ ├── train_protoss_20v20.sh │ │ │ │ │ ├── train_protoss_20v23.sh │ │ │ │ │ ├── train_protoss_5v5.sh │ │ │ │ │ ├── train_terran_10v10.sh │ │ │ │ │ ├── train_terran_10v11.sh │ │ │ │ │ ├── train_terran_20v20.sh │ │ │ │ │ ├── train_terran_20v23.sh │ │ │ │ │ ├── train_terran_5v5.sh │ │ │ │ │ ├── train_zerg_10v10.sh │ │ │ │ │ ├── train_zerg_10v11.sh │ │ │ │ │ ├── train_zerg_20v20.sh │ │ │ │ │ ├── train_zerg_20v23.sh │ │ │ │ │ └── train_zerg_5v5.sh │ │ │ │ ├── train_spacerobot.sh │ │ │ │ ├── train_spacerobot_4arm.sh │ │ │ │ └── train_spacerobot_one_agent.sh │ │ │ └── utils │ │ │ │ ├── __init__.py │ │ │ │ ├── multi_discrete.py │ │ │ │ ├── separated_buffer.py │ │ │ │ ├── shared_buffer.py │ │ │ │ ├── util.py │ │ │ │ └── valuenorm.py │ │ ├── requirements.txt │ │ └── setup.py │ ├── PPO │ │ ├── Continious │ │ │ ├── PPO │ │ │ │ ├── __init__.py │ │ │ │ ├── actor.py │ │ │ │ ├── agent.py │ │ │ │ ├── critic.py │ │ │ │ ├── main.py │ │ │ │ ├── memory.py │ │ │ │ ├── models │ │ │ │ │ ├── space_robot_actor.pt │ │ │ │ │ └── space_robot_critic.pt │ │ │ │ ├── plots │ │ │ │ │ └── space_robot_performance.png │ │ │ │ └── utils.py │ │ │ ├── PPO_Two_heads │ │ │ │ ├── __init__.py │ │ │ │ ├── actor.py │ │ │ │ ├── agent.py │ │ │ │ ├── critic.py │ │ │ │ ├── main.py │ │ │ │ ├── memory.py │ │ │ │ ├── models │ │ │ │ │ ├── space_robot_actor.pt │ │ │ │ │ └── space_robot_critic.pt │ │ │ │ ├── plots │ │ │ │ │ └── space_robot_performance.png │ │ │ │ └── utils.py │ │ │ └── __init__.py │ │ ├── Discrete │ │ │ ├── PPO │ │ │ │ ├── __init__.py │ │ │ │ ├── actor.py │ │ │ │ ├── agent.py │ │ │ │ ├── critic.py │ │ │ │ ├── main.py │ │ │ │ ├── memory.py │ │ │ │ ├── models │ │ │ │ │ ├── space_robot_actor.pt │ │ │ │ │ └── space_robot_critic.pt │ │ │ │ ├── plots │ │ │ │ │ └── space_robot_performance.png │ │ │ │ ├── training_log │ │ │ │ └── utils.py │ │ │ └── PPOImage │ │ │ │ ├── __init__.py │ │ │ │ ├── actor.py │ │ │ │ ├── agent.py │ │ │ │ ├── critic.py │ │ │ │ ├── main.py │ │ │ │ ├── memory.py │ │ │ │ ├── models │ │ │ │ ├── .space_robot_actor.pt.icloud │ │ │ │ └── .space_robot_critic.pt.icloud │ │ │ │ ├── plots │ │ │ │ └── space_robot_performance.png │ │ │ │ └── utils.py │ │ ├── PPO_test.py │ │ ├── PPO_test_2.py │ │ ├── __init__.py │ │ └── test_ppo.py │ ├── SAC │ │ ├── SAC_ENV │ │ │ ├── core.py │ │ │ ├── logger │ │ │ │ ├── events.out.tfevents.1658847118.Tosins-Air.19214.0 │ │ │ │ ├── events.out.tfevents.1658847140.Tosins-Air.19431.0 │ │ │ │ ├── events.out.tfevents.1658847454.Tosins-Air.19535.0 │ │ │ │ ├── events.out.tfevents.1658847513.Tosins-Air.19931.0 │ │ │ │ ├── events.out.tfevents.1658847612.Tosins-Air.19979.0 │ │ │ │ ├── events.out.tfevents.1658847918.Tosins-Air.20089.0 │ │ │ │ ├── events.out.tfevents.1658848049.Tosins-Air.20232.0 │ │ │ │ ├── events.out.tfevents.1658848339.Tosins-Air.20384.0 │ │ │ │ ├── events.out.tfevents.1658848364.Tosins-Air.20423.0 │ │ │ │ ├── events.out.tfevents.1658848673.Tosins-Air.20649.0 │ │ │ │ ├── events.out.tfevents.1658848831.Tosins-Air.20793.0 │ │ │ │ ├── events.out.tfevents.1658849191.Tosins-Air.20924.0 │ │ │ │ ├── events.out.tfevents.1658849218.Tosins-Air.20984.0 │ │ │ │ ├── events.out.tfevents.1658849777.Tosins-Air.21229.0 │ │ │ │ ├── events.out.tfevents.1658849785.Tosins-Air.21269.0 │ │ │ │ ├── events.out.tfevents.1658849885.Tosins-Air.21429.0 │ │ │ │ ├── events.out.tfevents.1658849941.Tosins-Air.21521.0 │ │ │ │ └── events.out.tfevents.1658850278.Tosins-Air.21678.0 │ │ │ ├── memory.py │ │ │ ├── sac.py │ │ │ └── training_log_csv │ │ │ │ ├── run-.-tag-Avg Reward.csv │ │ │ │ └── run-.-tag-Loss_Pi.csv │ │ └── __init__.py │ ├── __init__.py │ └── result │ │ ├── actor_agent0.pt │ │ ├── actor_agent1.pt │ │ ├── actor_agent2.pt │ │ ├── actor_agent3.pt │ │ ├── actor_agent4.pt │ │ └── actor_agent5.pt ├── __init__.py └── utils │ └── mpi_tools.py ├── Simulation.jpg ├── SpaceRobotEnv ├── .DS_Store ├── __init__.py ├── assets │ ├── .DS_Store │ ├── common │ │ ├── __init__.py │ │ ├── materials.xml │ │ ├── skybox.xml │ │ └── visual.xml │ └── spacerobot │ │ ├── arm_v3.xml │ │ ├── arm_v31.xml │ │ ├── arm_v32.xml │ │ ├── arm_v33.xml │ │ ├── asset.xml │ │ ├── one_arm.xml │ │ ├── sensor.xml │ │ ├── spacerobot_cost.xml │ │ ├── spacerobot_dualarm.xml │ │ ├── spacerobot_fourarm.xml │ │ ├── spacerobot_image.xml │ │ ├── spacerobot_show.xml │ │ ├── spacerobot_state.xml │ │ ├── stls │ │ ├── R10.stl │ │ ├── cube.stl │ │ ├── v_base.stl │ │ ├── v_forearm.stl │ │ ├── v_shoulder.stl │ │ ├── v_upperarm.stl │ │ ├── v_wrist1.stl │ │ ├── v_wrist2.stl │ │ └── v_wrist3.stl │ │ └── subgoal.xml ├── envs │ ├── SpaceRobotBaseRot.py │ ├── SpaceRobotCost.py │ ├── SpaceRobotDualArm.py │ ├── SpaceRobotDualArmWithRot.py │ ├── SpaceRobotFourArm.py │ ├── SpaceRobotImage.py │ ├── SpaceRobotPointCloud.py │ ├── SpaceRobotReorientation.py │ ├── SpaceRobotState.py │ └── __init__.py └── images │ ├── Simulation.jpg │ ├── ccc.png │ ├── iros.gif │ ├── ral.gif │ └── robot.png ├── render ├── base_reorien │ ├── fig0.jpg │ ├── fig10.jpg │ ├── fig100.jpg │ ├── fig150.jpg │ ├── fig20.jpg │ ├── fig30.jpg │ ├── fig5.jpg │ ├── fig50.jpg │ └── render_base_rot.mp4 ├── fig.jpg ├── fig1.jpg ├── fig2.jpg ├── mixed_goal │ ├── fig0.jpg │ ├── fig10.jpg │ ├── fig100.jpg │ ├── fig150.jpg │ ├── fig199.jpg │ ├── fig20.jpg │ ├── fig30.jpg │ ├── fig50.jpg │ └── render_mix3.mp4 ├── render_4arm_comp.gif ├── render_base_rot_comp.gif ├── render_mix_dual_stage_comp.gif ├── save1.png └── traj_planning │ ├── fig0.jpg │ ├── fig10.jpg │ ├── fig100.jpg │ ├── fig150.jpg │ ├── fig20.jpg │ ├── fig40.jpg │ ├── fig50.jpg │ ├── render_4arm.gif │ ├── render_4arm.mp4 │ └── sim1.png ├── requirements.txt ├── setup.py └── test_env.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/LICENSE -------------------------------------------------------------------------------- /MUJOCO_LOG.TXT: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/MUJOCO_LOG.TXT -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/README.md -------------------------------------------------------------------------------- /RL_algorithms/Torch/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/.DS_Store -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/core.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/ddpg.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658931832.Tosins-MacBook-Air.local.42757.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658931832.Tosins-MacBook-Air.local.42757.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658931911.Tosins-MacBook-Air.local.42851.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658931911.Tosins-MacBook-Air.local.42851.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658931934.Tosins-MacBook-Air.local.42904.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658931934.Tosins-MacBook-Air.local.42904.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932019.Tosins-MacBook-Air.local.42965.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932019.Tosins-MacBook-Air.local.42965.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932066.Tosins-MacBook-Air.local.43009.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932066.Tosins-MacBook-Air.local.43009.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932179.Tosins-MacBook-Air.local.43178.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932179.Tosins-MacBook-Air.local.43178.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932723.Tosins-MacBook-Air.local.43565.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932723.Tosins-MacBook-Air.local.43565.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932834.Tosins-MacBook-Air.local.43628.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/logger/events.out.tfevents.1658932834.Tosins-MacBook-Air.local.43628.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/memory.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/training_log_csv/Avg Reward (1).svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/training_log_csv/Avg Reward (1).svg -------------------------------------------------------------------------------- /RL_algorithms/Torch/DDPG/DDPG_ENV/training_log_csv/run-.-tag-Avg Reward (1).csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/DDPG/DDPG_ENV/training_log_csv/run-.-tag-Avg Reward (1).csv -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/LICENSE -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/README.md -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/environment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/environment.yaml -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/__init__.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/happo/happo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/happo/happo_trainer.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/happo/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/happo/policy.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/hatrpo/hatrpo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/hatrpo/hatrpo_trainer.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/hatrpo/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/hatrpo/policy.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/mat/algorithm/ma_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/mat/algorithm/ma_transformer.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/mat/algorithm/transformer_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/mat/algorithm/transformer_policy.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/mat/mat_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/mat/mat_trainer.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/algorithm/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/algorithm/actor.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/algorithm/rMAPPOPolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/algorithm/rMAPPOPolicy.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/algorithm/r_actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/algorithm/r_actor_critic.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/r_mappo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/r_mappo/r_mappo.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/act.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/act.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/cnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/cnn.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/distributions.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/mlp.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/popart.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/popart.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/popart_hatrpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/popart_hatrpo.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/rnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/rnn.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/transformer_act.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/transformer_act.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/algorithms/utils/util.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/config.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/__init__.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/env_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/env_wrappers.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/football/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/football/.DS_Store -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/football/Football_Env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/football/Football_Env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/CMakeLists.txt -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/Hanabi_Env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/Hanabi_Env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/__init__.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/clean_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/clean_all.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/CMakeLists.txt -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/canonical_encoders.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/canonical_encoders.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/canonical_encoders.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/canonical_encoders.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_card.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_card.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_card.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_card.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_game.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_game.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_game.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_game.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_hand.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_hand.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_hand.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_hand.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_history_item.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_history_item.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_history_item.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_history_item.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_move.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_move.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_move.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_move.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_observation.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_observation.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_observation.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_observation.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_state.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_state.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_state.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/hanabi_state.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/observation_encoder.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/observation_encoder.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/util.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/util.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/util.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/hanabi_lib/util.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/pyhanabi.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/pyhanabi.cc -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/pyhanabi.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/pyhanabi.h -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/pyhanabi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/hanabi/pyhanabi.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/MPE_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/MPE_env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/core.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/environment.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/multi_discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/multi_discrete.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/rendering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/rendering.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenario.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenario.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/__init__.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_adversary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_adversary.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_attack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_attack.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_crypto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_crypto.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_crypto_display.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_crypto_display.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_push.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_push.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_reference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_reference.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_speaker_listener.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_speaker_listener.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_spread.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_spread.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_tag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_tag.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_world_comm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/mpe/scenarios/simple_world_comm.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/spacerobot/SpaceRobotBaseRot_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/spacerobot/SpaceRobotBaseRot_env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/spacerobot/SpaceRobotDualArmWithRot_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/spacerobot/SpaceRobotDualArmWithRot_env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/spacerobot/SpaceRobotFourArm_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/spacerobot/SpaceRobotFourArm_env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/SMACv2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/SMACv2.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/SMACv2_modified.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/SMACv2_modified.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2_Env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2_Env.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2v2/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2v2/distributions.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2v2/starcraft2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2v2/starcraft2.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2v2/wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/StarCraft2v2/wrapper.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/multiagentenv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/multiagentenv.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/smac_maps.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/envs/starcraft2/smac_maps.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/base_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/base_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/mpe_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/mpe_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/smac_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/smac_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/spacerobot_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/separated/spacerobot_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/base_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/base_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/football_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/football_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/hanabi_runner_forward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/hanabi_runner_forward.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/mpe_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/mpe_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/smac_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/runner/shared/smac_runner.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/eval/eval_hanabi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/eval/eval_hanabi.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/eval_hanabi_forward.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/eval_hanabi_forward.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/render/render_football.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/render/render_football.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/render/render_mpe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/render/render_mpe.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/render_football.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/render_football.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/render_mpe.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/render_mpe.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_football.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_football.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_hanabi_forward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_hanabi_forward.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_mpe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_mpe.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_smac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_smac.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_spacerobot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train/train_spacerobot.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_3v1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_3v1.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_ca_easy.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_ca_easy.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_ca_hard.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_ca_hard.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_corner.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_corner.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_rp.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_rp.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_rps.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_football_scripts/train_football_rps.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_hanabi_forward.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_hanabi_forward.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_mpe_scripts/train_mpe_comm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_mpe_scripts/train_mpe_comm.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_mpe_scripts/train_mpe_reference.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_mpe_scripts/train_mpe_reference.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_mpe_scripts/train_mpe_spread.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_mpe_scripts/train_mpe_spread.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_happo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_happo.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_hatrpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_hatrpo.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_mat.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_mat.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_mat_dec.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_other_algo/train_mat_dec.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_10m_vs_11m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_10m_vs_11m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_1c3s5z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_1c3s5z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_25m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_25m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_27m_vs_30m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_27m_vs_30m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_2c_vs_64zg.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_2c_vs_64zg.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_2m_vs_1z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_2m_vs_1z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_2s_vs_1sc.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_2s_vs_1sc.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s5z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s5z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s5z_vs_3s6z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s5z_vs_3s6z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s_vs_3z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s_vs_3z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s_vs_4z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s_vs_4z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s_vs_5z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_3s_vs_5z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_5m_vs_6m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_5m_vs_6m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_6h_vs_8z.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_6h_vs_8z.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_8m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_8m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_8m_vs_9m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_8m_vs_9m.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_MMM.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_MMM.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_MMM2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_MMM2.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_bane_vs_bane.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_bane_vs_bane.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_baneling.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_baneling.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_corridor.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smac_scripts/train_smac_corridor.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_10v10.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_10v10.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_10v11.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_10v11.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_20v20.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_20v20.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_20v23.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_20v23.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_5v5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_protoss_5v5.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_10v10.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_10v10.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_10v11.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_10v11.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_20v20.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_20v20.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_20v23.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_20v23.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_5v5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_terran_5v5.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_10v10.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_10v10.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_10v11.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_10v11.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_20v20.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_20v20.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_20v23.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_20v23.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_5v5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_smacv2_scripts/train_zerg_5v5.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_spacerobot.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_spacerobot.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_spacerobot_4arm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_spacerobot_4arm.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_spacerobot_one_agent.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/scripts/train_spacerobot_one_agent.sh -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/utils/multi_discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/utils/multi_discrete.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/utils/separated_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/utils/separated_buffer.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/utils/shared_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/utils/shared_buffer.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/utils/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/utils/util.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/onpolicy/utils/valuenorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/onpolicy/utils/valuenorm.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/requirements.txt -------------------------------------------------------------------------------- /RL_algorithms/Torch/MAPPO/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/MAPPO/setup.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/actor.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/agent.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/critic.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/main.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/memory.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/models/space_robot_actor.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/models/space_robot_actor.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/models/space_robot_critic.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/models/space_robot_critic.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/plots/space_robot_performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/plots/space_robot_performance.png -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO/utils.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/actor.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/agent.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/critic.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/main.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/memory.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/models/space_robot_actor.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/models/space_robot_actor.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/models/space_robot_critic.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/models/space_robot_critic.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/plots/space_robot_performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/plots/space_robot_performance.png -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Continious/PPO_Two_heads/utils.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Continious/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/actor.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/agent.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/critic.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/main.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/memory.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/models/space_robot_actor.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/models/space_robot_actor.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/models/space_robot_critic.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/models/space_robot_critic.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/plots/space_robot_performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/plots/space_robot_performance.png -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/training_log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/training_log -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPO/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPO/utils.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/actor.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/agent.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/critic.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/main.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/memory.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/models/.space_robot_actor.pt.icloud: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/models/.space_robot_actor.pt.icloud -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/models/.space_robot_critic.pt.icloud: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/models/.space_robot_critic.pt.icloud -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/plots/space_robot_performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/plots/space_robot_performance.png -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/Discrete/PPOImage/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/Discrete/PPOImage/utils.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/PPO_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/PPO_test.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/PPO_test_2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/PPO_test_2.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/PPO/test_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/PPO/test_ppo.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/core.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847118.Tosins-Air.19214.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847118.Tosins-Air.19214.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847140.Tosins-Air.19431.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847140.Tosins-Air.19431.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847454.Tosins-Air.19535.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847454.Tosins-Air.19535.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847513.Tosins-Air.19931.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847513.Tosins-Air.19931.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847612.Tosins-Air.19979.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847612.Tosins-Air.19979.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847918.Tosins-Air.20089.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658847918.Tosins-Air.20089.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848049.Tosins-Air.20232.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848049.Tosins-Air.20232.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848339.Tosins-Air.20384.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848339.Tosins-Air.20384.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848364.Tosins-Air.20423.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848364.Tosins-Air.20423.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848673.Tosins-Air.20649.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848673.Tosins-Air.20649.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848831.Tosins-Air.20793.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658848831.Tosins-Air.20793.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849191.Tosins-Air.20924.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849191.Tosins-Air.20924.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849218.Tosins-Air.20984.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849218.Tosins-Air.20984.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849777.Tosins-Air.21229.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849777.Tosins-Air.21229.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849785.Tosins-Air.21269.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849785.Tosins-Air.21269.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849885.Tosins-Air.21429.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849885.Tosins-Air.21429.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849941.Tosins-Air.21521.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658849941.Tosins-Air.21521.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658850278.Tosins-Air.21678.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/logger/events.out.tfevents.1658850278.Tosins-Air.21678.0 -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/memory.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/sac.py -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/training_log_csv/run-.-tag-Avg Reward.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/training_log_csv/run-.-tag-Avg Reward.csv -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/SAC_ENV/training_log_csv/run-.-tag-Loss_Pi.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/SAC/SAC_ENV/training_log_csv/run-.-tag-Loss_Pi.csv -------------------------------------------------------------------------------- /RL_algorithms/Torch/SAC/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/Torch/result/actor_agent0.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/result/actor_agent0.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/result/actor_agent1.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/result/actor_agent1.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/result/actor_agent2.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/result/actor_agent2.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/result/actor_agent3.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/result/actor_agent3.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/result/actor_agent4.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/result/actor_agent4.pt -------------------------------------------------------------------------------- /RL_algorithms/Torch/result/actor_agent5.pt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/Torch/result/actor_agent5.pt -------------------------------------------------------------------------------- /RL_algorithms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /RL_algorithms/utils/mpi_tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/RL_algorithms/utils/mpi_tools.py -------------------------------------------------------------------------------- /Simulation.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/Simulation.jpg -------------------------------------------------------------------------------- /SpaceRobotEnv/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/.DS_Store -------------------------------------------------------------------------------- /SpaceRobotEnv/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/__init__.py -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/.DS_Store -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/common/__init__.py -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/common/materials.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/common/materials.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/common/skybox.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/common/skybox.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/common/visual.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/common/visual.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/arm_v3.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/arm_v3.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/arm_v31.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/arm_v31.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/arm_v32.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/arm_v32.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/arm_v33.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/arm_v33.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/asset.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/asset.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/one_arm.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/one_arm.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/sensor.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/sensor.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/spacerobot_cost.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/spacerobot_cost.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/spacerobot_dualarm.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/spacerobot_dualarm.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/spacerobot_fourarm.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/spacerobot_fourarm.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/spacerobot_image.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/spacerobot_image.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/spacerobot_show.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/spacerobot_show.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/spacerobot_state.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/spacerobot_state.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/R10.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/R10.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/cube.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/cube.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_base.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_base.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_forearm.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_forearm.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_shoulder.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_shoulder.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_upperarm.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_upperarm.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_wrist1.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_wrist1.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_wrist2.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_wrist2.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/stls/v_wrist3.stl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/stls/v_wrist3.stl -------------------------------------------------------------------------------- /SpaceRobotEnv/assets/spacerobot/subgoal.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/assets/spacerobot/subgoal.xml -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotBaseRot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotBaseRot.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotCost.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotCost.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotDualArm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotDualArm.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotDualArmWithRot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotDualArmWithRot.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotFourArm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotFourArm.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotImage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotImage.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotPointCloud.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotPointCloud.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotReorientation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotReorientation.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/SpaceRobotState.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/SpaceRobotState.py -------------------------------------------------------------------------------- /SpaceRobotEnv/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/envs/__init__.py -------------------------------------------------------------------------------- /SpaceRobotEnv/images/Simulation.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/images/Simulation.jpg -------------------------------------------------------------------------------- /SpaceRobotEnv/images/ccc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/images/ccc.png -------------------------------------------------------------------------------- /SpaceRobotEnv/images/iros.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/images/iros.gif -------------------------------------------------------------------------------- /SpaceRobotEnv/images/ral.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/images/ral.gif -------------------------------------------------------------------------------- /SpaceRobotEnv/images/robot.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/SpaceRobotEnv/images/robot.png -------------------------------------------------------------------------------- /render/base_reorien/fig0.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig0.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig10.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig10.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig100.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig100.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig150.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig150.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig20.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig20.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig30.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig30.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig5.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig5.jpg -------------------------------------------------------------------------------- /render/base_reorien/fig50.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/fig50.jpg -------------------------------------------------------------------------------- /render/base_reorien/render_base_rot.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/base_reorien/render_base_rot.mp4 -------------------------------------------------------------------------------- /render/fig.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/fig.jpg -------------------------------------------------------------------------------- /render/fig1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/fig1.jpg -------------------------------------------------------------------------------- /render/fig2.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/fig2.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig0.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig0.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig10.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig10.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig100.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig100.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig150.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig150.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig199.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig199.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig20.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig20.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig30.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig30.jpg -------------------------------------------------------------------------------- /render/mixed_goal/fig50.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/fig50.jpg -------------------------------------------------------------------------------- /render/mixed_goal/render_mix3.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/mixed_goal/render_mix3.mp4 -------------------------------------------------------------------------------- /render/render_4arm_comp.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/render_4arm_comp.gif -------------------------------------------------------------------------------- /render/render_base_rot_comp.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/render_base_rot_comp.gif -------------------------------------------------------------------------------- /render/render_mix_dual_stage_comp.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/render_mix_dual_stage_comp.gif -------------------------------------------------------------------------------- /render/save1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/save1.png -------------------------------------------------------------------------------- /render/traj_planning/fig0.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig0.jpg -------------------------------------------------------------------------------- /render/traj_planning/fig10.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig10.jpg -------------------------------------------------------------------------------- /render/traj_planning/fig100.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig100.jpg -------------------------------------------------------------------------------- /render/traj_planning/fig150.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig150.jpg -------------------------------------------------------------------------------- /render/traj_planning/fig20.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig20.jpg -------------------------------------------------------------------------------- /render/traj_planning/fig40.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig40.jpg -------------------------------------------------------------------------------- /render/traj_planning/fig50.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/fig50.jpg -------------------------------------------------------------------------------- /render/traj_planning/render_4arm.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/render_4arm.gif -------------------------------------------------------------------------------- /render/traj_planning/render_4arm.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/render_4arm.mp4 -------------------------------------------------------------------------------- /render/traj_planning/sim1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/render/traj_planning/sim1.png -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/requirements.txt -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/setup.py -------------------------------------------------------------------------------- /test_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Tsinghua-Space-Robot-Learning-Group/SpaceOctopus/HEAD/test_env.py --------------------------------------------------------------------------------