├── .gitignore ├── LICENSE ├── README.md ├── experiments ├── buttons │ ├── buttons_rm_agent_1.txt │ ├── buttons_rm_agent_2.txt │ ├── buttons_rm_agent_3.txt │ └── team_buttons_rm.txt └── gridworld_many_agent_rendezvous │ ├── 10_agent_rendezvous_rm.txt │ ├── 2_agent_rendezvous_rm.txt │ ├── 3_agent_rendezvous_rm.txt │ ├── 4_agent_rendezvous_rm.txt │ ├── 5_agent_rendezvous_rm.txt │ ├── 6_agent_rendezvous_rm.txt │ ├── 7_agent_rendezvous_rm.txt │ ├── 8_agent_rendezvous_rm.txt │ ├── 9_agent_rendezvous_rm.txt │ ├── coordination_experiment_agent1.txt │ ├── coordination_experiment_agent10.txt │ ├── coordination_experiment_agent2.txt │ ├── coordination_experiment_agent3.txt │ ├── coordination_experiment_agent4.txt │ ├── coordination_experiment_agent5.txt │ ├── coordination_experiment_agent6.txt │ ├── coordination_experiment_agent7.txt │ ├── coordination_experiment_agent8.txt │ └── coordination_experiment_agent9.txt └── src ├── Agent ├── agent.py ├── centralized_agent.py ├── ihrl_agent.py └── iqAgent.py ├── Environments ├── coop_buttons │ ├── buttons_env.py │ └── multi_agent_buttons_env.py └── rendezvous │ ├── gridworld_env.py │ └── multi_agent_gridworld_env.py ├── buttons_config.py ├── experiments ├── dqprm.py ├── iql.py ├── run_centralized_coordination_experiment.py └── run_ihrl_experiment.py ├── rendezvous_config.py ├── reward_machines └── sparse_reward_machine.py ├── run.py └── tester ├── learning_params.py ├── tester.py └── tester_params.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/README.md -------------------------------------------------------------------------------- /experiments/buttons/buttons_rm_agent_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/buttons/buttons_rm_agent_1.txt -------------------------------------------------------------------------------- /experiments/buttons/buttons_rm_agent_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/buttons/buttons_rm_agent_2.txt -------------------------------------------------------------------------------- /experiments/buttons/buttons_rm_agent_3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/buttons/buttons_rm_agent_3.txt -------------------------------------------------------------------------------- /experiments/buttons/team_buttons_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/buttons/team_buttons_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/10_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/10_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/2_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/2_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/3_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/3_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/4_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/4_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/5_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/5_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/6_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/6_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/7_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/7_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/8_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/8_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/9_agent_rendezvous_rm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/9_agent_rendezvous_rm.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent1.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent10.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent10.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent2.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent3.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent4.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent5.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent5.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent6.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent6.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent7.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent7.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent8.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent8.txt -------------------------------------------------------------------------------- /experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent9.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/experiments/gridworld_many_agent_rendezvous/coordination_experiment_agent9.txt -------------------------------------------------------------------------------- /src/Agent/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Agent/agent.py -------------------------------------------------------------------------------- /src/Agent/centralized_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Agent/centralized_agent.py -------------------------------------------------------------------------------- /src/Agent/ihrl_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Agent/ihrl_agent.py -------------------------------------------------------------------------------- /src/Agent/iqAgent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Agent/iqAgent.py -------------------------------------------------------------------------------- /src/Environments/coop_buttons/buttons_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Environments/coop_buttons/buttons_env.py -------------------------------------------------------------------------------- /src/Environments/coop_buttons/multi_agent_buttons_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Environments/coop_buttons/multi_agent_buttons_env.py -------------------------------------------------------------------------------- /src/Environments/rendezvous/gridworld_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Environments/rendezvous/gridworld_env.py -------------------------------------------------------------------------------- /src/Environments/rendezvous/multi_agent_gridworld_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/Environments/rendezvous/multi_agent_gridworld_env.py -------------------------------------------------------------------------------- /src/buttons_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/buttons_config.py -------------------------------------------------------------------------------- /src/experiments/dqprm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/experiments/dqprm.py -------------------------------------------------------------------------------- /src/experiments/iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/experiments/iql.py -------------------------------------------------------------------------------- /src/experiments/run_centralized_coordination_experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/experiments/run_centralized_coordination_experiment.py -------------------------------------------------------------------------------- /src/experiments/run_ihrl_experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/experiments/run_ihrl_experiment.py -------------------------------------------------------------------------------- /src/rendezvous_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/rendezvous_config.py -------------------------------------------------------------------------------- /src/reward_machines/sparse_reward_machine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/reward_machines/sparse_reward_machine.py -------------------------------------------------------------------------------- /src/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/run.py -------------------------------------------------------------------------------- /src/tester/learning_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/tester/learning_params.py -------------------------------------------------------------------------------- /src/tester/tester.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/tester/tester.py -------------------------------------------------------------------------------- /src/tester/tester_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cyrusneary/rm-cooperative-marl/HEAD/src/tester/tester_params.py --------------------------------------------------------------------------------