├── .coveragerc ├── .flake8 ├── .github ├── ISSUE_TEMPLATE │ └── custom.md ├── PULL_REQUEST_TEMPLATE.md └── workflows │ ├── algo_test.yml │ ├── badge.yml │ ├── deploy.yml │ ├── doc.yml │ ├── envpool_test.yml │ ├── platform_test.yml │ ├── release.yml │ ├── release_conda.yml │ ├── style.yml │ └── unit_test.yml ├── .gitignore ├── .style.yapf ├── CHANGELOG ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── LICENSE ├── Makefile ├── README.md ├── SECURITY.md ├── assets └── wechat.jpeg ├── cloc.sh ├── codecov.yml ├── conda ├── conda_build_config.yaml └── meta.yaml ├── ding ├── __init__.py ├── bonus │ ├── __init__.py │ ├── a2c.py │ ├── c51.py │ ├── common.py │ ├── config.py │ ├── ddpg.py │ ├── dqn.py │ ├── model.py │ ├── pg.py │ ├── ppo_offpolicy.py │ ├── ppof.py │ ├── sac.py │ ├── sql.py │ └── td3.py ├── compatibility.py ├── config │ ├── __init__.py │ ├── config.py │ ├── example │ │ ├── A2C │ │ │ ├── __init__.py │ │ │ ├── gym_bipedalwalker_v3.py │ │ │ └── gym_lunarlander_v2.py │ │ ├── C51 │ │ │ ├── __init__.py │ │ │ ├── gym_lunarlander_v2.py │ │ │ ├── gym_pongnoframeskip_v4.py │ │ │ ├── gym_qbertnoframeskip_v4.py │ │ │ └── gym_spaceInvadersnoframeskip_v4.py │ │ ├── DDPG │ │ │ ├── __init__.py │ │ │ ├── gym_bipedalwalker_v3.py │ │ │ ├── gym_halfcheetah_v3.py │ │ │ ├── gym_hopper_v3.py │ │ │ ├── gym_lunarlandercontinuous_v2.py │ │ │ ├── gym_pendulum_v1.py │ │ │ └── gym_walker2d_v3.py │ │ ├── DQN │ │ │ ├── __init__.py │ │ │ ├── gym_lunarlander_v2.py │ │ │ ├── gym_pongnoframeskip_v4.py │ │ │ ├── gym_qbertnoframeskip_v4.py │ │ │ └── gym_spaceInvadersnoframeskip_v4.py │ │ ├── PG │ │ │ ├── __init__.py │ │ │ └── gym_pendulum_v1.py │ │ ├── PPOF │ │ │ ├── __init__.py │ │ │ ├── gym_lunarlander_v2.py │ │ │ └── gym_lunarlandercontinuous_v2.py │ │ ├── PPOOffPolicy │ │ │ ├── __init__.py │ │ │ ├── gym_lunarlander_v2.py │ │ │ ├── gym_pongnoframeskip_v4.py │ │ │ ├── gym_qbertnoframeskip_v4.py │ │ │ └── gym_spaceInvadersnoframeskip_v4.py │ │ ├── SAC │ │ │ ├── __init__.py │ │ │ ├── gym_bipedalwalker_v3.py │ │ │ ├── gym_halfcheetah_v3.py │ │ │ ├── gym_hopper_v3.py │ │ │ ├── gym_lunarlandercontinuous_v2.py │ │ │ ├── gym_pendulum_v1.py │ │ │ └── gym_walker2d_v3.py │ │ ├── SQL │ │ │ ├── __init__.py │ │ │ └── gym_lunarlander_v2.py │ │ ├── TD3 │ │ │ ├── __init__.py │ │ │ ├── gym_bipedalwalker_v3.py │ │ │ ├── gym_halfcheetah_v3.py │ │ │ ├── gym_hopper_v3.py │ │ │ ├── gym_lunarlandercontinuous_v2.py │ │ │ ├── gym_pendulum_v1.py │ │ │ └── gym_walker2d_v3.py │ │ └── __init__.py │ ├── tests │ │ └── test_config_formatted.py │ └── utils.py ├── data │ ├── __init__.py │ ├── buffer │ │ ├── __init__.py │ │ ├── buffer.py │ │ ├── deque_buffer.py │ │ ├── deque_buffer_wrapper.py │ │ ├── middleware │ │ │ ├── __init__.py │ │ │ ├── clone_object.py │ │ │ ├── group_sample.py │ │ │ ├── padding.py │ │ │ ├── priority.py │ │ │ ├── sample_range_view.py │ │ │ ├── staleness_check.py │ │ │ └── use_time_check.py │ │ └── tests │ │ │ ├── test_buffer.py │ │ │ ├── test_buffer_benchmark.py │ │ │ └── test_middleware.py │ ├── level_replay │ │ ├── __init__.py │ │ ├── level_sampler.py │ │ └── tests │ │ │ └── test_level_sampler.py │ ├── model_loader.py │ ├── shm_buffer.py │ ├── storage │ │ ├── __init__.py │ │ ├── file.py │ │ ├── storage.py │ │ └── tests │ │ │ └── test_storage.py │ ├── storage_loader.py │ └── tests │ │ ├── test_model_loader.py │ │ ├── test_shm_buffer.py │ │ └── test_storage_loader.py ├── design │ ├── dataloader-sequence.png │ ├── dataloader-sequence.puml │ ├── env_state.png │ ├── parallel_main-sequence.png │ ├── parallel_main-sequence.puml │ ├── serial_collector-activity.png │ ├── serial_collector-activity.puml │ ├── serial_evaluator-activity.png │ ├── serial_evaluator-activity.puml │ ├── serial_learner-activity.png │ ├── serial_learner-activity.puml │ ├── serial_main-sequence.png │ └── serial_main.puml ├── entry │ ├── __init__.py │ ├── application_entry.py │ ├── application_entry_trex_collect_data.py │ ├── cli.py │ ├── cli_ditask.py │ ├── cli_parsers │ │ ├── __init__.py │ │ ├── k8s_parser.py │ │ ├── slurm_parser.py │ │ └── tests │ │ │ ├── test_k8s_parser.py │ │ │ └── test_slurm_parser.py │ ├── dist_entry.py │ ├── parallel_entry.py │ ├── predefined_config.py │ ├── serial_entry.py │ ├── serial_entry_bc.py │ ├── serial_entry_bco.py │ ├── serial_entry_dqfd.py │ ├── serial_entry_gail.py │ ├── serial_entry_guided_cost.py │ ├── serial_entry_mbrl.py │ ├── serial_entry_ngu.py │ ├── serial_entry_offline.py │ ├── serial_entry_onpolicy.py │ ├── serial_entry_onpolicy_ppg.py │ ├── serial_entry_pc.py │ ├── serial_entry_plr.py │ ├── serial_entry_preference_based_irl.py │ ├── serial_entry_preference_based_irl_onpolicy.py │ ├── serial_entry_r2d3.py │ ├── serial_entry_reward_model_offpolicy.py │ ├── serial_entry_reward_model_onpolicy.py │ ├── serial_entry_sqil.py │ ├── serial_entry_td3_vae.py │ ├── tests │ │ ├── config │ │ │ ├── agconfig.yaml │ │ │ ├── dijob-cartpole.yaml │ │ │ └── k8s-config.yaml │ │ ├── test_application_entry.py │ │ ├── test_application_entry_trex_collect_data.py │ │ ├── test_cli_ditask.py │ │ ├── test_parallel_entry.py │ │ ├── test_random_collect.py │ │ ├── test_serial_entry.py │ │ ├── test_serial_entry_algo.py │ │ ├── test_serial_entry_bc.py │ │ ├── test_serial_entry_bco.py │ │ ├── test_serial_entry_dqfd.py │ │ ├── test_serial_entry_for_anytrading.py │ │ ├── test_serial_entry_guided_cost.py │ │ ├── test_serial_entry_mbrl.py │ │ ├── test_serial_entry_onpolicy.py │ │ ├── test_serial_entry_preference_based_irl.py │ │ ├── test_serial_entry_preference_based_irl_onpolicy.py │ │ ├── test_serial_entry_reward_model.py │ │ └── test_serial_entry_sqil.py │ └── utils.py ├── envs │ ├── __init__.py │ ├── common │ │ ├── __init__.py │ │ ├── common_function.py │ │ ├── env_element.py │ │ ├── env_element_runner.py │ │ └── tests │ │ │ └── test_common_function.py │ ├── env │ │ ├── __init__.py │ │ ├── base_env.py │ │ ├── default_wrapper.py │ │ ├── ding_env_wrapper.py │ │ ├── env_implementation_check.py │ │ └── tests │ │ │ ├── __init__.py │ │ │ ├── demo_env.py │ │ │ ├── test_ding_env_wrapper.py │ │ │ └── test_env_implementation_check.py │ ├── env_manager │ │ ├── __init__.py │ │ ├── base_env_manager.py │ │ ├── ding_env_manager.py │ │ ├── env_supervisor.py │ │ ├── envpool_env_manager.py │ │ ├── gym_vector_env_manager.py │ │ ├── subprocess_env_manager.py │ │ └── tests │ │ │ ├── __init__.py │ │ │ ├── conftest.py │ │ │ ├── test_base_env_manager.py │ │ │ ├── test_env_supervisor.py │ │ │ ├── test_envpool_env_manager.py │ │ │ ├── test_gym_vector_env_manager.py │ │ │ ├── test_shm.py │ │ │ └── test_subprocess_env_manager.py │ ├── env_wrappers │ │ ├── __init__.py │ │ └── env_wrappers.py │ └── gym_env.py ├── example │ ├── __init__.py │ ├── bcq.py │ ├── c51_nstep.py │ ├── collect_demo_data.py │ ├── cql.py │ ├── d4pg.py │ ├── ddpg.py │ ├── dqn.py │ ├── dqn_eval.py │ ├── dqn_frozen_lake.py │ ├── dqn_her.py │ ├── dqn_new_env.py │ ├── dqn_nstep.py │ ├── dqn_nstep_gymnasium.py │ ├── dqn_per.py │ ├── dqn_rnd.py │ ├── dt.py │ ├── edac.py │ ├── impala.py │ ├── iqn_nstep.py │ ├── mappo.py │ ├── masac.py │ ├── pdqn.py │ ├── ppg_offpolicy.py │ ├── ppo.py │ ├── ppo_lunarlander.py │ ├── ppo_lunarlander_continuous.py │ ├── ppo_offpolicy.py │ ├── ppo_with_complex_obs.py │ ├── qgpo.py │ ├── qrdqn_nstep.py │ ├── r2d2.py │ ├── sac.py │ ├── sqil.py │ ├── sqil_continuous.py │ ├── sql.py │ ├── td3.py │ └── trex.py ├── framework │ ├── __init__.py │ ├── context.py │ ├── event_loop.py │ ├── message_queue │ │ ├── __init__.py │ │ ├── mq.py │ │ ├── nng.py │ │ ├── redis.py │ │ └── tests │ │ │ ├── test_nng.py │ │ │ └── test_redis.py │ ├── middleware │ │ ├── __init__.py │ │ ├── barrier.py │ │ ├── ckpt_handler.py │ │ ├── collector.py │ │ ├── data_fetcher.py │ │ ├── distributer.py │ │ ├── functional │ │ │ ├── __init__.py │ │ │ ├── advantage_estimator.py │ │ │ ├── collector.py │ │ │ ├── ctx_helper.py │ │ │ ├── data_processor.py │ │ │ ├── enhancer.py │ │ │ ├── evaluator.py │ │ │ ├── explorer.py │ │ │ ├── logger.py │ │ │ ├── priority.py │ │ │ ├── termination_checker.py │ │ │ ├── timer.py │ │ │ └── trainer.py │ │ ├── learner.py │ │ └── tests │ │ │ ├── __init__.py │ │ │ ├── mock_for_test.py │ │ │ ├── test_advantage_estimator.py │ │ │ ├── test_barrier.py │ │ │ ├── test_ckpt_handler.py │ │ │ ├── test_collector.py │ │ │ ├── test_data_processor.py │ │ │ ├── test_distributer.py │ │ │ ├── test_enhancer.py │ │ │ ├── test_evaluator.py │ │ │ ├── test_explorer.py │ │ │ ├── test_logger.py │ │ │ ├── test_priority.py │ │ │ └── test_trainer.py │ ├── parallel.py │ ├── supervisor.py │ ├── task.py │ ├── tests │ │ ├── context_fake_data.py │ │ ├── test_context.py │ │ ├── test_event_loop.py │ │ ├── test_parallel.py │ │ ├── test_supervisor.py │ │ ├── test_task.py │ │ └── test_wrapper.py │ └── wrapper │ │ ├── __init__.py │ │ └── step_timer.py ├── hpc_rl │ ├── README.md │ ├── __init__.py │ ├── tests │ │ ├── test_dntd.py │ │ ├── test_gae.py │ │ ├── test_lstm.py │ │ ├── test_ppo.py │ │ ├── test_qntd.py │ │ ├── test_qntd_rescale.py │ │ ├── test_scatter.py │ │ ├── test_tdlambda.py │ │ ├── test_upgo.py │ │ ├── test_vtrace.py │ │ └── testbase.py │ └── wrapper.py ├── interaction │ ├── __init__.py │ ├── base │ │ ├── __init__.py │ │ ├── app.py │ │ ├── common.py │ │ ├── network.py │ │ └── threading.py │ ├── config │ │ ├── __init__.py │ │ └── base.py │ ├── exception │ │ ├── __init__.py │ │ ├── base.py │ │ ├── master.py │ │ └── slave.py │ ├── master │ │ ├── __init__.py │ │ ├── base.py │ │ ├── connection.py │ │ ├── master.py │ │ └── task.py │ ├── slave │ │ ├── __init__.py │ │ ├── action.py │ │ └── slave.py │ └── tests │ │ ├── __init__.py │ │ ├── base │ │ ├── __init__.py │ │ ├── test_app.py │ │ ├── test_common.py │ │ ├── test_network.py │ │ └── test_threading.py │ │ ├── config │ │ ├── __init__.py │ │ └── test_base.py │ │ ├── exception │ │ ├── __init__.py │ │ ├── test_base.py │ │ ├── test_master.py │ │ └── test_slave.py │ │ ├── interaction │ │ ├── __init__.py │ │ ├── bases.py │ │ ├── test_errors.py │ │ └── test_simple.py │ │ └── test_utils │ │ ├── __init__.py │ │ ├── random.py │ │ └── stream.py ├── league │ ├── __init__.py │ ├── algorithm.py │ ├── base_league.py │ ├── metric.py │ ├── one_vs_one_league.py │ ├── player.py │ ├── shared_payoff.py │ ├── starcraft_player.py │ └── tests │ │ ├── conftest.py │ │ ├── league_test_default_config.py │ │ ├── test_league_metric.py │ │ ├── test_one_vs_one_league.py │ │ ├── test_payoff.py │ │ └── test_player.py ├── model │ ├── __init__.py │ ├── common │ │ ├── __init__.py │ │ ├── encoder.py │ │ ├── head.py │ │ ├── tests │ │ │ ├── test_encoder.py │ │ │ └── test_head.py │ │ └── utils.py │ ├── template │ │ ├── __init__.py │ │ ├── acer.py │ │ ├── atoc.py │ │ ├── bc.py │ │ ├── bcq.py │ │ ├── collaq.py │ │ ├── coma.py │ │ ├── decision_transformer.py │ │ ├── diffusion.py │ │ ├── ebm.py │ │ ├── edac.py │ │ ├── havac.py │ │ ├── hpt.py │ │ ├── language_transformer.py │ │ ├── madqn.py │ │ ├── maqac.py │ │ ├── mavac.py │ │ ├── ngu.py │ │ ├── pdqn.py │ │ ├── pg.py │ │ ├── ppg.py │ │ ├── procedure_cloning.py │ │ ├── q_learning.py │ │ ├── qac.py │ │ ├── qac_dist.py │ │ ├── qgpo.py │ │ ├── qmix.py │ │ ├── qtran.py │ │ ├── qvac.py │ │ ├── sqn.py │ │ ├── tests │ │ │ ├── test_acer.py │ │ │ ├── test_atoc.py │ │ │ ├── test_bc.py │ │ │ ├── test_bcq.py │ │ │ ├── test_collaq.py │ │ │ ├── test_coma_nn.py │ │ │ ├── test_decision_transformer.py │ │ │ ├── test_ebm.py │ │ │ ├── test_edac.py │ │ │ ├── test_havac.py │ │ │ ├── test_hpt.py │ │ │ ├── test_hybrid_qac.py │ │ │ ├── test_language_transformer.py │ │ │ ├── test_madqn.py │ │ │ ├── test_maqac.py │ │ │ ├── test_mavac.py │ │ │ ├── test_ngu.py │ │ │ ├── test_pdqn.py │ │ │ ├── test_pg.py │ │ │ ├── test_procedure_cloning.py │ │ │ ├── test_q_learning.py │ │ │ ├── test_qac.py │ │ │ ├── test_qac_dist.py │ │ │ ├── test_qmix.py │ │ │ ├── test_qtran.py │ │ │ ├── test_vac.py │ │ │ ├── test_vae.py │ │ │ └── test_wqmix.py │ │ ├── vac.py │ │ ├── vae.py │ │ └── wqmix.py │ └── wrapper │ │ ├── __init__.py │ │ ├── model_wrappers.py │ │ └── test_model_wrappers.py ├── policy │ ├── __init__.py │ ├── a2c.py │ ├── acer.py │ ├── atoc.py │ ├── base_policy.py │ ├── bc.py │ ├── bcq.py │ ├── bdq.py │ ├── c51.py │ ├── collaq.py │ ├── coma.py │ ├── command_mode_policy_instance.py │ ├── common_utils.py │ ├── cql.py │ ├── d4pg.py │ ├── ddpg.py │ ├── dqfd.py │ ├── dqn.py │ ├── dt.py │ ├── edac.py │ ├── fqf.py │ ├── happo.py │ ├── ibc.py │ ├── il.py │ ├── impala.py │ ├── iql.py │ ├── iqn.py │ ├── madqn.py │ ├── mbpolicy │ │ ├── __init__.py │ │ ├── dreamer.py │ │ ├── mbsac.py │ │ ├── tests │ │ │ └── test_mbpolicy_utils.py │ │ └── utils.py │ ├── mdqn.py │ ├── ngu.py │ ├── offppo_collect_traj.py │ ├── pc.py │ ├── pdqn.py │ ├── pg.py │ ├── plan_diffuser.py │ ├── policy_factory.py │ ├── ppg.py │ ├── ppo.py │ ├── ppof.py │ ├── prompt_awr.py │ ├── prompt_pg.py │ ├── qgpo.py │ ├── qmix.py │ ├── qrdqn.py │ ├── qtran.py │ ├── r2d2.py │ ├── r2d2_collect_traj.py │ ├── r2d2_gtrxl.py │ ├── r2d3.py │ ├── rainbow.py │ ├── sac.py │ ├── sql.py │ ├── sqn.py │ ├── td3.py │ ├── td3_bc.py │ ├── td3_vae.py │ ├── tests │ │ ├── test_common_utils.py │ │ ├── test_cql.py │ │ ├── test_r2d3.py │ │ └── test_stdim.py │ └── wqmix.py ├── reward_model │ ├── __init__.py │ ├── base_reward_model.py │ ├── drex_reward_model.py │ ├── gail_irl_model.py │ ├── guided_cost_reward_model.py │ ├── her_reward_model.py │ ├── icm_reward_model.py │ ├── ngu_reward_model.py │ ├── pdeil_irl_model.py │ ├── pwil_irl_model.py │ ├── red_irl_model.py │ ├── rnd_reward_model.py │ ├── tests │ │ └── test_gail_irl_model.py │ └── trex_reward_model.py ├── rl_utils │ ├── README.md │ ├── __init__.py │ ├── a2c.py │ ├── acer.py │ ├── adder.py │ ├── beta_function.py │ ├── coma.py │ ├── exploration.py │ ├── gae.py │ ├── grpo.py │ ├── happo.py │ ├── isw.py │ ├── log_prob_utils.py │ ├── ppg.py │ ├── ppo.py │ ├── retrace.py │ ├── rloo.py │ ├── sampler.py │ ├── td.py │ ├── tests │ │ ├── test_a2c.py │ │ ├── test_adder.py │ │ ├── test_coma.py │ │ ├── test_exploration.py │ │ ├── test_gae.py │ │ ├── test_grpo_rlhf.py │ │ ├── test_happo.py │ │ ├── test_log_prob_fn.py │ │ ├── test_log_prob_utils.py │ │ ├── test_ppg.py │ │ ├── test_ppo.py │ │ ├── test_ppo_rlhf.py │ │ ├── test_retrace.py │ │ ├── test_rloo_rlhf.py │ │ ├── test_td.py │ │ ├── test_upgo.py │ │ ├── test_value_rescale.py │ │ └── test_vtrace.py │ ├── upgo.py │ ├── value_rescale.py │ └── vtrace.py ├── scripts │ ├── dijob-qbert.yaml │ ├── docker-test-entry.sh │ ├── docker-test.sh │ ├── install-k8s-tools.sh │ ├── kill.sh │ ├── local_parallel.sh │ ├── local_serial.sh │ ├── main_league.sh │ ├── main_league_slurm.sh │ └── tests │ │ ├── test_parallel_socket.py │ │ └── test_parallel_socket.sh ├── torch_utils │ ├── __init__.py │ ├── backend_helper.py │ ├── checkpoint_helper.py │ ├── data_helper.py │ ├── dataparallel.py │ ├── diffusion_SDE │ │ ├── __init__.py │ │ └── dpm_solver_pytorch.py │ ├── distribution.py │ ├── loss │ │ ├── __init__.py │ │ ├── contrastive_loss.py │ │ ├── cross_entropy_loss.py │ │ ├── multi_logits_loss.py │ │ └── tests │ │ │ ├── test_contrastive_loss.py │ │ │ ├── test_cross_entropy_loss.py │ │ │ └── test_multi_logits_loss.py │ ├── lr_scheduler.py │ ├── math_helper.py │ ├── metric.py │ ├── model_helper.py │ ├── network │ │ ├── __init__.py │ │ ├── activation.py │ │ ├── diffusion.py │ │ ├── dreamer.py │ │ ├── gtrxl.py │ │ ├── gumbel_softmax.py │ │ ├── merge.py │ │ ├── nn_module.py │ │ ├── normalization.py │ │ ├── popart.py │ │ ├── res_block.py │ │ ├── resnet.py │ │ ├── rnn.py │ │ ├── scatter_connection.py │ │ ├── soft_argmax.py │ │ ├── tests │ │ │ ├── test_activation.py │ │ │ ├── test_diffusion.py │ │ │ ├── test_dreamer.py │ │ │ ├── test_gtrxl.py │ │ │ ├── test_gumbel_softmax.py │ │ │ ├── test_merge.py │ │ │ ├── test_nn_module.py │ │ │ ├── test_normalization.py │ │ │ ├── test_popart.py │ │ │ ├── test_res_block.py │ │ │ ├── test_resnet.py │ │ │ ├── test_rnn.py │ │ │ ├── test_scatter.py │ │ │ ├── test_soft_argmax.py │ │ │ └── test_transformer.py │ │ └── transformer.py │ ├── nn_test_helper.py │ ├── optimizer_helper.py │ ├── parameter.py │ ├── reshape_helper.py │ └── tests │ │ ├── test_backend_helper.py │ │ ├── test_ckpt_helper.py │ │ ├── test_data_helper.py │ │ ├── test_distribution.py │ │ ├── test_feature_merge.py │ │ ├── test_lr_scheduler.py │ │ ├── test_math_helper.py │ │ ├── test_metric.py │ │ ├── test_model_helper.py │ │ ├── test_nn_test_helper.py │ │ ├── test_optimizer.py │ │ ├── test_parameter.py │ │ └── test_reshape_helper.py ├── utils │ ├── __init__.py │ ├── autolog │ │ ├── __init__.py │ │ ├── base.py │ │ ├── data.py │ │ ├── model.py │ │ ├── tests │ │ │ ├── __init__.py │ │ │ ├── test_data.py │ │ │ ├── test_model.py │ │ │ └── test_time.py │ │ ├── time_ctl.py │ │ └── value.py │ ├── bfs_helper.py │ ├── collection_helper.py │ ├── compression_helper.py │ ├── data │ │ ├── __init__.py │ │ ├── base_dataloader.py │ │ ├── collate_fn.py │ │ ├── dataloader.py │ │ ├── dataset.py │ │ ├── rlhf_offline_dataset.py │ │ ├── rlhf_online_dataset.py │ │ ├── structure │ │ │ ├── __init__.py │ │ │ ├── cache.py │ │ │ └── lifo_deque.py │ │ └── tests │ │ │ ├── dataloader_speed │ │ │ └── experiment_dataloader_speed.py │ │ │ ├── test_cache.py │ │ │ ├── test_collate_fn.py │ │ │ ├── test_dataloader.py │ │ │ ├── test_dataset.py │ │ │ ├── test_rlhf_offline_dataset.py │ │ │ └── test_rlhf_online_dataset.py │ ├── default_helper.py │ ├── deprecation.py │ ├── design_helper.py │ ├── dict_helper.py │ ├── fake_linklink.py │ ├── fast_copy.py │ ├── file_helper.py │ ├── import_helper.py │ ├── k8s_helper.py │ ├── linklink_dist_helper.py │ ├── loader │ │ ├── __init__.py │ │ ├── base.py │ │ ├── collection.py │ │ ├── dict.py │ │ ├── exception.py │ │ ├── mapping.py │ │ ├── norm.py │ │ ├── number.py │ │ ├── string.py │ │ ├── tests │ │ │ ├── __init__.py │ │ │ ├── loader │ │ │ │ ├── __init__.py │ │ │ │ ├── test_base.py │ │ │ │ ├── test_collection.py │ │ │ │ ├── test_dict.py │ │ │ │ ├── test_mapping.py │ │ │ │ ├── test_norm.py │ │ │ │ ├── test_number.py │ │ │ │ ├── test_string.py │ │ │ │ ├── test_types.py │ │ │ │ └── test_utils.py │ │ │ └── test_cartpole_dqn_serial_config_loader.py │ │ ├── types.py │ │ └── utils.py │ ├── lock_helper.py │ ├── log_helper.py │ ├── log_writer_helper.py │ ├── memory_helper.py │ ├── normalizer_helper.py │ ├── orchestrator_launcher.py │ ├── profiler_helper.py │ ├── pytorch_ddp_dist_helper.py │ ├── registry.py │ ├── registry_factory.py │ ├── render_helper.py │ ├── scheduler_helper.py │ ├── segment_tree.py │ ├── slurm_helper.py │ ├── system_helper.py │ ├── tests │ │ ├── config │ │ │ └── k8s-config.yaml │ │ ├── test_bfs_helper.py │ │ ├── test_collection_helper.py │ │ ├── test_compression_helper.py │ │ ├── test_config_helper.py │ │ ├── test_default_helper.py │ │ ├── test_deprecation.py │ │ ├── test_design_helper.py │ │ ├── test_file_helper.py │ │ ├── test_import_helper.py │ │ ├── test_k8s_launcher.py │ │ ├── test_lock.py │ │ ├── test_log_helper.py │ │ ├── test_log_writer_helper.py │ │ ├── test_memory_helper.py │ │ ├── test_normalizer_helper.py │ │ ├── test_profiler_helper.py │ │ ├── test_registry.py │ │ ├── test_scheduler_helper.py │ │ ├── test_segment_tree.py │ │ ├── test_system_helper.py │ │ └── test_time_helper.py │ ├── time_helper.py │ ├── time_helper_base.py │ ├── time_helper_cuda.py │ └── type_helper.py ├── worker │ ├── __init__.py │ ├── adapter │ │ ├── __init__.py │ │ ├── learner_aggregator.py │ │ └── tests │ │ │ └── test_learner_aggregator.py │ ├── collector │ │ ├── __init__.py │ │ ├── base_parallel_collector.py │ │ ├── base_serial_collector.py │ │ ├── base_serial_evaluator.py │ │ ├── battle_episode_serial_collector.py │ │ ├── battle_interaction_serial_evaluator.py │ │ ├── battle_sample_serial_collector.py │ │ ├── comm │ │ │ ├── __init__.py │ │ │ ├── base_comm_collector.py │ │ │ ├── flask_fs_collector.py │ │ │ ├── tests │ │ │ │ └── test_collector_with_coordinator.py │ │ │ └── utils.py │ │ ├── episode_serial_collector.py │ │ ├── interaction_serial_evaluator.py │ │ ├── marine_parallel_collector.py │ │ ├── metric_serial_evaluator.py │ │ ├── sample_serial_collector.py │ │ ├── tests │ │ │ ├── __init__.py │ │ │ ├── fake_cls_policy.py │ │ │ ├── fake_cpong_dqn_config.py │ │ │ ├── speed_test │ │ │ │ ├── __init__.py │ │ │ │ ├── fake_env.py │ │ │ │ ├── fake_policy.py │ │ │ │ ├── test_collector_profile.py │ │ │ │ └── utils.py │ │ │ ├── test_base_serial_collector.py │ │ │ ├── test_episode_serial_collector.py │ │ │ ├── test_marine_parallel_collector.py │ │ │ ├── test_metric_serial_evaluator.py │ │ │ └── test_sample_serial_collector.py │ │ └── zergling_parallel_collector.py │ ├── coordinator │ │ ├── __init__.py │ │ ├── base_parallel_commander.py │ │ ├── base_serial_commander.py │ │ ├── comm_coordinator.py │ │ ├── coordinator.py │ │ ├── one_vs_one_parallel_commander.py │ │ ├── operator_server.py │ │ ├── resource_manager.py │ │ ├── solo_parallel_commander.py │ │ └── tests │ │ │ ├── conftest.py │ │ │ ├── test_coordinator.py │ │ │ ├── test_fake_operator_server.py │ │ │ └── test_one_vs_one_commander.py │ ├── learner │ │ ├── __init__.py │ │ ├── base_learner.py │ │ ├── comm │ │ │ ├── __init__.py │ │ │ ├── base_comm_learner.py │ │ │ ├── flask_fs_learner.py │ │ │ ├── tests │ │ │ │ └── test_learner_with_coordinator.py │ │ │ └── utils.py │ │ ├── learner_hook.py │ │ └── tests │ │ │ ├── test_base_learner.py │ │ │ └── test_learner_hook.py │ └── replay_buffer │ │ ├── __init__.py │ │ ├── advanced_buffer.py │ │ ├── base_buffer.py │ │ ├── episode_buffer.py │ │ ├── naive_buffer.py │ │ ├── tests │ │ ├── conftest.py │ │ ├── test_advanced_buffer.py │ │ └── test_naive_buffer.py │ │ └── utils.py └── world_model │ ├── __init__.py │ ├── base_world_model.py │ ├── ddppo.py │ ├── dreamer.py │ ├── idm.py │ ├── mbpo.py │ ├── model │ ├── __init__.py │ ├── ensemble.py │ ├── networks.py │ └── tests │ │ ├── test_ensemble.py │ │ └── test_networks.py │ ├── tests │ ├── test_ddppo.py │ ├── test_dreamerv3.py │ ├── test_idm.py │ ├── test_mbpo.py │ ├── test_world_model.py │ └── test_world_model_utils.py │ └── utils.py ├── dizoo ├── __init__.py ├── atari │ ├── __init__.py │ ├── atari.gif │ ├── config │ │ ├── __init__.py │ │ └── serial │ │ │ ├── __init__.py │ │ │ ├── asterix │ │ │ ├── __init__.py │ │ │ └── asterix_mdqn_config.py │ │ │ ├── demon_attack │ │ │ └── demon_attack_dqn_config.py │ │ │ ├── enduro │ │ │ ├── __init__.py │ │ │ ├── enduro_dqn_config.py │ │ │ ├── enduro_impala_config.py │ │ │ ├── enduro_mdqn_config.py │ │ │ ├── enduro_onppo_config.py │ │ │ ├── enduro_qrdqn_config.py │ │ │ └── enduro_rainbow_config.py │ │ │ ├── montezuma │ │ │ └── montezuma_ngu_config.py │ │ │ ├── phoenix │ │ │ ├── phoenix_fqf_config.py │ │ │ └── phoenix_iqn_config.py │ │ │ ├── pitfall │ │ │ └── pitfall_ngu_config.py │ │ │ ├── pong │ │ │ ├── __init__.py │ │ │ ├── pong_a2c_config.py │ │ │ ├── pong_acer_config.py │ │ │ ├── pong_c51_config.py │ │ │ ├── pong_cql_config.py │ │ │ ├── pong_dqfd_config.py │ │ │ ├── pong_dqn_config.py │ │ │ ├── pong_dqn_ddp_config.py │ │ │ ├── pong_dqn_envpool_config.py │ │ │ ├── pong_dqn_multi_gpu_config.py │ │ │ ├── pong_dqn_render_config.py │ │ │ ├── pong_dqn_stdim_config.py │ │ │ ├── pong_dt_config.py │ │ │ ├── pong_fqf_config.py │ │ │ ├── pong_gail_dqn_config.py │ │ │ ├── pong_impala_config.py │ │ │ ├── pong_iqn_config.py │ │ │ ├── pong_ngu_config.py │ │ │ ├── pong_ppg_config.py │ │ │ ├── pong_ppo_config.py │ │ │ ├── pong_ppo_ddp_config.py │ │ │ ├── pong_qrdqn_config.py │ │ │ ├── pong_qrdqn_generation_data_config.py │ │ │ ├── pong_r2d2_config.py │ │ │ ├── pong_r2d2_gtrxl_config.py │ │ │ ├── pong_r2d2_residual_config.py │ │ │ ├── pong_r2d3_offppoexpert_config.py │ │ │ ├── pong_r2d3_r2d2expert_config.py │ │ │ ├── pong_rainbow_config.py │ │ │ ├── pong_sqil_config.py │ │ │ ├── pong_sql_config.py │ │ │ ├── pong_trex_offppo_config.py │ │ │ └── pong_trex_sql_config.py │ │ │ ├── qbert │ │ │ ├── __init__.py │ │ │ ├── qbert_a2c_config.py │ │ │ ├── qbert_acer_config.py │ │ │ ├── qbert_c51_config.py │ │ │ ├── qbert_cql_config.py │ │ │ ├── qbert_dqfd_config.py │ │ │ ├── qbert_dqn_config.py │ │ │ ├── qbert_fqf_config.py │ │ │ ├── qbert_impala_config.py │ │ │ ├── qbert_iqn_config.py │ │ │ ├── qbert_ngu_config.py │ │ │ ├── qbert_offppo_config.py │ │ │ ├── qbert_onppo_config.py │ │ │ ├── qbert_ppg_config.py │ │ │ ├── qbert_qrdqn_config.py │ │ │ ├── qbert_qrdqn_generation_data_config.py │ │ │ ├── qbert_r2d2_config.py │ │ │ ├── qbert_r2d2_gtrxl_config.py │ │ │ ├── qbert_rainbow_config.py │ │ │ ├── qbert_sqil_config.py │ │ │ ├── qbert_sql_config.py │ │ │ ├── qbert_trex_dqn_config.py │ │ │ └── qbert_trex_offppo_config.py │ │ │ └── spaceinvaders │ │ │ ├── __init__.py │ │ │ ├── spaceinvaders_a2c_config.py │ │ │ ├── spaceinvaders_acer_config.py │ │ │ ├── spaceinvaders_c51_config.py │ │ │ ├── spaceinvaders_dqfd_config.py │ │ │ ├── spaceinvaders_dqn_config.py │ │ │ ├── spaceinvaders_dqn_config_multi_gpu_ddp.py │ │ │ ├── spaceinvaders_dqn_config_multi_gpu_dp.py │ │ │ ├── spaceinvaders_fqf_config.py │ │ │ ├── spaceinvaders_impala_config.py │ │ │ ├── spaceinvaders_iqn_config.py │ │ │ ├── spaceinvaders_mdqn_config.py │ │ │ ├── spaceinvaders_ngu_config.py │ │ │ ├── spaceinvaders_offppo_config.py │ │ │ ├── spaceinvaders_onppo_config.py │ │ │ ├── spaceinvaders_ppg_config.py │ │ │ ├── spaceinvaders_qrdqn_config.py │ │ │ ├── spaceinvaders_r2d2_config.py │ │ │ ├── spaceinvaders_r2d2_gtrxl_config.py │ │ │ ├── spaceinvaders_r2d2_residual_config.py │ │ │ ├── spaceinvaders_rainbow_config.py │ │ │ ├── spaceinvaders_sqil_config.py │ │ │ ├── spaceinvaders_sql_config.py │ │ │ ├── spaceinvaders_trex_dqn_config.py │ │ │ └── spaceinvaders_trex_offppo_config.py │ ├── entry │ │ ├── __init__.py │ │ ├── atari_dqn_main.py │ │ ├── atari_dt_main.py │ │ ├── atari_impala_main.py │ │ ├── atari_ppg_main.py │ │ ├── phoenix_fqf_main.py │ │ ├── phoenix_iqn_main.py │ │ ├── pong_cql_main.py │ │ ├── pong_dqn_envpool_main.py │ │ ├── pong_fqf_main.py │ │ ├── qbert_cql_main.py │ │ ├── qbert_fqf_main.py │ │ ├── spaceinvaders_dqn_eval.py │ │ ├── spaceinvaders_dqn_main_multi_gpu_ddp.py │ │ ├── spaceinvaders_dqn_main_multi_gpu_dp.py │ │ └── spaceinvaders_fqf_main.py │ ├── envs │ │ ├── __init__.py │ │ ├── atari_env.py │ │ ├── atari_wrappers.py │ │ └── test_atari_env.py │ └── example │ │ ├── atari_dqn.py │ │ ├── atari_dqn_ddp.py │ │ ├── atari_dqn_dist.py │ │ ├── atari_dqn_dist_ddp.py │ │ ├── atari_dqn_dist_rdma.py │ │ ├── atari_dqn_dp.py │ │ ├── atari_ppo.py │ │ └── atari_ppo_ddp.py ├── beergame │ ├── __init__.py │ ├── beergame.png │ ├── config │ │ └── beergame_onppo_config.py │ ├── entry │ │ └── beergame_eval.py │ └── envs │ │ ├── BGAgent.py │ │ ├── __init__.py │ │ ├── beergame_core.py │ │ ├── beergame_env.py │ │ ├── clBeergame.py │ │ ├── plotting.py │ │ └── utils.py ├── bitflip │ ├── README.md │ ├── __init__.py │ ├── bitflip.gif │ ├── config │ │ ├── __init__.py │ │ ├── bitflip_her_dqn_config.py │ │ └── bitflip_pure_dqn_config.py │ ├── entry │ │ ├── __init__.py │ │ └── bitflip_dqn_main.py │ └── envs │ │ ├── __init__.py │ │ ├── bitflip_env.py │ │ └── test_bitfilp_env.py ├── box2d │ ├── __init__.py │ ├── bipedalwalker │ │ ├── __init__.py │ │ ├── config │ │ │ ├── __init__.py │ │ │ ├── bipedalwalker_a2c_config.py │ │ │ ├── bipedalwalker_bco_config.py │ │ │ ├── bipedalwalker_ddpg_config.py │ │ │ ├── bipedalwalker_dt_config.py │ │ │ ├── bipedalwalker_gail_sac_config.py │ │ │ ├── bipedalwalker_impala_config.py │ │ │ ├── bipedalwalker_pg_config.py │ │ │ ├── bipedalwalker_ppo_config.py │ │ │ ├── bipedalwalker_ppopg_config.py │ │ │ ├── bipedalwalker_sac_config.py │ │ │ └── bipedalwalker_td3_config.py │ │ ├── entry │ │ │ ├── __init__.py │ │ │ └── bipedalwalker_ppo_eval.py │ │ ├── envs │ │ │ ├── __init__.py │ │ │ ├── bipedalwalker_env.py │ │ │ └── test_bipedalwalker.py │ │ └── original.gif │ ├── carracing │ │ ├── __init__.py │ │ ├── car_racing.gif │ │ ├── config │ │ │ ├── __init__.py │ │ │ └── carracing_dqn_config.py │ │ └── envs │ │ │ ├── __init__.py │ │ │ ├── carracing_env.py │ │ │ └── test_carracing_env.py │ └── lunarlander │ │ ├── __init__.py │ │ ├── config │ │ ├── __init__.py │ │ ├── lunarlander_a2c_config.py │ │ ├── lunarlander_acer_config.py │ │ ├── lunarlander_bco_config.py │ │ ├── lunarlander_c51_config.py │ │ ├── lunarlander_cont_ddpg_config.py │ │ ├── lunarlander_cont_sac_config.py │ │ ├── lunarlander_cont_td3_config.py │ │ ├── lunarlander_cont_td3_vae_config.py │ │ ├── lunarlander_discrete_sac_config.py │ │ ├── lunarlander_dqfd_config.py │ │ ├── lunarlander_dqn_config.py │ │ ├── lunarlander_dqn_deque_config.py │ │ ├── lunarlander_dt_config.py │ │ ├── lunarlander_gail_dqn_config.py │ │ ├── lunarlander_gcl_config.py │ │ ├── lunarlander_hpt_config.py │ │ ├── lunarlander_impala_config.py │ │ ├── lunarlander_ngu_config.py │ │ ├── lunarlander_offppo_config.py │ │ ├── lunarlander_pg_config.py │ │ ├── lunarlander_ppo_config.py │ │ ├── lunarlander_ppo_continuous_config.py │ │ ├── lunarlander_qrdqn_config.py │ │ ├── lunarlander_r2d2_config.py │ │ ├── lunarlander_r2d2_gtrxl_config.py │ │ ├── lunarlander_r2d3_ppoexpert_config.py │ │ ├── lunarlander_r2d3_r2d2expert_config.py │ │ ├── lunarlander_rnd_onppo_config.py │ │ ├── lunarlander_sqil_config.py │ │ ├── lunarlander_sql_config.py │ │ ├── lunarlander_trex_dqn_config.py │ │ └── lunarlander_trex_offppo_config.py │ │ ├── entry │ │ ├── __init__.py │ │ ├── lunarlander_dqn_eval.py │ │ ├── lunarlander_dqn_example.py │ │ └── lunarlander_hpt_example.py │ │ ├── envs │ │ ├── __init__.py │ │ ├── lunarlander_env.py │ │ └── test_lunarlander_env.py │ │ ├── lunarlander.gif │ │ └── offline_data │ │ ├── collect_dqn_data_config.py │ │ ├── lunarlander_collect_data.py │ │ └── lunarlander_show_data.py ├── bsuite │ ├── __init__.py │ ├── bsuite.png │ ├── config │ │ ├── __init__.py │ │ └── serial │ │ │ ├── bandit_noise │ │ │ └── bandit_noise_0_dqn_config.py │ │ │ ├── cartpole_swingup │ │ │ └── cartpole_swingup_0_dqn_config.py │ │ │ └── memory_len │ │ │ ├── memory_len_0_a2c_config.py │ │ │ ├── memory_len_0_dqn_config.py │ │ │ ├── memory_len_15_r2d2_config.py │ │ │ └── memory_len_15_r2d2_gtrxl_config.py │ └── envs │ │ ├── __init__.py │ │ ├── bsuite_env.py │ │ └── test_bsuite_env.py ├── classic_control │ ├── __init__.py │ ├── acrobot │ │ ├── __init__.py │ │ ├── acrobot.gif │ │ ├── config │ │ │ ├── __init__.py │ │ │ └── acrobot_dqn_config.py │ │ └── envs │ │ │ ├── __init__.py │ │ │ ├── acrobot_env.py │ │ │ └── test_acrobot_env.py │ ├── cartpole │ │ ├── __init__.py │ │ ├── cartpole.gif │ │ ├── config │ │ │ ├── __init__.py │ │ │ ├── cartpole_a2c_config.py │ │ │ ├── cartpole_acer_config.py │ │ │ ├── cartpole_bc_config.py │ │ │ ├── cartpole_bco_config.py │ │ │ ├── cartpole_c51_config.py │ │ │ ├── cartpole_cql_config.py │ │ │ ├── cartpole_decision_transformer.py │ │ │ ├── cartpole_dqfd_config.py │ │ │ ├── cartpole_dqn_config.py │ │ │ ├── cartpole_dqn_ddp_config.py │ │ │ ├── cartpole_dqn_gail_config.py │ │ │ ├── cartpole_dqn_rnd_config.py │ │ │ ├── cartpole_dqn_stdim_config.py │ │ │ ├── cartpole_drex_dqn_config.py │ │ │ ├── cartpole_dt_config.py │ │ │ ├── cartpole_fqf_config.py │ │ │ ├── cartpole_gcl_config.py │ │ │ ├── cartpole_impala_config.py │ │ │ ├── cartpole_iqn_config.py │ │ │ ├── cartpole_mdqn_config.py │ │ │ ├── cartpole_ngu_config.py │ │ │ ├── cartpole_pg_config.py │ │ │ ├── cartpole_ppg_config.py │ │ │ ├── cartpole_ppo_config.py │ │ │ ├── cartpole_ppo_ddp_config.py │ │ │ ├── cartpole_ppo_icm_config.py │ │ │ ├── cartpole_ppo_offpolicy_config.py │ │ │ ├── cartpole_ppo_stdim_config.py │ │ │ ├── cartpole_ppopg_config.py │ │ │ ├── cartpole_qrdqn_config.py │ │ │ ├── cartpole_qrdqn_generation_data_config.py │ │ │ ├── cartpole_r2d2_config.py │ │ │ ├── cartpole_r2d2_gtrxl_config.py │ │ │ ├── cartpole_r2d2_residual_config.py │ │ │ ├── cartpole_rainbow_config.py │ │ │ ├── cartpole_rnd_onppo_config.py │ │ │ ├── cartpole_sac_config.py │ │ │ ├── cartpole_sqil_config.py │ │ │ ├── cartpole_sql_config.py │ │ │ ├── cartpole_sqn_config.py │ │ │ ├── cartpole_trex_dqn_config.py │ │ │ ├── cartpole_trex_offppo_config.py │ │ │ ├── cartpole_trex_onppo_config.py │ │ │ └── parallel │ │ │ │ ├── __init__.py │ │ │ │ ├── cartpole_dqn_config.py │ │ │ │ ├── cartpole_dqn_config_k8s.py │ │ │ │ └── cartpole_dqn_dist.sh │ │ ├── entry │ │ │ ├── __init__.py │ │ │ ├── cartpole_c51_deploy.py │ │ │ ├── cartpole_c51_main.py │ │ │ ├── cartpole_cql_main.py │ │ │ ├── cartpole_dqn_buffer_main.py │ │ │ ├── cartpole_dqn_eval.py │ │ │ ├── cartpole_dqn_main.py │ │ │ ├── cartpole_dqn_pwil_main.py │ │ │ ├── cartpole_fqf_main.py │ │ │ ├── cartpole_ppg_main.py │ │ │ ├── cartpole_ppo_main.py │ │ │ └── cartpole_ppo_offpolicy_main.py │ │ └── envs │ │ │ ├── __init__.py │ │ │ ├── cartpole_env.py │ │ │ ├── test_cartpole_env.py │ │ │ └── test_cartpole_env_manager.py │ ├── mountain_car │ │ ├── __init__.py │ │ ├── config │ │ │ └── mtcar_rainbow_config.py │ │ └── envs │ │ │ ├── __init__.py │ │ │ ├── mtcar_env.py │ │ │ └── test_mtcar_env.py │ └── pendulum │ │ ├── __init__.py │ │ ├── config │ │ ├── __init__.py │ │ ├── mbrl │ │ │ ├── pendulum_mbsac_ddppo_config.py │ │ │ ├── pendulum_mbsac_mbpo_config.py │ │ │ ├── pendulum_sac_ddppo_config.py │ │ │ ├── pendulum_sac_mbpo_config.py │ │ │ └── pendulum_stevesac_mbpo_config.py │ │ ├── pendulum_a2c_config.py │ │ ├── pendulum_bdq_config.py │ │ ├── pendulum_cql_config.py │ │ ├── pendulum_d4pg_config.py │ │ ├── pendulum_ddpg_config.py │ │ ├── pendulum_dqn_config.py │ │ ├── pendulum_ibc_config.py │ │ ├── pendulum_pg_config.py │ │ ├── pendulum_ppo_config.py │ │ ├── pendulum_sac_config.py │ │ ├── pendulum_sac_data_generation_config.py │ │ ├── pendulum_sqil_sac_config.py │ │ ├── pendulum_td3_bc_config.py │ │ ├── pendulum_td3_config.py │ │ └── pendulum_td3_data_generation_config.py │ │ ├── entry │ │ ├── __init__.py │ │ ├── pendulum_cql_ddpg_main.py │ │ ├── pendulum_cql_main.py │ │ ├── pendulum_d4pg_main.py │ │ ├── pendulum_ddpg_main.py │ │ ├── pendulum_dqn_eval.py │ │ ├── pendulum_ppo_main.py │ │ ├── pendulum_td3_bc_main.py │ │ └── pendulum_td3_main.py │ │ ├── envs │ │ ├── __init__.py │ │ ├── pendulum_env.py │ │ └── test_pendulum_env.py │ │ └── pendulum.gif ├── cliffwalking │ ├── __init__.py │ ├── cliff_walking.gif │ ├── config │ │ └── cliffwalking_dqn_config.py │ ├── entry │ │ ├── cliffwalking_dqn_deploy.py │ │ └── cliffwalking_dqn_main.py │ └── envs │ │ ├── __init__.py │ │ ├── cliffwalking_env.py │ │ └── test_cliffwalking_env.py ├── common │ ├── __init__.py │ └── policy │ │ ├── __init__.py │ │ ├── md_dqn.py │ │ ├── md_ppo.py │ │ └── md_rainbow_dqn.py ├── competitive_rl │ ├── README.md │ ├── __init__.py │ ├── competitive_rl.gif │ ├── config │ │ └── cpong_dqn_config.py │ └── envs │ │ ├── __init__.py │ │ ├── competitive_rl_env.py │ │ ├── competitive_rl_env_wrapper.py │ │ ├── resources │ │ └── pong │ │ │ ├── checkpoint-alphapong.pkl │ │ │ ├── checkpoint-medium.pkl │ │ │ ├── checkpoint-strong.pkl │ │ │ └── checkpoint-weak.pkl │ │ └── test_competitive_rl.py ├── d4rl │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ ├── antmaze_umaze_pd_config.py │ │ ├── halfcheetah_expert_cql_config.py │ │ ├── halfcheetah_expert_dt_config.py │ │ ├── halfcheetah_expert_td3bc_config.py │ │ ├── halfcheetah_medium_bcq_config.py │ │ ├── halfcheetah_medium_cql_config.py │ │ ├── halfcheetah_medium_dt_config.py │ │ ├── halfcheetah_medium_edac_config.py │ │ ├── halfcheetah_medium_expert_bcq_config.py │ │ ├── halfcheetah_medium_expert_cql_config.py │ │ ├── halfcheetah_medium_expert_dt_config.py │ │ ├── halfcheetah_medium_expert_edac_config.py │ │ ├── halfcheetah_medium_expert_iql_config.py │ │ ├── halfcheetah_medium_expert_pd_config.py │ │ ├── halfcheetah_medium_expert_qgpo_config.py │ │ ├── halfcheetah_medium_expert_td3bc_config.py │ │ ├── halfcheetah_medium_iql_config.py │ │ ├── halfcheetah_medium_pd_config.py │ │ ├── halfcheetah_medium_replay_cql_config.py │ │ ├── halfcheetah_medium_replay_dt_config.py │ │ ├── halfcheetah_medium_replay_iql_config.py │ │ ├── halfcheetah_medium_replay_td3bc_config.py │ │ ├── halfcheetah_medium_td3bc_config.py │ │ ├── halfcheetah_random_cql_config.py │ │ ├── halfcheetah_random_dt_config.py │ │ ├── halfcheetah_random_td3bc_config.py │ │ ├── hopper_expert_cql_config.py │ │ ├── hopper_expert_dt_config.py │ │ ├── hopper_expert_td3bc_config.py │ │ ├── hopper_medium_bcq_config.py │ │ ├── hopper_medium_cql_config.py │ │ ├── hopper_medium_dt_config.py │ │ ├── hopper_medium_edac_config.py │ │ ├── hopper_medium_expert_bc_config.py │ │ ├── hopper_medium_expert_bcq_config.py │ │ ├── hopper_medium_expert_cql_config.py │ │ ├── hopper_medium_expert_dt_config.py │ │ ├── hopper_medium_expert_edac_config.py │ │ ├── hopper_medium_expert_ibc_ar_config.py │ │ ├── hopper_medium_expert_ibc_config.py │ │ ├── hopper_medium_expert_ibc_mcmc_config.py │ │ ├── hopper_medium_expert_iql_config.py │ │ ├── hopper_medium_expert_pd_config.py │ │ ├── hopper_medium_expert_qgpo_config.py │ │ ├── hopper_medium_expert_td3bc_config.py │ │ ├── hopper_medium_iql_config.py │ │ ├── hopper_medium_pd_config.py │ │ ├── hopper_medium_replay_cql_config.py │ │ ├── hopper_medium_replay_dt_config.py │ │ ├── hopper_medium_replay_iql_config.py │ │ ├── hopper_medium_replay_td3bc_config.py │ │ ├── hopper_medium_td3bc_config.py │ │ ├── hopper_random_cql_config.py │ │ ├── hopper_random_dt_config.py │ │ ├── hopper_random_td3bc_config.py │ │ ├── kitchen_complete_bc_config.py │ │ ├── kitchen_complete_ibc_ar_config.py │ │ ├── kitchen_complete_ibc_config.py │ │ ├── kitchen_complete_ibc_mcmc_config.py │ │ ├── maze2d_large_pd_config.py │ │ ├── maze2d_medium_pd_config.py │ │ ├── maze2d_umaze_pd_config.py │ │ ├── pen_human_bc_config.py │ │ ├── pen_human_ibc_ar_config.py │ │ ├── pen_human_ibc_config.py │ │ ├── pen_human_ibc_mcmc_config.py │ │ ├── walker2d_expert_cql_config.py │ │ ├── walker2d_expert_dt_config.py │ │ ├── walker2d_expert_td3bc_config.py │ │ ├── walker2d_medium_cql_config.py │ │ ├── walker2d_medium_dt_config.py │ │ ├── walker2d_medium_expert_cql_config.py │ │ ├── walker2d_medium_expert_dt_config.py │ │ ├── walker2d_medium_expert_iql_config.py │ │ ├── walker2d_medium_expert_pd_config.py │ │ ├── walker2d_medium_expert_qgpo_config.py │ │ ├── walker2d_medium_expert_td3bc_config.py │ │ ├── walker2d_medium_iql_config.py │ │ ├── walker2d_medium_pd_config.py │ │ ├── walker2d_medium_replay_cql_config.py │ │ ├── walker2d_medium_replay_dt_config.py │ │ ├── walker2d_medium_replay_iql_config.py │ │ ├── walker2d_medium_replay_td3bc_config.py │ │ ├── walker2d_medium_td3bc_config.py │ │ ├── walker2d_random_cql_config.py │ │ ├── walker2d_random_dt_config.py │ │ └── walker2d_random_td3bc_config.py │ ├── d4rl.gif │ ├── entry │ │ ├── __init__.py │ │ ├── d4rl_bcq_main.py │ │ ├── d4rl_cql_main.py │ │ ├── d4rl_dt_mujoco.py │ │ ├── d4rl_edac_main.py │ │ ├── d4rl_ibc_main.py │ │ ├── d4rl_iql_main.py │ │ ├── d4rl_pd_main.py │ │ └── d4rl_td3_bc_main.py │ └── envs │ │ ├── __init__.py │ │ ├── d4rl_env.py │ │ └── d4rl_wrappers.py ├── dmc2gym │ ├── __init__.py │ ├── config │ │ ├── cartpole_balance │ │ │ └── cartpole_balance_dreamer_config.py │ │ ├── cheetah_run │ │ │ └── cheetah_run_dreamer_config.py │ │ ├── dmc2gym_dreamer_config.py │ │ ├── dmc2gym_ppo_config.py │ │ ├── dmc2gym_sac_pixel_config.py │ │ ├── dmc2gym_sac_state_config.py │ │ └── walker_walk │ │ │ └── walker_walk_dreamer_config.py │ ├── dmc2gym_cheetah.png │ ├── entry │ │ ├── dmc2gym_onppo_main.py │ │ ├── dmc2gym_sac_pixel_main.py │ │ ├── dmc2gym_sac_state_main.py │ │ └── dmc2gym_save_replay_example.py │ └── envs │ │ ├── __init__.py │ │ ├── dmc2gym_env.py │ │ └── test_dmc2gym_env.py ├── evogym │ ├── __init__.py │ ├── config │ │ ├── bridgewalker_ddpg_config.py │ │ ├── carrier_ppo_config.py │ │ ├── walker_ddpg_config.py │ │ └── walker_ppo_config.py │ ├── entry │ │ └── walker_ppo_eval.py │ ├── envs │ │ ├── __init__.py │ │ ├── evogym_env.py │ │ ├── test │ │ │ ├── test_evogym_env.py │ │ │ └── visualize_simple_env.py │ │ └── world_data │ │ │ ├── carry_bot.json │ │ │ ├── simple_evironment.json │ │ │ └── speed_bot.json │ └── evogym.gif ├── frozen_lake │ ├── FrozenLake.gif │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ └── frozen_lake_dqn_config.py │ └── envs │ │ ├── __init__.py │ │ ├── frozen_lake_env.py │ │ └── test_frozen_lake_env.py ├── gfootball │ ├── README.md │ ├── __init__.py │ ├── config │ │ ├── gfootball_counter_mappo_config.py │ │ ├── gfootball_counter_masac_config.py │ │ ├── gfootball_keeper_mappo_config.py │ │ └── gfootball_keeper_masac_config.py │ ├── entry │ │ ├── __init__.py │ │ ├── gfootball_bc_config.py │ │ ├── gfootball_bc_kaggle5th_main.py │ │ ├── gfootball_bc_rule_lt0_main.py │ │ ├── gfootball_bc_rule_main.py │ │ ├── gfootball_dqn_config.py │ │ ├── parallel │ │ │ ├── gfootball_il_parallel_config.py │ │ │ └── gfootball_ppo_parallel_config.py │ │ ├── show_dataset.py │ │ └── test_accuracy.py │ ├── envs │ │ ├── __init__.py │ │ ├── action │ │ │ ├── gfootball_action.py │ │ │ └── gfootball_action_runner.py │ │ ├── fake_dataset.py │ │ ├── gfootball_academy_env.py │ │ ├── gfootball_env.py │ │ ├── gfootballsp_env.py │ │ ├── obs │ │ │ ├── encoder.py │ │ │ ├── gfootball_obs.py │ │ │ └── gfootball_obs_runner.py │ │ ├── reward │ │ │ ├── gfootball_reward.py │ │ │ └── gfootball_reward_runner.py │ │ └── tests │ │ │ ├── test_env_gfootball.py │ │ │ └── test_env_gfootball_academy.py │ ├── gfootball.gif │ ├── model │ │ ├── __init__.py │ │ ├── bots │ │ │ ├── TamakEriFever │ │ │ │ ├── config.yaml │ │ │ │ ├── football │ │ │ │ │ └── util.py │ │ │ │ ├── football_ikki.py │ │ │ │ ├── handyrl_core │ │ │ │ │ ├── model.py │ │ │ │ │ └── util.py │ │ │ │ ├── readme.md │ │ │ │ ├── submission.py │ │ │ │ └── view_test.py │ │ │ ├── __init__.py │ │ │ ├── kaggle_5th_place_model.py │ │ │ └── rule_based_bot_model.py │ │ ├── conv1d │ │ │ ├── conv1d.py │ │ │ └── conv1d_default_config.py │ │ └── q_network │ │ │ ├── football_q_network.py │ │ │ ├── football_q_network_default_config.py │ │ │ └── tests │ │ │ └── test_football_model.py │ ├── policy │ │ ├── __init__.py │ │ └── ppo_lstm.py │ └── replay.py ├── gobigger_overview.gif ├── gym_anytrading │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ └── stocks_dqn_config.py │ ├── envs │ │ ├── README.md │ │ ├── __init__.py │ │ ├── data │ │ │ └── README.md │ │ ├── position.png │ │ ├── profit.png │ │ ├── statemachine.png │ │ ├── stocks_env.py │ │ ├── test_stocks_env.py │ │ └── trading_env.py │ └── worker │ │ ├── __init__.py │ │ └── trading_serial_evaluator.py ├── gym_hybrid │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ ├── gym_hybrid_ddpg_config.py │ │ ├── gym_hybrid_hppo_config.py │ │ ├── gym_hybrid_mpdqn_config.py │ │ └── gym_hybrid_pdqn_config.py │ ├── entry │ │ ├── __init__.py │ │ ├── gym_hybrid_ddpg_eval.py │ │ └── gym_hybrid_ddpg_main.py │ ├── envs │ │ ├── README.md │ │ ├── __init__.py │ │ ├── gym-hybrid │ │ │ ├── README.md │ │ │ ├── gym_hybrid │ │ │ │ ├── __init__.py │ │ │ │ ├── agents.py │ │ │ │ ├── bg.jpg │ │ │ │ ├── environments.py │ │ │ │ └── target.png │ │ │ ├── setup.py │ │ │ └── tests │ │ │ │ ├── hardmove.py │ │ │ │ ├── moving.py │ │ │ │ ├── record.py │ │ │ │ ├── render.py │ │ │ │ └── sliding.py │ │ ├── gym_hybrid_env.py │ │ └── test_gym_hybrid_env.py │ └── moving_v0.gif ├── gym_pybullet_drones │ ├── __init__.py │ ├── config │ │ ├── flythrugate_onppo_config.py │ │ └── takeoffaviary_onppo_config.py │ ├── entry │ │ ├── flythrugate_onppo_eval.py │ │ └── takeoffaviary_onppo_eval.py │ ├── envs │ │ ├── __init__.py │ │ ├── gym_pybullet_drones_env.py │ │ ├── test_ding_env.py │ │ └── test_ori_env.py │ └── gym_pybullet_drones.gif ├── gym_soccer │ ├── __init__.py │ ├── config │ │ └── gym_soccer_pdqn_config.py │ ├── envs │ │ ├── README.md │ │ ├── __init__.py │ │ ├── gym_soccer_env.py │ │ └── test_gym_soccer_env.py │ └── half_offensive.gif ├── image_classification │ ├── __init__.py │ ├── data │ │ ├── __init__.py │ │ ├── dataset.py │ │ └── sampler.py │ ├── entry │ │ ├── imagenet_res18_config.py │ │ └── imagenet_res18_main.py │ ├── imagenet.png │ └── policy │ │ ├── __init__.py │ │ └── policy.py ├── ising_env │ ├── __init__.py │ ├── config │ │ └── ising_mfq_config.py │ ├── entry │ │ └── ising_mfq_eval.py │ ├── envs │ │ ├── __init__.py │ │ ├── ising_model │ │ │ ├── Ising.py │ │ │ ├── __init__.py │ │ │ └── multiagent │ │ │ │ ├── __init__.py │ │ │ │ ├── core.py │ │ │ │ └── environment.py │ │ ├── ising_model_env.py │ │ └── test_ising_model_env.py │ └── ising_env.gif ├── league_demo │ ├── __init__.py │ ├── demo_league.py │ ├── game_env.py │ ├── league_demo.png │ ├── league_demo_collector.py │ ├── league_demo_ppo_config.py │ ├── league_demo_ppo_main.py │ ├── selfplay_demo_ppo_config.py │ └── selfplay_demo_ppo_main.py ├── mario │ ├── __init__.py │ ├── mario.gif │ ├── mario_dqn_config.py │ ├── mario_dqn_example.py │ └── mario_dqn_main.py ├── maze │ ├── __init__.py │ ├── config │ │ ├── maze_bc_config.py │ │ └── maze_pc_config.py │ ├── entry │ │ └── maze_bc_main.py │ └── envs │ │ ├── __init__.py │ │ ├── maze_env.py │ │ └── test_maze_env.py ├── metadrive │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ ├── metadrive_onppo_config.py │ │ └── metadrive_onppo_eval_config.py │ ├── env │ │ ├── __init__.py │ │ ├── drive_env.py │ │ ├── drive_utils.py │ │ └── drive_wrapper.py │ └── metadrive_env.gif ├── minigrid │ ├── __init__.py │ ├── config │ │ ├── minigrid_dreamer_config.py │ │ ├── minigrid_icm_offppo_config.py │ │ ├── minigrid_icm_onppo_config.py │ │ ├── minigrid_ngu_config.py │ │ ├── minigrid_offppo_config.py │ │ ├── minigrid_onppo_config.py │ │ ├── minigrid_onppo_stdim_config.py │ │ ├── minigrid_r2d2_config.py │ │ └── minigrid_rnd_onppo_config.py │ ├── entry │ │ └── minigrid_onppo_main.py │ ├── envs │ │ ├── __init__.py │ │ ├── app_key_to_door_treasure.py │ │ ├── minigrid_env.py │ │ ├── minigrid_wrapper.py │ │ ├── noisy_tv.py │ │ └── test_minigrid_env.py │ ├── minigrid.gif │ └── utils │ │ └── eval.py ├── mujoco │ ├── __init__.py │ ├── addition │ │ └── install_mesa.sh │ ├── config │ │ ├── __init__.py │ │ ├── ant_ddpg_config.py │ │ ├── ant_gail_sac_config.py │ │ ├── ant_onppo_config.py │ │ ├── ant_ppo_config.py │ │ ├── ant_sac_config.py │ │ ├── ant_td3_config.py │ │ ├── ant_trex_onppo_config.py │ │ ├── ant_trex_sac_config.py │ │ ├── halfcheetah_bco_config.py │ │ ├── halfcheetah_bdq_config.py │ │ ├── halfcheetah_d4pg_config.py │ │ ├── halfcheetah_ddpg_config.py │ │ ├── halfcheetah_gail_sac_config.py │ │ ├── halfcheetah_gcl_sac_config.py │ │ ├── halfcheetah_onppo_config.py │ │ ├── halfcheetah_sac_config.py │ │ ├── halfcheetah_sqil_sac_config.py │ │ ├── halfcheetah_td3_config.py │ │ ├── halfcheetah_trex_onppo_config.py │ │ ├── halfcheetah_trex_sac_config.py │ │ ├── hopper_bco_config.py │ │ ├── hopper_bdq_config.py │ │ ├── hopper_cql_config.py │ │ ├── hopper_d4pg_config.py │ │ ├── hopper_ddpg_config.py │ │ ├── hopper_gail_sac_config.py │ │ ├── hopper_gcl_config.py │ │ ├── hopper_onppo_config.py │ │ ├── hopper_sac_config.py │ │ ├── hopper_sac_data_generation_config.py │ │ ├── hopper_sqil_sac_config.py │ │ ├── hopper_td3_bc_config.py │ │ ├── hopper_td3_config.py │ │ ├── hopper_td3_data_generation_config.py │ │ ├── hopper_trex_onppo_config.py │ │ ├── hopper_trex_sac_config.py │ │ ├── mbrl │ │ │ ├── halfcheetah_mbsac_mbpo_config.py │ │ │ ├── halfcheetah_sac_mbpo_config.py │ │ │ ├── halfcheetah_stevesac_mbpo_config.py │ │ │ ├── hopper_mbsac_mbpo_config.py │ │ │ ├── hopper_sac_mbpo_config.py │ │ │ ├── hopper_stevesac_mbpo_config.py │ │ │ ├── walker2d_mbsac_mbpo_config.py │ │ │ ├── walker2d_sac_mbpo_config.py │ │ │ └── walker2d_stevesac_mbpo_config.py │ │ ├── walker2d_d4pg_config.py │ │ ├── walker2d_ddpg_config.py │ │ ├── walker2d_gail_ddpg_config.py │ │ ├── walker2d_gail_sac_config.py │ │ ├── walker2d_gcl_config.py │ │ ├── walker2d_onppo_config.py │ │ ├── walker2d_sac_config.py │ │ ├── walker2d_sqil_sac_config.py │ │ ├── walker2d_td3_config.py │ │ ├── walker2d_trex_onppo_config.py │ │ └── walker2d_trex_sac_config.py │ ├── entry │ │ ├── __init__.py │ │ ├── mujoco_cql_generation_main.py │ │ ├── mujoco_cql_main.py │ │ ├── mujoco_d4pg_main.py │ │ ├── mujoco_ddpg_eval.py │ │ ├── mujoco_ddpg_main.py │ │ ├── mujoco_ppo_main.py │ │ └── mujoco_td3_bc_main.py │ ├── envs │ │ ├── __init__.py │ │ ├── mujoco_disc_env.py │ │ ├── mujoco_env.py │ │ ├── mujoco_gym_env.py │ │ ├── mujoco_wrappers.py │ │ └── test │ │ │ ├── test_mujoco_disc_env.py │ │ │ ├── test_mujoco_env.py │ │ │ └── test_mujoco_gym_env.py │ ├── example │ │ ├── mujoco_bc_main.py │ │ └── mujoco_sac.py │ └── mujoco.gif ├── multiagent_mujoco │ ├── README.md │ ├── __init__.py │ ├── config │ │ ├── ant_maddpg_config.py │ │ ├── ant_mappo_config.py │ │ ├── ant_masac_config.py │ │ ├── ant_matd3_config.py │ │ ├── halfcheetah_happo_config.py │ │ ├── halfcheetah_mappo_config.py │ │ └── walker2d_happo_config.py │ └── envs │ │ ├── __init__.py │ │ ├── assets │ │ ├── .gitignore │ │ ├── __init__.py │ │ ├── coupled_half_cheetah.xml │ │ ├── manyagent_ant.xml │ │ ├── manyagent_ant.xml.template │ │ ├── manyagent_ant__stage1.xml │ │ ├── manyagent_swimmer.xml.template │ │ ├── manyagent_swimmer__bckp2.xml │ │ └── manyagent_swimmer_bckp.xml │ │ ├── coupled_half_cheetah.py │ │ ├── manyagent_ant.py │ │ ├── manyagent_swimmer.py │ │ ├── mujoco_multi.py │ │ ├── multi_mujoco_env.py │ │ ├── multiagentenv.py │ │ └── obsk.py ├── overcooked │ ├── README.md │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ └── overcooked_ppo_config.py │ ├── envs │ │ ├── __init__.py │ │ ├── overcooked_env.py │ │ └── test_overcooked_env.py │ └── overcooked.gif ├── petting_zoo │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ ├── ptz_pistonball_qmix_config.py │ │ ├── ptz_simple_spread_atoc_config.py │ │ ├── ptz_simple_spread_collaq_config.py │ │ ├── ptz_simple_spread_coma_config.py │ │ ├── ptz_simple_spread_happo_config.py │ │ ├── ptz_simple_spread_maddpg_config.py │ │ ├── ptz_simple_spread_madqn_config.py │ │ ├── ptz_simple_spread_mappo_config.py │ │ ├── ptz_simple_spread_masac_config.py │ │ ├── ptz_simple_spread_qmix_config.py │ │ ├── ptz_simple_spread_qtran_config.py │ │ ├── ptz_simple_spread_vdn_config.py │ │ └── ptz_simple_spread_wqmix_config.py │ ├── entry │ │ └── ptz_simple_spread_eval.py │ ├── envs │ │ ├── __init__.py │ │ ├── petting_zoo_pistonball_env.py │ │ ├── petting_zoo_simple_spread_env.py │ │ ├── test_petting_zoo_pistonball_env.py │ │ └── test_petting_zoo_simple_spread_env.py │ └── petting_zoo_mpe_simple_spread.gif ├── pomdp │ ├── __init__.py │ ├── config │ │ ├── pomdp_dqn_config.py │ │ └── pomdp_ppo_config.py │ └── envs │ │ ├── __init__.py │ │ ├── atari_env.py │ │ ├── atari_wrappers.py │ │ └── test_atari_env.py ├── procgen │ ├── README.md │ ├── __init__.py │ ├── coinrun.gif │ ├── coinrun.png │ ├── coinrun_dqn.svg │ ├── coinrun_ppo.svg │ ├── config │ │ ├── __init__.py │ │ ├── bigfish_plr_config.py │ │ ├── bigfish_ppg_config.py │ │ ├── coinrun_dqn_config.py │ │ ├── coinrun_ppg_config.py │ │ ├── coinrun_ppo_config.py │ │ ├── maze_dqn_config.py │ │ ├── maze_ppg_config.py │ │ └── maze_ppo_config.py │ ├── entry │ │ └── coinrun_onppo_main.py │ ├── envs │ │ ├── __init__.py │ │ ├── procgen_env.py │ │ └── test_coinrun_env.py │ ├── maze.gif │ ├── maze.png │ └── maze_dqn.svg ├── pybullet │ ├── __init__.py │ ├── envs │ │ ├── __init__.py │ │ ├── pybullet_env.py │ │ └── pybullet_wrappers.py │ └── pybullet.gif ├── rocket │ ├── README.md │ ├── __init__.py │ ├── config │ │ ├── __init__.py │ │ ├── rocket_hover_ppo_config.py │ │ └── rocket_landing_ppo_config.py │ ├── entry │ │ ├── __init__.py │ │ ├── rocket_hover_onppo_main_v2.py │ │ ├── rocket_hover_ppo_main.py │ │ ├── rocket_landing_onppo_main_v2.py │ │ └── rocket_landing_ppo_main.py │ └── envs │ │ ├── __init__.py │ │ ├── rocket_env.py │ │ └── test_rocket_env.py ├── slime_volley │ ├── __init__.py │ ├── config │ │ ├── slime_volley_league_ppo_config.py │ │ └── slime_volley_ppo_config.py │ ├── entry │ │ ├── slime_volley_league_ppo_main.py │ │ └── slime_volley_selfplay_ppo_main.py │ ├── envs │ │ ├── __init__.py │ │ ├── slime_volley_env.py │ │ └── test_slime_volley_env.py │ └── slime_volley.gif ├── smac │ ├── README.md │ ├── __init__.py │ ├── config │ │ ├── smac_10m11m_mappo_config.py │ │ ├── smac_10m11m_masac_config.py │ │ ├── smac_25m_mappo_config.py │ │ ├── smac_25m_masac_config.py │ │ ├── smac_27m30m_mappo_config.py │ │ ├── smac_2c64zg_mappo_config.py │ │ ├── smac_2c64zg_masac_config.py │ │ ├── smac_2c64zg_qmix_config.py │ │ ├── smac_2s3z_qmix_config.py │ │ ├── smac_2s3z_qtran_config.py │ │ ├── smac_3m_masac_config.py │ │ ├── smac_3s5z_collaq_config.py │ │ ├── smac_3s5z_collaq_per_config.py │ │ ├── smac_3s5z_coma_config.py │ │ ├── smac_3s5z_madqn_config.py │ │ ├── smac_3s5z_mappo_config.py │ │ ├── smac_3s5z_masac_config.py │ │ ├── smac_3s5z_qmix_config.py │ │ ├── smac_3s5z_qtran_config.py │ │ ├── smac_3s5z_wqmix_config.py │ │ ├── smac_3s5zvs3s6z_madqn_config.py │ │ ├── smac_3s5zvs3s6z_mappo_config.py │ │ ├── smac_3s5zvs3s6z_masac_config.py │ │ ├── smac_5m6m_collaq_config.py │ │ ├── smac_5m6m_madqn_config.py │ │ ├── smac_5m6m_mappo_config.py │ │ ├── smac_5m6m_masac_config.py │ │ ├── smac_5m6m_qmix_config.py │ │ ├── smac_5m6m_qtran_config.py │ │ ├── smac_5m6m_wqmix_config.py │ │ ├── smac_8m9m_madqn_config.py │ │ ├── smac_8m9m_mappo_config.py │ │ ├── smac_8m9m_masac_config.py │ │ ├── smac_MMM2_collaq_config.py │ │ ├── smac_MMM2_coma_config.py │ │ ├── smac_MMM2_madqn_config.py │ │ ├── smac_MMM2_mappo_config.py │ │ ├── smac_MMM2_masac_config.py │ │ ├── smac_MMM2_qmix_config.py │ │ ├── smac_MMM2_wqmix_config.py │ │ ├── smac_MMM_collaq_config.py │ │ ├── smac_MMM_coma_config.py │ │ ├── smac_MMM_madqn_config.py │ │ ├── smac_MMM_mappo_config.py │ │ ├── smac_MMM_masac_config.py │ │ ├── smac_MMM_qmix_config.py │ │ ├── smac_MMM_qtran_config.py │ │ ├── smac_MMM_wqmix_config.py │ │ ├── smac_corridor_mappo_config.py │ │ └── smac_corridor_masac_config.py │ ├── envs │ │ ├── __init__.py │ │ ├── fake_smac_env.py │ │ ├── maps │ │ │ ├── README.md │ │ │ ├── SMAC_Maps │ │ │ │ ├── 10m_vs_11m.SC2Map │ │ │ │ ├── 1c3s5z.SC2Map │ │ │ │ ├── 25m.SC2Map │ │ │ │ ├── 27m_vs_30m.SC2Map │ │ │ │ ├── 2c_vs_64zg.SC2Map │ │ │ │ ├── 2m_vs_1z.SC2Map │ │ │ │ ├── 2s3z.SC2Map │ │ │ │ ├── 2s_vs_1sc.SC2Map │ │ │ │ ├── 3m.SC2Map │ │ │ │ ├── 3s5z.SC2Map │ │ │ │ ├── 3s5z_vs_3s6z.SC2Map │ │ │ │ ├── 3s_vs_3z.SC2Map │ │ │ │ ├── 3s_vs_4z.SC2Map │ │ │ │ ├── 3s_vs_5z.SC2Map │ │ │ │ ├── 5m_vs_6m.SC2Map │ │ │ │ ├── 6h_vs_8z.SC2Map │ │ │ │ ├── 8m.SC2Map │ │ │ │ ├── 8m_vs_9m.SC2Map │ │ │ │ ├── MMM.SC2Map │ │ │ │ ├── MMM2.SC2Map │ │ │ │ ├── __init__.py │ │ │ │ ├── bane_vs_bane.SC2Map │ │ │ │ ├── corridor.SC2Map │ │ │ │ ├── infestor_viper.SC2Map │ │ │ │ └── so_many_baneling.SC2Map │ │ │ ├── SMAC_Maps_two_player │ │ │ │ ├── 3m.SC2Map │ │ │ │ ├── 3s5z.SC2Map │ │ │ │ └── __init__.py │ │ │ └── __init__.py │ │ ├── smac_action.py │ │ ├── smac_env.py │ │ ├── smac_map.py │ │ ├── smac_reward.py │ │ └── test_smac_env.py │ ├── smac.gif │ └── utils │ │ └── eval.py ├── sokoban │ ├── __init__.py │ └── envs │ │ ├── __init__.py │ │ ├── sokoban_env.py │ │ ├── sokoban_wrappers.py │ │ └── test_sokoban_env.py ├── tabmwp │ ├── README.md │ ├── __init__.py │ ├── benchmark.png │ ├── config │ │ ├── tabmwp_awr_config.py │ │ └── tabmwp_pg_config.py │ ├── envs │ │ ├── __init__.py │ │ ├── tabmwp_env.py │ │ ├── test_tabmwp_env.py │ │ └── utils.py │ └── tabmwp.jpeg └── taxi │ ├── Taxi-v3_episode_0.gif │ ├── __init__.py │ ├── config │ ├── __init__.py │ └── taxi_dqn_config.py │ ├── entry │ └── taxi_dqn_deploy.py │ └── envs │ ├── __init__.py │ ├── taxi_env.py │ └── test_taxi_env.py ├── docker ├── Dockerfile.base ├── Dockerfile.env ├── Dockerfile.hpc └── Dockerfile.rpc ├── format.sh ├── pytest.ini └── setup.py /.coveragerc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.coveragerc -------------------------------------------------------------------------------- /.flake8: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.flake8 -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/custom.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/ISSUE_TEMPLATE/custom.md -------------------------------------------------------------------------------- /.github/PULL_REQUEST_TEMPLATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/PULL_REQUEST_TEMPLATE.md -------------------------------------------------------------------------------- /.github/workflows/algo_test.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/algo_test.yml -------------------------------------------------------------------------------- /.github/workflows/badge.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/badge.yml -------------------------------------------------------------------------------- /.github/workflows/deploy.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/deploy.yml -------------------------------------------------------------------------------- /.github/workflows/doc.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/doc.yml -------------------------------------------------------------------------------- /.github/workflows/envpool_test.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/envpool_test.yml -------------------------------------------------------------------------------- /.github/workflows/platform_test.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/platform_test.yml -------------------------------------------------------------------------------- /.github/workflows/release.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/release.yml -------------------------------------------------------------------------------- /.github/workflows/release_conda.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/release_conda.yml -------------------------------------------------------------------------------- /.github/workflows/style.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/style.yml -------------------------------------------------------------------------------- /.github/workflows/unit_test.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.github/workflows/unit_test.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.gitignore -------------------------------------------------------------------------------- /.style.yapf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/.style.yapf -------------------------------------------------------------------------------- /CHANGELOG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/CHANGELOG -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/README.md -------------------------------------------------------------------------------- /SECURITY.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/SECURITY.md -------------------------------------------------------------------------------- /assets/wechat.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/assets/wechat.jpeg -------------------------------------------------------------------------------- /cloc.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/cloc.sh -------------------------------------------------------------------------------- /codecov.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/codecov.yml -------------------------------------------------------------------------------- /conda/conda_build_config.yaml: -------------------------------------------------------------------------------- 1 | python: 2 | - 3.7 3 | -------------------------------------------------------------------------------- /conda/meta.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/conda/meta.yaml -------------------------------------------------------------------------------- /ding/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/__init__.py -------------------------------------------------------------------------------- /ding/bonus/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/__init__.py -------------------------------------------------------------------------------- /ding/bonus/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/a2c.py -------------------------------------------------------------------------------- /ding/bonus/c51.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/c51.py -------------------------------------------------------------------------------- /ding/bonus/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/common.py -------------------------------------------------------------------------------- /ding/bonus/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/config.py -------------------------------------------------------------------------------- /ding/bonus/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/ddpg.py -------------------------------------------------------------------------------- /ding/bonus/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/dqn.py -------------------------------------------------------------------------------- /ding/bonus/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/model.py -------------------------------------------------------------------------------- /ding/bonus/pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/pg.py -------------------------------------------------------------------------------- /ding/bonus/ppo_offpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/ppo_offpolicy.py -------------------------------------------------------------------------------- /ding/bonus/ppof.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/ppof.py -------------------------------------------------------------------------------- /ding/bonus/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/sac.py -------------------------------------------------------------------------------- /ding/bonus/sql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/sql.py -------------------------------------------------------------------------------- /ding/bonus/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/bonus/td3.py -------------------------------------------------------------------------------- /ding/compatibility.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/compatibility.py -------------------------------------------------------------------------------- /ding/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/__init__.py -------------------------------------------------------------------------------- /ding/config/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/config.py -------------------------------------------------------------------------------- /ding/config/example/A2C/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/A2C/__init__.py -------------------------------------------------------------------------------- /ding/config/example/C51/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/C51/__init__.py -------------------------------------------------------------------------------- /ding/config/example/DDPG/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/DDPG/__init__.py -------------------------------------------------------------------------------- /ding/config/example/DDPG/gym_hopper_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/DDPG/gym_hopper_v3.py -------------------------------------------------------------------------------- /ding/config/example/DQN/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/DQN/__init__.py -------------------------------------------------------------------------------- /ding/config/example/PG/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/PG/__init__.py -------------------------------------------------------------------------------- /ding/config/example/PG/gym_pendulum_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/PG/gym_pendulum_v1.py -------------------------------------------------------------------------------- /ding/config/example/PPOF/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/PPOF/__init__.py -------------------------------------------------------------------------------- /ding/config/example/SAC/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/SAC/__init__.py -------------------------------------------------------------------------------- /ding/config/example/SAC/gym_hopper_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/SAC/gym_hopper_v3.py -------------------------------------------------------------------------------- /ding/config/example/SQL/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/SQL/__init__.py -------------------------------------------------------------------------------- /ding/config/example/TD3/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/TD3/__init__.py -------------------------------------------------------------------------------- /ding/config/example/TD3/gym_hopper_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/TD3/gym_hopper_v3.py -------------------------------------------------------------------------------- /ding/config/example/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/example/__init__.py -------------------------------------------------------------------------------- /ding/config/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/config/utils.py -------------------------------------------------------------------------------- /ding/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/__init__.py -------------------------------------------------------------------------------- /ding/data/buffer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/__init__.py -------------------------------------------------------------------------------- /ding/data/buffer/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/buffer.py -------------------------------------------------------------------------------- /ding/data/buffer/deque_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/deque_buffer.py -------------------------------------------------------------------------------- /ding/data/buffer/deque_buffer_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/deque_buffer_wrapper.py -------------------------------------------------------------------------------- /ding/data/buffer/middleware/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/middleware/__init__.py -------------------------------------------------------------------------------- /ding/data/buffer/middleware/padding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/middleware/padding.py -------------------------------------------------------------------------------- /ding/data/buffer/middleware/priority.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/middleware/priority.py -------------------------------------------------------------------------------- /ding/data/buffer/tests/test_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/tests/test_buffer.py -------------------------------------------------------------------------------- /ding/data/buffer/tests/test_middleware.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/buffer/tests/test_middleware.py -------------------------------------------------------------------------------- /ding/data/level_replay/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/data/level_replay/level_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/level_replay/level_sampler.py -------------------------------------------------------------------------------- /ding/data/model_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/model_loader.py -------------------------------------------------------------------------------- /ding/data/shm_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/shm_buffer.py -------------------------------------------------------------------------------- /ding/data/storage/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/storage/__init__.py -------------------------------------------------------------------------------- /ding/data/storage/file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/storage/file.py -------------------------------------------------------------------------------- /ding/data/storage/storage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/storage/storage.py -------------------------------------------------------------------------------- /ding/data/storage/tests/test_storage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/storage/tests/test_storage.py -------------------------------------------------------------------------------- /ding/data/storage_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/storage_loader.py -------------------------------------------------------------------------------- /ding/data/tests/test_model_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/tests/test_model_loader.py -------------------------------------------------------------------------------- /ding/data/tests/test_shm_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/tests/test_shm_buffer.py -------------------------------------------------------------------------------- /ding/data/tests/test_storage_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/data/tests/test_storage_loader.py -------------------------------------------------------------------------------- /ding/design/dataloader-sequence.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/dataloader-sequence.png -------------------------------------------------------------------------------- /ding/design/dataloader-sequence.puml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/dataloader-sequence.puml -------------------------------------------------------------------------------- /ding/design/env_state.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/env_state.png -------------------------------------------------------------------------------- /ding/design/parallel_main-sequence.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/parallel_main-sequence.png -------------------------------------------------------------------------------- /ding/design/parallel_main-sequence.puml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/parallel_main-sequence.puml -------------------------------------------------------------------------------- /ding/design/serial_collector-activity.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/serial_collector-activity.png -------------------------------------------------------------------------------- /ding/design/serial_evaluator-activity.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/serial_evaluator-activity.png -------------------------------------------------------------------------------- /ding/design/serial_learner-activity.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/serial_learner-activity.png -------------------------------------------------------------------------------- /ding/design/serial_learner-activity.puml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/serial_learner-activity.puml -------------------------------------------------------------------------------- /ding/design/serial_main-sequence.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/serial_main-sequence.png -------------------------------------------------------------------------------- /ding/design/serial_main.puml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/design/serial_main.puml -------------------------------------------------------------------------------- /ding/entry/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/__init__.py -------------------------------------------------------------------------------- /ding/entry/application_entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/application_entry.py -------------------------------------------------------------------------------- /ding/entry/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/cli.py -------------------------------------------------------------------------------- /ding/entry/cli_ditask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/cli_ditask.py -------------------------------------------------------------------------------- /ding/entry/cli_parsers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/cli_parsers/__init__.py -------------------------------------------------------------------------------- /ding/entry/cli_parsers/k8s_parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/cli_parsers/k8s_parser.py -------------------------------------------------------------------------------- /ding/entry/cli_parsers/slurm_parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/cli_parsers/slurm_parser.py -------------------------------------------------------------------------------- /ding/entry/dist_entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/dist_entry.py -------------------------------------------------------------------------------- /ding/entry/parallel_entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/parallel_entry.py -------------------------------------------------------------------------------- /ding/entry/predefined_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/predefined_config.py -------------------------------------------------------------------------------- /ding/entry/serial_entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_bc.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_bco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_bco.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_dqfd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_dqfd.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_gail.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_gail.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_guided_cost.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_guided_cost.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_mbrl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_mbrl.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_ngu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_ngu.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_offline.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_onpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_onpolicy.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_onpolicy_ppg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_onpolicy_ppg.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_pc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_pc.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_plr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_plr.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_r2d3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_r2d3.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_sqil.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_sqil.py -------------------------------------------------------------------------------- /ding/entry/serial_entry_td3_vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/serial_entry_td3_vae.py -------------------------------------------------------------------------------- /ding/entry/tests/config/agconfig.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/config/agconfig.yaml -------------------------------------------------------------------------------- /ding/entry/tests/config/k8s-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/config/k8s-config.yaml -------------------------------------------------------------------------------- /ding/entry/tests/test_cli_ditask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/test_cli_ditask.py -------------------------------------------------------------------------------- /ding/entry/tests/test_parallel_entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/test_parallel_entry.py -------------------------------------------------------------------------------- /ding/entry/tests/test_random_collect.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/test_random_collect.py -------------------------------------------------------------------------------- /ding/entry/tests/test_serial_entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/test_serial_entry.py -------------------------------------------------------------------------------- /ding/entry/tests/test_serial_entry_bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/test_serial_entry_bc.py -------------------------------------------------------------------------------- /ding/entry/tests/test_serial_entry_bco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/tests/test_serial_entry_bco.py -------------------------------------------------------------------------------- /ding/entry/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/entry/utils.py -------------------------------------------------------------------------------- /ding/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/__init__.py -------------------------------------------------------------------------------- /ding/envs/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/common/__init__.py -------------------------------------------------------------------------------- /ding/envs/common/common_function.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/common/common_function.py -------------------------------------------------------------------------------- /ding/envs/common/env_element.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/common/env_element.py -------------------------------------------------------------------------------- /ding/envs/common/env_element_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/common/env_element_runner.py -------------------------------------------------------------------------------- /ding/envs/env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env/__init__.py -------------------------------------------------------------------------------- /ding/envs/env/base_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env/base_env.py -------------------------------------------------------------------------------- /ding/envs/env/default_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env/default_wrapper.py -------------------------------------------------------------------------------- /ding/envs/env/ding_env_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env/ding_env_wrapper.py -------------------------------------------------------------------------------- /ding/envs/env/env_implementation_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env/env_implementation_check.py -------------------------------------------------------------------------------- /ding/envs/env/tests/__init__.py: -------------------------------------------------------------------------------- 1 | from .demo_env import DemoEnv 2 | -------------------------------------------------------------------------------- /ding/envs/env/tests/demo_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env/tests/demo_env.py -------------------------------------------------------------------------------- /ding/envs/env_manager/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_manager/__init__.py -------------------------------------------------------------------------------- /ding/envs/env_manager/base_env_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_manager/base_env_manager.py -------------------------------------------------------------------------------- /ding/envs/env_manager/ding_env_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_manager/ding_env_manager.py -------------------------------------------------------------------------------- /ding/envs/env_manager/env_supervisor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_manager/env_supervisor.py -------------------------------------------------------------------------------- /ding/envs/env_manager/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/envs/env_manager/tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_manager/tests/conftest.py -------------------------------------------------------------------------------- /ding/envs/env_manager/tests/test_shm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_manager/tests/test_shm.py -------------------------------------------------------------------------------- /ding/envs/env_wrappers/__init__.py: -------------------------------------------------------------------------------- 1 | from .env_wrappers import * 2 | -------------------------------------------------------------------------------- /ding/envs/env_wrappers/env_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/env_wrappers/env_wrappers.py -------------------------------------------------------------------------------- /ding/envs/gym_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/envs/gym_env.py -------------------------------------------------------------------------------- /ding/example/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/example/bcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/bcq.py -------------------------------------------------------------------------------- /ding/example/c51_nstep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/c51_nstep.py -------------------------------------------------------------------------------- /ding/example/collect_demo_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/collect_demo_data.py -------------------------------------------------------------------------------- /ding/example/cql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/cql.py -------------------------------------------------------------------------------- /ding/example/d4pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/d4pg.py -------------------------------------------------------------------------------- /ding/example/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/ddpg.py -------------------------------------------------------------------------------- /ding/example/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn.py -------------------------------------------------------------------------------- /ding/example/dqn_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_eval.py -------------------------------------------------------------------------------- /ding/example/dqn_frozen_lake.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_frozen_lake.py -------------------------------------------------------------------------------- /ding/example/dqn_her.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_her.py -------------------------------------------------------------------------------- /ding/example/dqn_new_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_new_env.py -------------------------------------------------------------------------------- /ding/example/dqn_nstep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_nstep.py -------------------------------------------------------------------------------- /ding/example/dqn_nstep_gymnasium.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_nstep_gymnasium.py -------------------------------------------------------------------------------- /ding/example/dqn_per.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_per.py -------------------------------------------------------------------------------- /ding/example/dqn_rnd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dqn_rnd.py -------------------------------------------------------------------------------- /ding/example/dt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/dt.py -------------------------------------------------------------------------------- /ding/example/edac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/edac.py -------------------------------------------------------------------------------- /ding/example/impala.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/impala.py -------------------------------------------------------------------------------- /ding/example/iqn_nstep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/iqn_nstep.py -------------------------------------------------------------------------------- /ding/example/mappo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/mappo.py -------------------------------------------------------------------------------- /ding/example/masac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/masac.py -------------------------------------------------------------------------------- /ding/example/pdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/pdqn.py -------------------------------------------------------------------------------- /ding/example/ppg_offpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/ppg_offpolicy.py -------------------------------------------------------------------------------- /ding/example/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/ppo.py -------------------------------------------------------------------------------- /ding/example/ppo_lunarlander.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/ppo_lunarlander.py -------------------------------------------------------------------------------- /ding/example/ppo_offpolicy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/ppo_offpolicy.py -------------------------------------------------------------------------------- /ding/example/ppo_with_complex_obs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/ppo_with_complex_obs.py -------------------------------------------------------------------------------- /ding/example/qgpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/qgpo.py -------------------------------------------------------------------------------- /ding/example/qrdqn_nstep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/qrdqn_nstep.py -------------------------------------------------------------------------------- /ding/example/r2d2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/r2d2.py -------------------------------------------------------------------------------- /ding/example/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/sac.py -------------------------------------------------------------------------------- /ding/example/sqil.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/sqil.py -------------------------------------------------------------------------------- /ding/example/sqil_continuous.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/sqil_continuous.py -------------------------------------------------------------------------------- /ding/example/sql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/sql.py -------------------------------------------------------------------------------- /ding/example/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/td3.py -------------------------------------------------------------------------------- /ding/example/trex.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/example/trex.py -------------------------------------------------------------------------------- /ding/framework/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/__init__.py -------------------------------------------------------------------------------- /ding/framework/context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/context.py -------------------------------------------------------------------------------- /ding/framework/event_loop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/event_loop.py -------------------------------------------------------------------------------- /ding/framework/message_queue/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/message_queue/__init__.py -------------------------------------------------------------------------------- /ding/framework/message_queue/mq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/message_queue/mq.py -------------------------------------------------------------------------------- /ding/framework/message_queue/nng.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/message_queue/nng.py -------------------------------------------------------------------------------- /ding/framework/message_queue/redis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/message_queue/redis.py -------------------------------------------------------------------------------- /ding/framework/middleware/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/middleware/__init__.py -------------------------------------------------------------------------------- /ding/framework/middleware/barrier.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/middleware/barrier.py -------------------------------------------------------------------------------- /ding/framework/middleware/ckpt_handler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/middleware/ckpt_handler.py -------------------------------------------------------------------------------- /ding/framework/middleware/collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/middleware/collector.py -------------------------------------------------------------------------------- /ding/framework/middleware/learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/middleware/learner.py -------------------------------------------------------------------------------- /ding/framework/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/parallel.py -------------------------------------------------------------------------------- /ding/framework/supervisor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/supervisor.py -------------------------------------------------------------------------------- /ding/framework/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/task.py -------------------------------------------------------------------------------- /ding/framework/tests/test_context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/tests/test_context.py -------------------------------------------------------------------------------- /ding/framework/tests/test_event_loop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/tests/test_event_loop.py -------------------------------------------------------------------------------- /ding/framework/tests/test_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/tests/test_parallel.py -------------------------------------------------------------------------------- /ding/framework/tests/test_supervisor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/tests/test_supervisor.py -------------------------------------------------------------------------------- /ding/framework/tests/test_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/tests/test_task.py -------------------------------------------------------------------------------- /ding/framework/tests/test_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/tests/test_wrapper.py -------------------------------------------------------------------------------- /ding/framework/wrapper/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/wrapper/__init__.py -------------------------------------------------------------------------------- /ding/framework/wrapper/step_timer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/framework/wrapper/step_timer.py -------------------------------------------------------------------------------- /ding/hpc_rl/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/README.md -------------------------------------------------------------------------------- /ding/hpc_rl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/__init__.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_dntd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_dntd.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_gae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_gae.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_lstm.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_ppo.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_qntd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_qntd.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_qntd_rescale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_qntd_rescale.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_scatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_scatter.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_tdlambda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_tdlambda.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_upgo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_upgo.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/test_vtrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/test_vtrace.py -------------------------------------------------------------------------------- /ding/hpc_rl/tests/testbase.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/tests/testbase.py -------------------------------------------------------------------------------- /ding/hpc_rl/wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/hpc_rl/wrapper.py -------------------------------------------------------------------------------- /ding/interaction/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/__init__.py -------------------------------------------------------------------------------- /ding/interaction/base/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/base/__init__.py -------------------------------------------------------------------------------- /ding/interaction/base/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/base/app.py -------------------------------------------------------------------------------- /ding/interaction/base/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/base/common.py -------------------------------------------------------------------------------- /ding/interaction/base/network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/base/network.py -------------------------------------------------------------------------------- /ding/interaction/base/threading.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/base/threading.py -------------------------------------------------------------------------------- /ding/interaction/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/config/__init__.py -------------------------------------------------------------------------------- /ding/interaction/config/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/config/base.py -------------------------------------------------------------------------------- /ding/interaction/exception/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/exception/__init__.py -------------------------------------------------------------------------------- /ding/interaction/exception/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/exception/base.py -------------------------------------------------------------------------------- /ding/interaction/exception/master.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/exception/master.py -------------------------------------------------------------------------------- /ding/interaction/exception/slave.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/exception/slave.py -------------------------------------------------------------------------------- /ding/interaction/master/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/master/__init__.py -------------------------------------------------------------------------------- /ding/interaction/master/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/master/base.py -------------------------------------------------------------------------------- /ding/interaction/master/connection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/master/connection.py -------------------------------------------------------------------------------- /ding/interaction/master/master.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/master/master.py -------------------------------------------------------------------------------- /ding/interaction/master/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/master/task.py -------------------------------------------------------------------------------- /ding/interaction/slave/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/slave/__init__.py -------------------------------------------------------------------------------- /ding/interaction/slave/action.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/slave/action.py -------------------------------------------------------------------------------- /ding/interaction/slave/slave.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/slave/slave.py -------------------------------------------------------------------------------- /ding/interaction/tests/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/tests/__init__.py -------------------------------------------------------------------------------- /ding/interaction/tests/base/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/tests/base/__init__.py -------------------------------------------------------------------------------- /ding/interaction/tests/base/test_app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/interaction/tests/base/test_app.py -------------------------------------------------------------------------------- /ding/interaction/tests/config/__init__.py: -------------------------------------------------------------------------------- 1 | from .test_base import TestInteractionConfig 2 | -------------------------------------------------------------------------------- /ding/league/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/__init__.py -------------------------------------------------------------------------------- /ding/league/algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/algorithm.py -------------------------------------------------------------------------------- /ding/league/base_league.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/base_league.py -------------------------------------------------------------------------------- /ding/league/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/metric.py -------------------------------------------------------------------------------- /ding/league/one_vs_one_league.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/one_vs_one_league.py -------------------------------------------------------------------------------- /ding/league/player.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/player.py -------------------------------------------------------------------------------- /ding/league/shared_payoff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/shared_payoff.py -------------------------------------------------------------------------------- /ding/league/starcraft_player.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/starcraft_player.py -------------------------------------------------------------------------------- /ding/league/tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/tests/conftest.py -------------------------------------------------------------------------------- /ding/league/tests/test_league_metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/tests/test_league_metric.py -------------------------------------------------------------------------------- /ding/league/tests/test_payoff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/tests/test_payoff.py -------------------------------------------------------------------------------- /ding/league/tests/test_player.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/league/tests/test_player.py -------------------------------------------------------------------------------- /ding/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/__init__.py -------------------------------------------------------------------------------- /ding/model/common/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/common/__init__.py -------------------------------------------------------------------------------- /ding/model/common/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/common/encoder.py -------------------------------------------------------------------------------- /ding/model/common/head.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/common/head.py -------------------------------------------------------------------------------- /ding/model/common/tests/test_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/common/tests/test_encoder.py -------------------------------------------------------------------------------- /ding/model/common/tests/test_head.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/common/tests/test_head.py -------------------------------------------------------------------------------- /ding/model/common/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/common/utils.py -------------------------------------------------------------------------------- /ding/model/template/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/__init__.py -------------------------------------------------------------------------------- /ding/model/template/acer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/acer.py -------------------------------------------------------------------------------- /ding/model/template/atoc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/atoc.py -------------------------------------------------------------------------------- /ding/model/template/bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/bc.py -------------------------------------------------------------------------------- /ding/model/template/bcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/bcq.py -------------------------------------------------------------------------------- /ding/model/template/collaq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/collaq.py -------------------------------------------------------------------------------- /ding/model/template/coma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/coma.py -------------------------------------------------------------------------------- /ding/model/template/diffusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/diffusion.py -------------------------------------------------------------------------------- /ding/model/template/ebm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/ebm.py -------------------------------------------------------------------------------- /ding/model/template/edac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/edac.py -------------------------------------------------------------------------------- /ding/model/template/havac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/havac.py -------------------------------------------------------------------------------- /ding/model/template/hpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/hpt.py -------------------------------------------------------------------------------- /ding/model/template/madqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/madqn.py -------------------------------------------------------------------------------- /ding/model/template/maqac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/maqac.py -------------------------------------------------------------------------------- /ding/model/template/mavac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/mavac.py -------------------------------------------------------------------------------- /ding/model/template/ngu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/ngu.py -------------------------------------------------------------------------------- /ding/model/template/pdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/pdqn.py -------------------------------------------------------------------------------- /ding/model/template/pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/pg.py -------------------------------------------------------------------------------- /ding/model/template/ppg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/ppg.py -------------------------------------------------------------------------------- /ding/model/template/q_learning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/q_learning.py -------------------------------------------------------------------------------- /ding/model/template/qac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/qac.py -------------------------------------------------------------------------------- /ding/model/template/qac_dist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/qac_dist.py -------------------------------------------------------------------------------- /ding/model/template/qgpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/qgpo.py -------------------------------------------------------------------------------- /ding/model/template/qmix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/qmix.py -------------------------------------------------------------------------------- /ding/model/template/qtran.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/qtran.py -------------------------------------------------------------------------------- /ding/model/template/qvac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/qvac.py -------------------------------------------------------------------------------- /ding/model/template/sqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/sqn.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_acer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_acer.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_atoc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_atoc.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_bc.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_bcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_bcq.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_ebm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_ebm.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_edac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_edac.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_havac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_havac.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_hpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_hpt.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_madqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_madqn.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_maqac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_maqac.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_mavac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_mavac.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_ngu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_ngu.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_pdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_pdqn.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_pg.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_qac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_qac.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_qmix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_qmix.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_qtran.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_qtran.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_vac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_vac.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_vae.py -------------------------------------------------------------------------------- /ding/model/template/tests/test_wqmix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/tests/test_wqmix.py -------------------------------------------------------------------------------- /ding/model/template/vac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/vac.py -------------------------------------------------------------------------------- /ding/model/template/vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/vae.py -------------------------------------------------------------------------------- /ding/model/template/wqmix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/template/wqmix.py -------------------------------------------------------------------------------- /ding/model/wrapper/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/wrapper/__init__.py -------------------------------------------------------------------------------- /ding/model/wrapper/model_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/model/wrapper/model_wrappers.py -------------------------------------------------------------------------------- /ding/policy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/__init__.py -------------------------------------------------------------------------------- /ding/policy/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/a2c.py -------------------------------------------------------------------------------- /ding/policy/acer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/acer.py -------------------------------------------------------------------------------- /ding/policy/atoc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/atoc.py -------------------------------------------------------------------------------- /ding/policy/base_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/base_policy.py -------------------------------------------------------------------------------- /ding/policy/bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/bc.py -------------------------------------------------------------------------------- /ding/policy/bcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/bcq.py -------------------------------------------------------------------------------- /ding/policy/bdq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/bdq.py -------------------------------------------------------------------------------- /ding/policy/c51.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/c51.py -------------------------------------------------------------------------------- /ding/policy/collaq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/collaq.py -------------------------------------------------------------------------------- /ding/policy/coma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/coma.py -------------------------------------------------------------------------------- /ding/policy/common_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/common_utils.py -------------------------------------------------------------------------------- /ding/policy/cql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/cql.py -------------------------------------------------------------------------------- /ding/policy/d4pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/d4pg.py -------------------------------------------------------------------------------- /ding/policy/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/ddpg.py -------------------------------------------------------------------------------- /ding/policy/dqfd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/dqfd.py -------------------------------------------------------------------------------- /ding/policy/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/dqn.py -------------------------------------------------------------------------------- /ding/policy/dt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/dt.py -------------------------------------------------------------------------------- /ding/policy/edac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/edac.py -------------------------------------------------------------------------------- /ding/policy/fqf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/fqf.py -------------------------------------------------------------------------------- /ding/policy/happo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/happo.py -------------------------------------------------------------------------------- /ding/policy/ibc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/ibc.py -------------------------------------------------------------------------------- /ding/policy/il.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/il.py -------------------------------------------------------------------------------- /ding/policy/impala.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/impala.py -------------------------------------------------------------------------------- /ding/policy/iql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/iql.py -------------------------------------------------------------------------------- /ding/policy/iqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/iqn.py -------------------------------------------------------------------------------- /ding/policy/madqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/madqn.py -------------------------------------------------------------------------------- /ding/policy/mbpolicy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/mbpolicy/__init__.py -------------------------------------------------------------------------------- /ding/policy/mbpolicy/dreamer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/mbpolicy/dreamer.py -------------------------------------------------------------------------------- /ding/policy/mbpolicy/mbsac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/mbpolicy/mbsac.py -------------------------------------------------------------------------------- /ding/policy/mbpolicy/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/mbpolicy/utils.py -------------------------------------------------------------------------------- /ding/policy/mdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/mdqn.py -------------------------------------------------------------------------------- /ding/policy/ngu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/ngu.py -------------------------------------------------------------------------------- /ding/policy/offppo_collect_traj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/offppo_collect_traj.py -------------------------------------------------------------------------------- /ding/policy/pc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/pc.py -------------------------------------------------------------------------------- /ding/policy/pdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/pdqn.py -------------------------------------------------------------------------------- /ding/policy/pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/pg.py -------------------------------------------------------------------------------- /ding/policy/plan_diffuser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/plan_diffuser.py -------------------------------------------------------------------------------- /ding/policy/policy_factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/policy_factory.py -------------------------------------------------------------------------------- /ding/policy/ppg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/ppg.py -------------------------------------------------------------------------------- /ding/policy/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/ppo.py -------------------------------------------------------------------------------- /ding/policy/ppof.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/ppof.py -------------------------------------------------------------------------------- /ding/policy/prompt_awr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/prompt_awr.py -------------------------------------------------------------------------------- /ding/policy/prompt_pg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/prompt_pg.py -------------------------------------------------------------------------------- /ding/policy/qgpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/qgpo.py -------------------------------------------------------------------------------- /ding/policy/qmix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/qmix.py -------------------------------------------------------------------------------- /ding/policy/qrdqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/qrdqn.py -------------------------------------------------------------------------------- /ding/policy/qtran.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/qtran.py -------------------------------------------------------------------------------- /ding/policy/r2d2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/r2d2.py -------------------------------------------------------------------------------- /ding/policy/r2d2_collect_traj.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/r2d2_collect_traj.py -------------------------------------------------------------------------------- /ding/policy/r2d2_gtrxl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/r2d2_gtrxl.py -------------------------------------------------------------------------------- /ding/policy/r2d3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/r2d3.py -------------------------------------------------------------------------------- /ding/policy/rainbow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/rainbow.py -------------------------------------------------------------------------------- /ding/policy/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/sac.py -------------------------------------------------------------------------------- /ding/policy/sql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/sql.py -------------------------------------------------------------------------------- /ding/policy/sqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/sqn.py -------------------------------------------------------------------------------- /ding/policy/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/td3.py -------------------------------------------------------------------------------- /ding/policy/td3_bc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/td3_bc.py -------------------------------------------------------------------------------- /ding/policy/td3_vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/td3_vae.py -------------------------------------------------------------------------------- /ding/policy/tests/test_common_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/tests/test_common_utils.py -------------------------------------------------------------------------------- /ding/policy/tests/test_cql.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/tests/test_cql.py -------------------------------------------------------------------------------- /ding/policy/tests/test_r2d3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/tests/test_r2d3.py -------------------------------------------------------------------------------- /ding/policy/tests/test_stdim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/tests/test_stdim.py -------------------------------------------------------------------------------- /ding/policy/wqmix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/policy/wqmix.py -------------------------------------------------------------------------------- /ding/reward_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/__init__.py -------------------------------------------------------------------------------- /ding/reward_model/base_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/base_reward_model.py -------------------------------------------------------------------------------- /ding/reward_model/drex_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/drex_reward_model.py -------------------------------------------------------------------------------- /ding/reward_model/gail_irl_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/gail_irl_model.py -------------------------------------------------------------------------------- /ding/reward_model/her_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/her_reward_model.py -------------------------------------------------------------------------------- /ding/reward_model/icm_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/icm_reward_model.py -------------------------------------------------------------------------------- /ding/reward_model/ngu_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/ngu_reward_model.py -------------------------------------------------------------------------------- /ding/reward_model/pdeil_irl_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/pdeil_irl_model.py -------------------------------------------------------------------------------- /ding/reward_model/pwil_irl_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/pwil_irl_model.py -------------------------------------------------------------------------------- /ding/reward_model/red_irl_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/red_irl_model.py -------------------------------------------------------------------------------- /ding/reward_model/rnd_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/rnd_reward_model.py -------------------------------------------------------------------------------- /ding/reward_model/trex_reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/reward_model/trex_reward_model.py -------------------------------------------------------------------------------- /ding/rl_utils/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/README.md -------------------------------------------------------------------------------- /ding/rl_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/__init__.py -------------------------------------------------------------------------------- /ding/rl_utils/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/a2c.py -------------------------------------------------------------------------------- /ding/rl_utils/acer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/acer.py -------------------------------------------------------------------------------- /ding/rl_utils/adder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/adder.py -------------------------------------------------------------------------------- /ding/rl_utils/beta_function.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/beta_function.py -------------------------------------------------------------------------------- /ding/rl_utils/coma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/coma.py -------------------------------------------------------------------------------- /ding/rl_utils/exploration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/exploration.py -------------------------------------------------------------------------------- /ding/rl_utils/gae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/gae.py -------------------------------------------------------------------------------- /ding/rl_utils/grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/grpo.py -------------------------------------------------------------------------------- /ding/rl_utils/happo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/happo.py -------------------------------------------------------------------------------- /ding/rl_utils/isw.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/isw.py -------------------------------------------------------------------------------- /ding/rl_utils/log_prob_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/log_prob_utils.py -------------------------------------------------------------------------------- /ding/rl_utils/ppg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/ppg.py -------------------------------------------------------------------------------- /ding/rl_utils/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/ppo.py -------------------------------------------------------------------------------- /ding/rl_utils/retrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/retrace.py -------------------------------------------------------------------------------- /ding/rl_utils/rloo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/rloo.py -------------------------------------------------------------------------------- /ding/rl_utils/sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/sampler.py -------------------------------------------------------------------------------- /ding/rl_utils/td.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/td.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_a2c.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_adder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_adder.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_coma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_coma.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_exploration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_exploration.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_gae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_gae.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_grpo_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_grpo_rlhf.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_happo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_happo.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_log_prob_fn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_log_prob_fn.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_ppg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_ppg.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_ppo.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_ppo_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_ppo_rlhf.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_retrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_retrace.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_rloo_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_rloo_rlhf.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_td.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_td.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_upgo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_upgo.py -------------------------------------------------------------------------------- /ding/rl_utils/tests/test_vtrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/tests/test_vtrace.py -------------------------------------------------------------------------------- /ding/rl_utils/upgo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/upgo.py -------------------------------------------------------------------------------- /ding/rl_utils/value_rescale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/value_rescale.py -------------------------------------------------------------------------------- /ding/rl_utils/vtrace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/rl_utils/vtrace.py -------------------------------------------------------------------------------- /ding/scripts/dijob-qbert.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/dijob-qbert.yaml -------------------------------------------------------------------------------- /ding/scripts/docker-test-entry.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/docker-test-entry.sh -------------------------------------------------------------------------------- /ding/scripts/docker-test.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/docker-test.sh -------------------------------------------------------------------------------- /ding/scripts/install-k8s-tools.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/install-k8s-tools.sh -------------------------------------------------------------------------------- /ding/scripts/kill.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/kill.sh -------------------------------------------------------------------------------- /ding/scripts/local_parallel.sh: -------------------------------------------------------------------------------- 1 | ding -m parallel -c $1 -s $2 2 | -------------------------------------------------------------------------------- /ding/scripts/local_serial.sh: -------------------------------------------------------------------------------- 1 | ding -m serial -c $1 -s $2 2 | -------------------------------------------------------------------------------- /ding/scripts/main_league.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/main_league.sh -------------------------------------------------------------------------------- /ding/scripts/main_league_slurm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/scripts/main_league_slurm.sh -------------------------------------------------------------------------------- /ding/torch_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/__init__.py -------------------------------------------------------------------------------- /ding/torch_utils/backend_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/backend_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/checkpoint_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/checkpoint_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/data_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/data_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/dataparallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/dataparallel.py -------------------------------------------------------------------------------- /ding/torch_utils/diffusion_SDE/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/torch_utils/distribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/distribution.py -------------------------------------------------------------------------------- /ding/torch_utils/loss/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/loss/__init__.py -------------------------------------------------------------------------------- /ding/torch_utils/lr_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/lr_scheduler.py -------------------------------------------------------------------------------- /ding/torch_utils/math_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/math_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/metric.py -------------------------------------------------------------------------------- /ding/torch_utils/model_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/model_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/network/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/__init__.py -------------------------------------------------------------------------------- /ding/torch_utils/network/activation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/activation.py -------------------------------------------------------------------------------- /ding/torch_utils/network/diffusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/diffusion.py -------------------------------------------------------------------------------- /ding/torch_utils/network/dreamer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/dreamer.py -------------------------------------------------------------------------------- /ding/torch_utils/network/gtrxl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/gtrxl.py -------------------------------------------------------------------------------- /ding/torch_utils/network/merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/merge.py -------------------------------------------------------------------------------- /ding/torch_utils/network/nn_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/nn_module.py -------------------------------------------------------------------------------- /ding/torch_utils/network/popart.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/popart.py -------------------------------------------------------------------------------- /ding/torch_utils/network/res_block.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/res_block.py -------------------------------------------------------------------------------- /ding/torch_utils/network/resnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/resnet.py -------------------------------------------------------------------------------- /ding/torch_utils/network/rnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/rnn.py -------------------------------------------------------------------------------- /ding/torch_utils/network/soft_argmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/soft_argmax.py -------------------------------------------------------------------------------- /ding/torch_utils/network/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/network/transformer.py -------------------------------------------------------------------------------- /ding/torch_utils/nn_test_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/nn_test_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/optimizer_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/optimizer_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/parameter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/parameter.py -------------------------------------------------------------------------------- /ding/torch_utils/reshape_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/reshape_helper.py -------------------------------------------------------------------------------- /ding/torch_utils/tests/test_metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/torch_utils/tests/test_metric.py -------------------------------------------------------------------------------- /ding/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/__init__.py -------------------------------------------------------------------------------- /ding/utils/autolog/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/__init__.py -------------------------------------------------------------------------------- /ding/utils/autolog/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/base.py -------------------------------------------------------------------------------- /ding/utils/autolog/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/data.py -------------------------------------------------------------------------------- /ding/utils/autolog/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/model.py -------------------------------------------------------------------------------- /ding/utils/autolog/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/utils/autolog/tests/test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/tests/test_data.py -------------------------------------------------------------------------------- /ding/utils/autolog/tests/test_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/tests/test_model.py -------------------------------------------------------------------------------- /ding/utils/autolog/tests/test_time.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/tests/test_time.py -------------------------------------------------------------------------------- /ding/utils/autolog/time_ctl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/time_ctl.py -------------------------------------------------------------------------------- /ding/utils/autolog/value.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/autolog/value.py -------------------------------------------------------------------------------- /ding/utils/bfs_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/bfs_helper.py -------------------------------------------------------------------------------- /ding/utils/collection_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/collection_helper.py -------------------------------------------------------------------------------- /ding/utils/compression_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/compression_helper.py -------------------------------------------------------------------------------- /ding/utils/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/__init__.py -------------------------------------------------------------------------------- /ding/utils/data/base_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/base_dataloader.py -------------------------------------------------------------------------------- /ding/utils/data/collate_fn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/collate_fn.py -------------------------------------------------------------------------------- /ding/utils/data/dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/dataloader.py -------------------------------------------------------------------------------- /ding/utils/data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/dataset.py -------------------------------------------------------------------------------- /ding/utils/data/rlhf_offline_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/rlhf_offline_dataset.py -------------------------------------------------------------------------------- /ding/utils/data/rlhf_online_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/rlhf_online_dataset.py -------------------------------------------------------------------------------- /ding/utils/data/structure/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/structure/__init__.py -------------------------------------------------------------------------------- /ding/utils/data/structure/cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/structure/cache.py -------------------------------------------------------------------------------- /ding/utils/data/structure/lifo_deque.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/structure/lifo_deque.py -------------------------------------------------------------------------------- /ding/utils/data/tests/test_cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/tests/test_cache.py -------------------------------------------------------------------------------- /ding/utils/data/tests/test_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/data/tests/test_dataset.py -------------------------------------------------------------------------------- /ding/utils/default_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/default_helper.py -------------------------------------------------------------------------------- /ding/utils/deprecation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/deprecation.py -------------------------------------------------------------------------------- /ding/utils/design_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/design_helper.py -------------------------------------------------------------------------------- /ding/utils/dict_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/dict_helper.py -------------------------------------------------------------------------------- /ding/utils/fake_linklink.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/fake_linklink.py -------------------------------------------------------------------------------- /ding/utils/fast_copy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/fast_copy.py -------------------------------------------------------------------------------- /ding/utils/file_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/file_helper.py -------------------------------------------------------------------------------- /ding/utils/import_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/import_helper.py -------------------------------------------------------------------------------- /ding/utils/k8s_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/k8s_helper.py -------------------------------------------------------------------------------- /ding/utils/linklink_dist_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/linklink_dist_helper.py -------------------------------------------------------------------------------- /ding/utils/loader/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/__init__.py -------------------------------------------------------------------------------- /ding/utils/loader/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/base.py -------------------------------------------------------------------------------- /ding/utils/loader/collection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/collection.py -------------------------------------------------------------------------------- /ding/utils/loader/dict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/dict.py -------------------------------------------------------------------------------- /ding/utils/loader/exception.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/exception.py -------------------------------------------------------------------------------- /ding/utils/loader/mapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/mapping.py -------------------------------------------------------------------------------- /ding/utils/loader/norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/norm.py -------------------------------------------------------------------------------- /ding/utils/loader/number.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/number.py -------------------------------------------------------------------------------- /ding/utils/loader/string.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/string.py -------------------------------------------------------------------------------- /ding/utils/loader/tests/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/tests/__init__.py -------------------------------------------------------------------------------- /ding/utils/loader/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/types.py -------------------------------------------------------------------------------- /ding/utils/loader/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/loader/utils.py -------------------------------------------------------------------------------- /ding/utils/lock_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/lock_helper.py -------------------------------------------------------------------------------- /ding/utils/log_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/log_helper.py -------------------------------------------------------------------------------- /ding/utils/log_writer_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/log_writer_helper.py -------------------------------------------------------------------------------- /ding/utils/memory_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/memory_helper.py -------------------------------------------------------------------------------- /ding/utils/normalizer_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/normalizer_helper.py -------------------------------------------------------------------------------- /ding/utils/orchestrator_launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/orchestrator_launcher.py -------------------------------------------------------------------------------- /ding/utils/profiler_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/profiler_helper.py -------------------------------------------------------------------------------- /ding/utils/pytorch_ddp_dist_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/pytorch_ddp_dist_helper.py -------------------------------------------------------------------------------- /ding/utils/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/registry.py -------------------------------------------------------------------------------- /ding/utils/registry_factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/registry_factory.py -------------------------------------------------------------------------------- /ding/utils/render_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/render_helper.py -------------------------------------------------------------------------------- /ding/utils/scheduler_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/scheduler_helper.py -------------------------------------------------------------------------------- /ding/utils/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/segment_tree.py -------------------------------------------------------------------------------- /ding/utils/slurm_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/slurm_helper.py -------------------------------------------------------------------------------- /ding/utils/system_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/system_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/config/k8s-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/config/k8s-config.yaml -------------------------------------------------------------------------------- /ding/utils/tests/test_bfs_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_bfs_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_config_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_config_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_default_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_default_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_deprecation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_deprecation.py -------------------------------------------------------------------------------- /ding/utils/tests/test_design_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_design_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_file_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_file_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_import_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_import_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_k8s_launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_k8s_launcher.py -------------------------------------------------------------------------------- /ding/utils/tests/test_lock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_lock.py -------------------------------------------------------------------------------- /ding/utils/tests/test_log_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_log_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_memory_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_memory_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_registry.py -------------------------------------------------------------------------------- /ding/utils/tests/test_segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_segment_tree.py -------------------------------------------------------------------------------- /ding/utils/tests/test_system_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_system_helper.py -------------------------------------------------------------------------------- /ding/utils/tests/test_time_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/tests/test_time_helper.py -------------------------------------------------------------------------------- /ding/utils/time_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/time_helper.py -------------------------------------------------------------------------------- /ding/utils/time_helper_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/time_helper_base.py -------------------------------------------------------------------------------- /ding/utils/time_helper_cuda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/time_helper_cuda.py -------------------------------------------------------------------------------- /ding/utils/type_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/utils/type_helper.py -------------------------------------------------------------------------------- /ding/worker/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/__init__.py -------------------------------------------------------------------------------- /ding/worker/adapter/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/adapter/__init__.py -------------------------------------------------------------------------------- /ding/worker/collector/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/collector/__init__.py -------------------------------------------------------------------------------- /ding/worker/collector/comm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/collector/comm/__init__.py -------------------------------------------------------------------------------- /ding/worker/collector/comm/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/collector/comm/utils.py -------------------------------------------------------------------------------- /ding/worker/collector/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/worker/collector/tests/speed_test/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/worker/coordinator/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/coordinator/__init__.py -------------------------------------------------------------------------------- /ding/worker/coordinator/coordinator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/coordinator/coordinator.py -------------------------------------------------------------------------------- /ding/worker/learner/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/learner/__init__.py -------------------------------------------------------------------------------- /ding/worker/learner/base_learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/learner/base_learner.py -------------------------------------------------------------------------------- /ding/worker/learner/comm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/learner/comm/__init__.py -------------------------------------------------------------------------------- /ding/worker/learner/comm/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/learner/comm/utils.py -------------------------------------------------------------------------------- /ding/worker/learner/learner_hook.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/learner/learner_hook.py -------------------------------------------------------------------------------- /ding/worker/replay_buffer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/replay_buffer/__init__.py -------------------------------------------------------------------------------- /ding/worker/replay_buffer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/worker/replay_buffer/utils.py -------------------------------------------------------------------------------- /ding/world_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/__init__.py -------------------------------------------------------------------------------- /ding/world_model/base_world_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/base_world_model.py -------------------------------------------------------------------------------- /ding/world_model/ddppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/ddppo.py -------------------------------------------------------------------------------- /ding/world_model/dreamer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/dreamer.py -------------------------------------------------------------------------------- /ding/world_model/idm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/idm.py -------------------------------------------------------------------------------- /ding/world_model/mbpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/mbpo.py -------------------------------------------------------------------------------- /ding/world_model/model/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ding/world_model/model/ensemble.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/model/ensemble.py -------------------------------------------------------------------------------- /ding/world_model/model/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/model/networks.py -------------------------------------------------------------------------------- /ding/world_model/tests/test_ddppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/tests/test_ddppo.py -------------------------------------------------------------------------------- /ding/world_model/tests/test_idm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/tests/test_idm.py -------------------------------------------------------------------------------- /ding/world_model/tests/test_mbpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/tests/test_mbpo.py -------------------------------------------------------------------------------- /ding/world_model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/ding/world_model/utils.py -------------------------------------------------------------------------------- /dizoo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/atari/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/atari/atari.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/atari.gif -------------------------------------------------------------------------------- /dizoo/atari/config/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/atari/config/serial/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/config/serial/__init__.py -------------------------------------------------------------------------------- /dizoo/atari/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/atari/entry/atari_dqn_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/atari_dqn_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/atari_dt_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/atari_dt_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/atari_impala_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/atari_impala_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/atari_ppg_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/atari_ppg_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/phoenix_fqf_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/phoenix_fqf_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/phoenix_iqn_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/phoenix_iqn_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/pong_cql_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/pong_cql_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/pong_fqf_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/pong_fqf_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/qbert_cql_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/qbert_cql_main.py -------------------------------------------------------------------------------- /dizoo/atari/entry/qbert_fqf_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/entry/qbert_fqf_main.py -------------------------------------------------------------------------------- /dizoo/atari/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/atari/envs/atari_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/envs/atari_env.py -------------------------------------------------------------------------------- /dizoo/atari/envs/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/envs/atari_wrappers.py -------------------------------------------------------------------------------- /dizoo/atari/envs/test_atari_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/envs/test_atari_env.py -------------------------------------------------------------------------------- /dizoo/atari/example/atari_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/example/atari_dqn.py -------------------------------------------------------------------------------- /dizoo/atari/example/atari_dqn_ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/example/atari_dqn_ddp.py -------------------------------------------------------------------------------- /dizoo/atari/example/atari_dqn_dist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/example/atari_dqn_dist.py -------------------------------------------------------------------------------- /dizoo/atari/example/atari_dqn_dp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/example/atari_dqn_dp.py -------------------------------------------------------------------------------- /dizoo/atari/example/atari_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/example/atari_ppo.py -------------------------------------------------------------------------------- /dizoo/atari/example/atari_ppo_ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/atari/example/atari_ppo_ddp.py -------------------------------------------------------------------------------- /dizoo/beergame/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/beergame/beergame.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/beergame.png -------------------------------------------------------------------------------- /dizoo/beergame/entry/beergame_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/entry/beergame_eval.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/BGAgent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/BGAgent.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/beergame_core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/beergame_core.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/beergame_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/beergame_env.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/clBeergame.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/clBeergame.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/plotting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/plotting.py -------------------------------------------------------------------------------- /dizoo/beergame/envs/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/beergame/envs/utils.py -------------------------------------------------------------------------------- /dizoo/bitflip/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bitflip/README.md -------------------------------------------------------------------------------- /dizoo/bitflip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/bitflip/bitflip.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bitflip/bitflip.gif -------------------------------------------------------------------------------- /dizoo/bitflip/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bitflip/config/__init__.py -------------------------------------------------------------------------------- /dizoo/bitflip/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/bitflip/entry/bitflip_dqn_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bitflip/entry/bitflip_dqn_main.py -------------------------------------------------------------------------------- /dizoo/bitflip/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .bitflip_env import BitFlipEnv 2 | -------------------------------------------------------------------------------- /dizoo/bitflip/envs/bitflip_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bitflip/envs/bitflip_env.py -------------------------------------------------------------------------------- /dizoo/bitflip/envs/test_bitfilp_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bitflip/envs/test_bitfilp_env.py -------------------------------------------------------------------------------- /dizoo/box2d/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/box2d/bipedalwalker/__init__.py: -------------------------------------------------------------------------------- 1 | from dizoo.box2d.bipedalwalker.config import * 2 | -------------------------------------------------------------------------------- /dizoo/box2d/bipedalwalker/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/box2d/bipedalwalker/original.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/box2d/bipedalwalker/original.gif -------------------------------------------------------------------------------- /dizoo/box2d/carracing/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/box2d/carracing/car_racing.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/box2d/carracing/car_racing.gif -------------------------------------------------------------------------------- /dizoo/box2d/carracing/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/box2d/carracing/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/box2d/lunarlander/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/box2d/lunarlander/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/box2d/lunarlander/lunarlander.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/box2d/lunarlander/lunarlander.gif -------------------------------------------------------------------------------- /dizoo/bsuite/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/bsuite/bsuite.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bsuite/bsuite.png -------------------------------------------------------------------------------- /dizoo/bsuite/config/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /dizoo/bsuite/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .bsuite_env import BSuiteEnv 2 | -------------------------------------------------------------------------------- /dizoo/bsuite/envs/bsuite_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bsuite/envs/bsuite_env.py -------------------------------------------------------------------------------- /dizoo/bsuite/envs/test_bsuite_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/bsuite/envs/test_bsuite_env.py -------------------------------------------------------------------------------- /dizoo/classic_control/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/classic_control/acrobot/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/classic_control/acrobot/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .acrobot_env import AcroBotEnv 2 | -------------------------------------------------------------------------------- /dizoo/classic_control/cartpole/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/classic_control/cartpole/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/classic_control/mountain_car/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/classic_control/mountain_car/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .mtcar_env import MountainCarEnv 2 | -------------------------------------------------------------------------------- /dizoo/classic_control/pendulum/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/classic_control/pendulum/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/cliffwalking/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/cliffwalking/cliff_walking.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/cliffwalking/cliff_walking.gif -------------------------------------------------------------------------------- /dizoo/cliffwalking/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/cliffwalking/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/common/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/common/policy/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/common/policy/md_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/common/policy/md_dqn.py -------------------------------------------------------------------------------- /dizoo/common/policy/md_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/common/policy/md_ppo.py -------------------------------------------------------------------------------- /dizoo/common/policy/md_rainbow_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/common/policy/md_rainbow_dqn.py -------------------------------------------------------------------------------- /dizoo/competitive_rl/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/competitive_rl/README.md -------------------------------------------------------------------------------- /dizoo/competitive_rl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/competitive_rl/competitive_rl.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/competitive_rl/competitive_rl.gif -------------------------------------------------------------------------------- /dizoo/competitive_rl/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/competitive_rl/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/d4rl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/d4rl/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/config/__init__.py -------------------------------------------------------------------------------- /dizoo/d4rl/d4rl.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/d4rl.gif -------------------------------------------------------------------------------- /dizoo/d4rl/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_bcq_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_bcq_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_cql_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_cql_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_dt_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_dt_mujoco.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_edac_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_edac_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_ibc_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_ibc_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_iql_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_iql_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_pd_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_pd_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/entry/d4rl_td3_bc_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/entry/d4rl_td3_bc_main.py -------------------------------------------------------------------------------- /dizoo/d4rl/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .d4rl_env import D4RLEnv 2 | -------------------------------------------------------------------------------- /dizoo/d4rl/envs/d4rl_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/envs/d4rl_env.py -------------------------------------------------------------------------------- /dizoo/d4rl/envs/d4rl_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/d4rl/envs/d4rl_wrappers.py -------------------------------------------------------------------------------- /dizoo/dmc2gym/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/dmc2gym/dmc2gym_cheetah.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/dmc2gym/dmc2gym_cheetah.png -------------------------------------------------------------------------------- /dizoo/dmc2gym/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .dmc2gym_env import DMC2GymEnv 2 | -------------------------------------------------------------------------------- /dizoo/dmc2gym/envs/dmc2gym_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/dmc2gym/envs/dmc2gym_env.py -------------------------------------------------------------------------------- /dizoo/dmc2gym/envs/test_dmc2gym_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/dmc2gym/envs/test_dmc2gym_env.py -------------------------------------------------------------------------------- /dizoo/evogym/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/evogym/entry/walker_ppo_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/evogym/entry/walker_ppo_eval.py -------------------------------------------------------------------------------- /dizoo/evogym/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .evogym_env import EvoGymEnv 2 | -------------------------------------------------------------------------------- /dizoo/evogym/envs/evogym_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/evogym/envs/evogym_env.py -------------------------------------------------------------------------------- /dizoo/evogym/evogym.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/evogym/evogym.gif -------------------------------------------------------------------------------- /dizoo/frozen_lake/FrozenLake.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/frozen_lake/FrozenLake.gif -------------------------------------------------------------------------------- /dizoo/frozen_lake/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/frozen_lake/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/frozen_lake/config/__init__.py -------------------------------------------------------------------------------- /dizoo/frozen_lake/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/frozen_lake/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/gfootball/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/README.md -------------------------------------------------------------------------------- /dizoo/gfootball/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gfootball/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gfootball/entry/show_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/entry/show_dataset.py -------------------------------------------------------------------------------- /dizoo/gfootball/entry/test_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/entry/test_accuracy.py -------------------------------------------------------------------------------- /dizoo/gfootball/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/gfootball/envs/fake_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/envs/fake_dataset.py -------------------------------------------------------------------------------- /dizoo/gfootball/envs/gfootball_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/envs/gfootball_env.py -------------------------------------------------------------------------------- /dizoo/gfootball/envs/gfootballsp_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/envs/gfootballsp_env.py -------------------------------------------------------------------------------- /dizoo/gfootball/envs/obs/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/envs/obs/encoder.py -------------------------------------------------------------------------------- /dizoo/gfootball/gfootball.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/gfootball.gif -------------------------------------------------------------------------------- /dizoo/gfootball/model/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gfootball/model/bots/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/model/bots/__init__.py -------------------------------------------------------------------------------- /dizoo/gfootball/model/conv1d/conv1d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/model/conv1d/conv1d.py -------------------------------------------------------------------------------- /dizoo/gfootball/policy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/policy/__init__.py -------------------------------------------------------------------------------- /dizoo/gfootball/policy/ppo_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/policy/ppo_lstm.py -------------------------------------------------------------------------------- /dizoo/gfootball/replay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gfootball/replay.py -------------------------------------------------------------------------------- /dizoo/gobigger_overview.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gobigger_overview.gif -------------------------------------------------------------------------------- /dizoo/gym_anytrading/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_anytrading/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/config/__init__.py -------------------------------------------------------------------------------- /dizoo/gym_anytrading/envs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/envs/README.md -------------------------------------------------------------------------------- /dizoo/gym_anytrading/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/gym_anytrading/envs/position.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/envs/position.png -------------------------------------------------------------------------------- /dizoo/gym_anytrading/envs/profit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/envs/profit.png -------------------------------------------------------------------------------- /dizoo/gym_anytrading/envs/stocks_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/envs/stocks_env.py -------------------------------------------------------------------------------- /dizoo/gym_anytrading/worker/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_anytrading/worker/__init__.py -------------------------------------------------------------------------------- /dizoo/gym_hybrid/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_hybrid/config/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_hybrid/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_hybrid/envs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_hybrid/envs/README.md -------------------------------------------------------------------------------- /dizoo/gym_hybrid/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_hybrid/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/gym_hybrid/envs/gym_hybrid_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_hybrid/envs/gym_hybrid_env.py -------------------------------------------------------------------------------- /dizoo/gym_hybrid/moving_v0.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_hybrid/moving_v0.gif -------------------------------------------------------------------------------- /dizoo/gym_pybullet_drones/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_soccer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_soccer/envs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_soccer/envs/README.md -------------------------------------------------------------------------------- /dizoo/gym_soccer/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/gym_soccer/envs/gym_soccer_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_soccer/envs/gym_soccer_env.py -------------------------------------------------------------------------------- /dizoo/gym_soccer/half_offensive.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/gym_soccer/half_offensive.gif -------------------------------------------------------------------------------- /dizoo/image_classification/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/image_classification/imagenet.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/image_classification/imagenet.png -------------------------------------------------------------------------------- /dizoo/ising_env/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/ising_env/entry/ising_mfq_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/ising_env/entry/ising_mfq_eval.py -------------------------------------------------------------------------------- /dizoo/ising_env/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/ising_env/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/ising_env/envs/ising_model/multiagent/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/ising_env/envs/ising_model_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/ising_env/envs/ising_model_env.py -------------------------------------------------------------------------------- /dizoo/ising_env/ising_env.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/ising_env/ising_env.gif -------------------------------------------------------------------------------- /dizoo/league_demo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/league_demo/demo_league.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/league_demo/demo_league.py -------------------------------------------------------------------------------- /dizoo/league_demo/game_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/league_demo/game_env.py -------------------------------------------------------------------------------- /dizoo/league_demo/league_demo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/league_demo/league_demo.png -------------------------------------------------------------------------------- /dizoo/mario/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/mario/mario.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mario/mario.gif -------------------------------------------------------------------------------- /dizoo/mario/mario_dqn_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mario/mario_dqn_config.py -------------------------------------------------------------------------------- /dizoo/mario/mario_dqn_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mario/mario_dqn_example.py -------------------------------------------------------------------------------- /dizoo/mario/mario_dqn_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mario/mario_dqn_main.py -------------------------------------------------------------------------------- /dizoo/maze/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/maze/__init__.py -------------------------------------------------------------------------------- /dizoo/maze/config/maze_bc_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/maze/config/maze_bc_config.py -------------------------------------------------------------------------------- /dizoo/maze/config/maze_pc_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/maze/config/maze_pc_config.py -------------------------------------------------------------------------------- /dizoo/maze/entry/maze_bc_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/maze/entry/maze_bc_main.py -------------------------------------------------------------------------------- /dizoo/maze/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .maze_env import Maze 2 | -------------------------------------------------------------------------------- /dizoo/maze/envs/maze_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/maze/envs/maze_env.py -------------------------------------------------------------------------------- /dizoo/maze/envs/test_maze_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/maze/envs/test_maze_env.py -------------------------------------------------------------------------------- /dizoo/metadrive/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/metadrive/config/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/metadrive/env/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/metadrive/env/drive_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/metadrive/env/drive_env.py -------------------------------------------------------------------------------- /dizoo/metadrive/env/drive_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/metadrive/env/drive_utils.py -------------------------------------------------------------------------------- /dizoo/metadrive/env/drive_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/metadrive/env/drive_wrapper.py -------------------------------------------------------------------------------- /dizoo/metadrive/metadrive_env.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/metadrive/metadrive_env.gif -------------------------------------------------------------------------------- /dizoo/minigrid/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/__init__.py -------------------------------------------------------------------------------- /dizoo/minigrid/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/minigrid/envs/minigrid_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/envs/minigrid_env.py -------------------------------------------------------------------------------- /dizoo/minigrid/envs/minigrid_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/envs/minigrid_wrapper.py -------------------------------------------------------------------------------- /dizoo/minigrid/envs/noisy_tv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/envs/noisy_tv.py -------------------------------------------------------------------------------- /dizoo/minigrid/minigrid.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/minigrid.gif -------------------------------------------------------------------------------- /dizoo/minigrid/utils/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/minigrid/utils/eval.py -------------------------------------------------------------------------------- /dizoo/mujoco/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/mujoco/addition/install_mesa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/addition/install_mesa.sh -------------------------------------------------------------------------------- /dizoo/mujoco/config/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/mujoco/config/ant_ddpg_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/config/ant_ddpg_config.py -------------------------------------------------------------------------------- /dizoo/mujoco/config/ant_onppo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/config/ant_onppo_config.py -------------------------------------------------------------------------------- /dizoo/mujoco/config/ant_ppo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/config/ant_ppo_config.py -------------------------------------------------------------------------------- /dizoo/mujoco/config/ant_sac_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/config/ant_sac_config.py -------------------------------------------------------------------------------- /dizoo/mujoco/config/ant_td3_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/config/ant_td3_config.py -------------------------------------------------------------------------------- /dizoo/mujoco/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/mujoco/entry/mujoco_cql_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/entry/mujoco_cql_main.py -------------------------------------------------------------------------------- /dizoo/mujoco/entry/mujoco_d4pg_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/entry/mujoco_d4pg_main.py -------------------------------------------------------------------------------- /dizoo/mujoco/entry/mujoco_ddpg_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/entry/mujoco_ddpg_eval.py -------------------------------------------------------------------------------- /dizoo/mujoco/entry/mujoco_ddpg_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/entry/mujoco_ddpg_main.py -------------------------------------------------------------------------------- /dizoo/mujoco/entry/mujoco_ppo_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/entry/mujoco_ppo_main.py -------------------------------------------------------------------------------- /dizoo/mujoco/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/mujoco/envs/mujoco_disc_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/envs/mujoco_disc_env.py -------------------------------------------------------------------------------- /dizoo/mujoco/envs/mujoco_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/envs/mujoco_env.py -------------------------------------------------------------------------------- /dizoo/mujoco/envs/mujoco_gym_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/envs/mujoco_gym_env.py -------------------------------------------------------------------------------- /dizoo/mujoco/envs/mujoco_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/envs/mujoco_wrappers.py -------------------------------------------------------------------------------- /dizoo/mujoco/example/mujoco_bc_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/example/mujoco_bc_main.py -------------------------------------------------------------------------------- /dizoo/mujoco/example/mujoco_sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/example/mujoco_sac.py -------------------------------------------------------------------------------- /dizoo/mujoco/mujoco.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/mujoco/mujoco.gif -------------------------------------------------------------------------------- /dizoo/multiagent_mujoco/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/multiagent_mujoco/README.md -------------------------------------------------------------------------------- /dizoo/multiagent_mujoco/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/multiagent_mujoco/envs/assets/.gitignore: -------------------------------------------------------------------------------- 1 | *.auto.xml 2 | -------------------------------------------------------------------------------- /dizoo/multiagent_mujoco/envs/assets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/multiagent_mujoco/envs/obsk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/multiagent_mujoco/envs/obsk.py -------------------------------------------------------------------------------- /dizoo/overcooked/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/overcooked/README.md -------------------------------------------------------------------------------- /dizoo/overcooked/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/overcooked/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/overcooked/config/__init__.py -------------------------------------------------------------------------------- /dizoo/overcooked/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/overcooked/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/overcooked/envs/overcooked_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/overcooked/envs/overcooked_env.py -------------------------------------------------------------------------------- /dizoo/overcooked/overcooked.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/overcooked/overcooked.gif -------------------------------------------------------------------------------- /dizoo/petting_zoo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/petting_zoo/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/petting_zoo/config/__init__.py -------------------------------------------------------------------------------- /dizoo/petting_zoo/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/pomdp/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/pomdp/config/pomdp_dqn_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pomdp/config/pomdp_dqn_config.py -------------------------------------------------------------------------------- /dizoo/pomdp/config/pomdp_ppo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pomdp/config/pomdp_ppo_config.py -------------------------------------------------------------------------------- /dizoo/pomdp/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .atari_env import PomdpAtariEnv 2 | -------------------------------------------------------------------------------- /dizoo/pomdp/envs/atari_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pomdp/envs/atari_env.py -------------------------------------------------------------------------------- /dizoo/pomdp/envs/atari_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pomdp/envs/atari_wrappers.py -------------------------------------------------------------------------------- /dizoo/pomdp/envs/test_atari_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pomdp/envs/test_atari_env.py -------------------------------------------------------------------------------- /dizoo/procgen/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/README.md -------------------------------------------------------------------------------- /dizoo/procgen/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/procgen/coinrun.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/coinrun.gif -------------------------------------------------------------------------------- /dizoo/procgen/coinrun.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/coinrun.png -------------------------------------------------------------------------------- /dizoo/procgen/coinrun_dqn.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/coinrun_dqn.svg -------------------------------------------------------------------------------- /dizoo/procgen/coinrun_ppo.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/coinrun_ppo.svg -------------------------------------------------------------------------------- /dizoo/procgen/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/config/__init__.py -------------------------------------------------------------------------------- /dizoo/procgen/config/maze_dqn_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/config/maze_dqn_config.py -------------------------------------------------------------------------------- /dizoo/procgen/config/maze_ppg_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/config/maze_ppg_config.py -------------------------------------------------------------------------------- /dizoo/procgen/config/maze_ppo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/config/maze_ppo_config.py -------------------------------------------------------------------------------- /dizoo/procgen/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/procgen/envs/procgen_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/envs/procgen_env.py -------------------------------------------------------------------------------- /dizoo/procgen/envs/test_coinrun_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/envs/test_coinrun_env.py -------------------------------------------------------------------------------- /dizoo/procgen/maze.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/maze.gif -------------------------------------------------------------------------------- /dizoo/procgen/maze.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/maze.png -------------------------------------------------------------------------------- /dizoo/procgen/maze_dqn.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/procgen/maze_dqn.svg -------------------------------------------------------------------------------- /dizoo/pybullet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/pybullet/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pybullet/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/pybullet/envs/pybullet_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pybullet/envs/pybullet_env.py -------------------------------------------------------------------------------- /dizoo/pybullet/pybullet.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/pybullet/pybullet.gif -------------------------------------------------------------------------------- /dizoo/rocket/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/rocket/README.md -------------------------------------------------------------------------------- /dizoo/rocket/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/rocket/config/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/rocket/entry/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/rocket/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/rocket/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/rocket/envs/rocket_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/rocket/envs/rocket_env.py -------------------------------------------------------------------------------- /dizoo/rocket/envs/test_rocket_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/rocket/envs/test_rocket_env.py -------------------------------------------------------------------------------- /dizoo/slime_volley/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/slime_volley/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/slime_volley/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/slime_volley/slime_volley.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/slime_volley/slime_volley.gif -------------------------------------------------------------------------------- /dizoo/smac/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/README.md -------------------------------------------------------------------------------- /dizoo/smac/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/smac/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/smac/envs/fake_smac_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/fake_smac_env.py -------------------------------------------------------------------------------- /dizoo/smac/envs/maps/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/maps/README.md -------------------------------------------------------------------------------- /dizoo/smac/envs/maps/SMAC_Maps/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/smac/envs/maps/SMAC_Maps_two_player/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/smac/envs/maps/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/smac/envs/smac_action.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/smac_action.py -------------------------------------------------------------------------------- /dizoo/smac/envs/smac_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/smac_env.py -------------------------------------------------------------------------------- /dizoo/smac/envs/smac_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/smac_map.py -------------------------------------------------------------------------------- /dizoo/smac/envs/smac_reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/smac_reward.py -------------------------------------------------------------------------------- /dizoo/smac/envs/test_smac_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/envs/test_smac_env.py -------------------------------------------------------------------------------- /dizoo/smac/smac.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/smac.gif -------------------------------------------------------------------------------- /dizoo/smac/utils/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/smac/utils/eval.py -------------------------------------------------------------------------------- /dizoo/sokoban/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/sokoban/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/sokoban/envs/__init__.py -------------------------------------------------------------------------------- /dizoo/sokoban/envs/sokoban_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/sokoban/envs/sokoban_env.py -------------------------------------------------------------------------------- /dizoo/sokoban/envs/sokoban_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/sokoban/envs/sokoban_wrappers.py -------------------------------------------------------------------------------- /dizoo/sokoban/envs/test_sokoban_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/sokoban/envs/test_sokoban_env.py -------------------------------------------------------------------------------- /dizoo/tabmwp/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/README.md -------------------------------------------------------------------------------- /dizoo/tabmwp/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/tabmwp/benchmark.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/benchmark.png -------------------------------------------------------------------------------- /dizoo/tabmwp/config/tabmwp_pg_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/config/tabmwp_pg_config.py -------------------------------------------------------------------------------- /dizoo/tabmwp/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dizoo/tabmwp/envs/tabmwp_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/envs/tabmwp_env.py -------------------------------------------------------------------------------- /dizoo/tabmwp/envs/test_tabmwp_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/envs/test_tabmwp_env.py -------------------------------------------------------------------------------- /dizoo/tabmwp/envs/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/envs/utils.py -------------------------------------------------------------------------------- /dizoo/tabmwp/tabmwp.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/tabmwp/tabmwp.jpeg -------------------------------------------------------------------------------- /dizoo/taxi/Taxi-v3_episode_0.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/taxi/Taxi-v3_episode_0.gif -------------------------------------------------------------------------------- /dizoo/taxi/__init__.py: -------------------------------------------------------------------------------- 1 | from .envs import * 2 | -------------------------------------------------------------------------------- /dizoo/taxi/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/taxi/config/__init__.py -------------------------------------------------------------------------------- /dizoo/taxi/config/taxi_dqn_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/taxi/config/taxi_dqn_config.py -------------------------------------------------------------------------------- /dizoo/taxi/entry/taxi_dqn_deploy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/taxi/entry/taxi_dqn_deploy.py -------------------------------------------------------------------------------- /dizoo/taxi/envs/__init__.py: -------------------------------------------------------------------------------- 1 | from .taxi_env import TaxiEnv 2 | -------------------------------------------------------------------------------- /dizoo/taxi/envs/taxi_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/taxi/envs/taxi_env.py -------------------------------------------------------------------------------- /dizoo/taxi/envs/test_taxi_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/dizoo/taxi/envs/test_taxi_env.py -------------------------------------------------------------------------------- /docker/Dockerfile.base: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/docker/Dockerfile.base -------------------------------------------------------------------------------- /docker/Dockerfile.env: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/docker/Dockerfile.env -------------------------------------------------------------------------------- /docker/Dockerfile.hpc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/docker/Dockerfile.hpc -------------------------------------------------------------------------------- /docker/Dockerfile.rpc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/docker/Dockerfile.rpc -------------------------------------------------------------------------------- /format.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/format.sh -------------------------------------------------------------------------------- /pytest.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/pytest.ini -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opendilab/DI-engine/HEAD/setup.py --------------------------------------------------------------------------------