├── .gitignore ├── .readthedocs.yaml ├── LICENSE.txt ├── README.md ├── config ├── a2c │ └── mujoco.yaml ├── ddpg │ └── mujoco.yaml ├── ddqn │ └── atari.yaml ├── dqn │ └── atari.yaml ├── duelingdqn │ └── atari.yaml ├── ppo │ ├── mujoco.yaml │ └── walkerStand.yaml └── td3 │ └── mujoco.yaml ├── docs ├── Makefile ├── api │ ├── xuance.agent.rst │ ├── xuance.environment.rst │ ├── xuance.learner.rst │ ├── xuance.policy.rst │ ├── xuance.representation.rst │ └── xuance.utils.rst ├── conf.py ├── index.rst ├── make.bat └── tutorials │ ├── concept.rst │ ├── configuration.rst │ ├── custom_env.rst │ ├── custom_loss.rst │ ├── custom_network.rst │ ├── logger.rst │ └── multi_inputs.rst ├── example ├── run_a2c.py ├── run_ddpg.py ├── run_ddqn.py ├── run_dqn.py ├── run_dueldqn.py ├── run_ppo.py └── run_td3.py ├── example_win ├── run_dmc_ppo.py ├── run_gym_ppo.py └── test_dmc_ppo.py ├── figures ├── Ant.png ├── Hopper.png ├── InvertedPendulum.png ├── halfcheetah.png ├── mujoco_benchmark.png ├── plotter.png ├── tensorboard.png ├── tensorboard_vis.png └── wandb_vis.png ├── setup.py └── xuance ├── agent ├── __init__.py ├── a2c.py ├── ddpg.py ├── dqn.py ├── ppo.py └── td3.py ├── environment ├── __init__.py ├── custom_envs │ ├── __pycache__ │ │ └── dmc.cpython-39.pyc │ ├── atari.py │ └── dmc.py ├── env_utils.py ├── envpool_utils.py ├── normalizer.py ├── vectorize.py └── wrappers.py ├── learner ├── __init__.py ├── a2c.py ├── ddpg.py ├── ddqn.py ├── dqn.py ├── ppo.py └── td3.py ├── policy ├── __init__.py ├── categorical.py ├── deterministic.py ├── dqn.py └── gaussian.py ├── representation ├── __init__.py └── network.py └── utils ├── __init__.py ├── block.py ├── common.py ├── distribution.py ├── layer.py └── memory.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/.gitignore -------------------------------------------------------------------------------- /.readthedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/.readthedocs.yaml -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/LICENSE.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/README.md -------------------------------------------------------------------------------- /config/a2c/mujoco.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/a2c/mujoco.yaml -------------------------------------------------------------------------------- /config/ddpg/mujoco.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/ddpg/mujoco.yaml -------------------------------------------------------------------------------- /config/ddqn/atari.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/ddqn/atari.yaml -------------------------------------------------------------------------------- /config/dqn/atari.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/dqn/atari.yaml -------------------------------------------------------------------------------- /config/duelingdqn/atari.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/duelingdqn/atari.yaml -------------------------------------------------------------------------------- /config/ppo/mujoco.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/ppo/mujoco.yaml -------------------------------------------------------------------------------- /config/ppo/walkerStand.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/ppo/walkerStand.yaml -------------------------------------------------------------------------------- /config/td3/mujoco.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/config/td3/mujoco.yaml -------------------------------------------------------------------------------- /docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/Makefile -------------------------------------------------------------------------------- /docs/api/xuance.agent.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/api/xuance.agent.rst -------------------------------------------------------------------------------- /docs/api/xuance.environment.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/api/xuance.environment.rst -------------------------------------------------------------------------------- /docs/api/xuance.learner.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/api/xuance.learner.rst -------------------------------------------------------------------------------- /docs/api/xuance.policy.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/api/xuance.policy.rst -------------------------------------------------------------------------------- /docs/api/xuance.representation.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/api/xuance.representation.rst -------------------------------------------------------------------------------- /docs/api/xuance.utils.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/api/xuance.utils.rst -------------------------------------------------------------------------------- /docs/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/conf.py -------------------------------------------------------------------------------- /docs/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/index.rst -------------------------------------------------------------------------------- /docs/make.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/make.bat -------------------------------------------------------------------------------- /docs/tutorials/concept.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/concept.rst -------------------------------------------------------------------------------- /docs/tutorials/configuration.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/configuration.rst -------------------------------------------------------------------------------- /docs/tutorials/custom_env.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/custom_env.rst -------------------------------------------------------------------------------- /docs/tutorials/custom_loss.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/custom_loss.rst -------------------------------------------------------------------------------- /docs/tutorials/custom_network.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/custom_network.rst -------------------------------------------------------------------------------- /docs/tutorials/logger.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/logger.rst -------------------------------------------------------------------------------- /docs/tutorials/multi_inputs.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/docs/tutorials/multi_inputs.rst -------------------------------------------------------------------------------- /example/run_a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_a2c.py -------------------------------------------------------------------------------- /example/run_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_ddpg.py -------------------------------------------------------------------------------- /example/run_ddqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_ddqn.py -------------------------------------------------------------------------------- /example/run_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_dqn.py -------------------------------------------------------------------------------- /example/run_dueldqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_dueldqn.py -------------------------------------------------------------------------------- /example/run_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_ppo.py -------------------------------------------------------------------------------- /example/run_td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example/run_td3.py -------------------------------------------------------------------------------- /example_win/run_dmc_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example_win/run_dmc_ppo.py -------------------------------------------------------------------------------- /example_win/run_gym_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example_win/run_gym_ppo.py -------------------------------------------------------------------------------- /example_win/test_dmc_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/example_win/test_dmc_ppo.py -------------------------------------------------------------------------------- /figures/Ant.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/Ant.png -------------------------------------------------------------------------------- /figures/Hopper.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/Hopper.png -------------------------------------------------------------------------------- /figures/InvertedPendulum.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/InvertedPendulum.png -------------------------------------------------------------------------------- /figures/halfcheetah.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/halfcheetah.png -------------------------------------------------------------------------------- /figures/mujoco_benchmark.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/mujoco_benchmark.png -------------------------------------------------------------------------------- /figures/plotter.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/plotter.png -------------------------------------------------------------------------------- /figures/tensorboard.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/tensorboard.png -------------------------------------------------------------------------------- /figures/tensorboard_vis.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/tensorboard_vis.png -------------------------------------------------------------------------------- /figures/wandb_vis.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/figures/wandb_vis.png -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/setup.py -------------------------------------------------------------------------------- /xuance/agent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/agent/__init__.py -------------------------------------------------------------------------------- /xuance/agent/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/agent/a2c.py -------------------------------------------------------------------------------- /xuance/agent/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/agent/ddpg.py -------------------------------------------------------------------------------- /xuance/agent/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/agent/dqn.py -------------------------------------------------------------------------------- /xuance/agent/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/agent/ppo.py -------------------------------------------------------------------------------- /xuance/agent/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/agent/td3.py -------------------------------------------------------------------------------- /xuance/environment/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/__init__.py -------------------------------------------------------------------------------- /xuance/environment/custom_envs/__pycache__/dmc.cpython-39.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/custom_envs/__pycache__/dmc.cpython-39.pyc -------------------------------------------------------------------------------- /xuance/environment/custom_envs/atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/custom_envs/atari.py -------------------------------------------------------------------------------- /xuance/environment/custom_envs/dmc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/custom_envs/dmc.py -------------------------------------------------------------------------------- /xuance/environment/env_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/env_utils.py -------------------------------------------------------------------------------- /xuance/environment/envpool_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/envpool_utils.py -------------------------------------------------------------------------------- /xuance/environment/normalizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/normalizer.py -------------------------------------------------------------------------------- /xuance/environment/vectorize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/vectorize.py -------------------------------------------------------------------------------- /xuance/environment/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/environment/wrappers.py -------------------------------------------------------------------------------- /xuance/learner/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/__init__.py -------------------------------------------------------------------------------- /xuance/learner/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/a2c.py -------------------------------------------------------------------------------- /xuance/learner/ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/ddpg.py -------------------------------------------------------------------------------- /xuance/learner/ddqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/ddqn.py -------------------------------------------------------------------------------- /xuance/learner/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/dqn.py -------------------------------------------------------------------------------- /xuance/learner/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/ppo.py -------------------------------------------------------------------------------- /xuance/learner/td3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/learner/td3.py -------------------------------------------------------------------------------- /xuance/policy/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/policy/__init__.py -------------------------------------------------------------------------------- /xuance/policy/categorical.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/policy/categorical.py -------------------------------------------------------------------------------- /xuance/policy/deterministic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/policy/deterministic.py -------------------------------------------------------------------------------- /xuance/policy/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/policy/dqn.py -------------------------------------------------------------------------------- /xuance/policy/gaussian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/policy/gaussian.py -------------------------------------------------------------------------------- /xuance/representation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/representation/__init__.py -------------------------------------------------------------------------------- /xuance/representation/network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/representation/network.py -------------------------------------------------------------------------------- /xuance/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /xuance/utils/block.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/utils/block.py -------------------------------------------------------------------------------- /xuance/utils/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/utils/common.py -------------------------------------------------------------------------------- /xuance/utils/distribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/utils/distribution.py -------------------------------------------------------------------------------- /xuance/utils/layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/utils/layer.py -------------------------------------------------------------------------------- /xuance/utils/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/wzcai99/XuanCE-Tiny/HEAD/xuance/utils/memory.py --------------------------------------------------------------------------------