├── DSAC1.0_environment.yml ├── README.md ├── dsac_v1.py ├── env_gym ├── __init__.py ├── __pycache__ │ └── gym_pendulum_data.cpython-38.pyc ├── gym_acrobot_data.py ├── gym_ant_data.py ├── gym_bipedalwalker_data.py ├── gym_bipedalwalkerhardcore_data.py ├── gym_blackjack_data.py ├── gym_boxing_data.py ├── gym_breakout_data.py ├── gym_carracing_data.py ├── gym_cartpole_data.py ├── gym_cartpoleconti_data.py ├── gym_cartpolecontiwithstack_data.py ├── gym_enduro_data.py ├── gym_frozenlake88_data.py ├── gym_frozenlake_data.py ├── gym_halfcheetah_data.py ├── gym_hopper_data.py ├── gym_humanoid_data.py ├── gym_humanoidstandup_data.py ├── gym_inverteddoublependulum_data.py ├── gym_invertedpendulum_data.py ├── gym_lunarlander_data.py ├── gym_lunarlanderconti_data.py ├── gym_mountaincar_data.py ├── gym_mountaincarconti_data.py ├── gym_pendulum_data.py ├── gym_phoenix_data.py ├── gym_pusher_data.py ├── gym_reacher_data.py ├── gym_spaceinvaders_data.py ├── gym_swimmer_data.py ├── gym_taxi_data.py └── gym_walker2d_data.py ├── example_train ├── dsac_mlp_humanoidconti_offserial.py └── main.py ├── figures └── test ├── networks ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-38.pyc │ └── mlp.cpython-38.pyc ├── cnn_shared.py └── mlp.py ├── results └── DSAC_V1_gym_pendulum │ └── 240223-002301 │ ├── apprfunc │ ├── apprfunc_0.pkl │ ├── apprfunc_10000.pkl │ ├── apprfunc_10900_opt.pkl │ ├── apprfunc_12000.pkl │ └── apprfunc_5000.pkl │ ├── config.json │ ├── data │ ├── DSAC_alpha-RL iter.csv │ ├── DSAC_critic_avg_q-RL iter.csv │ ├── DSAC_critic_avg_std-RL iter.csv │ ├── DSAC_entropy-RL iter.csv │ ├── DSAC_policy_mean-RL iter.csv │ ├── DSAC_policy_std-RL iter.csv │ ├── Evaluation_1. TAR-RL iter.csv │ ├── Evaluation_2. TAR-Total time [s].csv │ ├── Evaluation_3. TAR-Collected samples.csv │ ├── Evaluation_4. TAR-Replay samples.csv │ ├── Loss_Actor loss-RL iter.csv │ ├── RAM_RAM [MB]-RL iter.csv │ ├── Time_Algorithm time [ms]-RL iter.csv │ └── Time_Sampler time [ms]-RL iter.csv │ └── events.out.tfevents.1708618981.DESKTOP-ULVFR8S.6968.0 ├── run_policy.py ├── setup.py ├── training ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-38.pyc │ ├── evaluator.cpython-38.pyc │ ├── off_sampler.cpython-38.pyc │ ├── replay_buffer.cpython-38.pyc │ └── trainer.cpython-38.pyc ├── evaluator.py ├── off_sampler.py ├── replay_buffer.py └── trainer.py └── utils ├── __init__.py ├── __pycache__ ├── __init__.cpython-38.pyc ├── act_distribution_cls.cpython-38.pyc ├── common_utils.cpython-38.pyc ├── explore_noise.cpython-38.pyc ├── init_args.cpython-38.pyc ├── initialization.cpython-38.pyc ├── plot_evaluation.cpython-38.pyc ├── sys_run.cpython-38.pyc ├── tensorboard_setup.cpython-38.pyc └── wrapping_env.cpython-38.pyc ├── act_distribution_cls.py ├── common_utils.py ├── explore_noise.py ├── init_args.py ├── initialization.py ├── plot_evaluation.py ├── sys_run.py ├── tensorboard_setup.py └── wrapping_env.py /DSAC1.0_environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/DSAC1.0_environment.yml -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/README.md -------------------------------------------------------------------------------- /dsac_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/dsac_v1.py -------------------------------------------------------------------------------- /env_gym/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /env_gym/__pycache__/gym_pendulum_data.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/__pycache__/gym_pendulum_data.cpython-38.pyc -------------------------------------------------------------------------------- /env_gym/gym_acrobot_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_acrobot_data.py -------------------------------------------------------------------------------- /env_gym/gym_ant_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_ant_data.py -------------------------------------------------------------------------------- /env_gym/gym_bipedalwalker_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_bipedalwalker_data.py -------------------------------------------------------------------------------- /env_gym/gym_bipedalwalkerhardcore_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_bipedalwalkerhardcore_data.py -------------------------------------------------------------------------------- /env_gym/gym_blackjack_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_blackjack_data.py -------------------------------------------------------------------------------- /env_gym/gym_boxing_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_boxing_data.py -------------------------------------------------------------------------------- /env_gym/gym_breakout_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_breakout_data.py -------------------------------------------------------------------------------- /env_gym/gym_carracing_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_carracing_data.py -------------------------------------------------------------------------------- /env_gym/gym_cartpole_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_cartpole_data.py -------------------------------------------------------------------------------- /env_gym/gym_cartpoleconti_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_cartpoleconti_data.py -------------------------------------------------------------------------------- /env_gym/gym_cartpolecontiwithstack_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_cartpolecontiwithstack_data.py -------------------------------------------------------------------------------- /env_gym/gym_enduro_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_enduro_data.py -------------------------------------------------------------------------------- /env_gym/gym_frozenlake88_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_frozenlake88_data.py -------------------------------------------------------------------------------- /env_gym/gym_frozenlake_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_frozenlake_data.py -------------------------------------------------------------------------------- /env_gym/gym_halfcheetah_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_halfcheetah_data.py -------------------------------------------------------------------------------- /env_gym/gym_hopper_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_hopper_data.py -------------------------------------------------------------------------------- /env_gym/gym_humanoid_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_humanoid_data.py -------------------------------------------------------------------------------- /env_gym/gym_humanoidstandup_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_humanoidstandup_data.py -------------------------------------------------------------------------------- /env_gym/gym_inverteddoublependulum_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_inverteddoublependulum_data.py -------------------------------------------------------------------------------- /env_gym/gym_invertedpendulum_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_invertedpendulum_data.py -------------------------------------------------------------------------------- /env_gym/gym_lunarlander_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_lunarlander_data.py -------------------------------------------------------------------------------- /env_gym/gym_lunarlanderconti_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_lunarlanderconti_data.py -------------------------------------------------------------------------------- /env_gym/gym_mountaincar_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_mountaincar_data.py -------------------------------------------------------------------------------- /env_gym/gym_mountaincarconti_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_mountaincarconti_data.py -------------------------------------------------------------------------------- /env_gym/gym_pendulum_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_pendulum_data.py -------------------------------------------------------------------------------- /env_gym/gym_phoenix_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_phoenix_data.py -------------------------------------------------------------------------------- /env_gym/gym_pusher_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_pusher_data.py -------------------------------------------------------------------------------- /env_gym/gym_reacher_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_reacher_data.py -------------------------------------------------------------------------------- /env_gym/gym_spaceinvaders_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_spaceinvaders_data.py -------------------------------------------------------------------------------- /env_gym/gym_swimmer_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_swimmer_data.py -------------------------------------------------------------------------------- /env_gym/gym_taxi_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_taxi_data.py -------------------------------------------------------------------------------- /env_gym/gym_walker2d_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/env_gym/gym_walker2d_data.py -------------------------------------------------------------------------------- /example_train/dsac_mlp_humanoidconti_offserial.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/example_train/dsac_mlp_humanoidconti_offserial.py -------------------------------------------------------------------------------- /example_train/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/example_train/main.py -------------------------------------------------------------------------------- /figures/test: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /networks/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /networks/__pycache__/__init__.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/networks/__pycache__/__init__.cpython-38.pyc -------------------------------------------------------------------------------- /networks/__pycache__/mlp.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/networks/__pycache__/mlp.cpython-38.pyc -------------------------------------------------------------------------------- /networks/cnn_shared.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/networks/cnn_shared.py -------------------------------------------------------------------------------- /networks/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/networks/mlp.py -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_0.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_0.pkl -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_10000.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_10000.pkl -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_10900_opt.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_10900_opt.pkl -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_12000.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_12000.pkl -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_5000.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/apprfunc/apprfunc_5000.pkl -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/config.json -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_alpha-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_alpha-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_critic_avg_q-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_critic_avg_q-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_critic_avg_std-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_critic_avg_std-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_entropy-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_entropy-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_policy_mean-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_policy_mean-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_policy_std-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/DSAC_policy_std-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_1. TAR-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_1. TAR-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_2. TAR-Total time [s].csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_2. TAR-Total time [s].csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_3. TAR-Collected samples.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_3. TAR-Collected samples.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_4. TAR-Replay samples.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Evaluation_4. TAR-Replay samples.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Loss_Actor loss-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Loss_Actor loss-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/RAM_RAM [MB]-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/RAM_RAM [MB]-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Time_Algorithm time [ms]-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Time_Algorithm time [ms]-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/data/Time_Sampler time [ms]-RL iter.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/data/Time_Sampler time [ms]-RL iter.csv -------------------------------------------------------------------------------- /results/DSAC_V1_gym_pendulum/240223-002301/events.out.tfevents.1708618981.DESKTOP-ULVFR8S.6968.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/results/DSAC_V1_gym_pendulum/240223-002301/events.out.tfevents.1708618981.DESKTOP-ULVFR8S.6968.0 -------------------------------------------------------------------------------- /run_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/run_policy.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/setup.py -------------------------------------------------------------------------------- /training/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/__init__.py -------------------------------------------------------------------------------- /training/__pycache__/__init__.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/__pycache__/__init__.cpython-38.pyc -------------------------------------------------------------------------------- /training/__pycache__/evaluator.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/__pycache__/evaluator.cpython-38.pyc -------------------------------------------------------------------------------- /training/__pycache__/off_sampler.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/__pycache__/off_sampler.cpython-38.pyc -------------------------------------------------------------------------------- /training/__pycache__/replay_buffer.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/__pycache__/replay_buffer.cpython-38.pyc -------------------------------------------------------------------------------- /training/__pycache__/trainer.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/__pycache__/trainer.cpython-38.pyc -------------------------------------------------------------------------------- /training/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/evaluator.py -------------------------------------------------------------------------------- /training/off_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/off_sampler.py -------------------------------------------------------------------------------- /training/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/replay_buffer.py -------------------------------------------------------------------------------- /training/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/training/trainer.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__init__.py -------------------------------------------------------------------------------- /utils/__pycache__/__init__.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/__init__.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/act_distribution_cls.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/act_distribution_cls.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/common_utils.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/common_utils.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/explore_noise.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/explore_noise.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/init_args.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/init_args.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/initialization.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/initialization.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/plot_evaluation.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/plot_evaluation.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/sys_run.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/sys_run.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/tensorboard_setup.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/tensorboard_setup.cpython-38.pyc -------------------------------------------------------------------------------- /utils/__pycache__/wrapping_env.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/__pycache__/wrapping_env.cpython-38.pyc -------------------------------------------------------------------------------- /utils/act_distribution_cls.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/act_distribution_cls.py -------------------------------------------------------------------------------- /utils/common_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/common_utils.py -------------------------------------------------------------------------------- /utils/explore_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/explore_noise.py -------------------------------------------------------------------------------- /utils/init_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/init_args.py -------------------------------------------------------------------------------- /utils/initialization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/initialization.py -------------------------------------------------------------------------------- /utils/plot_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/plot_evaluation.py -------------------------------------------------------------------------------- /utils/sys_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/sys_run.py -------------------------------------------------------------------------------- /utils/tensorboard_setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/tensorboard_setup.py -------------------------------------------------------------------------------- /utils/wrapping_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Jingliang-Duan/DSAC-v1/HEAD/utils/wrapping_env.py --------------------------------------------------------------------------------