├── .gitignore ├── LICENSE ├── README.md ├── agents ├── ActorCritic.py ├── AveragedDQN.py ├── BaseAgent.py ├── BootstrappedDQN.py ├── DDPG.py ├── DDQN.py ├── DQN.py ├── EnsembleDQN.py ├── LSVI_PHE.py ├── MaxminDQN.py ├── MeDQN_Real.py ├── MeDQN_Uniform.py ├── NoisyNetDQN.py ├── PPO.py ├── REINFORCE.py ├── RPG.py ├── SAC.py ├── TD3.py ├── VanillaDQN.py └── __init__.py ├── analysis.py ├── clean.sh ├── components ├── exploration.py ├── network.py ├── normalizer.py └── replay.py ├── configs ├── MERL_acrobot_dqn.json ├── MERL_acrobot_medqn.json ├── MERL_catcher_dqn.json ├── MERL_catcher_medqn.json ├── MERL_copter_dqn.json ├── MERL_copter_medqn.json ├── MERL_mc_dqn.json ├── MERL_mc_dqn_small.json ├── MERL_mc_medqn.json ├── MERL_mc_medqn_lambda.json ├── MERL_minatar_dqn.json ├── MERL_minatar_medqn_r.json ├── MERL_minatar_medqn_u.json ├── MERL_seaquest_dqn.json ├── MERL_seaquest_medqn_r.json ├── MERL_seaquest_medqn_u.json ├── Maxmin_catcher.json ├── Maxmin_copter.json ├── Maxmin_lunar.json ├── Maxmin_minatar.json ├── RPG.json ├── dmc_ppo.json ├── dmc_rpg.json ├── mujoco_actorcritic.json ├── mujoco_ddpg.json ├── mujoco_reponpg.json ├── mujoco_sac.json ├── mujoco_td3.json └── nchain.json ├── envs ├── env.py └── wrapper.py ├── experiment.py ├── find_config.py ├── git_commit_id.sh ├── main.py ├── move_log.sh ├── plot.py ├── procfile ├── requirements.txt ├── run.py ├── run.sh ├── sbatch_m.sh ├── sbatch_s.sh ├── unfinish_job.py └── utils ├── helper.py ├── logger.py ├── plotter.py ├── submitter.py └── sweeper.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/README.md -------------------------------------------------------------------------------- /agents/ActorCritic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/ActorCritic.py -------------------------------------------------------------------------------- /agents/AveragedDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/AveragedDQN.py -------------------------------------------------------------------------------- /agents/BaseAgent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/BaseAgent.py -------------------------------------------------------------------------------- /agents/BootstrappedDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/BootstrappedDQN.py -------------------------------------------------------------------------------- /agents/DDPG.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/DDPG.py -------------------------------------------------------------------------------- /agents/DDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/DDQN.py -------------------------------------------------------------------------------- /agents/DQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/DQN.py -------------------------------------------------------------------------------- /agents/EnsembleDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/EnsembleDQN.py -------------------------------------------------------------------------------- /agents/LSVI_PHE.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/LSVI_PHE.py -------------------------------------------------------------------------------- /agents/MaxminDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/MaxminDQN.py -------------------------------------------------------------------------------- /agents/MeDQN_Real.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/MeDQN_Real.py -------------------------------------------------------------------------------- /agents/MeDQN_Uniform.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/MeDQN_Uniform.py -------------------------------------------------------------------------------- /agents/NoisyNetDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/NoisyNetDQN.py -------------------------------------------------------------------------------- /agents/PPO.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/PPO.py -------------------------------------------------------------------------------- /agents/REINFORCE.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/REINFORCE.py -------------------------------------------------------------------------------- /agents/RPG.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/RPG.py -------------------------------------------------------------------------------- /agents/SAC.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/SAC.py -------------------------------------------------------------------------------- /agents/TD3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/TD3.py -------------------------------------------------------------------------------- /agents/VanillaDQN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/VanillaDQN.py -------------------------------------------------------------------------------- /agents/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/agents/__init__.py -------------------------------------------------------------------------------- /analysis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/analysis.py -------------------------------------------------------------------------------- /clean.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/clean.sh -------------------------------------------------------------------------------- /components/exploration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/components/exploration.py -------------------------------------------------------------------------------- /components/network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/components/network.py -------------------------------------------------------------------------------- /components/normalizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/components/normalizer.py -------------------------------------------------------------------------------- /components/replay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/components/replay.py -------------------------------------------------------------------------------- /configs/MERL_acrobot_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_acrobot_dqn.json -------------------------------------------------------------------------------- /configs/MERL_acrobot_medqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_acrobot_medqn.json -------------------------------------------------------------------------------- /configs/MERL_catcher_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_catcher_dqn.json -------------------------------------------------------------------------------- /configs/MERL_catcher_medqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_catcher_medqn.json -------------------------------------------------------------------------------- /configs/MERL_copter_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_copter_dqn.json -------------------------------------------------------------------------------- /configs/MERL_copter_medqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_copter_medqn.json -------------------------------------------------------------------------------- /configs/MERL_mc_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_mc_dqn.json -------------------------------------------------------------------------------- /configs/MERL_mc_dqn_small.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_mc_dqn_small.json -------------------------------------------------------------------------------- /configs/MERL_mc_medqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_mc_medqn.json -------------------------------------------------------------------------------- /configs/MERL_mc_medqn_lambda.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_mc_medqn_lambda.json -------------------------------------------------------------------------------- /configs/MERL_minatar_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_minatar_dqn.json -------------------------------------------------------------------------------- /configs/MERL_minatar_medqn_r.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_minatar_medqn_r.json -------------------------------------------------------------------------------- /configs/MERL_minatar_medqn_u.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_minatar_medqn_u.json -------------------------------------------------------------------------------- /configs/MERL_seaquest_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_seaquest_dqn.json -------------------------------------------------------------------------------- /configs/MERL_seaquest_medqn_r.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_seaquest_medqn_r.json -------------------------------------------------------------------------------- /configs/MERL_seaquest_medqn_u.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/MERL_seaquest_medqn_u.json -------------------------------------------------------------------------------- /configs/Maxmin_catcher.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/Maxmin_catcher.json -------------------------------------------------------------------------------- /configs/Maxmin_copter.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/Maxmin_copter.json -------------------------------------------------------------------------------- /configs/Maxmin_lunar.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/Maxmin_lunar.json -------------------------------------------------------------------------------- /configs/Maxmin_minatar.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/Maxmin_minatar.json -------------------------------------------------------------------------------- /configs/RPG.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/RPG.json -------------------------------------------------------------------------------- /configs/dmc_ppo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/dmc_ppo.json -------------------------------------------------------------------------------- /configs/dmc_rpg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/dmc_rpg.json -------------------------------------------------------------------------------- /configs/mujoco_actorcritic.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/mujoco_actorcritic.json -------------------------------------------------------------------------------- /configs/mujoco_ddpg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/mujoco_ddpg.json -------------------------------------------------------------------------------- /configs/mujoco_reponpg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/mujoco_reponpg.json -------------------------------------------------------------------------------- /configs/mujoco_sac.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/mujoco_sac.json -------------------------------------------------------------------------------- /configs/mujoco_td3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/mujoco_td3.json -------------------------------------------------------------------------------- /configs/nchain.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/configs/nchain.json -------------------------------------------------------------------------------- /envs/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/envs/env.py -------------------------------------------------------------------------------- /envs/wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/envs/wrapper.py -------------------------------------------------------------------------------- /experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/experiment.py -------------------------------------------------------------------------------- /find_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/find_config.py -------------------------------------------------------------------------------- /git_commit_id.sh: -------------------------------------------------------------------------------- 1 | git rev-parse --short HEAD -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/main.py -------------------------------------------------------------------------------- /move_log.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/move_log.sh -------------------------------------------------------------------------------- /plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/plot.py -------------------------------------------------------------------------------- /procfile: -------------------------------------------------------------------------------- 1 | 60 -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/requirements.txt -------------------------------------------------------------------------------- /run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/run.py -------------------------------------------------------------------------------- /run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/run.sh -------------------------------------------------------------------------------- /sbatch_m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/sbatch_m.sh -------------------------------------------------------------------------------- /sbatch_s.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/sbatch_s.sh -------------------------------------------------------------------------------- /unfinish_job.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/unfinish_job.py -------------------------------------------------------------------------------- /utils/helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/utils/helper.py -------------------------------------------------------------------------------- /utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/utils/logger.py -------------------------------------------------------------------------------- /utils/plotter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/utils/plotter.py -------------------------------------------------------------------------------- /utils/submitter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/utils/submitter.py -------------------------------------------------------------------------------- /utils/sweeper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/qlan3/Explorer/HEAD/utils/sweeper.py --------------------------------------------------------------------------------