├── LICENSE ├── README.md ├── attackers ├── attacker.py └── data_mean_std.py ├── data └── img.png ├── experiment_configs ├── algorithms │ ├── batch.py │ ├── batch_mbrl.py │ ├── mbrl.py │ ├── offline.py │ ├── offline_mbrl.py │ └── online.py ├── base_experiment.py └── configs │ └── q_learning │ └── sac_config.py ├── experiment_utils ├── __init__.py ├── launch_experiment.py ├── prepare_data.py └── utils.py ├── lifelong_rl ├── __init__.py ├── baselines │ ├── __init__.py │ └── base │ │ ├── base.py │ │ └── mlp_baseline.py ├── core │ ├── __init__.py │ ├── logging │ │ ├── logging.py │ │ ├── logging_setup.py │ │ └── tabulate.py │ └── rl_algorithms │ │ ├── __init__.py │ │ ├── batch │ │ ├── __init__.py │ │ ├── batch_rl_algorithm.py │ │ └── mb_batch_rl_algorithm.py │ │ ├── offline │ │ ├── __init__.py │ │ ├── mb_offline_rl_algorithm.py │ │ └── offline_rl_algorithm.py │ │ ├── online │ │ ├── __init__.py │ │ ├── mbrl_algorithm.py │ │ └── online_rl_algorithm.py │ │ ├── rl_algorithm.py │ │ └── torch_rl_algorithm.py ├── data_management │ ├── replay_buffers │ │ ├── env_replay_buffer.py │ │ ├── mujoco_replay_buffer.py │ │ ├── replay_buffer.py │ │ └── simple_replay_buffer.py │ └── utils │ │ └── path_builder.py ├── envs │ ├── __init__.py │ ├── env_processor.py │ ├── env_utils.py │ ├── environments │ │ ├── __init__.py │ │ ├── ant_env.py │ │ ├── assets │ │ │ ├── ant.xml │ │ │ └── inverted_pendulum.xml │ │ ├── continuous_gridworld │ │ │ ├── __init__.py │ │ │ ├── cont_gridworld.py │ │ │ ├── grids │ │ │ │ ├── blank.txt │ │ │ │ ├── minecraft │ │ │ │ │ └── world_1.txt │ │ │ │ ├── one_goal.txt │ │ │ │ ├── volcano_1.txt │ │ │ │ └── volcano_2.txt │ │ │ └── tiles.py │ │ ├── hopper_env.py │ │ └── humanoid_env.py │ └── wrappers.py ├── exploration_strategies │ ├── __init__.py │ ├── base.py │ ├── epsilon_greedy.py │ ├── gaussian_and_epsilon_strategy.py │ ├── gaussian_strategy.py │ └── ou_strategy.py ├── models │ ├── __init__.py │ ├── dynamics_models │ │ ├── __init__.py │ │ └── probabilistic_ensemble.py │ └── networks.py ├── optimizers │ ├── __init__.py │ ├── optimizer.py │ └── random_shooting │ │ ├── __init__.py │ │ ├── cem.py │ │ ├── mppi.py │ │ └── rs_optimizer.py ├── policies │ ├── __init__.py │ ├── base │ │ ├── base.py │ │ ├── latent_prior_policy.py │ │ └── simple.py │ ├── models │ │ ├── gaussian_policy.py │ │ └── tanh_gaussian_policy.py │ └── mpc │ │ ├── mpc.py │ │ └── policy_mpc.py ├── samplers │ ├── __init__.py │ ├── data_collector │ │ ├── __init__.py │ │ ├── base.py │ │ ├── path_collector.py │ │ └── step_collector.py │ └── utils │ │ ├── model_rollout_functions.py │ │ ├── path_functions.py │ │ └── rollout_functions.py ├── torch │ ├── distributions.py │ ├── modules.py │ ├── pytorch_util.py │ └── risk_aversion.py ├── trainers │ ├── __init__.py │ ├── multi_trainer.py │ ├── q_learning │ │ ├── __init__.py │ │ └── sac.py │ └── trainer.py └── util │ ├── eval_util.py │ ├── pythonplusplus.py │ └── visualize_mujoco.py ├── requirements.txt └── scripts ├── get_config.py ├── get_dataset_return.py └── sac.py /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/README.md -------------------------------------------------------------------------------- /attackers/attacker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/attackers/attacker.py -------------------------------------------------------------------------------- /attackers/data_mean_std.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/attackers/data_mean_std.py -------------------------------------------------------------------------------- /data/img.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/data/img.png -------------------------------------------------------------------------------- /experiment_configs/algorithms/batch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/algorithms/batch.py -------------------------------------------------------------------------------- /experiment_configs/algorithms/batch_mbrl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/algorithms/batch_mbrl.py -------------------------------------------------------------------------------- /experiment_configs/algorithms/mbrl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/algorithms/mbrl.py -------------------------------------------------------------------------------- /experiment_configs/algorithms/offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/algorithms/offline.py -------------------------------------------------------------------------------- /experiment_configs/algorithms/offline_mbrl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/algorithms/offline_mbrl.py -------------------------------------------------------------------------------- /experiment_configs/algorithms/online.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/algorithms/online.py -------------------------------------------------------------------------------- /experiment_configs/base_experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/base_experiment.py -------------------------------------------------------------------------------- /experiment_configs/configs/q_learning/sac_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_configs/configs/q_learning/sac_config.py -------------------------------------------------------------------------------- /experiment_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /experiment_utils/launch_experiment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_utils/launch_experiment.py -------------------------------------------------------------------------------- /experiment_utils/prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_utils/prepare_data.py -------------------------------------------------------------------------------- /experiment_utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/experiment_utils/utils.py -------------------------------------------------------------------------------- /lifelong_rl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/baselines/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/baselines/base/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/baselines/base/base.py -------------------------------------------------------------------------------- /lifelong_rl/baselines/base/mlp_baseline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/baselines/base/mlp_baseline.py -------------------------------------------------------------------------------- /lifelong_rl/core/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/__init__.py -------------------------------------------------------------------------------- /lifelong_rl/core/logging/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/logging/logging.py -------------------------------------------------------------------------------- /lifelong_rl/core/logging/logging_setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/logging/logging_setup.py -------------------------------------------------------------------------------- /lifelong_rl/core/logging/tabulate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/logging/tabulate.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/batch/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/batch/batch_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/batch/batch_rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/batch/mb_batch_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/batch/mb_batch_rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/offline/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/offline/mb_offline_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/offline/mb_offline_rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/offline/offline_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/offline/offline_rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/online/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/online/mbrl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/online/mbrl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/online/online_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/online/online_rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/core/rl_algorithms/torch_rl_algorithm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/core/rl_algorithms/torch_rl_algorithm.py -------------------------------------------------------------------------------- /lifelong_rl/data_management/replay_buffers/env_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/data_management/replay_buffers/env_replay_buffer.py -------------------------------------------------------------------------------- /lifelong_rl/data_management/replay_buffers/mujoco_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/data_management/replay_buffers/mujoco_replay_buffer.py -------------------------------------------------------------------------------- /lifelong_rl/data_management/replay_buffers/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/data_management/replay_buffers/replay_buffer.py -------------------------------------------------------------------------------- /lifelong_rl/data_management/replay_buffers/simple_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/data_management/replay_buffers/simple_replay_buffer.py -------------------------------------------------------------------------------- /lifelong_rl/data_management/utils/path_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/data_management/utils/path_builder.py -------------------------------------------------------------------------------- /lifelong_rl/envs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/envs/env_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/env_processor.py -------------------------------------------------------------------------------- /lifelong_rl/envs/env_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/env_utils.py -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/ant_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/ant_env.py -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/assets/ant.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/assets/ant.xml -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/assets/inverted_pendulum.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/assets/inverted_pendulum.xml -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/cont_gridworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/cont_gridworld.py -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/grids/blank.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/grids/blank.txt -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/grids/minecraft/world_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/grids/minecraft/world_1.txt -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/grids/one_goal.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/grids/one_goal.txt -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/grids/volcano_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/grids/volcano_1.txt -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/grids/volcano_2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/grids/volcano_2.txt -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/continuous_gridworld/tiles.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/continuous_gridworld/tiles.py -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/hopper_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/hopper_env.py -------------------------------------------------------------------------------- /lifelong_rl/envs/environments/humanoid_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/environments/humanoid_env.py -------------------------------------------------------------------------------- /lifelong_rl/envs/wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/envs/wrappers.py -------------------------------------------------------------------------------- /lifelong_rl/exploration_strategies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/exploration_strategies/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/exploration_strategies/base.py -------------------------------------------------------------------------------- /lifelong_rl/exploration_strategies/epsilon_greedy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/exploration_strategies/epsilon_greedy.py -------------------------------------------------------------------------------- /lifelong_rl/exploration_strategies/gaussian_and_epsilon_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/exploration_strategies/gaussian_and_epsilon_strategy.py -------------------------------------------------------------------------------- /lifelong_rl/exploration_strategies/gaussian_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/exploration_strategies/gaussian_strategy.py -------------------------------------------------------------------------------- /lifelong_rl/exploration_strategies/ou_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/exploration_strategies/ou_strategy.py -------------------------------------------------------------------------------- /lifelong_rl/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/models/dynamics_models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/models/dynamics_models/probabilistic_ensemble.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/models/dynamics_models/probabilistic_ensemble.py -------------------------------------------------------------------------------- /lifelong_rl/models/networks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/models/networks.py -------------------------------------------------------------------------------- /lifelong_rl/optimizers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/optimizers/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/optimizers/optimizer.py -------------------------------------------------------------------------------- /lifelong_rl/optimizers/random_shooting/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/optimizers/random_shooting/cem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/optimizers/random_shooting/cem.py -------------------------------------------------------------------------------- /lifelong_rl/optimizers/random_shooting/mppi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/optimizers/random_shooting/mppi.py -------------------------------------------------------------------------------- /lifelong_rl/optimizers/random_shooting/rs_optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/optimizers/random_shooting/rs_optimizer.py -------------------------------------------------------------------------------- /lifelong_rl/policies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/policies/base/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/base/base.py -------------------------------------------------------------------------------- /lifelong_rl/policies/base/latent_prior_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/base/latent_prior_policy.py -------------------------------------------------------------------------------- /lifelong_rl/policies/base/simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/base/simple.py -------------------------------------------------------------------------------- /lifelong_rl/policies/models/gaussian_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/models/gaussian_policy.py -------------------------------------------------------------------------------- /lifelong_rl/policies/models/tanh_gaussian_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/models/tanh_gaussian_policy.py -------------------------------------------------------------------------------- /lifelong_rl/policies/mpc/mpc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/mpc/mpc.py -------------------------------------------------------------------------------- /lifelong_rl/policies/mpc/policy_mpc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/policies/mpc/policy_mpc.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/__init__.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/data_collector/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/samplers/data_collector/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/data_collector/base.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/data_collector/path_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/data_collector/path_collector.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/data_collector/step_collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/data_collector/step_collector.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/utils/model_rollout_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/utils/model_rollout_functions.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/utils/path_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/utils/path_functions.py -------------------------------------------------------------------------------- /lifelong_rl/samplers/utils/rollout_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/samplers/utils/rollout_functions.py -------------------------------------------------------------------------------- /lifelong_rl/torch/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/torch/distributions.py -------------------------------------------------------------------------------- /lifelong_rl/torch/modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/torch/modules.py -------------------------------------------------------------------------------- /lifelong_rl/torch/pytorch_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/torch/pytorch_util.py -------------------------------------------------------------------------------- /lifelong_rl/torch/risk_aversion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/torch/risk_aversion.py -------------------------------------------------------------------------------- /lifelong_rl/trainers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/trainers/multi_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/trainers/multi_trainer.py -------------------------------------------------------------------------------- /lifelong_rl/trainers/q_learning/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lifelong_rl/trainers/q_learning/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/trainers/q_learning/sac.py -------------------------------------------------------------------------------- /lifelong_rl/trainers/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/trainers/trainer.py -------------------------------------------------------------------------------- /lifelong_rl/util/eval_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/util/eval_util.py -------------------------------------------------------------------------------- /lifelong_rl/util/pythonplusplus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/util/pythonplusplus.py -------------------------------------------------------------------------------- /lifelong_rl/util/visualize_mujoco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/lifelong_rl/util/visualize_mujoco.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/get_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/scripts/get_config.py -------------------------------------------------------------------------------- /scripts/get_dataset_return.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/scripts/get_dataset_return.py -------------------------------------------------------------------------------- /scripts/sac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/YangRui2015/RORL/HEAD/scripts/sac.py --------------------------------------------------------------------------------