├── .gitignore ├── LICENSE ├── docs ├── atari_iqn_lstm.md ├── distributed_acting.md └── json_syntax.md ├── readme.md ├── rltime ├── __init__.py ├── acting │ ├── __init__.py │ ├── acting_interface.py │ ├── actor.py │ ├── actor_pool.py │ ├── actor_wrapper.py │ ├── async_actor.py │ ├── create.py │ └── ray_pool.py ├── configs │ ├── atari_iqn_lstm.json │ ├── atari_ppo.json │ ├── cartpole_a2c.json │ ├── cartpole_common.json │ ├── cartpole_dqn.json │ ├── cartpole_iqn.json │ ├── cartpole_ppo.json │ ├── env_wrappers │ │ ├── atari.json │ │ └── atari_lstm.json │ ├── exploration │ │ ├── decay_0.01_10p.json │ │ ├── decay_0.01_50p.json │ │ ├── decay_0.01_5p.json │ │ ├── per_actor_0.4_factor7.json │ │ └── per_actor_0.4_to_0.01_factor7_50p.json │ ├── models │ │ ├── mlp_2x64.json │ │ ├── modules │ │ │ ├── fc256.json │ │ │ ├── fc512.json │ │ │ ├── fc64.json │ │ │ ├── lstm512.json │ │ │ ├── nature_cnn.json │ │ │ └── nature_cnn_small.json │ │ ├── nature_cnn_fc512.json │ │ ├── nature_cnn_fc512_lstm512.json │ │ ├── nature_cnn_fc512_lstm512_fc512.json │ │ └── nature_cnn_lstm512_fc512.json │ ├── mountaincar_continuous_ppo.json │ └── ple_flappy_bird_iqn_lstm.json ├── env_wrappers │ ├── __init__.py │ ├── atari.py │ ├── common.py │ └── vec_env │ │ ├── __init__.py │ │ ├── common.py │ │ ├── simple.py │ │ └── sub_proc.py ├── eval.py ├── exploration │ ├── __init__.py │ ├── base.py │ └── epsilon_greedy.py ├── general │ ├── __init__.py │ ├── allowed_modules.py │ ├── backend.py │ ├── compression.py │ ├── config.py │ ├── config_template.py │ ├── loggers.py │ ├── object_wrapper.py │ ├── preceiver.py │ ├── singleton.py │ ├── type_registry.py │ ├── utils.py │ └── value_log.py ├── history │ ├── __init__.py │ ├── data_structures │ │ ├── __init__.py │ │ ├── cyclic_array.py │ │ └── segment_tree.py │ ├── history.py │ ├── online_history.py │ ├── parallel_history.py │ ├── prioritized_replay_history.py │ └── replay_history.py ├── models │ ├── __init__.py │ └── torch │ │ ├── __init__.py │ │ ├── modules │ │ ├── __init__.py │ │ ├── base.py │ │ ├── cnn.py │ │ ├── fc.py │ │ └── lstm.py │ │ ├── sequential.py │ │ ├── torch_model.py │ │ └── utils.py ├── policies │ ├── __init__.py │ ├── policy.py │ └── torch │ │ ├── __init__.py │ │ ├── actor_critic.py │ │ ├── dist_dqn.py │ │ ├── distributions │ │ ├── __init__.py │ │ ├── categorical.py │ │ ├── distribution_layer.py │ │ └── normal.py │ │ ├── dqn.py │ │ ├── iqn.py │ │ └── torch_policy.py ├── train.py └── training │ ├── __init__.py │ ├── multi_step_trainer.py │ ├── policy_trainer.py │ └── torch │ ├── __init__.py │ ├── a2c.py │ ├── dist_dqn.py │ ├── dqn.py │ ├── iqn.py │ ├── ppo.py │ └── torch_trainer.py └── setup.py /.gitignore: -------------------------------------------------------------------------------- 1 | *.pyc 2 | *.egg-info -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/LICENSE -------------------------------------------------------------------------------- /docs/atari_iqn_lstm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/docs/atari_iqn_lstm.md -------------------------------------------------------------------------------- /docs/distributed_acting.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/docs/distributed_acting.md -------------------------------------------------------------------------------- /docs/json_syntax.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/docs/json_syntax.md -------------------------------------------------------------------------------- /readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/readme.md -------------------------------------------------------------------------------- /rltime/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/acting/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/acting/acting_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/acting_interface.py -------------------------------------------------------------------------------- /rltime/acting/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/actor.py -------------------------------------------------------------------------------- /rltime/acting/actor_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/actor_pool.py -------------------------------------------------------------------------------- /rltime/acting/actor_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/actor_wrapper.py -------------------------------------------------------------------------------- /rltime/acting/async_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/async_actor.py -------------------------------------------------------------------------------- /rltime/acting/create.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/create.py -------------------------------------------------------------------------------- /rltime/acting/ray_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/acting/ray_pool.py -------------------------------------------------------------------------------- /rltime/configs/atari_iqn_lstm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/atari_iqn_lstm.json -------------------------------------------------------------------------------- /rltime/configs/atari_ppo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/atari_ppo.json -------------------------------------------------------------------------------- /rltime/configs/cartpole_a2c.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/cartpole_a2c.json -------------------------------------------------------------------------------- /rltime/configs/cartpole_common.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/cartpole_common.json -------------------------------------------------------------------------------- /rltime/configs/cartpole_dqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/cartpole_dqn.json -------------------------------------------------------------------------------- /rltime/configs/cartpole_iqn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/cartpole_iqn.json -------------------------------------------------------------------------------- /rltime/configs/cartpole_ppo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/cartpole_ppo.json -------------------------------------------------------------------------------- /rltime/configs/env_wrappers/atari.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/env_wrappers/atari.json -------------------------------------------------------------------------------- /rltime/configs/env_wrappers/atari_lstm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/env_wrappers/atari_lstm.json -------------------------------------------------------------------------------- /rltime/configs/exploration/decay_0.01_10p.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/exploration/decay_0.01_10p.json -------------------------------------------------------------------------------- /rltime/configs/exploration/decay_0.01_50p.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/exploration/decay_0.01_50p.json -------------------------------------------------------------------------------- /rltime/configs/exploration/decay_0.01_5p.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/exploration/decay_0.01_5p.json -------------------------------------------------------------------------------- /rltime/configs/exploration/per_actor_0.4_factor7.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/exploration/per_actor_0.4_factor7.json -------------------------------------------------------------------------------- /rltime/configs/exploration/per_actor_0.4_to_0.01_factor7_50p.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/exploration/per_actor_0.4_to_0.01_factor7_50p.json -------------------------------------------------------------------------------- /rltime/configs/models/mlp_2x64.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/mlp_2x64.json -------------------------------------------------------------------------------- /rltime/configs/models/modules/fc256.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/modules/fc256.json -------------------------------------------------------------------------------- /rltime/configs/models/modules/fc512.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/modules/fc512.json -------------------------------------------------------------------------------- /rltime/configs/models/modules/fc64.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/modules/fc64.json -------------------------------------------------------------------------------- /rltime/configs/models/modules/lstm512.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/modules/lstm512.json -------------------------------------------------------------------------------- /rltime/configs/models/modules/nature_cnn.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/modules/nature_cnn.json -------------------------------------------------------------------------------- /rltime/configs/models/modules/nature_cnn_small.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/modules/nature_cnn_small.json -------------------------------------------------------------------------------- /rltime/configs/models/nature_cnn_fc512.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/nature_cnn_fc512.json -------------------------------------------------------------------------------- /rltime/configs/models/nature_cnn_fc512_lstm512.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/nature_cnn_fc512_lstm512.json -------------------------------------------------------------------------------- /rltime/configs/models/nature_cnn_fc512_lstm512_fc512.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/nature_cnn_fc512_lstm512_fc512.json -------------------------------------------------------------------------------- /rltime/configs/models/nature_cnn_lstm512_fc512.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/models/nature_cnn_lstm512_fc512.json -------------------------------------------------------------------------------- /rltime/configs/mountaincar_continuous_ppo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/mountaincar_continuous_ppo.json -------------------------------------------------------------------------------- /rltime/configs/ple_flappy_bird_iqn_lstm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/configs/ple_flappy_bird_iqn_lstm.json -------------------------------------------------------------------------------- /rltime/env_wrappers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/env_wrappers/atari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/env_wrappers/atari.py -------------------------------------------------------------------------------- /rltime/env_wrappers/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/env_wrappers/common.py -------------------------------------------------------------------------------- /rltime/env_wrappers/vec_env/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/env_wrappers/vec_env/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/env_wrappers/vec_env/common.py -------------------------------------------------------------------------------- /rltime/env_wrappers/vec_env/simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/env_wrappers/vec_env/simple.py -------------------------------------------------------------------------------- /rltime/env_wrappers/vec_env/sub_proc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/env_wrappers/vec_env/sub_proc.py -------------------------------------------------------------------------------- /rltime/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/eval.py -------------------------------------------------------------------------------- /rltime/exploration/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/exploration/__init__.py -------------------------------------------------------------------------------- /rltime/exploration/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/exploration/base.py -------------------------------------------------------------------------------- /rltime/exploration/epsilon_greedy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/exploration/epsilon_greedy.py -------------------------------------------------------------------------------- /rltime/general/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/general/allowed_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/allowed_modules.py -------------------------------------------------------------------------------- /rltime/general/backend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/backend.py -------------------------------------------------------------------------------- /rltime/general/compression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/compression.py -------------------------------------------------------------------------------- /rltime/general/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/config.py -------------------------------------------------------------------------------- /rltime/general/config_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/config_template.py -------------------------------------------------------------------------------- /rltime/general/loggers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/loggers.py -------------------------------------------------------------------------------- /rltime/general/object_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/object_wrapper.py -------------------------------------------------------------------------------- /rltime/general/preceiver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/preceiver.py -------------------------------------------------------------------------------- /rltime/general/singleton.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/singleton.py -------------------------------------------------------------------------------- /rltime/general/type_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/type_registry.py -------------------------------------------------------------------------------- /rltime/general/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/utils.py -------------------------------------------------------------------------------- /rltime/general/value_log.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/general/value_log.py -------------------------------------------------------------------------------- /rltime/history/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/__init__.py -------------------------------------------------------------------------------- /rltime/history/data_structures/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/history/data_structures/cyclic_array.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/data_structures/cyclic_array.py -------------------------------------------------------------------------------- /rltime/history/data_structures/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/data_structures/segment_tree.py -------------------------------------------------------------------------------- /rltime/history/history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/history.py -------------------------------------------------------------------------------- /rltime/history/online_history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/online_history.py -------------------------------------------------------------------------------- /rltime/history/parallel_history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/parallel_history.py -------------------------------------------------------------------------------- /rltime/history/prioritized_replay_history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/prioritized_replay_history.py -------------------------------------------------------------------------------- /rltime/history/replay_history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/history/replay_history.py -------------------------------------------------------------------------------- /rltime/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/__init__.py -------------------------------------------------------------------------------- /rltime/models/torch/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/models/torch/modules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/modules/__init__.py -------------------------------------------------------------------------------- /rltime/models/torch/modules/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/modules/base.py -------------------------------------------------------------------------------- /rltime/models/torch/modules/cnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/modules/cnn.py -------------------------------------------------------------------------------- /rltime/models/torch/modules/fc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/modules/fc.py -------------------------------------------------------------------------------- /rltime/models/torch/modules/lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/modules/lstm.py -------------------------------------------------------------------------------- /rltime/models/torch/sequential.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/sequential.py -------------------------------------------------------------------------------- /rltime/models/torch/torch_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/torch_model.py -------------------------------------------------------------------------------- /rltime/models/torch/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/models/torch/utils.py -------------------------------------------------------------------------------- /rltime/policies/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/policies/policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/policy.py -------------------------------------------------------------------------------- /rltime/policies/torch/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rltime/policies/torch/actor_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/actor_critic.py -------------------------------------------------------------------------------- /rltime/policies/torch/dist_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/dist_dqn.py -------------------------------------------------------------------------------- /rltime/policies/torch/distributions/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/distributions/__init__.py -------------------------------------------------------------------------------- /rltime/policies/torch/distributions/categorical.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/distributions/categorical.py -------------------------------------------------------------------------------- /rltime/policies/torch/distributions/distribution_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/distributions/distribution_layer.py -------------------------------------------------------------------------------- /rltime/policies/torch/distributions/normal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/distributions/normal.py -------------------------------------------------------------------------------- /rltime/policies/torch/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/dqn.py -------------------------------------------------------------------------------- /rltime/policies/torch/iqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/iqn.py -------------------------------------------------------------------------------- /rltime/policies/torch/torch_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/policies/torch/torch_policy.py -------------------------------------------------------------------------------- /rltime/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/train.py -------------------------------------------------------------------------------- /rltime/training/__init__.py: -------------------------------------------------------------------------------- 1 | from .torch import get_types 2 | -------------------------------------------------------------------------------- /rltime/training/multi_step_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/multi_step_trainer.py -------------------------------------------------------------------------------- /rltime/training/policy_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/policy_trainer.py -------------------------------------------------------------------------------- /rltime/training/torch/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/__init__.py -------------------------------------------------------------------------------- /rltime/training/torch/a2c.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/a2c.py -------------------------------------------------------------------------------- /rltime/training/torch/dist_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/dist_dqn.py -------------------------------------------------------------------------------- /rltime/training/torch/dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/dqn.py -------------------------------------------------------------------------------- /rltime/training/torch/iqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/iqn.py -------------------------------------------------------------------------------- /rltime/training/torch/ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/ppo.py -------------------------------------------------------------------------------- /rltime/training/torch/torch_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/rltime/training/torch/torch_trainer.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/opherlieber/rltime/HEAD/setup.py --------------------------------------------------------------------------------