├── .gitignore ├── LICENSE ├── README.md ├── config ├── __init__.py ├── get_euler_args.py ├── get_n_input.py ├── mujoco_config.py └── postprocess_misc_args.py ├── diagram ├── diagram.pdf ├── diagram.png ├── display2.png ├── display_template.pdf └── display_template.png ├── lib ├── __init__.py ├── agent.py ├── distributions │ ├── __init__.py │ ├── ar_normal.py │ ├── boltzmann.py │ ├── delta.py │ ├── distribution.py │ ├── kl_divergence.py │ ├── mixture_of_normals.py │ ├── mixture_of_tanh_normals.py │ ├── mixture_same_family.py │ ├── normal_uniform.py │ ├── tanh_ar_normal.py │ ├── tanh_normal.py │ └── transforms │ │ ├── __init__.py │ │ ├── autoregressive.py │ │ ├── reverse.py │ │ ├── tanh.py │ │ └── transform_module.py ├── inference │ ├── __init__.py │ ├── cem.py │ ├── direct.py │ ├── direct_goal.py │ ├── direct_gradient.py │ ├── gradient.py │ ├── iterative.py │ └── non_parametric.py ├── layers │ ├── __init__.py │ ├── ar_fully_connected.py │ ├── convolutional.py │ ├── fully_connected.py │ ├── layer.py │ ├── recurrent.py │ └── transposed_conv.py ├── models │ ├── __init__.py │ └── model.py ├── networks │ ├── __init__.py │ ├── ar_fully_connected.py │ ├── convolutional.py │ ├── fully_connected.py │ ├── minigrid │ │ ├── __init__.py │ │ ├── minigrid_conv.py │ │ └── minigrid_deconv.py │ ├── network.py │ ├── network_ensemble.py │ ├── recurrent.py │ └── vizdoom │ │ ├── __init__.py │ │ ├── conv_decoder.py │ │ ├── conv_discrim.py │ │ ├── conv_encoder.py │ │ ├── skip_conv_decoder.py │ │ └── skip_conv_encoder.py ├── value_estimators │ ├── __init__.py │ ├── direct_q.py │ ├── direct_v.py │ ├── goal_based.py │ ├── model_based_q.py │ └── simulator_q.py └── variables │ ├── __init__.py │ ├── latent_variables │ ├── __init__.py │ ├── convolutional.py │ ├── fully_connected.py │ └── latent_variable.py │ ├── observed_variables │ ├── __init__.py │ ├── convolutional.py │ ├── fully_connected.py │ ├── observed_variable.py │ └── transposed_conv.py │ └── value_variable.py ├── local_vars.py ├── main.py ├── misc ├── __init__.py ├── buffer.py ├── collector.py ├── estimators.py ├── euler.py ├── gradients.py ├── initialization.py ├── normalization.py ├── one_hot.py └── optimizer.py ├── requirements.txt └── util ├── __init__.py ├── analysis ├── __init__.py ├── analyze_agent_kl.py ├── analyze_inf.py ├── goal_optimization.py ├── test_value_est.py └── visualize_optimization.py ├── env_util ├── __init__.py ├── mujoco │ ├── __init__.py │ ├── ant.py │ └── humanoid.py ├── registration.py ├── synchronous_env.py └── wrappers │ ├── __init__.py │ ├── action_wrappers.py │ ├── observation_wrappers.py │ └── reward_wrappers.py ├── plot_util.py └── train_util ├── __init__.py ├── agent_kl.py ├── collect_episode.py ├── collect_optimized_episode.py ├── test_model.py ├── train.py └── train_batch.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/README.md -------------------------------------------------------------------------------- /config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/config/__init__.py -------------------------------------------------------------------------------- /config/get_euler_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/config/get_euler_args.py -------------------------------------------------------------------------------- /config/get_n_input.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/config/get_n_input.py -------------------------------------------------------------------------------- /config/mujoco_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/config/mujoco_config.py -------------------------------------------------------------------------------- /config/postprocess_misc_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/config/postprocess_misc_args.py -------------------------------------------------------------------------------- /diagram/diagram.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/diagram/diagram.pdf -------------------------------------------------------------------------------- /diagram/diagram.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/diagram/diagram.png -------------------------------------------------------------------------------- /diagram/display2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/diagram/display2.png -------------------------------------------------------------------------------- /diagram/display_template.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/diagram/display_template.pdf -------------------------------------------------------------------------------- /diagram/display_template.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/diagram/display_template.png -------------------------------------------------------------------------------- /lib/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/__init__.py -------------------------------------------------------------------------------- /lib/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/agent.py -------------------------------------------------------------------------------- /lib/distributions/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/__init__.py -------------------------------------------------------------------------------- /lib/distributions/ar_normal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/ar_normal.py -------------------------------------------------------------------------------- /lib/distributions/boltzmann.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/boltzmann.py -------------------------------------------------------------------------------- /lib/distributions/delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/delta.py -------------------------------------------------------------------------------- /lib/distributions/distribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/distribution.py -------------------------------------------------------------------------------- /lib/distributions/kl_divergence.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/kl_divergence.py -------------------------------------------------------------------------------- /lib/distributions/mixture_of_normals.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/mixture_of_normals.py -------------------------------------------------------------------------------- /lib/distributions/mixture_of_tanh_normals.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/mixture_of_tanh_normals.py -------------------------------------------------------------------------------- /lib/distributions/mixture_same_family.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/mixture_same_family.py -------------------------------------------------------------------------------- /lib/distributions/normal_uniform.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/normal_uniform.py -------------------------------------------------------------------------------- /lib/distributions/tanh_ar_normal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/tanh_ar_normal.py -------------------------------------------------------------------------------- /lib/distributions/tanh_normal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/tanh_normal.py -------------------------------------------------------------------------------- /lib/distributions/transforms/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/transforms/__init__.py -------------------------------------------------------------------------------- /lib/distributions/transforms/autoregressive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/transforms/autoregressive.py -------------------------------------------------------------------------------- /lib/distributions/transforms/reverse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/transforms/reverse.py -------------------------------------------------------------------------------- /lib/distributions/transforms/tanh.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/transforms/tanh.py -------------------------------------------------------------------------------- /lib/distributions/transforms/transform_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/distributions/transforms/transform_module.py -------------------------------------------------------------------------------- /lib/inference/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/__init__.py -------------------------------------------------------------------------------- /lib/inference/cem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/cem.py -------------------------------------------------------------------------------- /lib/inference/direct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/direct.py -------------------------------------------------------------------------------- /lib/inference/direct_goal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/direct_goal.py -------------------------------------------------------------------------------- /lib/inference/direct_gradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/direct_gradient.py -------------------------------------------------------------------------------- /lib/inference/gradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/gradient.py -------------------------------------------------------------------------------- /lib/inference/iterative.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/iterative.py -------------------------------------------------------------------------------- /lib/inference/non_parametric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/inference/non_parametric.py -------------------------------------------------------------------------------- /lib/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/__init__.py -------------------------------------------------------------------------------- /lib/layers/ar_fully_connected.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/ar_fully_connected.py -------------------------------------------------------------------------------- /lib/layers/convolutional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/convolutional.py -------------------------------------------------------------------------------- /lib/layers/fully_connected.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/fully_connected.py -------------------------------------------------------------------------------- /lib/layers/layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/layer.py -------------------------------------------------------------------------------- /lib/layers/recurrent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/recurrent.py -------------------------------------------------------------------------------- /lib/layers/transposed_conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/layers/transposed_conv.py -------------------------------------------------------------------------------- /lib/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/models/__init__.py -------------------------------------------------------------------------------- /lib/models/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/models/model.py -------------------------------------------------------------------------------- /lib/networks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/__init__.py -------------------------------------------------------------------------------- /lib/networks/ar_fully_connected.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/ar_fully_connected.py -------------------------------------------------------------------------------- /lib/networks/convolutional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/convolutional.py -------------------------------------------------------------------------------- /lib/networks/fully_connected.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/fully_connected.py -------------------------------------------------------------------------------- /lib/networks/minigrid/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/minigrid/__init__.py -------------------------------------------------------------------------------- /lib/networks/minigrid/minigrid_conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/minigrid/minigrid_conv.py -------------------------------------------------------------------------------- /lib/networks/minigrid/minigrid_deconv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/minigrid/minigrid_deconv.py -------------------------------------------------------------------------------- /lib/networks/network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/network.py -------------------------------------------------------------------------------- /lib/networks/network_ensemble.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/network_ensemble.py -------------------------------------------------------------------------------- /lib/networks/recurrent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/recurrent.py -------------------------------------------------------------------------------- /lib/networks/vizdoom/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/vizdoom/__init__.py -------------------------------------------------------------------------------- /lib/networks/vizdoom/conv_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/vizdoom/conv_decoder.py -------------------------------------------------------------------------------- /lib/networks/vizdoom/conv_discrim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/vizdoom/conv_discrim.py -------------------------------------------------------------------------------- /lib/networks/vizdoom/conv_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/vizdoom/conv_encoder.py -------------------------------------------------------------------------------- /lib/networks/vizdoom/skip_conv_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/vizdoom/skip_conv_decoder.py -------------------------------------------------------------------------------- /lib/networks/vizdoom/skip_conv_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/networks/vizdoom/skip_conv_encoder.py -------------------------------------------------------------------------------- /lib/value_estimators/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/value_estimators/__init__.py -------------------------------------------------------------------------------- /lib/value_estimators/direct_q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/value_estimators/direct_q.py -------------------------------------------------------------------------------- /lib/value_estimators/direct_v.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/value_estimators/direct_v.py -------------------------------------------------------------------------------- /lib/value_estimators/goal_based.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/value_estimators/goal_based.py -------------------------------------------------------------------------------- /lib/value_estimators/model_based_q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/value_estimators/model_based_q.py -------------------------------------------------------------------------------- /lib/value_estimators/simulator_q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/value_estimators/simulator_q.py -------------------------------------------------------------------------------- /lib/variables/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/__init__.py -------------------------------------------------------------------------------- /lib/variables/latent_variables/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/latent_variables/__init__.py -------------------------------------------------------------------------------- /lib/variables/latent_variables/convolutional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/latent_variables/convolutional.py -------------------------------------------------------------------------------- /lib/variables/latent_variables/fully_connected.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/latent_variables/fully_connected.py -------------------------------------------------------------------------------- /lib/variables/latent_variables/latent_variable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/latent_variables/latent_variable.py -------------------------------------------------------------------------------- /lib/variables/observed_variables/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/observed_variables/__init__.py -------------------------------------------------------------------------------- /lib/variables/observed_variables/convolutional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/observed_variables/convolutional.py -------------------------------------------------------------------------------- /lib/variables/observed_variables/fully_connected.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/observed_variables/fully_connected.py -------------------------------------------------------------------------------- /lib/variables/observed_variables/observed_variable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/observed_variables/observed_variable.py -------------------------------------------------------------------------------- /lib/variables/observed_variables/transposed_conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/observed_variables/transposed_conv.py -------------------------------------------------------------------------------- /lib/variables/value_variable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/lib/variables/value_variable.py -------------------------------------------------------------------------------- /local_vars.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/local_vars.py -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/main.py -------------------------------------------------------------------------------- /misc/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/__init__.py -------------------------------------------------------------------------------- /misc/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/buffer.py -------------------------------------------------------------------------------- /misc/collector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/collector.py -------------------------------------------------------------------------------- /misc/estimators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/estimators.py -------------------------------------------------------------------------------- /misc/euler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/euler.py -------------------------------------------------------------------------------- /misc/gradients.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/gradients.py -------------------------------------------------------------------------------- /misc/initialization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/initialization.py -------------------------------------------------------------------------------- /misc/normalization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/normalization.py -------------------------------------------------------------------------------- /misc/one_hot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/one_hot.py -------------------------------------------------------------------------------- /misc/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/misc/optimizer.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/requirements.txt -------------------------------------------------------------------------------- /util/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /util/analysis/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/analysis/__init__.py -------------------------------------------------------------------------------- /util/analysis/analyze_agent_kl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/analysis/analyze_agent_kl.py -------------------------------------------------------------------------------- /util/analysis/analyze_inf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/analysis/analyze_inf.py -------------------------------------------------------------------------------- /util/analysis/goal_optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/analysis/goal_optimization.py -------------------------------------------------------------------------------- /util/analysis/test_value_est.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/analysis/test_value_est.py -------------------------------------------------------------------------------- /util/analysis/visualize_optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/analysis/visualize_optimization.py -------------------------------------------------------------------------------- /util/env_util/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/__init__.py -------------------------------------------------------------------------------- /util/env_util/mujoco/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /util/env_util/mujoco/ant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/mujoco/ant.py -------------------------------------------------------------------------------- /util/env_util/mujoco/humanoid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/mujoco/humanoid.py -------------------------------------------------------------------------------- /util/env_util/registration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/registration.py -------------------------------------------------------------------------------- /util/env_util/synchronous_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/synchronous_env.py -------------------------------------------------------------------------------- /util/env_util/wrappers/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /util/env_util/wrappers/action_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/wrappers/action_wrappers.py -------------------------------------------------------------------------------- /util/env_util/wrappers/observation_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/wrappers/observation_wrappers.py -------------------------------------------------------------------------------- /util/env_util/wrappers/reward_wrappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/env_util/wrappers/reward_wrappers.py -------------------------------------------------------------------------------- /util/plot_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/plot_util.py -------------------------------------------------------------------------------- /util/train_util/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/__init__.py -------------------------------------------------------------------------------- /util/train_util/agent_kl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/agent_kl.py -------------------------------------------------------------------------------- /util/train_util/collect_episode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/collect_episode.py -------------------------------------------------------------------------------- /util/train_util/collect_optimized_episode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/collect_optimized_episode.py -------------------------------------------------------------------------------- /util/train_util/test_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/test_model.py -------------------------------------------------------------------------------- /util/train_util/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/train.py -------------------------------------------------------------------------------- /util/train_util/train_batch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/joelouismarino/variational_rl/HEAD/util/train_util/train_batch.py --------------------------------------------------------------------------------