├── .gitignore
├── README.md
└── docs
    ├── img
        ├── double_pendulum
        │   ├── combination_logsumexp.png
        │   └── combination_mean.png
        ├── ibm_pendulum
        │   ├── bayes_sim
        │   │   ├── bayessim_ibm_pendulum_mdn_difference.png
        │   │   ├── bayessim_ibm_pendulum_mdn_difference_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdn_downsampled_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdn_signature_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdn_summary_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_matern_difference_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_matern_downsampled_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_matern_signature_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_matern_summary_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_rbf_difference_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_rbf_downsampled_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_rbf_signature_trajectories.png
        │   │   ├── bayessim_ibm_pendulum_mdrff_rbf_summary_trajectories.png
        │   │   ├── ibm_groundtruth_difference.png
        │   │   ├── ibm_groundtruth_downsampled.png
        │   │   ├── ibm_groundtruth_raw.png
        │   │   ├── ibm_groundtruth_signature.png
        │   │   └── ibm_groundtruth_summary.png
        │   ├── cem_trajectories.png
        │   ├── ibm-pendulum-timelapse.png
        │   ├── mcmc_trajectories.png
        │   ├── nuts_trajectories.png
        │   ├── sgld_ms.png
        │   ├── sgld_trajectories.png
        │   ├── svgd_ms_test.png
        │   ├── svgd_multiple_shooting.png
        │   ├── svgd_multiple_shooting_q.png
        │   ├── svgd_single_shooting.png
        │   ├── svgd_single_shooting_q.png
        │   └── svgd_ss_test.png
        ├── panda
        │   ├── box_position_cem.png
        │   ├── box_position_emcee.png
        │   ├── box_position_nuts.png
        │   ├── box_position_sgld.png
        │   ├── box_position_svgd_ms.png
        │   ├── box_position_svgd_ss.png
        │   ├── panda_box_2.jpg
        │   ├── panda_box_4.jpg
        │   ├── panda_box_initial_trajectory.png
        │   ├── panda_box_trajectory.png
        │   ├── panda_box_weights_cem.png
        │   ├── panda_sim.png
        │   ├── panda_sim_array.png
        │   ├── panda_sim_array2.png
        │   ├── panda_sim_array3.png
        │   ├── panda_sim_array4.png
        │   ├── panda_sim_array5.png
        │   ├── panda_sim_array6.png
        │   ├── panda_sim_array7.png
        │   └── panda_sim_markers.png
        ├── pds_diagram.png
        ├── pds_diagram.svg
        └── synthetic_param_uncertainty
        │   ├── bayessim_two_param_mdn_downsampled_trajectories.png
        │   ├── bayessim_twoparam_mdn_difference.png
        │   ├── bayessim_twoparam_mdn_downsampled.png
        │   ├── bayessim_twoparam_mdrff_rbf_downsampled.png
        │   ├── knn_kl.png
        │   ├── knn_kl_real_sim.png
        │   ├── knn_kl_sim_real.png
        │   ├── mmd.png
        │   ├── synthetic_param_uncertainty_cem.png
        │   ├── synthetic_param_uncertainty_mcmc.png
        │   ├── synthetic_param_uncertainty_nuts.png
        │   ├── synthetic_param_uncertainty_sgld.png
        │   ├── synthetic_param_uncertainty_svgd.png
        │   └── synthetic_params_loglikelihood.png
    └── index.html


/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | pip-wheel-metadata/
 24 | share/python-wheels/
 25 | *.egg-info/
 26 | .installed.cfg
 27 | *.egg
 28 | MANIFEST
 29 | 
 30 | # PyInstaller
 31 | #  Usually these files are written by a python script from a template
 32 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 33 | *.manifest
 34 | *.spec
 35 | 
 36 | # Installer logs
 37 | pip-log.txt
 38 | pip-delete-this-directory.txt
 39 | 
 40 | # Unit test / coverage reports
 41 | htmlcov/
 42 | .tox/
 43 | .nox/
 44 | .coverage
 45 | .coverage.*
 46 | .cache
 47 | nosetests.xml
 48 | coverage.xml
 49 | *.cover
 50 | *.py,cover
 51 | .hypothesis/
 52 | .pytest_cache/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | target/
 76 | 
 77 | # Jupyter Notebook
 78 | .ipynb_checkpoints
 79 | 
 80 | # IPython
 81 | profile_default/
 82 | ipython_config.py
 83 | 
 84 | # pyenv
 85 | .python-version
 86 | 
 87 | # pipenv
 88 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 89 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 90 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 91 | #   install all needed dependencies.
 92 | #Pipfile.lock
 93 | 
 94 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow
 95 | __pypackages__/
 96 | 
 97 | # Celery stuff
 98 | celerybeat-schedule
 99 | celerybeat.pid
100 | 
101 | # SageMath parsed files
102 | *.sage.py
103 | 
104 | # Environments
105 | .env
106 | .venv
107 | env/
108 | venv/
109 | ENV/
110 | env.bak/
111 | venv.bak/
112 | 
113 | # Spyder project settings
114 | .spyderproject
115 | .spyproject
116 | 
117 | # Rope project settings
118 | .ropeproject
119 | 
120 | # mkdocs documentation
121 | /site
122 | 
123 | # mypy
124 | .mypy_cache/
125 | .dmypy.json
126 | dmypy.json
127 | 
128 | # Pyre type checker
129 | .pyre/
130 | 
131 | .history


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # prob-diff-sim
2 | Probabilistic Inference of Simulation Parameters via Parallel Differentiable Simulation
3 | 


--------------------------------------------------------------------------------
/docs/img/double_pendulum/combination_logsumexp.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/double_pendulum/combination_logsumexp.png


--------------------------------------------------------------------------------
/docs/img/double_pendulum/combination_mean.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/double_pendulum/combination_mean.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_difference.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_difference.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_difference_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_difference_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_downsampled_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_downsampled_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_signature_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_signature_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_summary_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_summary_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_difference_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_difference_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_downsampled_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_downsampled_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_signature_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_signature_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_summary_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_summary_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_difference_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_difference_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_downsampled_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_downsampled_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_signature_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_signature_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_summary_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_summary_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_difference.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_difference.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_downsampled.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_downsampled.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_raw.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_raw.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_signature.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_signature.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_summary.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/bayes_sim/ibm_groundtruth_summary.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/cem_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/cem_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/ibm-pendulum-timelapse.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/ibm-pendulum-timelapse.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/mcmc_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/mcmc_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/nuts_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/nuts_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/sgld_ms.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/sgld_ms.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/sgld_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/sgld_trajectories.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/svgd_ms_test.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/svgd_ms_test.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/svgd_multiple_shooting.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/svgd_multiple_shooting.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/svgd_multiple_shooting_q.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/svgd_multiple_shooting_q.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/svgd_single_shooting.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/svgd_single_shooting.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/svgd_single_shooting_q.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/svgd_single_shooting_q.png


--------------------------------------------------------------------------------
/docs/img/ibm_pendulum/svgd_ss_test.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/ibm_pendulum/svgd_ss_test.png


--------------------------------------------------------------------------------
/docs/img/panda/box_position_cem.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/box_position_cem.png


--------------------------------------------------------------------------------
/docs/img/panda/box_position_emcee.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/box_position_emcee.png


--------------------------------------------------------------------------------
/docs/img/panda/box_position_nuts.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/box_position_nuts.png


--------------------------------------------------------------------------------
/docs/img/panda/box_position_sgld.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/box_position_sgld.png


--------------------------------------------------------------------------------
/docs/img/panda/box_position_svgd_ms.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/box_position_svgd_ms.png


--------------------------------------------------------------------------------
/docs/img/panda/box_position_svgd_ss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/box_position_svgd_ss.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_box_2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_box_2.jpg


--------------------------------------------------------------------------------
/docs/img/panda/panda_box_4.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_box_4.jpg


--------------------------------------------------------------------------------
/docs/img/panda/panda_box_initial_trajectory.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_box_initial_trajectory.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_box_trajectory.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_box_trajectory.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_box_weights_cem.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_box_weights_cem.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array2.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array3.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array4.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array5.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array6.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array6.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_array7.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_array7.png


--------------------------------------------------------------------------------
/docs/img/panda/panda_sim_markers.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/panda/panda_sim_markers.png


--------------------------------------------------------------------------------
/docs/img/pds_diagram.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/pds_diagram.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/bayessim_two_param_mdn_downsampled_trajectories.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/bayessim_two_param_mdn_downsampled_trajectories.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/bayessim_twoparam_mdn_difference.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/bayessim_twoparam_mdn_difference.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/bayessim_twoparam_mdn_downsampled.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/bayessim_twoparam_mdn_downsampled.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/bayessim_twoparam_mdrff_rbf_downsampled.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/bayessim_twoparam_mdrff_rbf_downsampled.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/knn_kl.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/knn_kl.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/knn_kl_real_sim.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/knn_kl_real_sim.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/knn_kl_sim_real.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/knn_kl_sim_real.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/mmd.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/mmd.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_cem.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_cem.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_mcmc.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_mcmc.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_nuts.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_nuts.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_sgld.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_sgld.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_svgd.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/synthetic_param_uncertainty_svgd.png


--------------------------------------------------------------------------------
/docs/img/synthetic_param_uncertainty/synthetic_params_loglikelihood.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/uscresl/prob-diff-sim/c7793e2cc2d326922c5dd8367224927ff46b1ef6/docs/img/synthetic_param_uncertainty/synthetic_params_loglikelihood.png


--------------------------------------------------------------------------------
/docs/index.html:
--------------------------------------------------------------------------------
   1 | <!doctype html>
   2 | <html lang="en">
   3 | 
   4 | <head>
   5 |     <meta charset="utf-8">
   6 |     <meta name="viewport" content="width=device-width, initial-scale=1">
   7 | 
   8 |     <meta property="og:site_name" content="Probabilistic Differentiable Simulation">
   9 |     <meta property="og:title" content="Probabilistic Differentiable Simulation">
  10 |     <meta property="og:description"
  11 |         content="Bayesian inference of simulation parameters that leverages parallel differentiable simulators">
  12 |     <meta property="og:url" content="https://uscresl.github.io/prob-diff-sim/">
  13 |     <meta property="og:image" content="https://uscresl.github.io/prob-diff-sim/img/pds_diagram.png">
  14 |     <meta property="og:image:type" content="image/jpeg">
  15 | 
  16 |     <meta name="twitter:card" content="summary_large_image">
  17 |     <meta name="twitter:title" content="Probabilistic Differentiable Simulation">
  18 |     <meta name="twitter:description"
  19 |         content="Bayesian inference of simulation parameters that leverages parallel differentiable simulators">
  20 |     <meta name="twitter:creator" content="@eric_heiden">
  21 |     <meta name="twitter:url" content="https://uscresl.github.io/prob-diff-sim/">
  22 |     <meta name="twitter:image:src" content="https://uscresl.github.io/prob-diff-sim/img/pds_diagram.png">
  23 | 
  24 |     <meta name="description"
  25 |         content="Bayesian inference of simulation parameters that leverages parallel differentiable simulators">
  26 |     <meta name="author" content="Eric Heiden, Christopher E. Denniston, David Millard, Fabio Ramos, Gaurav S. Sukhatme">
  27 | 
  28 |     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.0.0-beta3/dist/css/bootstrap.min.css" rel="stylesheet"
  29 |         integrity="sha384-eOJMYsd53ii+scO/bJGFsiCZc+5NDVN2yr8+0RDqr0Ql0h+rP48ckxlpbzKgwra6" crossorigin="anonymous">
  30 | 
  31 |     <title>Probabilistic Differentiable Simulation</title>
  32 | 
  33 |     <style>
  34 |         div.authors p:first-of-type {
  35 |             font-size: 1.4em;
  36 |         }
  37 | 
  38 |         div.authors p {
  39 |             text-align: center;
  40 |         }
  41 | 
  42 |         div.affiliations p {
  43 |             text-align: center;
  44 |         }
  45 | 
  46 |         h1,
  47 |         h2 {
  48 |             margin: 1em 0;
  49 |             text-align: center;
  50 |         }
  51 | 
  52 |         a:link {
  53 |             text-decoration: none;
  54 |         }
  55 | 
  56 |         #video {
  57 |             text-align: center;
  58 |         }
  59 | 
  60 |         div.container {
  61 |             padding-top: 60px;
  62 |         }
  63 | 
  64 |         .navbar {
  65 |             padding: 0.4em 2em;
  66 |         }
  67 | 
  68 |         #abstract p {
  69 |             text-align: justify;
  70 |         }
  71 | 
  72 |         #results .label {
  73 |             margin-top: 1em;
  74 |             margin-bottom: 0.3em;
  75 |             font-weight: bold;
  76 |         }
  77 | 
  78 |         #results h3,
  79 |         #results h5 {
  80 |             margin-top: 2em;
  81 |         }
  82 | 
  83 |         .btn {
  84 |             width: 75%;
  85 |         }
  86 | 
  87 |         .actions .col {
  88 |             text-align: center;
  89 |         }
  90 | 
  91 |         p {
  92 |             text-align: justify;
  93 |         }
  94 | 
  95 |         table.numbers td {
  96 |             font-family: monospace !important;
  97 |             text-align: right;
  98 |             padding-right: 5%;
  99 |         }
 100 | 
 101 |         table.centered td,
 102 |         table.centered p {
 103 |             text-align: center !important;
 104 |         }
 105 |     </style>
 106 |     <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/katex@0.13.18/dist/katex.min.css"
 107 |         integrity="sha384-zTROYFVGOfTw7JV7KUu8udsvW2fx4lWOsCEDqhBreBwlHI4ioVRtmIvEThzJHGET" crossorigin="anonymous">
 108 | 
 109 |     <!-- The loading of KaTeX is deferred to speed up page rendering -->
 110 |     <script defer src="https://cdn.jsdelivr.net/npm/katex@0.13.18/dist/katex.min.js"
 111 |         integrity="sha384-GxNFqL3r9uRJQhR+47eDxuPoNE7yLftQM8LcxzgS4HT73tp970WS/wV5p8UzCOmb"
 112 |         crossorigin="anonymous"></script>
 113 | 
 114 |     <!-- To automatically render math in text elements, include the auto-render extension: -->
 115 |     <script defer src="https://cdn.jsdelivr.net/npm/katex@0.13.18/dist/contrib/auto-render.min.js"
 116 |         integrity="sha384-vZTG03m+2yp6N6BNi5iM4rW4oIwk5DfcNdFfxkk9ZWpDriOkXX8voJBFrAO7MpVl"
 117 |         crossorigin="anonymous"></script>
 118 | 
 119 |     <script>
 120 |         document.addEventListener("DOMContentLoaded", function () {
 121 |             renderMathInElement(document.body, {
 122 |                 // customised options
 123 |                 // • auto-render specific keys, e.g.:
 124 |                 delimiters: [
 125 |                     { left: '$$', right: '$$', display: true },
 126 |                     { left: '$', right: '$', display: false },
 127 |                     { left: '\\(', right: '\\)', display: false },
 128 |                     { left: '\\[', right: '\\]', display: true }
 129 |                 ],
 130 |                 // • rendering keys, e.g.:
 131 |                 throwOnError: false
 132 |             });
 133 |         });
 134 |     </script>
 135 | </head>
 136 | 
 137 | <body>
 138 |     <nav class="navbar navbar-expand-md navbar-light fixed-top bg-light">
 139 |         <a class="navbar-brand" href="#">Probabilistic Differentiable Simulation (PDS)</a>
 140 | 
 141 |         <button class="navbar-toggler" type="button" data-toggle="collapse" data-target="#navbarToggle">
 142 |             <span class="navbar-toggler-icon"></span>
 143 |         </button>
 144 | 
 145 |         <div class="collapse navbar-collapse justify-content-end position-relative" id="navbarToggle">
 146 |             <ul class="navbar-nav ml-auto">
 147 |                 <li class="nav-item">
 148 |                     <a class="nav-link" href="#" target="_self">Home</a>
 149 |                 </li>
 150 |                 <li class="nav-item">
 151 |                     <a class="nav-link" href="#abstract" target="_self">Abstract</a>
 152 |                 </li>
 153 |                 <li class="nav-item">
 154 |                     <a class="nav-link" href="#video" target="_self">Video</a>
 155 |                 </li>
 156 |                 <li class="nav-item">
 157 |                     <a class="nav-link" href="#appendix" target="_self">Appendix</a>
 158 |                 </li>
 159 |                 <li class="nav-item">
 160 |                     <a class="nav-link" href="#acknowledgements" target="_self">Acknowledgements</a>
 161 |                 </li>
 162 |             </ul>
 163 |         </div>
 164 |     </nav>
 165 | 
 166 |     <div class="container">
 167 | 
 168 |         <h1>Probabilistic Inference of Simulation Parameters via <br /> Parallel Differentiable Simulation</h1>
 169 | 
 170 |         <h2>ICRA 2022</h2>
 171 | 
 172 |         <div class="row authors">
 173 |             <div class="col">
 174 |                 <p>
 175 |                     <a target="_blank" href="https://eric-heiden.com">Eric Heiden</a><sup>1</sup>
 176 |                 </p>
 177 |             </div>
 178 |             <div class="col">
 179 |                 <p>
 180 |                     <a target="_blank" href="https://www.cdenniston.com">Christopher E. Denniston</a><sup>1</sup>
 181 |                 </p>
 182 |             </div>
 183 |             <div class="col">
 184 |                 <p>
 185 |                     <a target="_blank" href="https://dmillard.github.io">David Millard</a><sup>1</sup>
 186 |                 </p>
 187 |             </div>
 188 |             <div class="col">
 189 |                 <p>
 190 |                     <a target="_blank" href="https://fabioramos.github.io">Fabio Ramos</a><sup>2,3</sup>
 191 |                 </p>
 192 |             </div>
 193 |             <div class="col">
 194 |                 <p>
 195 |                     <a target="_blank" href="http://robotics.usc.edu/~gaurav/">Gaurav S. Sukhatme</a><sup>1,4</sup>
 196 |                 </p>
 197 |             </div>
 198 |         </div>
 199 |         <div class="row affiliations">
 200 |             <div class="col">
 201 |                 <p><sup>1</sup>University of Southern California</p>
 202 |             </div>
 203 |             <div class="col">
 204 |                 <p><sup>2</sup>NVIDIA</p>
 205 |             </div>
 206 |             <div class="col">
 207 |                 <p><sup>3</sup>University of Sydney</p>
 208 |             </div>
 209 |             <div class="col">
 210 |                 <p><sup>4</sup>Amazon</p>
 211 |             </div>
 212 |         </div>
 213 |     </div>
 214 | 
 215 |     <div class="container" id="summary">
 216 |         <div class="row">
 217 |             <figure class="figure">
 218 |                 <img class="figure-img img-fluid p-5" src="img/pds_diagram.png" alt="PDS" />
 219 |                 <figcaption class="figure-caption">We reduce the reality gap in robotics simulators by introducing a
 220 |                     Bayesian inference approach named <em>Constrained Stein Variational Gradient Descent</em> (CSVGD).
 221 |                     Through a
 222 |                     multiple-shooting likelihood model for trajectories, and by leveraging parallel differentiable
 223 |                     simulators, CSVGD can infer complex, non-parametric posterior distributions over simulation
 224 |                     parameters for highly nonlinear systems.</figcaption>
 225 |             </figure>
 226 |             <!-- <div class="col-2">
 227 |                 <video autoplay muted loop class="img-fluid">
 228 |                     <source src="apple_springs_damage.mp4" type="video/mp4">
 229 |                     Your browser does not support the video tag.
 230 |                 </video>
 231 |             </div> -->
 232 |         </div>
 233 |     </div>
 234 | 
 235 |     <div class="container" id="abstract">
 236 |         <div class="row">
 237 |             <h2>Abstract</h2>
 238 |             <!-- <p class="col-sm-10 fs-5"> -->
 239 |             <p>
 240 |                 To accurately reproduce measurements from the real world, simulators need to have an adequate model of
 241 |                 the physical system and require the parameters of the model be identified.
 242 |             </p>
 243 |             <p>
 244 |                 We address the latter problem of estimating parameters through a Bayesian inference approach that
 245 |                 approximates a posterior distribution over simulation parameters given real sensor measurements.
 246 |                 By extending the commonly used Gaussian likelihood model for trajectories via the
 247 |                 <em>multiple-shooting</em> formulation, our chosen particle-based inference algorithm <em>Stein
 248 |                     Variational Gradient
 249 |                     Descent</em> is able to identify highly nonlinear, underactuated systems. We leverage GPU code
 250 |                 generation
 251 |                 and differentiable simulation to evaluate the likelihood and its gradient for many particles in
 252 |                 parallel.
 253 |             </p>
 254 |             <p>
 255 |                 Our algorithm infers non-parametric distributions over simulation parameters more accurately than
 256 |                 comparable baselines and handles constraints over parameters efficiently through gradient-based
 257 |                 optimization. We evaluate estimation performance on several physical experiments. On an underactuated
 258 |                 mechanism where a 7-DOF robot arm excites an object with an unknown mass configuration, we demonstrate
 259 |                 how our inference technique can identify symmetries between the parameters and provide highly accurate
 260 |                 predictions.
 261 |             </p>
 262 |             <!-- <div class="card col align-self-center border-0">
 263 |                 <a href="">
 264 |                     <img src="paper-thumbnail.png" class="card-img-top" alt="PDS paper" />
 265 |                     <div class="card-body" align="center">
 266 |                         <h5 class="card-title">Paper on ArXiv</h5>
 267 |                     </div>
 268 |                 </a>
 269 |             </div> -->
 270 |         </div>
 271 | 
 272 |         <div class="row actions">
 273 |             <div class="col"><a href="https://arxiv.org/abs/2109.08815" target="_blank"
 274 |                     class="btn btn-primary col">Paper on Arxiv</a></div>
 275 |             <div class="col"><a href="#" class="btn btn-primary col">Code (coming soon!)</a></div>
 276 |             <div class="col"><a href="#" data-bs-toggle="modal" data-bs-target="#citationModal"
 277 |                     class="btn btn-primary col">Citation</a></div>
 278 |         </div>
 279 |     </div>
 280 | 
 281 |     <div class="modal fade" id="citationModal" tabindex="-1" role="dialog" aria-labelledby="citationModalTitle">
 282 |         <div class="modal-dialog modal-dialog-centered" role="document">
 283 |             <div class="modal-content">
 284 |                 <div class="modal-header">
 285 |                     <h5 class="modal-title" id="citationModalLongTitle">Citation</h5>
 286 |                     <button type="button" class="btn-close" data-bs-dismiss="modal" aria-label="Close"></button>
 287 |                 </div>
 288 |                 <div class="modal-body">
 289 |                     <pre>
 290 | @article{heiden2022pds,
 291 | author    = {Eric Heiden and
 292 |              Christopher E. Denniston and
 293 |              David Millard and
 294 |              Fabio Ramos and
 295 |              Gaurav S. Sukhatme},
 296 | title     = {Probabilistic Inference of Simulation Parameters via Parallel Differentiable Simulation},
 297 | journal   = {International Conference on Robotics and Automation (ICRA)},
 298 | year      = {2022}
 299 | }
 300 |                     </pre>
 301 |                 </div>
 302 |             </div>
 303 |         </div>
 304 |     </div>
 305 | 
 306 |     <div class="container" id="video">
 307 |         <h2>Video</h2>
 308 |         <div class="row justify-content-md-center">
 309 |             <div class="ratio ratio-16x9 w-75">
 310 |                 <iframe src="https://www.youtube-nocookie.com/embed/QfhsWlKbfYM" title="YouTube video player"
 311 |                     frameborder="0"
 312 |                     allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
 313 |                     allowfullscreen></iframe>
 314 |             </div>
 315 |         </div>
 316 |     </div>
 317 | 
 318 |     <div class="container" id="appendix">
 319 |         <h2>Appendix</h2>
 320 | 
 321 |         <p>
 322 |             The following sections provide additional technical details that supplement our paper. Please consult our
 323 |             paper for the definition of the symbols used in the following sections.
 324 |         </p>
 325 | 
 326 |         $
 327 |         \gdef\paramdim{M}
 328 |         \gdef\params{\theta}
 329 |         \gdef\particles{\Theta}
 330 |         \gdef\numparticles{N}
 331 |         \gdef\statedim{D}
 332 |         \gdef\statevec{\mathbf{s}}
 333 |         \gdef\controlvec{\mathbf{u}}
 334 |         \gdef\observationdim{N}
 335 |         \gdef\observationvec{\mathbf{x}}
 336 |         \gdef\timedim{T}
 337 |         \gdef\trajectory{\mathcal{X}}
 338 |         \gdef\trajectoryset{D_\trajectory}
 339 |         \gdef\trajectorysetsub[1]{D_{\trajectory,#1}}
 340 |         \gdef\particleset{\xi}
 341 |         \gdef\simu{^{\text{sim}}}
 342 |         \gdef\real{^{\text{real}}}
 343 |         \gdef\fsim{f_{\text{sim}}}
 344 |         \gdef\fobs{f_{\text{obs}}}
 345 |         \gdef\fstep{f_{\text{step}}}
 346 |         \gdef\pobs{p_{\text{obs}}}
 347 | 
 348 |         \gdef\xp{\params^\prime}
 349 |         \gdef\kxx{k(\params, \xp)}
 350 |         \gdef\logprob{\log \mathcal{L}(\params)}
 351 |         \gdef\logprobp{\log \mathcal{L}(\xp)}
 352 | 
 353 |         \gdef\gradx{\nabla_{\params}}
 354 |         \gdef\gradxp{\nabla_{\xp}}
 355 |         \gdef\gradxxp{\nabla_{\params\xp}}
 356 | 
 357 |         \gdef\exparams{\bar{\params}}
 358 | 
 359 |         \gdef\jointpos{\mathbf{q}}
 360 |         \gdef\jointvel{\mathbf{\dot{q}}}
 361 |         \gdef\jointacc{\mathbf{\ddot{q}}}
 362 |         \gdef\jointtorque{\tau}
 363 |         \gdef\externalforce{\mathbf{f}^{\text{ext}}}
 364 |         \gdef\timestep{\Delta t}
 365 | 
 366 |         \gdef\pdef{p_{\text{def}}}
 367 |         \gdef\plim{p_{\text{lim}}}
 368 | 
 369 |         \gdef\second{\text{s}}
 370 |         \gdef\kg{\text{kg}}
 371 |         \gdef\meter{\text{m}}
 372 |         \gdef\Hz{\text{Hz}}
 373 |         $
 374 | 
 375 |         <h3>1 Technical Details</h3>
 376 |         <h4>1.1 Initializing the Estimators</h4>
 377 |         <p>
 378 |             For each experiment, we initialize the particles for the estimators via the deterministic Sobol sequence on
 379 |             the intervals specified through the parameter limits. Our code uses the Sobol sequence implementation
 380 |             from Burkardt [<a href="#sec:references">1</a>] which is based on a Fortran77 implementation by Fox [<a
 381 |                 href="#sec:references">2</a>].
 382 |             For the MCMC methods that sample a single Markov chain, we used the center point between the parameter
 383 |             limits as initial guess.
 384 |         </p>
 385 | 
 386 |         <h4>1.2 Likelihood Model for Sets of Trajectories</h4>
 387 | 
 388 |         <p>
 389 |             In this work we assume that trajectories may have been generated by a distribution over parameters.
 390 |             In the case of a replicable experimental setup, this could be a point distribution at the only true
 391 |             parameters.
 392 |             However, when trajectories are collected from multiple robots, or with slightly different experimental
 393 |             setups between experiments}, there may be a multimodal distribution over parameters which generated the set
 394 |             of trajectories.
 395 |         </p>
 396 |         <p>
 397 |             Note, that irrespective of the choice of likelihood function we do not make any assumption about the shape
 398 |             of the posterior distribution by leveraging SVGD which is a non-parametric inference algorithm. In
 399 |             trajectory space, the Gaussian likelihood function is a common choice as it corresponds to the typical
 400 |             least-squares estimation methodology. Other likelihood distributions may be integrated with our method,
 401 |             which we leave up to future work.
 402 |         </p>
 403 |         <p>
 404 |             The likelihood which we use is a mixture of equally-weighted Gaussians centered at each reference
 405 |             trajectory $\trajectory\real$:
 406 |             $$
 407 |             \begin{equation}
 408 |             p_{sum} (\trajectoryset\real | \params) = \sum_{\trajectory\real \in \trajectoryset\real}
 409 |             p_{ss}(\trajectory\real | \params).
 410 |             \end{equation}
 411 |             $$
 412 | 
 413 |             If we were to consider each trajectory as an independent sample from the same trajectory distribution (the
 414 |             product), the likelihood function would be
 415 |             $$\begin{equation}
 416 |             p_{product} (\trajectoryset\real | \params) = \prod_{\trajectory\real \in \trajectoryset\real}
 417 |             p_{ss}(\trajectory\real | \params).
 418 |             \end{equation}$$
 419 | 
 420 |             While both equations define the likelihood for
 421 |             a combination of single-shooting likelihood functions $p_{ss}$ for a set of real trajectories
 422 |             $\trajectoryset\real$, the same combination operators (sum or product) apply to the combination of
 423 |             multiple-shooting likelihood functions $p_{ms}$ analogously.
 424 |         </p>
 425 |         <p>
 426 |             The consequence of using these likelihoods can be seen in the following figure where
 427 |             $p_{product}$ shows the resulting posterior distribution (in parameter space) when
 428 |             treating a set of trajectories as independent and taking the product of their likelihoods
 429 |             (Equation 2), while <a href="#fig:double-pendulum-sum">Figure 1 (b)</a> shows the result of treating
 430 |             them as a sum of Gaussian likelihoods (Equation 1).
 431 |             In <a href="#fig:double-pendulum-prod">Figure 1 (a)</a> the posterior becomes the average of the two
 432 |             distributions since that
 433 |             is the most likely position that generated both of the distinct trajectories. In contrast, the posterior
 434 |             approximated by the same algorithm (CSVGD) but using the sum of Gaussian likelihoods, successfully captures
 435 |             the multimodality in the trajectory space since most particles have aligned near the two modes of the true
 436 |             distribution in parameter space.
 437 | 
 438 |         </p>
 439 | 
 440 |         <div class="row">
 441 |             <div class="col"></div>
 442 |             <div class="col-4" id="fig:double-pendulum-prod">
 443 |                 <img class="img-fluid" src="img/double_pendulum/combination_mean.png" />
 444 |                 <p style="text-align: center;">(a) Product</p>
 445 |             </div>
 446 |             <div class="col-4" id="fig:double-pendulum-sum">
 447 |                 <img class="img-fluid" src="img/double_pendulum/combination_logsumexp.png" />
 448 |                 <p style="text-align: center;">(b) Sum</p>
 449 |             </div>
 450 |             <div class="col"></div>
 451 |         </div>
 452 | 
 453 |         <div class="row">
 454 |             <div class="col"></div>
 455 |             <div class="col-8">
 456 |                 <p align="justify">
 457 |                     <b>Figure 1.</b> Comparison of posterior parameter distributions obtained from fitting the
 458 |                     parameters to two
 459 |                     ground-truth trajectories generated from different link lengths of a simulated double pendulum
 460 |                     (units of the axes in meters). The trajectories were 300 steps long (which corresponds to a length
 461 |                     of 3s) and contain the 2 joint positions and 2 joint velocities of the uncontrolled
 462 |                     double pendulum which starts from a zero-velocity initial configuration where the first angle is at
 463 |                     $90^\circ$ (sideways) and the other at $0^\circ$. In (a), the product of the individual
 464 |                     per-trajectory likelihoods is maximized (Equation 2). In (b), the sum
 465 |                     of the likelihoods is maximized (Equation 1).
 466 |                 </p>
 467 |             </div>
 468 |             <div class="col"></div>
 469 |         </div>
 470 | 
 471 |         <h4 id="sec:normalization">1.3 State and Parameter Normalization</h4>
 472 | 
 473 |         <p>
 474 |             The parameters we are estimating are valid over only particular ranges of values. These ranges are often
 475 |             widely different - in the case of our real-world pendulum experiment, the center of mass of a link in a
 476 |             pendulum may be in the order of centimeters, while the angular velocity at the beginning of the recorded
 477 |             motion can reach values on the orders of meters per second. It is therefore important to scale the
 478 |             parameters to a common range to avoid any dimension to dominate smaller parameter ranges during the
 479 |             estimation.
 480 |         </p>
 481 |         <p>
 482 |             Similarly, the state dimensions are of different units - for example, we typically include velocities and
 483 |             positions in the recorded data over which we compute the likelihood. Therefore, we also normalize the range
 484 |             over the state dimensions. Given the state vector, respective parameter vector, $w$, we normalize each
 485 |             dimension $i$ by its statistical variance $\sigma^2$, i.e. $\frac{w_i}{\sigma_i^2}$.
 486 |         </p>
 487 | 
 488 |         <h4>1.4 KNN-based Approximation for KL Divergence</h4>
 489 |         <p>
 490 |             In this work, we compare a set of parameter guesses (particles) to the ground-truth parameters, or a set of
 491 |             trajectories generated by simulating trajectories from each parameter in the particle distribution to a set
 492 |             of trajectories created on a physical system.
 493 |             To compare these distributions, we use the KL divergence to determine how the two distributions differ from
 494 |             each other.
 495 |             Formally, the KL divergence is the expected value of the log likelihood ratio between two distributions, and
 496 |             is an asymmetric divergence that does not satisfy the triangle inequality.
 497 |         </p>
 498 |         <p>
 499 |             The KL divergence is easily computable in the case of discrete distributions or simple parametric
 500 |             distributions, but is not easily calculable for samples from non-parametric distributions such as those over
 501 |             trajectories.
 502 |             Instead, we use an approximation to the KL divergence which uses the relative distances between samples in a
 503 |             set to estimate the KL divergence between particle distributions.
 504 |             This method has been used to compare particle distributions over robot poses to asses the performance of
 505 |             particle filter distributions [<a href="#sec:references">3</a>].
 506 |             To estimate the KL divergence between particle distributions over trajectories $\trajectoryset^{p}$ and
 507 |             $\trajectoryset^{q}$ we adopt the formulation from [<a href="#sec:references">4</a>,<a
 508 |                 href="#sec:references">3</a>]:
 509 |             $$
 510 |             \begin{equation}
 511 |             \tilde{d}_{KL} (\trajectoryset^{p} \parallel \trajectoryset^{q}) =
 512 |             \frac{\observationdim}{|\trajectoryset^p|} \sum_{i=1}^{|\trajectoryset^p|}
 513 |             \log\frac{\operatorname{KNN}^p_{k_i}(i)}{\operatorname{KNN}^q_{l_i}(i)}+ \frac{1}{|\trajectoryset^p|}
 514 |             \sum_{i=1}^{|\trajectoryset^p|} [\psi(l_i) - \psi(k_i)] +
 515 |             \log\frac{|\trajectoryset^q|}{|\trajectoryset^p|-1},
 516 |             \end{equation}
 517 |             $$
 518 |             where $\observationdim$ is the dimensionality of the trajectories, $|\trajectoryset^p|$ is the number of
 519 |             trajectories in the $\trajectoryset^{p}$ dataset, $|\trajectoryset^q|$ is the number of particles in the
 520 |             $\trajectoryset^{q}$ dataset, $\operatorname{KNN}^p_{k_i}(i)$ is the distance from trajectory $\trajectory_i
 521 |             \in \trajectoryset^{p}$ to its $k_i$-th nearest neighbor in $\trajectoryset^{q}$,
 522 |             $\operatorname{KNN}^q_{l_i}(i)$ is the distance from trajectory $\trajectory_i \in \trajectoryset^{p}$ to
 523 |             its $l_i$-th nearest neighbor in $\trajectoryset^{p} \backslash \trajectory_i$, and $\psi$ is the digamma
 524 |             function. Note that this approximation of KL divergence can also be applied to compare parameter
 525 |             distributions, as we show in the synthetic data experiment from subsection 5.1 of our main paper (cf. Figure
 526 |             4 (a) and (b) from the main paper) where the ground-truth parameter distribution is known.
 527 |         </p>
 528 |         <p>
 529 |             Throughout this work, we set $k_i$ and $l_i$ to 3 as this reduces the bias in the approximation, but does
 530 |             not require a large amount of samples from the ground-truth distribution.
 531 |         </p>
 532 | 
 533 |         <h3>2 Experiments</h3>
 534 |         <p>We provide further technical details and results from the experiments we present in the main paper.</p>
 535 | 
 536 |         <h4 id="sec:dynamics">2.1 Differentiable Simulator</h4>
 537 | 
 538 |         <p>
 539 |             Other than requiring a differentiable forward dynamics model which allows to simulate the system in its
 540 |             entirety following the Markov assumption, our proposed algorithm does not rely on a particular choice of
 541 |             dynamical system or simulator for which its parameters need to be estimated.
 542 |             For our experiments, we use the <em><a
 543 |                     href="https://github.com/google-research/tiny-differentiable-simulator" target="_blank">Tiny
 544 |                     Differentiable Simulator</a></em> [<a href="#sec:references">5</a>] that implements end-to-end
 545 |             differentiable contact models and the Articulated Body Algorithm (ABA) [<a href="#sec:references">6</a>] to
 546 |             compute the forward dynamics (FD) for articulated rigid-body mechanisms. Given joint positions $\jointpos$,
 547 |             velocities $\jointvel$, torques $\jointtorque$ in generalized coordinates, and external forces
 548 |             $\externalforce$, ABA calculates the joint accelerations $\jointacc$.
 549 |             We use semi-implicit Euler integration to advance the system dynamics in time for a time step $\Delta t$:
 550 |             $$
 551 |             \begin{align}
 552 |             \jointacc_{t+1} = \operatorname{ABA}(\jointpos_t, \jointvel_t, \jointtorque_t, \externalforce_t; \params),
 553 |             \qquad
 554 |             \jointvel_{t+1} = \jointvel_t + \jointacc_{t+1} \timestep, \qquad
 555 |             \jointpos_{t+1} = \jointpos_t + \jointvel_{t+1} \timestep.
 556 |             \end{align}
 557 |             $$
 558 |         </p>
 559 |         <p>
 560 |             The second-order ODE described by Equation 4 is lowered to a first-order system, with state
 561 |             $\statevec_t = \begin{bmatrix}\jointpos_t & \jointvel_t\end{bmatrix}$. Furthermore, we deal primarily with
 562 |             the discrete
 563 |             time-stepped dynamics function
 564 |             $\statevec_{t+1} = \fstep(\statevec_t, t, \params)$,
 565 |             assuming that $\timestep$ is constant. The function $\fsim(\params, \statevec_0)$ uses $\fstep$ iteratively
 566 |             to produce a trajectory of states $[\statevec]_{t=1}^T$ given an initial state $\statevec_0$ and the
 567 |             parameters $\params$. Many systems of practical interest for robotics are controlled by an external input.
 568 |             In our formulation for parameter estimation, we include controls as explicit dependencies on the time
 569 |             parameter $t$.
 570 |         </p>
 571 |         <p>
 572 |             For an articulated rigid body system, the parameters $\params$ may include (but are not limited to) the
 573 |             masses, inertial properties and geometrical properties of the bodies in the mechanism, as well as joint and
 574 |             contact friction coefficients. Given $\frac{\partial \fstep}{\partial\params}$ and
 575 |             $\frac{\partial\fstep}{\partial\statevec}$, gradients of simulation parameters with respect to the state
 576 |             trajectories can be computed directly through the chain rule, or via the adjoint sensitivity
 577 |             method [<a href="#sec:references">7</a>].
 578 |         </p>
 579 | 
 580 | 
 581 |         <h4 id="sec:ibm-pendulum">2.2 Identify Real-world Double Pendulum</h4>
 582 |         <p>
 583 |             We set up the double pendulum estimation experiment with the 11 parameters shown in
 584 |             <a href="#tab:params-ibm-pendulum">Table 1</a> to be estimated. The state space consists of the two
 585 |             positions and
 586 |             velocities of both joints: $\statevec = \begin{bmatrix}\mathbf{q}_{0:1} &
 587 |             \mathbf{\dot{q}}_{0:1}\end{bmatrix}$. The dataset of
 588 |             trajectories contains image sequences (see time lapse of an excerpt from a trajectory in
 589 |             <a href="#fig:ibm-pendulum-timelapse">Figure 2</a>) and annotated pixel coordinates of the three vertices in
 590 |             the double
 591 |             pendulum, from which we extracted joint positions and velocities (via finite differencing given the known
 592 |             recording frequency of 400Hz).
 593 | 
 594 |         </p>
 595 | 
 596 |         <div class="row">
 597 |             <div class="col-md-8" id="tab:params-ibm-pendulum">
 598 |                 <table class="table">
 599 |                     <thead>
 600 |                         <tr>
 601 |                             <th scope="col">Link</th>
 602 |                             <th scope="col">Parameter</th>
 603 |                             <th scope="col" colspan="2" style="text-align:center">Minimum</th>
 604 |                             <th scope="col" colspan="2" style="text-align:center">Maximum</th>
 605 |                         </tr>
 606 |                     </thead>
 607 |                     <tbody>
 608 |                         <tr>
 609 |                             <th rowspan="5">Link 1</th>
 610 |                             <th>Mass</th>
 611 |                             <td align="right">0.05 </td>
 612 |                             <td> $\kg$ </td>
 613 |                             <td align="right"> 0.5 </td>
 614 |                             <td> $\kg$ </td>
 615 |                         </tr>
 616 |                         <tr>
 617 |                             <th> $I_{xx}$ </th>
 618 |                             <td align="right"> 0.002 </td>
 619 |                             <td> $\kg\cdot\meter^2$ </td>
 620 |                             <td align="right"> 1.0 </td>
 621 |                             <td> $\kg\cdot\meter^2$</td>
 622 |                         </tr>
 623 |                         <tr>
 624 |                             <th> COM $x$ </th>
 625 |                             <td align="right"> -0.2 </td>
 626 |                             <td> $\meter$ </td>
 627 |                             <td align="right"> 0.2 </td>
 628 |                             <td> $\meter$ </td>
 629 |                         </tr>
 630 |                         <tr>
 631 |                             <th> COM $y$ </th>
 632 |                             <td align="right"> -0.2 </td>
 633 |                             <td> $\meter$ </td>
 634 |                             <td align="right"> 0.2 </td>
 635 |                             <td> $\meter$ </td>
 636 |                         </tr>
 637 |                         <tr>
 638 |                             <th> Joint friction </th>
 639 |                             <td align="right"> 0.0 </td>
 640 |                             <td> </td>
 641 |                             <td align="right"> 0.5 </td>
 642 |                             <td> </td>
 643 |                         </tr>
 644 |                         <tr>
 645 |                             <th rowspan="6">Link 2
 646 |                             <th>Length </th>
 647 |                             <td align="right"> 0.08 </td>
 648 |                             <td> $\meter$ </td>
 649 |                             <td align="right"> 0.3 </td>
 650 |                             <td> $\meter$ </td>
 651 |                         </tr>
 652 |                         <tr>
 653 |                             <th> Mass </th>
 654 |                             <td align="right"> 0.05 </td>
 655 |                             <td> $\kg$ </td>
 656 |                             <td align="right"> 0.5 </td>
 657 |                             <td> $\kg$ </td>
 658 |                         </tr>
 659 |                         <tr>
 660 |                             <th> $I_{xx}$ </th>
 661 |                             <td align="right"> 0.002 </td>
 662 |                             <td> $\kg\cdot\meter^2$ </td>
 663 |                             <td align="right"> 1.0 </td>
 664 |                             <td> $\kg\cdot\meter^2$ </td>
 665 |                         </tr>
 666 |                         <tr>
 667 |                             <th> COM $x$ </th>
 668 |                             <td align="right"> -0.2 </td>
 669 |                             <td> $\meter$ </td>
 670 |                             <td align="right"> 0.2 </td>
 671 |                             <td> $\meter$ </td>
 672 |                         </tr>
 673 |                         <tr>
 674 |                             <th> COM $y$ </th>
 675 |                             <td align="right"> -0.2 </td>
 676 |                             <td> $\meter$ </td>
 677 |                             <td align="right"> 0.2 </td>
 678 |                             <td> $\meter$ </td>
 679 |                         </tr>
 680 |                         <tr>
 681 |                             <th> Joint friction </th>
 682 |                             <td align="right"> 0.0 </td>
 683 |                             <td> </td>
 684 |                             <td align="right"> 0.5 </td>
 685 |                             <td> </td>
 686 |                         </tr>
 687 |                     </tbody>
 688 |                 </table>
 689 |             </div>
 690 |             <div class="col-md-4" id="fig:ibm-pendulum-timelapse">
 691 |                 <img src="img/ibm_pendulum/ibm-pendulum-timelapse.png" alt="IBM Pendulum" class="img-fluid" />
 692 |             </div>
 693 |         </div>
 694 |         <div class="row">
 695 |             <div class="col-md-8">
 696 |                 <p>
 697 |                     <b>Table 1.</b> Parameters to be estimated. $I$ refers to the $3\times3$ inertia matrix, COM stands
 698 |                     for center of mass.
 699 |                 </p>
 700 |             </div>
 701 |             <div class="col-md-4">
 702 |                 <p><b>Figure 2.</b> Time lapse of a double pendulum trajectory from the IBM
 703 |                     dataset [<a href="#sec:references">8</a>].</p>
 704 |             </div>
 705 |         </div>
 706 |         <p>
 707 |             Since we know that all trajectories in this dataset stem from the same double
 708 |             pendulum [<a href="#sec:references">8</a>], we only used a single reference trajectory as target trajectory
 709 |             $\trajectory\real$ during the estimation. We let each estimator run for 2000 iterations. For evaluation, we
 710 |             calculate the consistency metrics from Tab. 1 of the main paper over 10 held-out trajectories from a test
 711 |             dataset. For comparison, we visualize the trajectory density over simulations rolled out from the last 100
 712 |             Markov samples (or 100 particles in the case of particle-based approaches) in
 713 |             <a href="#fig:ibm-pendulum-rollouts">Figure 3</a>. The ground-truth shown in these plots again stems from
 714 |             the unseen test
 715 |             dataset. This experiment further demonstrates the generalizability of simulation-based inference, which,
 716 |             when an adequate model has been implemented and its parameters identified, can predict outcomes under
 717 |             various novel conditions even though the training dataset consisted of only a single trajectory in this
 718 |             example.
 719 |         </p>
 720 | 
 721 | 
 722 |         <div class="row" id="fig:ibm-pendulum-rollouts">
 723 |             <div class="col"></div>
 724 |             <div class="col-8">
 725 |                 <table class="table table-borderless table-hover align-middle">
 726 |                     <tr>
 727 |                         <th>
 728 |                             Emcee </th>
 729 |                         <td>
 730 |                             <img src="img/ibm_pendulum/mcmc_trajectories.png" alt="Emcee" class="img-fluid" />
 731 |                         </td>
 732 |                     </tr>
 733 |                     <tr>
 734 |                         <th>
 735 |                             CEM </th>
 736 |                         <td>
 737 |                             <img src="img/ibm_pendulum/cem_trajectories.png" class="img-fluid" alt="CEM" />
 738 |                         </td>
 739 |                     </tr>
 740 |                     <tr>
 741 |                         <th>
 742 |                             NUTS </th>
 743 |                         <td>
 744 |                             <img src="img/ibm_pendulum/nuts_trajectories.png" class="img-fluid" alt="NUTS" />
 745 |                         </td>
 746 |                     </tr>
 747 |                     <tr>
 748 |                         <th>
 749 |                             SGLD </th>
 750 |                         <td>
 751 |                             <img src="img/ibm_pendulum/sgld_trajectories.png" class="img-fluid" alt="SGLD" />
 752 |                         </td>
 753 |                     </tr>
 754 |                     <tr>
 755 |                         <th>
 756 |                             SVGD </th>
 757 |                         <td>
 758 |                             <img src="img/ibm_pendulum/svgd_ss_test.png" class="img-fluid" alt="SVGD" />
 759 |                         </td>
 760 |                     </tr>
 761 |                     <tr>
 762 |                         <th>
 763 |                             CSVGD </th>
 764 |                         <td>
 765 |                             <img src="img/ibm_pendulum/svgd_ms_test.png" class="img-fluid" alt="CSVGD" />
 766 |                         </td>
 767 |                     </tr>
 768 |                 </table>
 769 |                 <p>
 770 |                     <b>Figure 3.</b> Kernel density estimation over trajectory roll-outs from the last estimated 100
 771 |                     parameter guesses of each method, applied to the physical double pendulum dataset from
 772 |                     <a href="#sec:ibm-pendulum">Section 2.2</a>. The ground-truth trajectory here stems from the test
 773 |                     dataset of 10
 774 |                     trajectories that were held out during training. The particle-based approaches (CEM, SVGD, CSVGD)
 775 |                     use 100 particles.
 776 |                 </p>
 777 |             </div>
 778 |             <div class="col"></div>
 779 |         </div>
 780 | 
 781 |         <h4 id="sec:exp-multiple-shooting">2.3 Ablation Study on Multiple Shooting</h4>
 782 | 
 783 |         <p>
 784 |             We evaluate the baseline estimation algorithms with our proposed multiple-shooting likelihood
 785 |             function
 786 |             (using
 787 |             10 shooting windows) on the physical double pendulum dataset from before. To make the constrained
 788 |             optimization problem amenable to the MCMC samplers, we formulate the defect constraint through the
 789 |             following
 790 |             likelihood:
 791 |             $$
 792 |             \begin{align}
 793 |             \pdef(\statevec_t^s, \statevec_t) = \mathcal{N}(\statevec_t^s | \statevec_t,\sigma^2_{\text{def}})
 794 |             \qquad
 795 |             t\in [h, 2h, \dots],
 796 |             \end{align}
 797 |             $$
 798 |             where we tune $\sigma^2_{\text{def}}$ to a small value (on the order of $10^{-2}$) such that the
 799 |             defects are
 800 |             minimized during the estimation. As we describe in Sec. 4.4 from our main paper, the parameter space
 801 |             is
 802 |             augmented by the shooting variables $\statevec_t^s$.
 803 |         </p>
 804 |         <p>
 805 |             As shown in <a href="#tab:ms-baselines">Table 2</a>, the MCMC approaches Emcee and NUTS do not benefit
 806 |             meaningfully from
 807 |             the multiple-shooting approach. Emcee often yields unstable simulations from which we are not able
 808 |             to
 809 |             compute some of the metrics. The increased dimensionality of the parameter space appears to add a
 810 |             significant challenge to these methods, which are known to scale poorly to higher dimensions.
 811 |             Despite being configured to use a Gaussian mixture model of 3 kernels, the CEM posterior immediately
 812 |             collapses to a single point such that the KL divergence of simulated against real trajectories
 813 |             cannot be computed.
 814 |         </p>
 815 | 
 816 |         <table class="table numbers" id="tab:ms-baselines">
 817 |             <thead>
 818 |                 <tr>
 819 |                     <th scope="col"></th>
 820 |                     <th scope="col" colspan="2" style="text-align:center">$d_{\text{KL}} (\trajectoryset\real
 821 |                         \parallel
 822 |                         \trajectoryset\simu)$</th>
 823 |                     <th scope="col" colspan="2" style="text-align:center">$d_{\text{KL}} (\trajectoryset\simu
 824 |                         \parallel
 825 |                         \trajectoryset\real)$</th>
 826 |                     <th scope="col" colspan="2" style="text-align:center">MMD</th>
 827 |                 </tr>
 828 |                 <tr>
 829 |                     <th>Algorithm</th>
 830 |                     <th style="text-align:center">SS</th>
 831 |                     <th style="text-align:center">MS</th>
 832 |                     <th style="text-align:center">SS</th>
 833 |                     <th style="text-align:center">MS</th>
 834 |                     <th style="text-align:center">SS</th>
 835 |                     <th style="text-align:center">MS</th>
 836 |                 </tr>
 837 |             </thead>
 838 |             <tbody>
 839 |                 <tr>
 840 |                     <th> Emcee </th>
 841 |                     <td class="text-primary"> 8542.2466 </td>
 842 |                     <td> 8950.4574 </td>
 843 |                     <td> 4060.6312 </td>
 844 |                     <td>N/A </td>
 845 |                     <td> 1.1365 </td>
 846 |                     <td> N/A </td>
 847 |                 </tr>
 848 |                 <tr>
 849 |                     <th> CEM </th>
 850 |                     <td> 8911.1798 </td>
 851 |                     <td class="text-primary"> 8860.5115 </td>
 852 |                     <td> 8549.5927 </td>
 853 |                     <td>N/A </td>
 854 |                     <td> 0.9687 </td>
 855 |                     <td class="text-primary"> 0.5682 </td>
 856 |                 </tr>
 857 |                 <tr>
 858 |                     <th> SGLD </th>
 859 |                     <td> 8788.0962 </td>
 860 |                     <td class="text-primary"> 5863.2728 </td>
 861 |                     <td> 7876.0310 </td>
 862 |                     <td class="text-primary">2187.2825 </td>
 863 |                     <td> 2.1220 </td>
 864 |                     <td class="text-primary"> 0.0759 </td>
 865 |                 </tr>
 866 |                 <tr>
 867 |                     <th> NUTS </th>
 868 |                     <td> 9196.7461 </td>
 869 |                     <td class="text-primary"> 8785.5326 </td>
 870 |                     <td> 6432.2131 </td>
 871 |                     <td class="text-primary">4935.8983 </td>
 872 |                     <td class="text-primary"> 0.5371 </td>
 873 |                     <td> 1.1642 </td>
 874 |                 </tr>
 875 |                 <tr>
 876 |                     <th> (C)SVGD </th>
 877 |                     <td> 8803.5683 </td>
 878 |                     <td class="text-primary"> 5204.5336 </td>
 879 |                     <td> 10283.6659</td>
 880 |                     <td class="text-primary"> 2773.1751 </td>
 881 |                     <td> 0.7177 </td>
 882 |                     <td class="text-primary"> 0.0366 </td>
 883 |                 </tr>
 884 |             </tbody>
 885 |         </table>
 886 |         <p>
 887 |             <b>Table 2.</b> Consistency metrics of the posterior distributions approximated from the physical
 888 |             double pendulum dataset (<a href="#sec:ibm-pendulum">Section 2.2</a>) by the different estimation algorithms
 889 |             using the
 890 |             single-shooting likelihood $p_{ss}(\trajectory\real | \params)$ (column "SS") and the
 891 |             multiple-shooting
 892 |             likelihood $p_{ms}(\trajectory\real | \params)$ (column "MS") with 10 shooting windows. Note that
 893 |             SVGD with multiple-shooting corresponds to CSVGD.
 894 |         </p>
 895 | 
 896 |         <p>
 897 |             We observe a significant improvement in estimation accuracy on SGLD, where the multiple-shooting
 898 |             approach
 899 |             allowed it to converge to closely matching trajectories, as shown in <a href="#fig:sgld-ms">Figure 4</a>. As
 900 |             with
 901 |             SVGD,
 902 |             the availability of gradients allows this method to scale better to the higher dimensional parameter
 903 |             space,
 904 |             while the smoothed likelihood landscape further helps the approach to find better fitting
 905 |             parameters.
 906 |         </p>
 907 | 
 908 |         <div class="row" id="fig:sgld-ms">
 909 |             <div class="col"></div>
 910 |             <div class="col-8">
 911 |                 <img src="img/ibm_pendulum/sgld_ms.png" class="img-fluid" alt="SGLD with Multiple Shooting" />
 912 |                 <p>
 913 |                     <b>Figure 4.</b> Kernel density estimation over trajectory roll-outs from the last estimated 100
 914 |                     parameter guesses of SGLD with the multiple-shooting likelihood model (see
 915 |                     <a href="#sec:exp-multiple-shooting">Section 2.3</a>), applied to the physical double pendulum
 916 |                     dataset from
 917 |                     <a href="#sec:ibm-pendulum">Section 2.2</a>. Similarly to SVGD, SGLD benefits significantly from the
 918 |                     smoother
 919 |                     likelihood function while being able to cope with the augmented parameter space thanks to its
 920 |                     gradient-based approach.
 921 |                 </p>
 922 |             </div>
 923 |             <div class="col"></div>
 924 |         </div>
 925 | 
 926 |         <h4 id="sec:likelihoodfree">2.4 Comparison to Likelihood-free Inference</h4>
 927 |         <p>
 928 |             Our Bayesian inference approach leverages the simulator as part of the likelihood model to
 929 |             approximate posterior distributions over simulation parameters, which means the simulator is indispensable
 930 |             in our estimation process}. In the following, we compare our approach against the likelihood-free inference
 931 |             approach BayesSim [<a href="#sec:references">9</a>] that leverages approximate Bayesian computation (ABC)
 932 |             which is
 933 |             the most popular family of algorithms within likelihood-free methods.
 934 |         </p>
 935 | 
 936 |         <p>
 937 |             Likelihood-free methods assume the simulator is a black box that can generate a trajectory given a parameter
 938 |             setting. Instead of querying the simulator to evaluate the likelihood (as in our approach), a conditional
 939 |             density $q(\params | \trajectoryset)$ is learned directly from a dataset of simulation parameters and their
 940 |             corresponding rolled-out trajectories via supervised learning to approximate the posterior. A common choice
 941 |             of model for such density is a mixture density network [<a href="#sec:references">10</a>], which
 942 |             parameterizes a
 943 |             Gaussian mixture model. This is in contrast to our (C)SVGD algorithm which can approximate
 944 |             any shape of posterior by being a nonparametric inference algorithm.
 945 |         </p>
 946 |         </p>
 947 | 
 948 |         <p>
 949 |             For our experiments we collect a dataset of 10,000 simulated trajectories of parameters randomly sampled
 950 |             from the prior distribution. We train the density network via the Adam optimizer with a learning rate of
 951 |             $10^{-3}$ for 3000 epochs, after which we observed no meaningful improvement to the calculated
 952 |             log-likelihood loss during training. In the following, we provide further details on the likelihood-free
 953 |             inference pipeline we consider, by describing the input data processing and the model used for approximating
 954 |             the posterior.
 955 |         </p>
 956 |         <h5 id="sec:bayessim-input">2.4.1 Input Data Processing</h5>
 957 |         <p>
 958 |             The input to the learned density model has to be a sufficient statistic of the underlying data, while being
 959 |             low-dimensional in order to keep the learning problem computationally tractable. We consider the following
 960 |             four methods of processing the trajectories that are the input to the likelihood-free methods, as
 961 |             visualized for an example trajectory in <a href="#fig:bayessim-inputs">Figure 5</a>. Note that we configured
 962 |             the following
 963 |             input processing methods to generate a one-dimensional input vector that has a reasonable length to be
 964 |             computationally feasible to train on (given the 10,000 trajectories from the training dataset), while
 965 |             achieving acceptable performance which we validated through testing various settings.
 966 |         </p>
 967 | 
 968 |         <p>
 969 |             <b>Downsampled:</b> we down-sample the trajectory so that for the double pendulum experiment
 970 |             (<a href="#sec:ibm-pendulum">Section 2.2</a>) we use only every 20th state, for the Panda arm experiment
 971 |             (<a href="#sec:panda-box">Section 2.5</a>) only every 200-th state of the trajectory. Finally, the state
 972 |             dimensions per
 973 |             trajectory are concatenated to a one-dimensional vector.
 974 |         </p>
 975 |         <p>
 976 |             <b>Difference:</b> we adapt the input statistic from the original BayesSim approach in [<a
 977 |                 href="#sec:references">9</a>, Eq. (22)] where the differences of two consecutive states along the
 978 |             trajectory are used in
 979 |             concatenation with their mean and variance:
 980 |             $$
 981 |             \psi(\trajectory) = (\operatorname{downsample}(\tau), \mathbb{E}[\tau], \operatorname{Var}[\tau])
 982 |             \qquad\text{where}\qquad
 983 |             \tau = \{\statevec_t - \statevec_{t-1}\}_{t=1}^T
 984 |             $$
 985 |             As before, we down-sample these state differences and concatenate them to a vector.
 986 |         </p>
 987 |         <p>
 988 |             <b>Summary:</b> for each state dimension of the trajectory, we compute the following statistics typical for
 989 |             time series: mean, variance, cross correlation between state dimensions of the trajectory, as well as
 990 |             auto-correlations for each dimension at 5 different time delays: [5, 10, 20, 50, 100] time steps.
 991 |             These numbers are concatenated for all state dimensions to a one-dimensional vector per input
 992 |             trajectory.
 993 |         </p>
 994 |         <p>
 995 |             <b>Signature:</b> we compute the signature transform from the signatory package [<a
 996 |                 href="#sec:references">11</a>]
 997 |             over the input trajectory. Such so-called path signatures have been recently introduced to extract
 998 |             information about order and area, thereby preserving features inherent to nonlinear trajectories. We select
 999 |             a depth for the signature transform of 3 for the double pendulum experiment, and 2 for the Panda arm
1000 |             experiment, to obtain feature vectors of comparable size to the aforementioned input techniques.
1001 |         </p>
1002 | 
1003 |         <div class="row" id="fig:bayessim-inputs">
1004 |             <div class="col">
1005 |                 <img src="img/ibm_pendulum/bayes_sim/ibm_groundtruth_raw.png" class="img-fluid" alt="Ground Truth" />
1006 |                 <p style="text-align: center;">(a) Raw Input</p>
1007 |             </div>
1008 |             <div class="col">
1009 |                 <img src="img/ibm_pendulum/bayes_sim/ibm_groundtruth_downsampled.png" class="img-fluid"
1010 |                     alt="Downsampled" />
1011 |                 <p style="text-align: center;">(b) Downsampled</p>
1012 |             </div>
1013 |             <div class="col">
1014 |                 <img src="img/ibm_pendulum/bayes_sim/ibm_groundtruth_difference.png" class="img-fluid"
1015 |                     alt="Difference" />
1016 |                 <p style="text-align: center;">(c) Difference</p>
1017 |             </div>
1018 |             <div class="col">
1019 |                 <img src="img/ibm_pendulum/bayes_sim/ibm_groundtruth_summary.png" class="img-fluid" alt="Summary" />
1020 |                 <p style="text-align: center;">(d) Summary</p>
1021 |             </div>
1022 |             <div class="col">
1023 |                 <img src="img/ibm_pendulum/bayes_sim/ibm_groundtruth_signature.png" class="img-fluid" alt="Signature" />
1024 |                 <p style="text-align: center;">(e) Signature</p>
1025 |             </div>
1026 |         </div>
1027 |         <p>
1028 |             <b>Figure 5.</b> Exemplary visualization of the input processing methods for the likelihood-free baselines
1029 |             from <a href="#sec:likelihoodfree">Section 2.4</a> applied to a trajectory from the double pendulum
1030 |             experiment in
1031 |             <a href="#sec:ibm-pendulum">Section 2.2</a>.
1032 |         </p>
1033 | 
1034 |         <h5 id="sec:bayessim-model">2.4.2 Density Model</h5>
1035 |         <p>
1036 |             As the density model for the learned posterior $q(\params | \trajectoryset)$, we select the following
1037 |             commonly used representations.
1038 |         </p>
1039 |         <p>
1040 |             <b>Mixture density network (<b>MDN</b>):</b> uses neural network features from a feed-forward neural network
1041 |             using two hidden layers with 24 units each.
1042 |         </p>
1043 |         <p>
1044 |             <b>Mixture density random Fourier features (<b>MDRFF</b>):</b> this density model uses Fourier features and
1045 |             a kernel. We evaluate the MDRFF with the following common choices for the kernel:
1046 |         <ul>
1047 |             <li> Radial Basis Function (<b>RBF</b>) kernel </li>
1048 |             <li> <b>Matérn</b> kernel [<a href="#sec:references">12</a>, Eq. (4.14)] with $\nu=\frac{5}{2}$ </li>
1049 |         </ul>
1050 | 
1051 |         <h5 id="sec:bayessim-eval">2.4.3 Evaluation</h5>
1052 |         <p>
1053 |             Note that instead of action generation, which is part of the proposed BayesSim
1054 |             pipeline [<a href="#sec:references">9</a>], we only focus on the inference of the posterior density over
1055 |             simulation
1056 |             parameters in order to compare such likelihood-free inference approach against our method.
1057 |         </p>
1058 |         <p>
1059 |             To evaluate the metrics shown in <a href="#tab:likelihoodfree-results">Table 2</a> for each BayesSim
1060 |             instantiation (input method and density model), we sample 100 parameter vectors from the learned
1061 |             posterior $q(\params | \trajectoryset)$ and simulate them to obtain 100 trajectories which are compared
1062 |             against the reference trajectory sets, as we did in the comparison for the other Bayesian inference methods
1063 |             in Tab. 1 of the main paper.
1064 |         </p>
1065 | 
1066 |         <table class="table numbers" id="tab:likelihoodfree-results">
1067 |             <thead>
1068 |                 <td></td>
1069 |                 <td></td>
1070 |                 <th colspan="3" style="text-align:center" class="border-start border-end">Double Pendulum Experiment
1071 |                 </th>
1072 |                 <th style="text-align:center"> Panda Arm Experiment </th>
1073 |                 </tr>
1074 |                 <tr>
1075 |                     <th> Input </th>
1076 |                     <th> Model </th>
1077 |                     <th class="border-start" style="text-align:center"> $d_{\text{KL}} (\trajectoryset\real \parallel
1078 |                         \trajectoryset\simu)$
1079 |                     </th>
1080 |                     <th style="text-align:center"> $d_{\text{KL}} (\trajectoryset\simu \parallel \trajectoryset\real)$
1081 |                     </th>
1082 |                     <th class="border-end" style="text-align:center"> MMD
1083 |                     </th>
1084 |                     <th style="text-align:center"> $\log\pobs(\trajectoryset\real \parallel \trajectoryset\simu)$ </th>
1085 |                 </tr>
1086 |             </thead>
1087 |             <tbody>
1088 |                 <tr>
1089 |                     <th>Downsampled </th>
1090 |                     <th class="border-end"> MDN </th>
1091 |                     <td> 8817.9222 </td>
1092 |                     <td> 4050.4666 </td>
1093 |                     <td class="border-end"> 0.6748 </td>
1094 |                     <td> -17.4039 </td>
1095 |                 </tr>
1096 |                 <tr>
1097 |                     <th>Difference </th>
1098 |                     <th class="border-end"> MDN </th>
1099 |                     <td> 8919.2463 </td>
1100 |                     <td> 4633.2637 </td>
1101 |                     <td class="border-end"> 0.6285 </td>
1102 |                     <td> -17.1646 </td>
1103 |                 </tr>
1104 |                 <tr>
1105 |                     <th>Summary </th>
1106 |                     <th class="border-end"> MDN </th>
1107 |                     <td> 9092.5575 </td>
1108 |                     <td> 5093.8851 </td>
1109 |                     <td class="border-end"> 0.5664 </td>
1110 |                     <td> -18.3481 </td>
1111 |                 </tr>
1112 |                 <tr>
1113 |                     <th>Signature </th>
1114 |                     <th class="border-end"> MDN </th>
1115 |                     <td> 8985.8056 </td>
1116 |                     <td> 4610.5438 </td>
1117 |                     <td class="border-end"> 0.5807 </td>
1118 |                     <td> -19.3432 </td>
1119 |                 </tr>
1120 |                 <tr>
1121 |                     <th>Downsampled </th>
1122 |                     <th class="border-end"> MDRFF (RBF) </th>
1123 |                     <td> 9027.9474 </td>
1124 |                     <td> 5091.5283 </td>
1125 |                     <td class="border-end"> 0.5593 </td>
1126 |                     <td> -17.2335 </td>
1127 |                 </tr>
1128 |                 <tr>
1129 |                     <th>Difference </th>
1130 |                     <th class="border-end"> MDRFF (RBF) </th>
1131 |                     <td> 8936.3823 </td>
1132 |                     <td> 4282.8599 </td>
1133 |                     <td class="border-end"> 0.5988 </td>
1134 |                     <td> -18.4892 </td>
1135 |                 </tr>
1136 |                 <tr>
1137 |                     <th>Summary </th>
1138 |                     <th class="border-end"> MDRFF (RBF) </th>
1139 |                     <td> 9063.1753 </td>
1140 |                     <td> 4884.1398 </td>
1141 |                     <td class="border-end"> 0.5672 </td>
1142 |                     <td> -19.5430 </td>
1143 |                 </tr>
1144 |                 <tr>
1145 |                     <th>Signature </th>
1146 |                     <th class="border-end"> MDRFF (RBF) </th>
1147 |                     <td> 8980.9080 </td>
1148 |                     <td> 4081.1160 </td>
1149 |                     <td class="border-end"> 0.6016 </td>
1150 |                     <td> -18.3458 </td>
1151 |                 </tr>
1152 |                 <tr>
1153 |                     <th>Downsampled </th>
1154 |                     <th class="border-end"> MDRFF (Matérn) </th>
1155 |                     <td> 8818.1830 </td>
1156 |                     <td> 3794.9873 </td>
1157 |                     <td class="border-end"> 0.6110 </td>
1158 |                     <td> -17.6395 </td>
1159 |                 </tr>
1160 |                 <tr>
1161 |                     <th>Difference </th>
1162 |                     <th class="border-end"> MDRFF (Matérn) </th>
1163 |                     <td> 8859.2156 </td>
1164 |                     <td> 4349.9971 </td>
1165 |                     <td class="border-end"> 0.6176 </td>
1166 |                     <td> -17.2752 </td>
1167 |                 </tr>
1168 |                 <tr>
1169 |                     <th>Summary </th>
1170 |                     <th class="border-end"> MDRFF (Matérn) </th>
1171 |                     <td> 8962.0501 </td>
1172 |                     <td> 4241.4551 </td>
1173 |                     <td class="border-end"> 0.5999 </td>
1174 |                     <td> -19.6672 </td>
1175 |                 </tr>
1176 |                 <tr>
1177 |                     <th>Signature </th>
1178 |                     <th class="border-end"> MDRFF (Matérn) </th>
1179 |                     <td> 9036.9626 </td>
1180 |                     <td> 4620.9517 </td>
1181 |                     <td class="border-end"> 0.5715 </td>
1182 |                     <td> -18.1652 </td>
1183 |                 </tr>
1184 |                 <tr>
1185 |                     <th colspan="2" style="text-align:center" class="border-end">CSVGD </th>
1186 |                     <td class="text-primary"> 5204.5336 </td>
1187 |                     <td class="text-primary"> 2773.1751 </td>
1188 |                     <td class="text-primary border-end"> 0.0366 </td>
1189 |                     <td class="text-primary"> -15.1671 </td>
1190 |                 </tr>
1191 |             </tbody>
1192 |         </table>
1193 |         <p>
1194 |             <b>Table 2.</b>
1195 |             Consistency metrics of the posterior distributions approximated by the different BayesSim instantiations,
1196 |             where the input method and model name (including the kernel type for the MDRFF model) are given. Each metric
1197 |             is calculated across simulated and real trajectories. Lower is better on all metrics except the
1198 |             log-likelihood $\log\pobs(\trajectoryset\real \parallel \trajectoryset\simu)$ from the Panda arm experiment.
1199 |             For comparison, in the last row, we reproduce the numbers from CSVGD shown in Tab. 1 of the main paper.
1200 |         </p>
1201 | 
1202 | 
1203 |         <table class="table table-borderless table-hover centered" id="fig:ibm-pendulum-rollouts-bayessim">
1204 |             <tr>
1205 |                 <td width="50%">
1206 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_downsampled_trajectories.png"
1207 |                         class="img-fluid" />
1208 |                     <p><b>MDN</b> - Downsampled</p>
1209 | 
1210 |                 </td>
1211 |                 <td width="50%">
1212 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_difference_trajectories.png"
1213 |                         class="img-fluid" />
1214 |                     <p><b>MDN </b>- Difference </p>
1215 |                 </td>
1216 |             </tr>
1217 |             <tr>
1218 |                 <td>
1219 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_summary_trajectories.png"
1220 |                         class="img-fluid" />
1221 |                     <p><b>MDN</b> - Summary </p>
1222 |                 </td>
1223 |                 <td>
1224 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdn_signature_trajectories.png"
1225 |                         class="img-fluid" />
1226 |                     <p><b>MDN</b> - Signature </p>
1227 |                 </td>
1228 |             </tr>
1229 |             <tr>
1230 |                 <td>
1231 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_downsampled_trajectories.png"
1232 |                         class="img-fluid" />
1233 |                     <p><b>MDRFF (RBF)</b> - Downsampled </p>
1234 |                 </td>
1235 |                 <td>
1236 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_difference_trajectories.png"
1237 |                         class="img-fluid" />
1238 |                     <p><b>MDRFF (RBF)</b> - Difference </p>
1239 |                 </td>
1240 |             </tr>
1241 |             <tr>
1242 |                 <td>
1243 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_summary_trajectories.png"
1244 |                         class="img-fluid" />
1245 |                     <p><b>MDRFF (RBF)</b> - Summary </p>
1246 |                 </td>
1247 |                 <td>
1248 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_rbf_signature_trajectories.png"
1249 |                         class="img-fluid" />
1250 |                     <p><b>MDRFF (RBF)</b> - Signature </p>
1251 |                 </td>
1252 |             </tr>
1253 |             <tr>
1254 |                 <td>
1255 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_downsampled_trajectories.png"
1256 |                         class="img-fluid" />
1257 |                     <p><b>MDRFF (Matérn)</b> - Downsampled </p>
1258 |                 </td>
1259 |                 <td>
1260 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_difference_trajectories.png"
1261 |                         class="img-fluid" />
1262 |                     <p><b>MDRFF (Matérn)</b> - Difference </p>
1263 |                 </td>
1264 |             </tr>
1265 |             <tr>
1266 |                 <td>
1267 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_summary_trajectories.png"
1268 |                         class="img-fluid" />
1269 |                     <p><b>MDRFF (Matérn)</b> - Summary </p>
1270 |                 </td>
1271 |                 <td>
1272 |                     <img src="img/ibm_pendulum/bayes_sim/bayessim_ibm_pendulum_mdrff_matern_signature_trajectories.png"
1273 |                         class="img-fluid" />
1274 |                     <p><b>MDRFF (Matérn)</b> - Signature </p>
1275 |                 </td>
1276 |             </tr>
1277 |         </table>
1278 |         <p>
1279 |             <b>Figure 6.</b> Kernel density estimation over trajectory roll-outs from 100 parameter samples drawn from
1280 |             the posterior of each BayesSim method (model name with kernel choice in bold font + input method, see
1281 |             <a href="#sec:likelihoodfree">Section 2.4</a>), applied to the physical double pendulum dataset from
1282 |             <a href="#sec:ibm-pendulum">Section 2.2</a>. The ground-truth trajectory here stems from the test dataset of
1283 |             10 trajectories
1284 |             that were held out during training.
1285 |         </p>
1286 | 
1287 |         <h5>2.4.4 Discussion</h5>
1288 | 
1289 |         <p>
1290 |             The results from our experiments with the various likelihood-free approaches in
1291 |             <a href="#tab:likelihoodfree-results">Table 2</a> indicate that, among the tested pipelines, the MDRFF model
1292 |             with Matérn
1293 |             kernel and downsampled trajectory input overall performed the strongest, followed by the MDN with
1294 |             downsampled input. In comparison to the likelihood-based algorithms from Tab. 1 of the main paper, these
1295 |             results are comparable on the double pendulum experiment. However, in comparison to CSVGD, the estimated
1296 |             likelihood-free posteriors are significantly less accurate, which can also be clearly seen in the density
1297 |             plots over the rolled out trajectories from such learned densities in
1298 |             <a href="#fig:ibm-pendulum-rollouts-bayessim">Figure 6</a>. On the Panda arm experiment, the likelihood-free
1299 |             methods are
1300 |             outperformed by the likelihood-based algorithms (such as the Emcee sampler) more often on the likelihood of
1301 |             the learned parameter densities. CSVGD again achieves a much more accurate posterior in this experiment than
1302 |             any likelihood-free approach.
1303 |         </p>
1304 | 
1305 |         <p class="lead">Why do these likelihood-free methods perform so poorly on a seemingly simple double pendulum?
1306 |         </p>
1307 |         <p>
1308 |             One would expect that this kind of dynamical system poses no greater challenge to BayesSim when it was shown
1309 |             to identify a cartpole's link length and cart mass successfully [<a href="#sec:references">9</a>]. To
1310 |             investigate
1311 |             this problem, we revisit the simplified double pendulum estimation experiment from Sec. 5.1 of our main
1312 |             paper, where only the two link lengths need to be estimated from simulated trajectories. As before, we
1313 |             create a dataset with 10,000 trajectories of 400 time steps based on the two simulation parameters sampled
1314 |             from a uniform distribution ranging between 0.5m and 5m. While keeping all
1315 |             parameters the same as in our previous double-pendulum experiment where eleven parameters had to be
1316 |             inferred, all of the density models in combination with both the "difference" and "downsampled" input
1317 |             statistic infer a highly accurate parameter distribution, as shown in
1318 |             <a href="#fig:bayessim-twoparam-posterior">Figure 7 (a)</a>. The trajectories produced by sampling from the
1319 |             BayesSim posterior
1320 |             (<a href="#fig:bayessim-twoparam-trajectories">Figure 7 (b)</a>) also match the reference observations much
1321 |             more closely than
1322 |             any of the BayesSim models on the previous 11-parameter double
1323 |             pendulum (<a href="#fig:ibm-pendulum-rollouts-bayessim">Figure 6</a>). These results suggest that BayesSim and
1324 |             potentially
1325 |             other likelihood-free method have problems in inferring higher dimensional parameter distributions. The
1326 |             experiments in [<a href="#sec:references">9</a>] demonstrated as many as four parameters being estimated
1327 |             (for the
1328 |             acrobot), while showing inference results for simulated systems only. While our double pendulum system from
1329 |             <a href="#sec:ibm-pendulum">Section 2.2</a> is basic in principle, the higher dimensional parameter space
1330 |             (see parameters in
1331 |             <a href="#tab:params-ibm-pendulum">Table 1</a>) and the fact that we need to fit against real-world data
1332 |             makes it a
1333 |             significantly harder problem for most state-of-the-art inference algorithms. CSVGD is able to achieve a
1334 |             close fit thanks to the multiple-shooting segmentation of the trajectory which improves the convergence (see
1335 |             more ablation results for multiple-shooting on this experiment in <a
1336 |                 href="#sec:exp-multiple-shooting">Section 2.3</a>).
1337 |         </p>
1338 | 
1339 |         <div class="row">
1340 |             <div class="col"></div>
1341 |             <div class="col-4" id="fig:bayessim-twoparam-posterior">
1342 |                 <img src="img/synthetic_param_uncertainty/bayessim_twoparam_mdn_downsampled.png" class="img-fluid" />
1343 |                 <p style="text-align: center;">(a) Posterior</p>
1344 |             </div>
1345 |             <div class="col-4" id="fig:bayessim-twoparam-trajectories">
1346 |                 <img src="img/synthetic_param_uncertainty/bayessim_two_param_mdn_downsampled_trajectories.png"
1347 |                     class="img-fluid" />
1348 |                 <p style="text-align: center;">(b) Trajectory density</p>
1349 |             </div>
1350 |             <div class="col"></div>
1351 |         </div>
1352 |         <div class="row">
1353 |             <div class="col"></div>
1354 |             <div class="col-8">
1355 |                 <p>
1356 |                     <b>Figure 7.</b> Results from BayesSim on the simplified double pendulum experiment where only the
1357 |                     two link lengths need to be inferred. (a) shows the approximated posterior distribution by the MDN
1358 |                     model and "downsampled" input statistics. The diagonal plots show the marginal parameter
1359 |                     distributions, the bottom-left heatmap and the top-right contour plot show the 2D posterior where
1360 |                     the ground-truth parameters at (1.5m, 2m) are indicated by a red star. The
1361 |                     black dots in the top-right plot are 100 parameters sampled from the posterior which are rolled out
1362 |                     to generate trajectories for the trajectory density plot in (b). (b) shows a kernel density
1363 |                     estimation over these 100 trajectories for the four state dimensions
1364 |                     $(\jointpos_{[0:1]},\jointvel_{[0:1]})$ of the double pendulum.
1365 |                 </p>
1366 |             </div>
1367 |             <div class="col"></div>
1368 |         </div>
1369 | 
1370 |         <h4 id="sec:panda-box">2.5 Identify Inertia of an Articulated Rigid Object</h4>
1371 |         <p>
1372 |             The state space consists of the positions and velocities of the seven degrees of freedom of the robot arm
1373 |             and the two degrees of freedom in the universal joint, resulting in a 20-dimensional state vector
1374 |             $\statevec=\begin{bmatrix}\mathbf{q}_{0:8} & \mathbf{\dot{q}}_{0:8} & \mathbf{q}^d_{0:6} &
1375 |             \mathbf{\dot{q}}^d_{0:6}\end{bmatrix}$
1376 |             consisting of nine joint positions and velocities, plus the PD control position and velocity targets,
1377 |             $\mathbf{q}^d$ and $\mathbf{\dot{q}}^d$, for the actuated joints of the robot arm. We control the arm using
1378 |             the <em>MoveIt!</em> motion planning framework [<a href="#sec:references">13</a>] by moving joints 6 and 7
1379 |             to
1380 |             predefined joint-space offsets of $0.1$ and $-0.1$ radians, in sequence. We use the default Iterative
1381 |             Parabolic Time Parameterization algorithm with a velocity scaling factor of $0.1$. We track the motion of
1382 |             the acrylic box via a Vicon motion capture system and derive four Cartesian coordinates as observation
1383 |             $\observationvec=\begin{bmatrix}\mathbf{p}_{o} & \mathbf{p}_{x} & \mathbf{p}_{y} &
1384 |             \mathbf{p}_{z}\end{bmatrix}$ to represent the
1385 |             frame of the box (shown in <a href="#fig:panda-markers">Figure 8</a>): a point of origin located at the
1386 |             center of the
1387 |             upper lid of the box, and three points located 1m away from the origin into the x, y, and z
1388 |             direction (transformed by the reference frame of the box). We chose this state representation to ease the
1389 |             computation of the likelihood, since we only need to compute differences between 3D points instead of
1390 |             computing the distances over 3D rotations which requires special treatment [<a
1391 |                 href="#sec:references">14</a>].
1392 |         </p>
1393 |         <div class="row" id="fig:panda-markers">
1394 |             <div class="col"></div>
1395 |             <div class="col-8" id="fig:bayessim-twoparam-posterior">
1396 |                 <img src="img/panda/panda_sim_markers.png" class="img-fluid" />
1397 |                 <p>
1398 |                     <b>Figure 8.</b> Rendering of the simulation for the underactuated mechanism from
1399 |                     <a href="#sec:panda-box">Section 2.5</a>, where the four reference points for the origin, unit x, y,
1400 |                     and z vectors
1401 |                     are shown. The trace of the simulated trajectory is visualized by the solid lines, the ground-truth
1402 |                     trajectories of the markers are shown as dotted lines.
1403 |                 </p>
1404 |             </div>
1405 |             <div class="col"></div>
1406 |         </div>
1407 |         <p>
1408 |             We first identify the simulation parameters pertaining to the inertial properties of the box and the
1409 |             friction parameters of the universal joint. As shown in <a href="#tab:params-panda-box-phase1">Table 3
1410 |                 (a)</a>, the symmetric
1411 |             inertia matrix of the box is fully determined by the first six parameters, followed by the 3D center of
1412 |             mass. We have measured the mass to be 920g, so we do not need to estimate it. We simulate the
1413 |             universal joint with velocity-dependent damping, with possibly different friction coefficients for both
1414 |             degrees of freedom. The simulation parameters yielding the most accurate fit to a ground-truth trajectory
1415 |             from the physical robot shaking an empty box is shown in <a href="#fig:panda-box-trajectory">Figure 9</a>.
1416 |             We were able to
1417 |             find such parameters via SVGD, CSVGD and Emcee (shown is a parameter configuration from the particle
1418 |             distribution estimated by CSVGD with the highest likelihood).
1419 |         </p>
1420 | 
1421 |         <p>
1422 |             While the simulated trajectory matches the real data significantly better after the inertial parameters of
1423 |             the empty box have been identified (<a href="#fig:panda-box-trajectory-after">Figure 9 (b)</a>) than before
1424 |             (<a href="#fig:panda-box-trajectory-before">Figure (a)</a>), a reality gap remains. We believe this to be a
1425 |             result from a
1426 |             slight modeling error that the rigid body simulator cannot capture, e.g. the top of the box where the
1427 |             universal joint is attached bends slightly while the box is moving, and there may be slight geometric
1428 |             offsets between the real system and the model of it we use in the simulator. The latter parameters could
1429 |             have been further identified with our approach, nonetheless the simulation given the identified parameters
1430 |             is sufficient to be used in the next phase of the inference experiment.
1431 |         </p>
1432 | 
1433 |         <div class="row" id="fig:panda-box-trajectory">
1434 |             <div class="col-6" id="fig:panda-box-trajectory-before">
1435 |                 <img src="img/panda/panda_box_initial_trajectory.png" class="img-fluid" />
1436 |                 <p style="text-align: center;">(a) Before identification of empty box</p>
1437 |             </div>
1438 |             <div class="col-6" id="fig:panda-box-trajectory-after">
1439 |                 <img src="img/panda/panda_box_trajectory.png" class="img-fluid" />
1440 |                 <p style="text-align: center;">(b) After identification of empty box</p>
1441 |             </div>
1442 |         </div>
1443 |         <p>
1444 |             <b>Figure 9.</b> Trajectories from the Panda robot arm shaking an empty box. Visualized are the
1445 |             simulated (red) and real (black) observations before (a) and after (b) the inertial parameters of
1446 |             the empty box and the friction from the universal joint (<a href="#tab:params-panda-box-phase1">Table 3
1447 |                 (a)</a>) have been
1448 |             identified. The columns correspond to the four reference points in the frame of the box (see a rendering of
1449 |             them in <a href="#fig:panda-markers">Figure 8</a>), the rows show the $x$, $y$, and $z$ axes of these
1450 |             reference points in
1451 |             meters. The horizontal axes show the time step.
1452 |         </p>
1453 | 
1454 |         <p>
1455 |             Given the parameters found in the first phase, we now investigate how well the various approaches can cope
1456 |             with dependent variables. By fixing two 500g to the bottom of the acrylic box, the 2D locations
1457 |             of such weights need to be inferred. Naturally, such assignment is symmetric, i.e. weight 1 and 2 can swap
1458 |             locations without affecting the dynamics. What would significantly alter the dynamics, however, is an
1459 |             unbalanced configuration of the weights which would cause the box to tilt.
1460 |         </p>
1461 | 
1462 |         <div class="row" id='tab:params-panda-box'>
1463 |             <div class="col"></div>
1464 |             <div class="col-5">
1465 |                 <table class="table" id="tab:params-panda-box-phase1">
1466 |                     <thead>
1467 |                         <tr>
1468 |                             <th scope="col"></th>
1469 |                             <th scope="col">Parameter</th>
1470 |                             <th scope="col" colspan="2" style="text-align:center">Minimum</th>
1471 |                             <th scope="col" colspan="2" style="text-align:center">Maximum</th>
1472 |                         </tr>
1473 |                     </thead>
1474 |                     <tbody>
1475 |                         <tr>
1476 |                             <th rowspan="9">Box</th>
1477 |                             <th> $I_{xx}$ </th>
1478 |                             <td align="right"> 0.05 </td>
1479 |                             <td> $\kg\cdot\meter^2$ </td>
1480 |                             <td align="right"> 0.1 </td>
1481 |                             <td> $\kg\cdot\meter^2$ </td>
1482 |                         </tr>
1483 |                         <tr>
1484 |                             <th> $I_{yy}$ </th>
1485 |                             <td align="right"> 0.05 </td>
1486 |                             <td> $\kg\cdot\meter^2$ </td>
1487 |                             <td align="right"> 0.1 </td>
1488 |                             <td> $\kg\cdot\meter^2$ </td>
1489 |                         </tr>
1490 |                         <tr>
1491 |                             <th> $I_{zz}$ </th>
1492 |                             <td align="right"> 0.05 </td>
1493 |                             <td> $\kg\cdot\meter^2$ </td>
1494 |                             <td align="right"> 0.1 </td>
1495 |                             <td> $\kg\cdot\meter^2$ </td>
1496 |                         </tr>
1497 |                         <tr>
1498 |                             <th> $I_{xy}$ </th>
1499 |                             <td align="right"> -0.01 </td>
1500 |                             <td> $\kg\cdot\meter^2$ </td>
1501 |                             <td align="right"> 0.01 </td>
1502 |                             <td> $\kg\cdot\meter^2$ </td>
1503 |                         </tr>
1504 |                         <tr>
1505 |                             <th> $I_{xz}$ </th>
1506 |                             <td align="right"> -0.01 </td>
1507 |                             <td> $\kg\cdot\meter^2$ </td>
1508 |                             <td align="right"> 0.01 </td>
1509 |                             <td> $\kg\cdot\meter^2$ </td>
1510 |                         </tr>
1511 |                         <tr>
1512 |                             <th> $I_{yz}$ </th>
1513 |                             <td align="right"> -0.01 </td>
1514 |                             <td> $\kg\cdot\meter^2$ </td>
1515 |                             <td align="right"> 0.01 </td>
1516 |                             <td> $\kg\cdot\meter^2$ </td>
1517 |                         </tr>
1518 |                         <tr>
1519 |                             <th> COM $x$ </th>
1520 |                             <td align="right"> -0.005 </td>
1521 |                             <td> $\meter$ </td>
1522 |                             <td align="right"> 0.005 </td>
1523 |                             <td> $\meter$ </td>
1524 |                         </tr>
1525 |                         <tr>
1526 |                             <th> COM $y$ </th>
1527 |                             <td align="right"> -0.005 </td>
1528 |                             <td> $\meter$ </td>
1529 |                             <td align="right"> 0.005 </td>
1530 |                             <td> $\meter$ </td>
1531 |                         </tr>
1532 |                         <tr>
1533 |                             <th> COM $z$ </th>
1534 |                             <td align="right"> 0.1 </td>
1535 |                             <td> $\meter$ </td>
1536 |                             <td align="right"> 0.4 </td>
1537 |                             <td> $\meter$</td>
1538 |                         </tr>
1539 | 
1540 |                         <tr>
1541 |                             <th rowspan="2">U-Joint</th>
1542 |                             <th> Friction DOF 1 </th>
1543 |                             <td align="right"> 0.0 </td>
1544 |                             <td> </td>
1545 |                             <td align="right"> 0.15 </td>
1546 |                             <td></td>
1547 |                         </tr>
1548 |                         <tr>
1549 |                             <th> Friction DOF 2 </th>
1550 |                             <td align="right"> 0.0 </td>
1551 |                             <td> </td>
1552 |                             <td align="right"> 0.15 </td>
1553 |                             <td> </td>
1554 |                         </tr>
1555 |                     </tbody>
1556 |                 </table>
1557 |                 <p style="text-align: center;">(a) Phase I</p>
1558 | 
1559 |             </div>
1560 |             <div class="col"></div>
1561 |             <div class="col-4">
1562 |                 <table class="table" id="tab:params-panda-box-phase2">
1563 |                     <thead>
1564 |                         <tr>
1565 |                             <th scope="col"></th>
1566 |                             <th scope="col">Parameter</th>
1567 |                             <th scope="col" colspan="2" style="text-align:center">Minimum</th>
1568 |                             <th scope="col" colspan="2" style="text-align:center">Maximum</th>
1569 |                         </tr>
1570 |                     </thead>
1571 |                     <tbody>
1572 |                         <tr>
1573 |                             <th rowspan="2">Weight 1</th>
1574 |                             <th> Position $x$ </th>
1575 |                             <td align="right"> -0.14 </td>
1576 |                             <td> $\meter$ </td>
1577 |                             <td align="right"> 0.14 </td>
1578 |                             <td>$\meter$</td>
1579 |                         </tr>
1580 |                         <tr>
1581 |                             <th> Position $y$ </th>
1582 |                             <td align="right"> -0.08 </td>
1583 |                             <td> $\meter$ </td>
1584 |                             <td align="right"> 0.08 </td>
1585 |                             <td>$\meter$</td>
1586 |                         </tr>
1587 |                         <tr>
1588 |                             <th rowspan="2">Weight 2</th>
1589 |                             <th> Position $x$ </th>
1590 |                             <td align="right"> -0.14 </td>
1591 |                             <td> $\meter$ </td>
1592 |                             <td align="right"> 0.14 </td>
1593 |                             <td>$\meter$</td>
1594 |                         </tr>
1595 |                         <tr>
1596 |                             <th> Position $y$ </th>
1597 |                             <td align="right"> -0.08 </td>
1598 |                             <td> $\meter$ </td>
1599 |                             <td align="right"> 0.08 </td>
1600 |                             <td>$\meter$</td>
1601 |                         </tr>
1602 |                     </tbody>
1603 |                 </table>
1604 |                 <p style="text-align: center;">(b) Phase II</p>
1605 | 
1606 |             </div>
1607 |             <div class="col"></div>
1608 |         </div>
1609 |         <p>
1610 |             <b>Table 3.</b> Parameters to be estimated and their ranges for the two estimation phases of the
1611 |             underactuated mechanism experiment from <a href="#sec:panda-box">Section 2.5</a>.
1612 |         </p>
1613 | 
1614 |         <p>
1615 |             We use 50 particles and run each estimation algorithm for 500 iterations. For each baseline method, we
1616 |             carefully tuned the hyper parameters to facilitate a fair comparison. Such tuning included selecting an
1617 |             appropriate measurement noise variance, which, as we observed on Emcee and SGLD in particular, had a
1618 |             significant influence on the exploration behavior of these algorithms. With a larger observation noise
1619 |             variance the resulting posterior distribution became wider, however we were unable to attain such behavior
1620 |             with the NUTS estimator whose iterates quickly collapsed to a single point at the center of the box (see
1621 |             <a href="#fig:panda-box-posterior-nuts">Figure 10 (d)</a>). Similarly, CEM immediately became stuck in the
1622 |             suboptimal
1623 |             configuration shown in <a href="#fig:panda-box-posterior-cem">Figure 10 (b)</a>. Nonetheless, after 500
1624 |             iterations, all methods
1625 |             predicted weight positions that were aligned opposite to one another to balance the box.
1626 |         </p>
1627 | 
1628 |         <p>
1629 |             As can be seen in <a href="#fig:panda-box-posterior-svgd">Figure 10 (e)</a>, SVGD achieves a fairly
1630 |             predictive posterior
1631 |             approximation, with many particles aligned close to the true vertical position at $y=0$. With the
1632 |             introduction of the multiple-shooting constraints, Constrained SVGD (CSVGD) converges significantly faster
1633 |             to a posterior distribution that accurately captures the true locations of the box, while retaining the
1634 |             exploration performance of SVGD that spreads out the particles over multiple modes, as shown in
1635 |             <a href="#fig:panda-box-posterior-csvgd">Figure 10 (f)</a>.
1636 |         </p>
1637 | 
1638 |         <div class="row" id="fig:panda-box-posterior">
1639 |             <div class="col-4" id="fig:panda-box-posterior-emcee">
1640 |                 <img src="img/panda/box_position_emcee.png" alt="Emcee" class="img-fluid" />
1641 |                 <p style="text-align: center;">(a) Emcee</p>
1642 |             </div>
1643 |             <div class="col-4" id="fig:panda-box-posterior-cem">
1644 |                 <img src="img/panda/box_position_cem.png" alt="CEM" class="img-fluid" />
1645 |                 <p style="text-align: center;">(b) CEM</p>
1646 |             </div>
1647 |             <div class="col-4" id="fig:panda-box-posterior-sgld">
1648 |                 <img src="img/panda/box_position_sgld.png" alt="SGLD" class="img-fluid" />
1649 |                 <p style="text-align: center;">(c) SGLD</p>
1650 |             </div>
1651 |             <div class="col-4" id="fig:panda-box-posterior-nuts">
1652 |                 <img src="img/panda/box_position_nuts.png" alt="NUTS" class="img-fluid" />
1653 |                 <p style="text-align: center;">(d) NUTS</p>
1654 |             </div>
1655 |             <div class="col-4" id="fig:panda-box-posterior-svgd">
1656 |                 <img src="img/panda/box_position_svgd_ss.png" alt="SVGD" class="img-fluid" />
1657 |                 <p style="text-align: center;">(e) SVGD</p>
1658 |             </div>
1659 |             <div class="col-4" id="fig:panda-box-posterior-csvgd">
1660 |                 <img src="img/panda/box_position_svgd_ms.png" alt="CSVGD" class="img-fluid" />
1661 |                 <p style="text-align: center;">(f) CSVGD</p>
1662 |             </div>
1663 |         </div>
1664 |         <p>
1665 |             <b>Figure 10.</b> Posterior plots over the 2D weight locations approximated by the estimation algorithms
1666 |             applied to the underactuated mechanism experiment from <a href="#sec:panda-box">Section 2.5</a>. Blue shades
1667 |             indicate a
1668 |             Gaussian kernel density estimation computed over the inferred parameter samples. Since it is an
1669 |             unbounded kernel density estimate, the blue shades cross the parameter boundaries in certain areas (e.g. for
1670 |             CSVGD), while in reality none of the estimated particles violate the parameter limits.
1671 |         </p>
1672 | 
1673 |         <h3 id="sec:references">References</h3>
1674 | 
1675 |         <style>
1676 |             ul.references {
1677 |                 list-style-type: none;
1678 |                 counter-reset: elementcounter;
1679 |                 padding-left: 0;
1680 |                 display: table;
1681 |             }
1682 | 
1683 |             .references li {
1684 |                 display: table-row;
1685 |             }
1686 | 
1687 |             .references li:before {
1688 |                 content: "["counter(elementcounter) "]";
1689 |                 counter-increment: elementcounter;
1690 |                 font-weight: normal;
1691 |                 display: table-cell;
1692 |                 padding-right: 1em;
1693 |             }
1694 |         </style>
1695 | 
1696 |         <ul class="references">
1697 |             <li>
1698 |                 J. Burkardt. Sobol - the sobol quasirandom sequence.
1699 |                 <a target="_blank"
1700 |                     href="https://people.sc.fsu.edu/~jburkardt/cpp_src/sobol/sobol.html">https://people.sc.fsu.edu/~jburkardt/cpp_src/sobol/sobol.html</a>.
1701 |                 Accessed: 2021-06-23.
1702 |             </li>
1703 |             <li>
1704 |                 B. L. Fox. Algorithm 647: Implementation and relative efficiency of quasirandom sequence generators.
1705 |                 <em>ACM Trans. Math. Softw.</em>, 12(4):362–376, Dec. 1986. ISSN 0098-3500.
1706 |                 <a target="_blank" href="http://dx.doi.org/10.1145/22721.356187">doi:10.1145/22721.356187</a>.
1707 |             </li>
1708 |             <li>
1709 |                 R. Chou, Y. Boers, M. Podt, and M. Geist. Performance evaluation for particle filters. <em>In 14th
1710 |                     International Conference on Information Fusion</em>, pages 1–7, July 2011.
1711 |             </li>
1712 |             <li>
1713 |                 Q. Wang, S. R. Kulkarni, and S. Verdu. Divergence Estimation for Multidimensional Densities Via
1714 |                 $k$-Nearest-Neighbor Distances. <em>IEEE Transactions on Information Theory</em>,
1715 |                 55(5):2392–2405, May 2009. ISSN 0018-9448. <a target="_blank"
1716 |                     href="http://ieeexplore.ieee.org/document/4839047/">doi:10.1109/TIT.2009.2016060</a>.
1717 |             </li>
1718 |             <li>
1719 |                 E. Heiden, D. Millard, E. Coumans, Y. Sheng, and G. S. Sukhatme.
1720 |                 NeuralSim: Augmenting differentiable simulators with neural networks.
1721 |                 In <em>Proceedings of the IEEE International Conference on Robotics and Automation (ICRA)</em>, 2021.
1722 |                 URL <a target="_blank"
1723 |                     href="https://github.com/google-research/tiny-differentiable-simulator">https://github.com/google-research/tiny-differentiable-simulator</a>.
1724 |             </li>
1725 |             <li>
1726 |                 R. Featherstone. <em>Rigid Body Dynamics Algorithms</em>. Springer-Verlag, Berlin, Heidelberg, 2007.
1727 |                 ISBN 0387743146.
1728 |             </li>
1729 |             <li>
1730 |                 L. S. Pontryagin. <em>Mathematical theory of optimal processes</em>. Routledge, 2018.
1731 |             </li>
1732 |             <li>
1733 |                 A. Asseman, T. Kornuta, and A. Ozcan. Learning beyond simulated physics. In <em>Modeling and
1734 |                     Decision-making in the Spatiotemporal Domain Workshop</em>, 2018.
1735 |                 URL <a target="_blank"
1736 |                     href="https://openreview.net/forum?id=HylajWsRF7">https://openreview.net/forum?id=HylajWsRF7</a>.
1737 |             </li>
1738 |             <li>
1739 |                 F. Ramos, R. Possas, and D. Fox. BayesSim: Adaptive domain randomization via probabilistic inference for
1740 |                 robotics simulators.
1741 |                 In <em>Proceedings of Robotics: Science and Systems</em>, Freiburg im Breisgau, Germany, June 2019.
1742 |                 <a target="_blank" href="http://dx.doi.org/10.15607/RSS.2019.XV.029">doi:10.15607/RSS.2019.XV.029</a>.
1743 |             </li>
1744 |             <li>
1745 |                 C. M. Bishop. Mixture density networks. 1994.
1746 |             </li>
1747 |             <li>
1748 |                 P. Kidger and T. Lyons. Signatory: differentiable computations of the signature and logsignature
1749 |                 transforms, on both CPU and GPU.
1750 |                 In <em>International Conference on Learning Representations</em>, 2021.
1751 |                 <a target="_blank"
1752 |                     href="https://github.com/patrick-kidger/signatory">https://github.com/patrick-kidger/signatory</a>.
1753 |             </li>
1754 |             <li>
1755 |                 C. E. Rasmussen and C. K. I. Williams.
1756 |                 <em>Gaussian Processes for Machine Learning (Adaptive Computation and Machine Learning)</em>.
1757 |                 The MIT Press, 2005. ISBN 026218253X.
1758 |             </li>
1759 |             <li>
1760 |                 T. Coleman David. Reducing the Barrier to Entry of Complex Robotic Software: a MoveIt! Case Study.
1761 |                 2014. <a target="_blank"
1762 |                     href="http://dx.doi.org/10.6092/JOSER_2014_05_01_P3">doi:10.6092/JOSER_2014_05_01_P3</a>. URL
1763 |                 <a target="_blank" href="https://aisberg.unibg.it/handle/10446/87657">
1764 |                     https://aisberg.unibg.it/handle/10446/87657</a>. Publisher: Universita degli studi di Bergamo.
1765 |             </li>
1766 |             <li>
1767 |                 D. Q. Huynh. Metrics for 3d rotations: Comparison and analysis. <em>Journal of Mathematical Imaging and
1768 |                     Vision</em>, 35(2):155–164, 2009.
1769 |             </li>
1770 |         </ul>
1771 |     </div>
1772 | 
1773 |     <div class="container" id="acknowledgements">
1774 |         <h2>Acknowledgements</h2>
1775 | 
1776 |         <p class="lead">This work was supported by a Google PhD Fellowship and a NASA Space Technology
1777 |             Research
1778 |             Fellowship, grant number 80NSSC19K1182.</p>
1779 |         <p class="lead">G.S. Sukhatme holds concurrent appointments as a Professor at USC and as an Amazon
1780 |             Scholar. This
1781 |             paper describes work performed at USC and is not associated with Amazon.</p>
1782 |     </div>
1783 | 
1784 |     <div class="bg-light">
1785 |         <div class="container" align="right" style="padding:40px 0">
1786 |             Last updated on January 31, 2022
1787 |         </div>
1788 |     </div>
1789 | 
1790 |     <script src="https://cdn.jsdelivr.net/npm/bootstrap@5.0.0-beta3/dist/js/bootstrap.bundle.min.js"
1791 |         integrity="sha384-JEW9xMcG8R+pH31jmWH6WWP0WintQrMb4s7ZOdauHnUtxwoG2vI5DkLtS3qm9Ekf"
1792 |         crossorigin="anonymous"></script>
1793 | </body>
1794 | 
1795 | </html>
1796 | 


--------------------------------------------------------------------------------