├── .gitignore
├── CODE_OF_CONDUCT.md
├── LICENSE
├── README.md
├── SECURITY.md
├── SUPPORT.md
├── docs
    ├── _config.yml
    ├── css
    │   └── styles.css
    ├── img
    │   ├── Microsoft-logo-only.svg
    │   ├── Microsoft-logo.svg
    │   ├── Microsoft-logo_rgb_c-gray.png
    │   ├── Microsoft-logo_rgb_c-wht.png
    │   ├── Microsoft-logo_rgb_wht.png
    │   ├── dataset_samples.jpg
    │   ├── favicon.ico
    │   ├── joints_uncertainty.png
    │   ├── plot_20_L_Wrist.png
    │   ├── plot_21_R_Wrist.png
    │   ├── plot_all_bold.png
    │   └── results.png
    └── index.html
└── download_data.py


/.gitignore:
--------------------------------------------------------------------------------
  1 | ## Ignore Visual Studio temporary files, build results, and
  2 | ## files generated by popular Visual Studio add-ons.
  3 | ##
  4 | ## Get latest from https://github.com/github/gitignore/blob/main/VisualStudio.gitignore
  5 | 
  6 | # User-specific files
  7 | *.rsuser
  8 | *.suo
  9 | *.user
 10 | *.userosscache
 11 | *.sln.docstates
 12 | 
 13 | # User-specific files (MonoDevelop/Xamarin Studio)
 14 | *.userprefs
 15 | 
 16 | # Mono auto generated files
 17 | mono_crash.*
 18 | 
 19 | # Build results
 20 | [Dd]ebug/
 21 | [Dd]ebugPublic/
 22 | [Rr]elease/
 23 | [Rr]eleases/
 24 | x64/
 25 | x86/
 26 | [Ww][Ii][Nn]32/
 27 | [Aa][Rr][Mm]/
 28 | [Aa][Rr][Mm]64/
 29 | bld/
 30 | [Bb]in/
 31 | [Oo]bj/
 32 | [Ll]og/
 33 | [Ll]ogs/
 34 | 
 35 | # Visual Studio 2015/2017 cache/options directory
 36 | .vs/
 37 | # Uncomment if you have tasks that create the project's static files in wwwroot
 38 | #wwwroot/
 39 | 
 40 | # Visual Studio 2017 auto generated files
 41 | Generated\ Files/
 42 | 
 43 | # MSTest test Results
 44 | [Tt]est[Rr]esult*/
 45 | [Bb]uild[Ll]og.*
 46 | 
 47 | # NUnit
 48 | *.VisualState.xml
 49 | TestResult.xml
 50 | nunit-*.xml
 51 | 
 52 | # Build Results of an ATL Project
 53 | [Dd]ebugPS/
 54 | [Rr]eleasePS/
 55 | dlldata.c
 56 | 
 57 | # Benchmark Results
 58 | BenchmarkDotNet.Artifacts/
 59 | 
 60 | # .NET Core
 61 | project.lock.json
 62 | project.fragment.lock.json
 63 | artifacts/
 64 | 
 65 | # ASP.NET Scaffolding
 66 | ScaffoldingReadMe.txt
 67 | 
 68 | # StyleCop
 69 | StyleCopReport.xml
 70 | 
 71 | # Files built by Visual Studio
 72 | *_i.c
 73 | *_p.c
 74 | *_h.h
 75 | *.ilk
 76 | *.meta
 77 | *.obj
 78 | *.iobj
 79 | *.pch
 80 | *.pdb
 81 | *.ipdb
 82 | *.pgc
 83 | *.pgd
 84 | *.rsp
 85 | *.sbr
 86 | *.tlb
 87 | *.tli
 88 | *.tlh
 89 | *.tmp
 90 | *.tmp_proj
 91 | *_wpftmp.csproj
 92 | *.log
 93 | *.tlog
 94 | *.vspscc
 95 | *.vssscc
 96 | .builds
 97 | *.pidb
 98 | *.svclog
 99 | *.scc
100 | 
101 | # Chutzpah Test files
102 | _Chutzpah*
103 | 
104 | # Visual C++ cache files
105 | ipch/
106 | *.aps
107 | *.ncb
108 | *.opendb
109 | *.opensdf
110 | *.sdf
111 | *.cachefile
112 | *.VC.db
113 | *.VC.VC.opendb
114 | 
115 | # Visual Studio profiler
116 | *.psess
117 | *.vsp
118 | *.vspx
119 | *.sap
120 | 
121 | # Visual Studio Trace Files
122 | *.e2e
123 | 
124 | # TFS 2012 Local Workspace
125 | $tf/
126 | 
127 | # Guidance Automation Toolkit
128 | *.gpState
129 | 
130 | # ReSharper is a .NET coding add-in
131 | _ReSharper*/
132 | *.[Rr]e[Ss]harper
133 | *.DotSettings.user
134 | 
135 | # TeamCity is a build add-in
136 | _TeamCity*
137 | 
138 | # DotCover is a Code Coverage Tool
139 | *.dotCover
140 | 
141 | # AxoCover is a Code Coverage Tool
142 | .axoCover/*
143 | !.axoCover/settings.json
144 | 
145 | # Coverlet is a free, cross platform Code Coverage Tool
146 | coverage*.json
147 | coverage*.xml
148 | coverage*.info
149 | 
150 | # Visual Studio code coverage results
151 | *.coverage
152 | *.coveragexml
153 | 
154 | # NCrunch
155 | _NCrunch_*
156 | .*crunch*.local.xml
157 | nCrunchTemp_*
158 | 
159 | # MightyMoose
160 | *.mm.*
161 | AutoTest.Net/
162 | 
163 | # Web workbench (sass)
164 | .sass-cache/
165 | 
166 | # Installshield output folder
167 | [Ee]xpress/
168 | 
169 | # DocProject is a documentation generator add-in
170 | DocProject/buildhelp/
171 | DocProject/Help/*.HxT
172 | DocProject/Help/*.HxC
173 | DocProject/Help/*.hhc
174 | DocProject/Help/*.hhk
175 | DocProject/Help/*.hhp
176 | DocProject/Help/Html2
177 | DocProject/Help/html
178 | 
179 | # Click-Once directory
180 | publish/
181 | 
182 | # Publish Web Output
183 | *.[Pp]ublish.xml
184 | *.azurePubxml
185 | # Note: Comment the next line if you want to checkin your web deploy settings,
186 | # but database connection strings (with potential passwords) will be unencrypted
187 | *.pubxml
188 | *.publishproj
189 | 
190 | # Microsoft Azure Web App publish settings. Comment the next line if you want to
191 | # checkin your Azure Web App publish settings, but sensitive information contained
192 | # in these scripts will be unencrypted
193 | PublishScripts/
194 | 
195 | # NuGet Packages
196 | *.nupkg
197 | # NuGet Symbol Packages
198 | *.snupkg
199 | # The packages folder can be ignored because of Package Restore
200 | **/[Pp]ackages/*
201 | # except build/, which is used as an MSBuild target.
202 | !**/[Pp]ackages/build/
203 | # Uncomment if necessary however generally it will be regenerated when needed
204 | #!**/[Pp]ackages/repositories.config
205 | # NuGet v3's project.json files produces more ignorable files
206 | *.nuget.props
207 | *.nuget.targets
208 | 
209 | # Microsoft Azure Build Output
210 | csx/
211 | *.build.csdef
212 | 
213 | # Microsoft Azure Emulator
214 | ecf/
215 | rcf/
216 | 
217 | # Windows Store app package directories and files
218 | AppPackages/
219 | BundleArtifacts/
220 | Package.StoreAssociation.xml
221 | _pkginfo.txt
222 | *.appx
223 | *.appxbundle
224 | *.appxupload
225 | 
226 | # Visual Studio cache files
227 | # files ending in .cache can be ignored
228 | *.[Cc]ache
229 | # but keep track of directories ending in .cache
230 | !?*.[Cc]ache/
231 | 
232 | # Others
233 | ClientBin/
234 | ~$*
235 | *~
236 | *.dbmdl
237 | *.dbproj.schemaview
238 | *.jfm
239 | *.pfx
240 | *.publishsettings
241 | orleans.codegen.cs
242 | 
243 | # Including strong name files can present a security risk
244 | # (https://github.com/github/gitignore/pull/2483#issue-259490424)
245 | #*.snk
246 | 
247 | # Since there are multiple workflows, uncomment next line to ignore bower_components
248 | # (https://github.com/github/gitignore/pull/1529#issuecomment-104372622)
249 | #bower_components/
250 | 
251 | # RIA/Silverlight projects
252 | Generated_Code/
253 | 
254 | # Backup & report files from converting an old project file
255 | # to a newer Visual Studio version. Backup files are not needed,
256 | # because we have git ;-)
257 | _UpgradeReport_Files/
258 | Backup*/
259 | UpgradeLog*.XML
260 | UpgradeLog*.htm
261 | ServiceFabricBackup/
262 | *.rptproj.bak
263 | 
264 | # SQL Server files
265 | *.mdf
266 | *.ldf
267 | *.ndf
268 | 
269 | # Business Intelligence projects
270 | *.rdl.data
271 | *.bim.layout
272 | *.bim_*.settings
273 | *.rptproj.rsuser
274 | *- [Bb]ackup.rdl
275 | *- [Bb]ackup ([0-9]).rdl
276 | *- [Bb]ackup ([0-9][0-9]).rdl
277 | 
278 | # Microsoft Fakes
279 | FakesAssemblies/
280 | 
281 | # GhostDoc plugin setting file
282 | *.GhostDoc.xml
283 | 
284 | # Node.js Tools for Visual Studio
285 | .ntvs_analysis.dat
286 | node_modules/
287 | 
288 | # Visual Studio 6 build log
289 | *.plg
290 | 
291 | # Visual Studio 6 workspace options file
292 | *.opt
293 | 
294 | # Visual Studio 6 auto-generated workspace file (contains which files were open etc.)
295 | *.vbw
296 | 
297 | # Visual Studio 6 auto-generated project file (contains which files were open etc.)
298 | *.vbp
299 | 
300 | # Visual Studio 6 workspace and project file (working project files containing files to include in project)
301 | *.dsw
302 | *.dsp
303 | 
304 | # Visual Studio 6 technical files
305 | *.ncb
306 | *.aps
307 | 
308 | # Visual Studio LightSwitch build output
309 | **/*.HTMLClient/GeneratedArtifacts
310 | **/*.DesktopClient/GeneratedArtifacts
311 | **/*.DesktopClient/ModelManifest.xml
312 | **/*.Server/GeneratedArtifacts
313 | **/*.Server/ModelManifest.xml
314 | _Pvt_Extensions
315 | 
316 | # Paket dependency manager
317 | .paket/paket.exe
318 | paket-files/
319 | 
320 | # FAKE - F# Make
321 | .fake/
322 | 
323 | # CodeRush personal settings
324 | .cr/personal
325 | 
326 | # Python Tools for Visual Studio (PTVS)
327 | __pycache__/
328 | *.pyc
329 | 
330 | # Cake - Uncomment if you are using it
331 | # tools/**
332 | # !tools/packages.config
333 | 
334 | # Tabs Studio
335 | *.tss
336 | 
337 | # Telerik's JustMock configuration file
338 | *.jmconfig
339 | 
340 | # BizTalk build output
341 | *.btp.cs
342 | *.btm.cs
343 | *.odx.cs
344 | *.xsd.cs
345 | 
346 | # OpenCover UI analysis results
347 | OpenCover/
348 | 
349 | # Azure Stream Analytics local run output
350 | ASALocalRun/
351 | 
352 | # MSBuild Binary and Structured Log
353 | *.binlog
354 | 
355 | # NVidia Nsight GPU debugger configuration file
356 | *.nvuser
357 | 
358 | # MFractors (Xamarin productivity tool) working folder
359 | .mfractor/
360 | 
361 | # Local History for Visual Studio
362 | .localhistory/
363 | 
364 | # Visual Studio History (VSHistory) files
365 | .vshistory/
366 | 
367 | # BeatPulse healthcheck temp database
368 | healthchecksdb
369 | 
370 | # Backup folder for Package Reference Convert tool in Visual Studio 2017
371 | MigrationBackup/
372 | 
373 | # Ionide (cross platform F# VS Code tools) working folder
374 | .ionide/
375 | 
376 | # Fody - auto-generated XML schema
377 | FodyWeavers.xsd
378 | 
379 | # VS Code files for those working on multiple tools
380 | .vscode/*
381 | !.vscode/settings.json
382 | !.vscode/tasks.json
383 | !.vscode/launch.json
384 | !.vscode/extensions.json
385 | *.code-workspace
386 | 
387 | # Local History for Visual Studio Code
388 | .history/
389 | 
390 | # Windows Installer files from build outputs
391 | *.cab
392 | *.msi
393 | *.msix
394 | *.msm
395 | *.msp
396 | 
397 | # JetBrains Rider
398 | *.sln.iml
399 | 


--------------------------------------------------------------------------------
/CODE_OF_CONDUCT.md:
--------------------------------------------------------------------------------
 1 | # Microsoft Open Source Code of Conduct
 2 | 
 3 | This project has adopted the [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/).
 4 | 
 5 | Resources:
 6 | 
 7 | - [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/)
 8 | - [Microsoft Code of Conduct FAQ](https://opensource.microsoft.com/codeofconduct/faq/)
 9 | - Contact [opencode@microsoft.com](mailto:opencode@microsoft.com) with questions or concerns
10 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | Research Use of Data Agreement v1.0
 2 | 
 3 | This is the Research Use of Data Agreement, Version 1.0 (the “R-UDA”). Capitalized terms are defined in Section 5. Data Provider and you agree as follows:
 4 | 
 5 | 1. Provision of the Data
 6 | 1.1. You may use, modify, and distribute the Data made available to you by the Data Provider under this R-UDA for Research Use if you follow the R-UDA’s terms.
 7 | 1.2. Data Provider will not sue you or any Downstream Recipient for any claim arising out of the use, modification, or distribution of the Data provided you meet the terms of the R-UDA.
 8 | 1.3. This R-UDA does not restrict your use, modification, or distribution of any portions of the Data that are in the public domain or that may be used, modified, or distributed under any other legal exception or limitation.
 9 | 
10 | 2. Restrictions
11 | 2.1. You agree that you will use the Data solely for Computational Use for non-commercial research. This restriction means that you may engage in non-commercial research activities (including non-commercial research undertaken by or funded via a commercial entity), but you may not use the Data or any Results in any commercial offering, including as part of a product or service (or to improve any product or service) you use or provide to others.
12 | 2.2. You may not receive money or other consideration in exchange for use or redistribution of Data.
13 | 
14 | 3. Redistribution of Data
15 | 3.1. You may redistribute the Data, so long as:
16 | 3.1.1. You include with any Data you redistribute all credit or attribution information that you received with the Data, and your terms require any Downstream Recipient to do the same; and
17 | 3.1.2. You bind each recipient to whom you redistribute the Data to the terms of the R-UDA.
18 | 
19 | 4. No Warranty, Limitation of Liability
20 | 4.1. Data Provider does not represent or warrant that it has any rights whatsoever in the Data.
21 | 4.2. THE DATA IS PROVIDED ON AN “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED INCLUDING, WITHOUT LIMITATION, ANY WARRANTIES OR CONDITIONS OF TITLE, NON-INFRINGEMENT, MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
22 | 4.3. NEITHER DATA PROVIDER NOR ANY UPSTREAM DATA PROVIDER SHALL HAVE ANY LIABILITY FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING WITHOUT LIMITATION LOST PROFITS), HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE DATA OR RESULTS, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
23 | 
24 | 5. Definitions
25 | 5.1. “Computational Use” means activities necessary to enable the use of Data (alone or along with other material) for analysis by a computer.
26 | 5.2. “Data” means the material you receive under the R-UDA in modified or unmodified form, but not including Results.
27 | 5.3. “Data Provider” means the source from which you receive the Data and with whom you enter into the R-UDA.
28 | 5.4. “Downstream Recipient” means any person or persons who receives the Data directly or indirectly from you in accordance with the R-UDA.
29 | 5.5. “Result” means anything that you develop or improve from your use of Data that does not include more than a de minimis portion of the Data on which the use is based. Results may include de minimis portions of the Data necessary to report on or explain use that has been conducted with the Data, such as figures in scientific papers, but do not include more. Artificial intelligence models trained on Data (and which do not include more than a de minimis portion of Data) are Results.
30 | 5.6. “Upstream Data Providers” means the source or sources from which the Data Provider directly or indirectly received, under the terms of the R-UDA, material that is included in the Data.
31 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ![SynthEgo dataset](docs/img/dataset_samples.jpg)
 2 | 
 3 | # The SynthEgo Dataset
 4 | 
 5 | The SynthEgo dataset was introduced in our paper [**SimpleEgo: Predicting probabilistic body pose from egocentric cameras**](https://microsoft.github.io/SimpleEgo/).
 6 | 
 7 | The dataset contains:
 8 | 
 9 | - 60,000 stereo pair synthetic RGB images from a head mounted camera at 1280x720 pixel resolution.
10 | - [SMPL-H](https://mano.is.tue.mpg.de/) pose and identity parameters for each stereo pair.
11 | - 3D joint locations in world and camera space for each image.
12 | - 2D joint locations in image space for each image.
13 | - Camera parameters for each image.
14 | 
15 | ## Downloading the dataset
16 | 
17 | The license terms for the [MANO](https://mano.is.tue.mpg.de/) dataset and parts of the [AMASS](https://amass.is.tue.mpg.de/) dataset prevent redistribution.
18 | As such, we include names and indices for these poses in the dataset we distribute, but not the pose parameters themselves.
19 | **For simplicity, we provide a script to download the MANO, AMASS and SynthEgo datasets and splice in the relevant pose parameters automatically.**
20 | You will need to sign up for MANO and AMASS and provide the relevant credentials when prompted by the script.
21 | The only requirements for the script are numpy and wget, otherwise simply run `python download_dataset.py` from the command line.
22 | 
23 | You can download the dataset in parts (3GB each) directly from the following links, though *this is not recommended*:
24 | 
25 | - [Part 1](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_01.zip)
26 | - [Part 2](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_02.zip)
27 | - [Part 3](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_03.zip)
28 | - [Part 4](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_04.zip)
29 | - [Part 5](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_05.zip)
30 | - [Part 6](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_06.zip)
31 | - [Part 7](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_07.zip)
32 | - [Part 7](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_08.zip)
33 | - [Part 9](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_09.zip)
34 | - [Part 10](https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_10.zip)
35 | 
36 | ## Dataset layout
37 | 
38 | Once extracted, the dataset contains files for each sample of the form:
39 | 
40 | - `metadata_0000000_0000.json`
41 | - `img_L_0000000_0000.jpg`
42 | - `img_R_0000000_0000.jpg`
43 | 
44 | Where the first number indicates the subject index from 0 to 6000, and the second number indicates the frame index from 0 to 10.
45 | The metadata files are structured as follows:
46 | 
47 | ```json
48 | {
49 |   "pose": [ "52x3 array of SMPL-H thetas/pose parameters" ],
50 |   "translation": [ "3 element SMPL-H translation vector" ],
51 |   "identity": [ "10 element SMPL-H neutral beta vector" ],
52 |   "cameras": {
53 |       "camera_L": {
54 |           "world_to_camera": [ "4x4 extrinsic matrix" ],
55 |           "camera_to_image": [ "3x3 intrinsic matrix" ],
56 |           "resolution": [1280, 720]
57 |       },
58 |       "camera_R": { "as for camera_L" },
59 |   },
60 |   "landmarks": {
61 |       "3D_world": [ "54x3 joint locations in world space" ],
62 |       "3D_camera_L": [ "54x3 joint locations in camera space for camera_L" ],
63 |       "2D_camera_L": [ "54x2 joint locations in image space for camera_L" ],
64 |       "3D_camera_R": [ "54x3 joint locations in camera space for camera_R" ],
65 |       "2D_camera_R": [ "54x2 joint locations in image space for camera_R" ],
66 |   }
67 | }
68 | ```
69 | 
70 | ## Citation
71 | 
72 | If you use the SynthEgo Dataset your research, please cite the following paper:
73 | 
74 | ```bibtex
75 | @inproceedings{cuevas2024simpleego,
76 |   title={{SimpleEgo}: Predicting probabilistic body pose from egocentric cameras},
77 |   author={Cuevas-Velasquez, Hanz and Hewitt, Charlie and Aliakbarian, Sadegh and Baltru{\v{s}}aitis, Tadas},
78 |   booktitle={2024 International Conference on 3D Vision (3DV)},
79 |   pages={1446--1455},
80 |   year={2024},
81 |   organization={IEEE}
82 | }
83 | ```
84 | 


--------------------------------------------------------------------------------
/SECURITY.md:
--------------------------------------------------------------------------------
 1 | <!-- BEGIN MICROSOFT SECURITY.MD V0.0.9 BLOCK -->
 2 | 
 3 | ## Security
 4 | 
 5 | Microsoft takes the security of our software products and services seriously, which includes all source code repositories managed through our GitHub organizations, which include [Microsoft](https://github.com/Microsoft), [Azure](https://github.com/Azure), [DotNet](https://github.com/dotnet), [AspNet](https://github.com/aspnet) and [Xamarin](https://github.com/xamarin).
 6 | 
 7 | If you believe you have found a security vulnerability in any Microsoft-owned repository that meets [Microsoft's definition of a security vulnerability](https://aka.ms/security.md/definition), please report it to us as described below.
 8 | 
 9 | ## Reporting Security Issues
10 | 
11 | **Please do not report security vulnerabilities through public GitHub issues.**
12 | 
13 | Instead, please report them to the Microsoft Security Response Center (MSRC) at [https://msrc.microsoft.com/create-report](https://aka.ms/security.md/msrc/create-report).
14 | 
15 | If you prefer to submit without logging in, send email to [secure@microsoft.com](mailto:secure@microsoft.com).  If possible, encrypt your message with our PGP key; please download it from the [Microsoft Security Response Center PGP Key page](https://aka.ms/security.md/msrc/pgp).
16 | 
17 | You should receive a response within 24 hours. If for some reason you do not, please follow up via email to ensure we received your original message. Additional information can be found at [microsoft.com/msrc](https://www.microsoft.com/msrc). 
18 | 
19 | Please include the requested information listed below (as much as you can provide) to help us better understand the nature and scope of the possible issue:
20 | 
21 |   * Type of issue (e.g. buffer overflow, SQL injection, cross-site scripting, etc.)
22 |   * Full paths of source file(s) related to the manifestation of the issue
23 |   * The location of the affected source code (tag/branch/commit or direct URL)
24 |   * Any special configuration required to reproduce the issue
25 |   * Step-by-step instructions to reproduce the issue
26 |   * Proof-of-concept or exploit code (if possible)
27 |   * Impact of the issue, including how an attacker might exploit the issue
28 | 
29 | This information will help us triage your report more quickly.
30 | 
31 | If you are reporting for a bug bounty, more complete reports can contribute to a higher bounty award. Please visit our [Microsoft Bug Bounty Program](https://aka.ms/security.md/msrc/bounty) page for more details about our active programs.
32 | 
33 | ## Preferred Languages
34 | 
35 | We prefer all communications to be in English.
36 | 
37 | ## Policy
38 | 
39 | Microsoft follows the principle of [Coordinated Vulnerability Disclosure](https://aka.ms/security.md/cvd).
40 | 
41 | <!-- END MICROSOFT SECURITY.MD BLOCK -->
42 | 


--------------------------------------------------------------------------------
/SUPPORT.md:
--------------------------------------------------------------------------------
 1 | # TODO: The maintainer of this repo has not yet edited this file
 2 | 
 3 | **REPO OWNER**: Do you want Customer Service & Support (CSS) support for this product/project?
 4 | 
 5 | - **No CSS support:** Fill out this template with information about how to file issues and get help.
 6 | - **Yes CSS support:** Fill out an intake form at [aka.ms/onboardsupport](https://aka.ms/onboardsupport). CSS will work with/help you to determine next steps.
 7 | - **Not sure?** Fill out an intake as though the answer were "Yes". CSS will help you decide.
 8 | 
 9 | *Then remove this first heading from this SUPPORT.MD file before publishing your repo.*
10 | 
11 | # Support
12 | 
13 | ## How to file issues and get help  
14 | 
15 | This project uses GitHub Issues to track bugs and feature requests. Please search the existing 
16 | issues before filing new issues to avoid duplicates.  For new issues, file your bug or 
17 | feature request as a new Issue.
18 | 
19 | For help and questions about using this project, please **REPO MAINTAINER: INSERT INSTRUCTIONS HERE 
20 | FOR HOW TO ENGAGE REPO OWNERS OR COMMUNITY FOR HELP. COULD BE A STACK OVERFLOW TAG OR OTHER
21 | CHANNEL. WHERE WILL YOU HELP PEOPLE?**.
22 | 
23 | ## Microsoft Support Policy  
24 | 
25 | Support for this **PROJECT or PRODUCT** is limited to the resources listed above.
26 | 


--------------------------------------------------------------------------------
/docs/_config.yml:
--------------------------------------------------------------------------------
1 | theme: jekyll-theme-cayman


--------------------------------------------------------------------------------
/docs/css/styles.css:
--------------------------------------------------------------------------------
 1 | @import "https://cdn.jsdelivr.net/npm/bulma@0.9.3/css/bulma.min.css";
 2 | @import "https://cdn.jsdelivr.net/npm/@creativebulma/bulma-tooltip@1.2.0/dist/bulma-tooltip.min.css";
 3 | @media screen and (min-width: 1024px) {
 4 |     .container {
 5 |         max-width: 860px;
 6 |     }
 7 | }
 8 | 
 9 | .authors>span {
10 |     padding: 0 0.5rem;
11 |     display: inline-block;
12 | }
13 | 
14 | @media only screen and (max-width: 480px) {
15 |     a.button.is-rounded.is-link.is-light:not(:last-child) {
16 |         margin-bottom: 0.75em;
17 |     }
18 | }
19 | 
20 | .footer-links a {
21 |     color: inherit !important;
22 |     padding: 0 1em;
23 | }


--------------------------------------------------------------------------------
/docs/img/Microsoft-logo-only.svg:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <!-- Generator: Adobe Illustrator 25.4.1, SVG Export Plug-In . SVG Version: 6.00 Build 0)  -->
 3 | <svg version="1.1" id="MS-symbol" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
 4 | 	 viewBox="0 0 72 72" style="enable-background:new 0 0 72 72;" xml:space="preserve">
 5 | <style type="text/css">
 6 | 	.st0{fill:#F25022;}
 7 | 	.st1{fill:#7FBA00;}
 8 | 	.st2{fill:#00A4EF;}
 9 | 	.st3{fill:#FFB900;}
10 | </style>
11 | <g>
12 | 	<g>
13 | 		<rect class="st0" width="34.2" height="34.2"/>
14 | 		<rect x="37.8" class="st1" width="34.2" height="34.2"/>
15 | 		<rect y="37.8" class="st2" width="34.2" height="34.2"/>
16 | 		<rect x="37.8" y="37.8" class="st3" width="34.2" height="34.2"/>
17 | 	</g>
18 | </g>
19 | </svg>
20 | 


--------------------------------------------------------------------------------
/docs/img/Microsoft-logo.svg:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <!-- Generator: Adobe Illustrator 24.0.3, SVG Export Plug-In . SVG Version: 6.00 Build 0)  -->
 3 | <svg version="1.1" id="MS-symbol" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
 4 | 	 viewBox="0 0 337.6 72" style="enable-background:new 0 0 337.6 72;" xml:space="preserve">
 5 | <style type="text/css">
 6 | 	.st0{fill:#FFFFFF;}
 7 | 	.st1{fill:#F25022;}
 8 | 	.st2{fill:#7FBA00;}
 9 | 	.st3{fill:#00A4EF;}
10 | 	.st4{fill:#FFB900;}
11 | </style>
12 | <g>
13 | 	<path class="st0" d="M140.3,14.4v43.2h-7.5V23.7h-0.1l-13.4,33.9h-5l-13.7-33.9h-0.1v33.9h-6.9V14.4h10.8l12.4,32h0.2l13.1-32
14 | 		H140.3z M146.6,17.7c0-1.2,0.4-2.2,1.3-3c0.9-0.8,1.9-1.2,3.1-1.2c1.3,0,2.4,0.4,3.2,1.3c0.8,0.8,1.3,1.8,1.3,3s-0.4,2.2-1.3,3
15 | 		c-0.9,0.8-1.9,1.2-3.2,1.2s-2.3-0.4-3.1-1.2C147,19.8,146.6,18.8,146.6,17.7z M154.7,26.6v31h-7.3v-31
16 | 		C147.4,26.6,154.7,26.6,154.7,26.6z M176.8,52.3c1.1,0,2.3-0.3,3.6-0.8s2.5-1.2,3.6-2v6.8c-1.2,0.7-2.5,1.2-4,1.5s-3.1,0.5-4.9,0.5
17 | 		c-4.6,0-8.3-1.4-11.1-4.3c-2.9-2.9-4.3-6.6-4.3-11c0-5,1.5-9.1,4.4-12.3c2.9-3.2,7-4.8,12.4-4.8c1.4,0,2.7,0.2,4.1,0.5
18 | 		c1.4,0.4,2.5,0.8,3.3,1.2v7c-1.1-0.8-2.3-1.5-3.4-1.9c-1.2-0.5-2.4-0.7-3.6-0.7c-2.9,0-5.2,0.9-7,2.8s-2.7,4.4-2.7,7.6
19 | 		c0,3.1,0.8,5.6,2.5,7.3C171.6,51.4,173.9,52.3,176.8,52.3z M204.7,26.1c0.6,0,1.1,0,1.6,0.1s0.9,0.2,1.2,0.3v7.4
20 | 		c-0.4-0.3-0.9-0.5-1.7-0.8c-0.7-0.3-1.6-0.4-2.7-0.4c-1.8,0-3.3,0.8-4.5,2.3s-1.9,3.8-1.9,7v15.6h-7.3v-31h7.3v4.9h0.1
21 | 		c0.7-1.7,1.7-3,3-4C201.2,26.6,202.8,26.1,204.7,26.1z M207.9,42.6c0-5.1,1.4-9.2,4.3-12.2s6.9-4.5,12.1-4.5
22 | 		c4.8,0,8.6,1.4,11.3,4.3c2.7,2.9,4.1,6.8,4.1,11.7c0,5-1.4,9-4.3,12c-2.9,3-6.8,4.5-11.8,4.5c-4.8,0-8.6-1.4-11.4-4.2
23 | 		C209.3,51.3,207.9,47.4,207.9,42.6z M215.5,42.3c0,3.2,0.7,5.7,2.2,7.4c1.5,1.7,3.6,2.6,6.3,2.6c2.7,0,4.7-0.9,6.1-2.6
24 | 		s2.1-4.2,2.1-7.6c0-3.3-0.7-5.8-2.2-7.5c-1.4-1.7-3.4-2.5-6-2.5c-2.7,0-4.7,0.9-6.2,2.7C216.2,36.5,215.5,39,215.5,42.3z
25 | 		 M250.5,34.8c0,1,0.3,1.9,1,2.5s2.1,1.3,4.4,2.2c2.9,1.2,5,2.5,6.1,3.9c1.2,1.5,1.8,3.2,1.8,5.3c0,2.9-1.1,5.3-3.4,7
26 | 		c-2.2,1.8-5.3,2.7-9.1,2.7c-1.3,0-2.7-0.2-4.3-0.5c-1.6-0.3-2.9-0.7-4-1.2v-7.2c1.3,0.9,2.8,1.7,4.3,2.2s2.9,0.8,4.2,0.8
27 | 		c1.6,0,2.9-0.2,3.6-0.7c0.8-0.5,1.2-1.2,1.2-2.3c0-1-0.4-1.9-1.2-2.5c-0.8-0.7-2.4-1.5-4.6-2.4c-2.7-1.1-4.6-2.4-5.7-3.8
28 | 		s-1.7-3.2-1.7-5.4c0-2.8,1.1-5.1,3.3-6.9c2.2-1.8,5.1-2.7,8.6-2.7c1.1,0,2.3,0.1,3.6,0.4c1.3,0.2,2.5,0.6,3.4,0.9V34
29 | 		c-1-0.6-2.1-1.2-3.4-1.7s-2.6-0.7-3.8-0.7c-1.4,0-2.5,0.3-3.2,0.8C250.9,33.1,250.5,33.8,250.5,34.8z M266.9,42.6
30 | 		c0-5.1,1.4-9.2,4.3-12.2s6.9-4.5,12.1-4.5c4.8,0,8.6,1.4,11.3,4.3c2.7,2.9,4.1,6.8,4.1,11.7c0,5-1.4,9-4.3,12
31 | 		c-2.9,3-6.8,4.5-11.8,4.5c-4.8,0-8.6-1.4-11.4-4.2C268.4,51.3,266.9,47.4,266.9,42.6z M274.5,42.3c0,3.2,0.7,5.7,2.2,7.4
32 | 		c1.5,1.7,3.6,2.6,6.3,2.6c2.7,0,4.7-0.9,6.1-2.6s2.1-4.2,2.1-7.6c0-3.3-0.7-5.8-2.2-7.5c-1.4-1.7-3.4-2.5-6-2.5
33 | 		c-2.7,0-4.7,0.9-6.2,2.7C275.3,36.5,274.5,39,274.5,42.3z M322.9,32.6H312v25h-7.4v-25h-5.2v-6h5.2v-4.3c0-3.3,1.1-5.9,3.2-8
34 | 		s4.8-3.1,8.1-3.1c0.9,0,1.7,0,2.4,0.1c0.7,0.1,1.3,0.2,1.8,0.4V18c-0.2-0.1-0.7-0.3-1.3-0.5c-0.6-0.2-1.3-0.3-2.1-0.3
35 | 		c-1.5,0-2.7,0.5-3.5,1.4c-0.8,1-1.2,2.4-1.2,4.2v3.7h10.9v-7l7.3-2.2v9.2h7.4v6h-7.4V47c0,1.9,0.3,3.3,1,4c0.7,0.8,1.8,1.2,3.3,1.2
36 | 		c0.4,0,0.9-0.1,1.5-0.3c0.6-0.2,1.1-0.4,1.6-0.7v6c-0.5,0.3-1.2,0.5-2.3,0.7c-1.1,0.2-2.1,0.3-3.2,0.3c-3.1,0-5.4-0.8-6.9-2.5
37 | 		c-1.5-1.6-2.3-4.1-2.3-7.4V32.6z"/>
38 | 	<g>
39 | 		<rect class="st1" width="34.2" height="34.2"/>
40 | 		<rect x="37.8" class="st2" width="34.2" height="34.2"/>
41 | 		<rect y="37.8" class="st3" width="34.2" height="34.2"/>
42 | 		<rect x="37.8" y="37.8" class="st4" width="34.2" height="34.2"/>
43 | 	</g>
44 | </g>
45 | </svg>
46 | 


--------------------------------------------------------------------------------
/docs/img/Microsoft-logo_rgb_c-gray.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/Microsoft-logo_rgb_c-gray.png


--------------------------------------------------------------------------------
/docs/img/Microsoft-logo_rgb_c-wht.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/Microsoft-logo_rgb_c-wht.png


--------------------------------------------------------------------------------
/docs/img/Microsoft-logo_rgb_wht.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/Microsoft-logo_rgb_wht.png


--------------------------------------------------------------------------------
/docs/img/dataset_samples.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/dataset_samples.jpg


--------------------------------------------------------------------------------
/docs/img/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/favicon.ico


--------------------------------------------------------------------------------
/docs/img/joints_uncertainty.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/joints_uncertainty.png


--------------------------------------------------------------------------------
/docs/img/plot_20_L_Wrist.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/plot_20_L_Wrist.png


--------------------------------------------------------------------------------
/docs/img/plot_21_R_Wrist.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/plot_21_R_Wrist.png


--------------------------------------------------------------------------------
/docs/img/plot_all_bold.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/plot_all_bold.png


--------------------------------------------------------------------------------
/docs/img/results.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/microsoft/SimpleEgo/c5b171e5aaabad62ee1f22dbe81f0c9de49168d9/docs/img/results.png


--------------------------------------------------------------------------------
/docs/index.html:
--------------------------------------------------------------------------------
  1 | <!DOCTYPE html>
  2 | <html>
  3 | 
  4 | <head>
  5 |     <meta charset="utf-8">
  6 |     <meta name="viewport" content="width=device-width, initial-scale=1">
  7 |     <title>SimpleEgo</title>
  8 |     <link rel="shortcut icon" type="image/jpg" href="img/favicon.ico" />
  9 |     <!-- <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bulma@0.9.3/css/bulma.min.css"> -->
 10 |     <link rel="stylesheet" href="css/styles.css">
 11 |     <link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
 12 |     <script src="https://kit.fontawesome.com/49f46e7382.js" crossorigin="anonymous"></script>
 13 |     <script type="text/javascript" id="MathJax-script" async
 14 |         src="https://cdn.jsdelivr.net/npm/mathjax@3/es5/tex-chtml.js"></script>
 15 |     <script>
 16 |         window.MathJax = {
 17 |             tex: {
 18 |                 inlineMath: [['$', '$'], ['\\(', '\\)']]
 19 |             }
 20 |         };
 21 |     </script>
 22 | </head>
 23 | 
 24 | <body>
 25 |     <nav class="navbar is-dark" role="navigation" aria-label="main navigation">
 26 |         <div class="container is-max-desktop">
 27 |             <div class="navbar-brand">
 28 |                 <a class="navbar-item"
 29 |                     href="https://www.microsoft.com/en-us/research/lab/mixed-reality-ai-lab-cambridge/">
 30 |                     <img src="img/Microsoft-logo.svg" alt="Mesh Labs – Cambridge" style="height: 1.4rem;">
 31 |                 </a>
 32 |                 <a role="button" class="navbar-burger" aria-label="menu" aria-expanded="false"
 33 |                     data-target="navbarBasicExample">
 34 |                     <span aria-hidden="true"></span>
 35 |                     <span aria-hidden="true"></span>
 36 |                     <span aria-hidden="true"></span>
 37 |                 </a>
 38 |             </div>
 39 |             <div id="navbarBasicExample" class="navbar-menu">
 40 |                 <div class="navbar-start">
 41 |                     <a class="navbar-item"
 42 |                         href="https://www.microsoft.com/en-us/research/lab/mixed-reality-ai-lab-cambridge/">
 43 |                         Mesh Labs
 44 |                     </a>
 45 |                 </div>
 46 |                 <div class="navbar-end">
 47 |                     <a class="navbar-item" href="https://3dvconf.github.io/2024/" style="font-weight: bold;">
 48 |                         <span class="is-hidden-touch">3<span style="color:#ac9add">D</span><span
 49 |                                 style="color:#8e9add">V</span> 2024</span>
 50 |                         <span class="is-hidden-desktop">3<span style="color:#ac9add">D</span><span
 51 |                                 style="color:#8e9add">V</span> 2024</span>
 52 |                     </a>
 53 |                 </div>
 54 |             </div>
 55 |         </div>
 56 |     </nav>
 57 |     <section class="section">
 58 |         <div class="container is-max-desktop">
 59 |             <h1 class="title is-2 has-text-centered">
 60 |                 SimpleEgo
 61 |             </h1>
 62 |             <p class="subtitle is-4 has-text-centered">
 63 |                 Predicting probabilistic body pose from egocentric cameras
 64 |             </p>
 65 |             <p class="subtitle is-5 has-text-centered has-text-grey">
 66 |                 International Conference on 3D Vision 2024
 67 |             </p>
 68 | 
 69 |             <p class="subtitle is-6 has-text-centered authors" style="line-height: 1.5;">
 70 |                 <span>
 71 |                     <a href="https://www.hanzcuevas.com">Hanz&nbsp;Cuevas&nbsp;Vel&aacute;squez</a>
 72 |                 </span>
 73 |                 <span>
 74 |                     <a href="https://chewitt.me/">Charlie&nbsp;Hewitt</a>
 75 |                 </span>
 76 |                 <span>
 77 |                     <a href="mailto:saliakbarian@microsoft.com">Sadegh&nbsp;Aliakbarian</a>
 78 |                 </span>
 79 |                 <span>
 80 |                     <a href="mailto:tabaltru@microsoft.com">Tadas&nbsp;Baltru&scaron;aitis</a>
 81 |                 </span>
 82 |             </p>
 83 |         </div>
 84 |         <div class="container is-max-desktop has-text-centered mt-5">
 85 |             <a href="https://ieeexplore.ieee.org/abstract/document/10550776/" class="button is-rounded is-link is-light mr-2">
 86 |                 <span class="icon"><i class="fas fa-file-pdf"></i></span>
 87 |                 <span>Paper</span>
 88 |             </a>
 89 |             <a href="https://arxiv.org/abs/2401.14785" class="button is-rounded is-link is-light mr-2">
 90 |                 <span class="icon"><i class="ai ai-arxiv"></i></span>
 91 |                 <span>arXiv</span>
 92 |             </a>
 93 |             <a href="https://github.com/microsoft/SimpleEgo" class="button is-rounded is-link is-light">
 94 |                 <span class="icon"><i class="fab fa-github"></i></span>
 95 |                 <span>Dataset</span>
 96 |             </a>
 97 |         </div>
 98 |     </section>
 99 |     <!-- <section>
100 |         <div class="container is-max-desktop">
101 |             <figure class="image is-16by9">
102 |                 <iframe class="has-ratio" width="640" height="360" src="https://youtube.com/embed/TODO" frameborder="0" allowfullscreen></iframe>
103 |             </figure>
104 |         </div>
105 |     </section> -->
106 |     <section class="section">
107 |         <div class="container is-max-desktop">
108 |             <h1 class="title is-4">
109 |                 Abstract
110 |             </h1>
111 |             <div class="content has-text-justified-desktop">
112 |                 <p>
113 |                     Our work addresses the problem of egocentric human pose estimation from downwards-facing cameras on
114 |                     head-mounted devices (HMD).
115 |                     This presents a challenging scenario, as parts of the body often fall outside of the image or are
116 |                     occluded.
117 |                     Previous solutions minimize this problem by using fish-eye camera lenses to capture a wider view,
118 |                     but these can present hardware design issues.
119 |                     They also predict 2D heat-maps per joint and lift them to 3D space to deal with self-occlusions, but
120 |                     this requires large network architectures which are impractical to deploy on resource-constrained
121 |                     HMDs.
122 |                     We predict pose from images captured with conventional rectilinear camera lenses.
123 |                     This resolves hardware design issues, but means body parts are often out of frame.
124 |                     As such, we directly regress probabilistic joint rotations represented as matrix Fisher
125 |                     distributions for a parameterized body model.
126 |                     This allows us to quantify pose uncertainties and explain out-of-frame or occluded joints.
127 |                     This also removes the need to compute 2D heat-maps and allows for simplified DNN architectures which
128 |                     require less compute.
129 |                     Given the lack of egocentric datasets using rectilinear camera lenses, we introduce the
130 |                     <i>SynthEgo</i> dataset, a synthetic dataset with 60K stereo images containing high diversity of
131 |                     pose, shape, clothing and skin tone.
132 |                     Our approach achieves state-of-the-art results for this challenging configuration, reducing mean
133 |                     per-joint position error by 23% overall and 58% for the lower body.
134 |                     Our architecture also has eight times fewer parameters and runs twice as fast as the current
135 |                     state-of-the-art.
136 |                     Experiments show that training on our synthetic dataset leads to good generalization to real world
137 |                     images without fine-tuning.
138 |                 </p>
139 |             </div>
140 |         </div>
141 |     </section>
142 | 
143 | 
144 |     <section class="section pt-0">
145 |         <div class="container is-max-desktop">
146 |             <h1 class="title is-4">
147 |                 <i>SynthEgo</i> Dataset
148 |             </h1>
149 |             <img class="mb-5" src="img/dataset_samples.jpg">
150 |             <div class="content has-text-justified-desktop">
151 |                 <p>
152 |                     To construct the <i>SynthEgo</i> dataset we render 60K stereo pairs at 1280&times;720 pixel
153 |                     resolution, building on the pipeline of <a href="https://arxiv.org/pdf/2301.01161">Hewitt et al</a>.
154 |                     This dataset is comprised of 6000 unique identities, each performing 10 different poses in 10
155 |                     different lighting environments.
156 |                     Each identity is made up of a randomly sampled body shape, skin textures sampled from a library of
157 |                     25 and randomly recolored, and clothing assets sampled from a library of 202.
158 |                     Lighting environments are sampled from a library of 489 HDRIs, to ensure correct disparity of the
159 |                     environment between the stereo pair, we project the HDRI background onto the ground plane.
160 |                     Poses are sampled from a library of over 2 million unique poses and randomly mirrored; sampling is
161 |                     weighted by the mean absolute joint angle and common poses like T-pose are significantly
162 |                     down-weighted to increase diversity.
163 |                 </p>
164 | 
165 |                 <table>
166 |                     <thead>
167 |                         <th></th>
168 |                         <th><a
169 |                                 href="https://vcai.mpi-inf.mpg.de/projects/wxu/Mo2Cap2/">Mo<sup>2</sup>Cap<sup>2</sup></a>
170 |                         </th>
171 |                         <th><a href="https://github.com/facebookresearch/xR-EgoPose">xR-EgoPose</a></th>
172 |                         <th><a href="https://4dqv.mpi-inf.mpg.de/UnrealEgo/">UnrealEgo</a></th>
173 |                         <th><i>SynthEgo</i></th>
174 |                     </thead>
175 |                     <tbody>
176 |                         <tr>
177 |                             <td>Unique Identities</td>
178 |                             <td>700</td>
179 |                             <td>46</td>
180 |                             <td>17</td>
181 |                             <td>6000</td>
182 |                         </tr>
183 |                         <tr>
184 |                             <td>Environments</td>
185 |                             <td>Unspecified</td>
186 |                             <td>Unspecified</td>
187 |                             <td>14</td>
188 |                             <td>489</td>
189 |                         </tr>
190 |                         <tr>
191 |                             <td>Body Model</td>
192 |                             <td>SMPL</td>
193 |                             <td>Unspecified</td>
194 |                             <td>UnrealEngine</td>
195 |                             <td>SMPL-H</td>
196 |                         </tr>
197 |                         <tr>
198 |                             <td>Lens Type</td>
199 |                             <td>Fisheye</td>
200 |                             <td>Fisheye</td>
201 |                             <td>Fisheye</td>
202 |                             <td>Rectilinear</td>
203 |                         </tr>
204 |                         <tr>
205 |                             <td>Mono/Stereo</td>
206 |                             <td>Mono</td>
207 |                             <td>Mono</td>
208 |                             <td>Stereo</td>
209 |                             <td>Stereo</td>
210 |                         </tr>
211 |                         <tr>
212 |                             <td>Body Shape GT</td>
213 |                             <td></td>
214 |                             <td></td>
215 |                             <td></td>
216 |                             <td>&#10003;</td>
217 |                         </tr>
218 |                         <tr>
219 |                             <td>Joint Location GT</td>
220 |                             <td>&#10003;</td>
221 |                             <td>&#10003;</td>
222 |                             <td>&#10003;</td>
223 |                             <td>&#10003;</td>
224 |                         </tr>
225 |                         <tr>
226 |                             <td>Joint Rotation GT</td>
227 |                             <td></td>
228 |                             <td></td>
229 |                             <td></td>
230 |                             <td>&#10003;</td>
231 |                         </tr>
232 |                         <tr>
233 |                             <td>Realism</td>
234 |                             <td>Low</td>
235 |                             <td>Medium</td>
236 |                             <td>High</td>
237 |                             <td>High</td>
238 |                         </tr>
239 |                     </tbody>
240 |                 </table>
241 | 
242 |                 <p>
243 |                     We position the camera on the front of the forehead looking down at the body.
244 |                     The camera uses a pinhole model approximating the <a href="https://www.stereolabs.com/zed-mini/">ZED
245 |                         mini stereo</a>.
246 |                     We add uniform noise within &plusmn;1 cm to the location and &plusmn;10&deg; around all axes of
247 |                     rotation of the camera to simulate misplacement and movement of the HMD on the head.
248 |                     The resulting images are typically quite challenging for pose estimation, as many parts of the body
249 |                     are often not seen by the camera.
250 |                 </p>
251 |             </div>
252 |         </div>
253 |     </section>
254 |     <section class="section pt-0">
255 |         <div class="container is-max-desktop">
256 |             <h1 class="title is-4">
257 |                 Method
258 |             </h1>
259 |             <div class="content has-text-justified-desktop">
260 |                 <p>
261 |                     The goal of our method is to estimate the probability distribution over joint rotations $\mathbf{R}
262 |                     = \{\mathbf{R}_i\}^{N}_{i=1}$ conditioned on input image data $\mathbf{X}$,
263 |                     $p(\mathbf{R}|\mathbf{X})$.
264 |                     Following <a href="https://github.com/akashsengupta1997/HierarchicalProbabilistic3DHuman">Sengupta
265 |                         et al</a>, we train a neural network to regress Fisher parameters $\mathbf{F} =
266 |                     \{\mathbf{F}_i\}^{N}_{i=1}$ given input image data $\mathbf{X}$.
267 |                     From these predicted parameters we can calculate the expected rotation, $\mathbf{\hat{R}}_i$ and the
268 |                     concentration parameters for each joint $i$, $\kappa_{i,j}$.
269 |                     The latter describes the uncertainty of the rotation distribution.
270 |                 </p>
271 | 
272 |                 <p>
273 |                     We train the neural network by minimizing loss $\mathcal{L} = \mathcal{L}_{FNLL} + \mathcal{L}_J$.
274 |                     $\mathcal{L}_{FNLL}$ is the matrix Fisher negative log-likelihood, promoting accurate local joint
275 |                     rotations.
276 |                     $$
277 |                     \begin{aligned}
278 |                     \mathcal{L}_{FNLL}&=\sum_{i=1}^{N}log(c(\mathbf{F}_i))-\text{tr}(\mathbf{F}_i^\top \mathbf{R}_i)
279 |                     \end{aligned}
280 |                     $$
281 |                     $\mathcal{L}_J$ supervises the 3D joint positions regressed from the parametric body model, SMPL-H,
282 |                     with shape parameters $\boldsymbol\beta$ with joint regressor $\mathcal{J}$.
283 |                     $$
284 |                     \begin{aligned}
285 |                     J_{3D}(\mathbf{R},\boldsymbol\beta)=&\mathcal{J}(\textit{SMPL-H}(\mathbf{R}, \boldsymbol\beta))\\
286 |                     \mathcal{L}_{J}=&\left \| J_{3D}(\hat{\mathbf{R}},\boldsymbol\beta)-
287 |                     J_{3D}(\mathbf{R},\boldsymbol\beta) \right \|^2_2
288 |                     \end{aligned}
289 |                     $$
290 |                     This causes the network to consider the effect of the predicted rotations on the final pose, as the
291 |                     positions of child joints are influenced by the rotation of their parents in the kinematic tree of
292 |                     our body model.
293 |                 </p>
294 |             </div>
295 |         </div>
296 |     </section>
297 |     <section class="section pt-0">
298 |         <div class="container is-max-desktop">
299 |             <h1 class="title is-4">
300 |                 Results
301 |             </h1>
302 | 
303 |             <div class="content has-text-centered">
304 |                 <table class="mb-5">
305 |                     <thead>
306 |                         <tr>
307 |                             <th style="vertical-align: middle;" rowspan="2">Input</th>
308 |                             <th style="vertical-align: middle;" rowspan="2">Method</th>
309 |                             <th colspan="4">PA-MPJPE (mm)</th>
310 |                         </tr>
311 |                         <tr>
312 |                             <th>Upper Body</th>
313 |                             <th>Lower Body</th>
314 |                             <th>Hands</th>
315 |                             <th>All</th>
316 |                         </tr>
317 |                     </thead>
318 |                     <tbody>
319 |                         <tr>
320 |                             <td style="vertical-align: middle;" rowspan="2">Monocular</td>
321 |                             <td>xR-EgoPose</td>
322 |                             <td>50.18</td>
323 |                             <td>76.76</td>
324 |                             <td>127.34</td>
325 |                             <td>97.48</td>
326 |                         </tr>
327 |                         <tr>
328 |                             <td>Ours</td>
329 |                             <td><b>38.48</b></td>
330 |                             <td><b>62.35</b></td>
331 |                             <td><b>98.94</b></td>
332 |                             <td><b>76.05</b></td>
333 |                         </tr>
334 |                         <tr>
335 |                             <td style="vertical-align: middle; border-bottom: none;" rowspan="2">Stereo</td>
336 |                             <td>UnrealEgo</td>
337 |                             <td>48.06</td>
338 |                             <td>77.06</td>
339 |                             <td>117.85</td>
340 |                             <td>91.67</td>
341 |                         </tr>
342 |                         <tr>
343 |                             <td>Ours</td>
344 |                             <td><b>34.00</b></td>
345 |                             <td><b>54.59</b></td>
346 |                             <td><b>87.78</b></td>
347 |                             <td><b>67.31</b></td>
348 |                         </tr>
349 |                     </tbody>
350 |                 </table>
351 |             </div>
352 | 
353 |             <div class="columns">
354 |                 <div class="column is-half has-text-justified-desktop">
355 |                     <p>
356 |                         To evaluate the performance on real-world data, we recorded a dataset of 8378 stereo pair images
357 |                         from 11 different subjects performing actions like squatting, sitting, stretching, crossing
358 |                         arms, and interacting with small objects.
359 |                         Overall, our stereo network has the best performance.
360 |                         We observe that the extra information provided by the right image helps the network to better
361 |                         predict extremities.
362 |                         We also note that UnrealEgo and xR-EgoPose perform particularity poorly for lower body joints.
363 |                         This may be caused by the fact that the legs are not always visible, and that 2D heat-maps
364 |                         cannot provide uncertainties for joints outside of the image frame.
365 |                     </p>
366 |                 </div>
367 |                 <div class="column is-half">
368 |                     <img src="img/results.png" alt="Qualitative results on real data" />
369 |                     <p class="is-size-7">Qualitative results of our method compared to recent work for synthetic and real data.</p>
370 |                 </div>
371 |             </div>
372 | 
373 |             <div class="columns">
374 |                 <div class="column is-two-fifths">
375 |                     <img src="img/joints_uncertainty.png" alt="Joint concentration parameter visualization" />
376 |                     <p class="is-size-7">Axis specific concentration for different joints. Concentration is lowest around the primary axis of rotation for a given joint.</p>
377 |                 </div>
378 |                 <div class="column is-three-fifths has-text-justified-desktop">
379 |                     <p>
380 |                         Our paper demonstrates that the predicted uncertainty estimates capture extra information and
381 |                         priors about body pose, and shows empirically that the estimated uncertainties are reliable.
382 |                         While the former allows us to better explain the prediction of the model, the latter is of
383 |                         significant importance when it comes to deployment of our method in downstream tasks such as
384 |                         avatar animation, where uncertainty estimates can be used as a measure of reliance of the
385 |                         predicted poses.
386 |                     </p>
387 |                 </div>
388 |             </div>
389 | 
390 |             <div class="columns has-text-centered mb-0">
391 |                 <div class="column is-one-third pb-0">
392 |                     All Joints
393 |                     <img src="img/plot_all_bold.png" alt="Correlation between uncertainty and error for all joints" />
394 |                 </div>
395 |                 <div class="column is-one-third is-hidden-mobile pb-0">
396 |                     Left Wrist
397 |                     <img src="img/plot_20_L_Wrist.png" alt="Correlation between uncertainty and error for the left wrist" />
398 |                 </div>
399 |                 <div class="column is-one-third is-hidden-mobile pb-0">
400 |                     Right Wrist
401 |                     <img src="img/plot_21_R_Wrist.png" alt="Correlation between uncertainty and error for the right wrist" />
402 |                 </div>
403 |             </div>
404 |             <div class="content has-text-centered">
405 |                 <p class="is-size-7">Correlation of confidence with error; the higher the confidence the lower the error. Our confidence estimates are therefore reliable for downstream use.</p>
406 |             </div>
407 |         </div>
408 |     </section>
409 |     <section class="section pt-0">
410 |         <div class="container is-max-desktop">
411 |             <h1 class="title is-4">
412 |                 BibTeX
413 |             </h1>
414 |             <pre>
415 | @inproceedings{cuevas2024simpleego,
416 |   title={{SimpleEgo}: Predicting probabilistic body pose from egocentric cameras},
417 |   author={Cuevas-Velasquez, Hanz and Hewitt, Charlie and Aliakbarian, Sadegh and Baltru{\v{s}}aitis, Tadas},
418 |   booktitle={2024 International Conference on 3D Vision (3DV)},
419 |   pages={1446--1455},
420 |   year={2024},
421 |   organization={IEEE}
422 | }
423 | </pre>
424 |         </div>
425 |     </section>
426 |     <footer class="footer pb-0">
427 |         <div class="content has-text-centered pb-5">
428 |             <p>
429 |                 Work conducted at <a
430 |                     href=https://www.microsoft.com/en-us/research/lab/mixed-reality-ai-lab-cambridge>Mesh Labs &ndash;
431 |                     Cambridge</a>.<br />
432 |                 <img src="img/Microsoft-logo-only.svg" class="mt-5" alt="Microsoft" style="height: 2rem;">
433 |             </p>
434 |         </div>
435 |         <div class="footer-links content has-text-centered pt-5 has-text-grey-lighter is-size-7">
436 |             <a href="https://go.microsoft.com/fwlink/?LinkId=521839">Privacy</a>
437 |             <a href="https://go.microsoft.com/fwlink/?LinkID=206977">Terms of Use</a>
438 |             <a href="https://www.microsoft.com/en-us/legal/intellectualproperty/trademarks">Trademarks</a>
439 |             <a href="https://microsoft.com">&copy; Microsoft 2024</a>
440 |         </div>
441 |     </footer>
442 | </body>
443 | 
444 | <script>
445 |     document.addEventListener('DOMContentLoaded', () => {
446 | 
447 |         // Get all "navbar-burger" elements
448 |         const $navbarBurgers = Array.prototype.slice.call(document.querySelectorAll('.navbar-burger'), 0);
449 | 
450 |         // Check if there are any navbar burgers
451 |         if ($navbarBurgers.length > 0) {
452 | 
453 |             // Add a click event on each of them
454 |             $navbarBurgers.forEach(el => {
455 |                 el.addEventListener('click', () => {
456 | 
457 |                     // Get the target from the "data-target" attribute
458 |                     const target = el.dataset.target;
459 |                     const $target = document.getElementById(target);
460 | 
461 |                     // Toggle the "is-active" class on both the "navbar-burger" and the "navbar-menu"
462 |                     el.classList.toggle('is-active');
463 |                     $target.classList.toggle('is-active');
464 | 
465 |                 });
466 |             });
467 |         }
468 |     });
469 | </script>
470 | 
471 | </html>
472 | 


--------------------------------------------------------------------------------
/download_data.py:
--------------------------------------------------------------------------------
  1 | """Download and prepare the SynthEgo dataset.
  2 | 
  3 | MANO and AMASS parts from MPII licenses prohibit redistribution, so this script downloads from the
  4 | official source and splices in the correct data.
  5 | """
  6 | import subprocess
  7 | import sys
  8 | import json
  9 | from typing import Optional
 10 | from pathlib import Path
 11 | from getpass import getpass
 12 | from zipfile import ZipFile
 13 | import tarfile
 14 | 
 15 | import numpy as np
 16 | 
 17 | MANO_N_J = 15
 18 | SMPL_H_N_J = 22
 19 | LEFT_HAND = SMPL_H_N_J
 20 | RIGHT_HAND = SMPL_H_N_J + MANO_N_J
 21 | 
 22 | MANO_FILENAME = "manoposesv10"
 23 | MOSH_FILENAME = "MoSh"
 24 | POSELIM_FILENAME = "PosePrior"
 25 | SYNTHEGO_DIRNAME = "SynthEgo"
 26 | 
 27 | 
 28 | def _download_mpii_file(
 29 |     username: str, password: str, domain: str, file: str, out_path: Path
 30 | ) -> None:
 31 |     out_path.parent.mkdir(exist_ok=True, parents=True)
 32 |     url = f"https://download.is.tue.mpg.de/download.php?domain={domain}&resume=1&sfile={file}"
 33 |     try:
 34 |         subprocess.check_call(
 35 |             [
 36 |                 "wget",
 37 |                 "--post-data",
 38 |                 f"username={username}&password={password}",
 39 |                 url,
 40 |                 "-O",
 41 |                 out_path.as_posix(),
 42 |                 "--no-check-certificate",
 43 |                 "--continue",
 44 |             ]
 45 |         )
 46 |     except FileNotFoundError as exc:
 47 |         raise RuntimeError("wget not found, please install it") from exc
 48 |     except subprocess.CalledProcessError:
 49 |         print("Download failed, check your login details")
 50 |         if out_path.exists():
 51 |             out_path.unlink()
 52 |         sys.exit(1)
 53 | 
 54 | 
 55 | def get_mano(out_dir: Path) -> None:
 56 |     """Download MANO data."""
 57 |     print("Downloading MANO...")
 58 |     username = input("Username: ")
 59 |     password = getpass("Password: ")
 60 |     _download_mpii_file(
 61 |         username,
 62 |         password,
 63 |         "mano",
 64 |         f"{MANO_FILENAME}.zip",
 65 |         out_dir / f"{MANO_FILENAME}.zip",
 66 |     )
 67 | 
 68 | 
 69 | def get_amass(out_dir: Path) -> None:
 70 |     """Download AMASS data."""
 71 |     print("Downloading AMASS...")
 72 |     username = input("Username: ")
 73 |     password = getpass("Password: ")
 74 |     _download_mpii_file(
 75 |         username,
 76 |         password,
 77 |         "amass",
 78 |         f"amass_per_dataset/smplh/gender_specific/mosh_results/{MOSH_FILENAME}.tar.bz2",
 79 |         out_dir / f"{MOSH_FILENAME}.tar.bz2",
 80 |     )
 81 |     _download_mpii_file(
 82 |         username,
 83 |         password,
 84 |         "amass",
 85 |         f"amass_per_dataset/smplh/gender_specific/mosh_results/{POSELIM_FILENAME}.tar.bz2",
 86 |         out_dir / f"{POSELIM_FILENAME}.tar.bz2",
 87 |     )
 88 | 
 89 | 
 90 | def extract(data_path: Path, out_path: Optional[Path] = None) -> None:
 91 |     """Extract the data from the given path."""
 92 |     print(f"Extracting {data_path.name}...")
 93 |     if data_path.suffix == ".zip":
 94 |         out_path = out_path or data_path.parent / data_path.stem
 95 |         with ZipFile(data_path) as f:
 96 |             f.extractall(out_path)
 97 |     elif data_path.suffix == ".bz2":
 98 |         out_path = out_path or data_path.parent / data_path.name.replace(".tar.bz2", "")
 99 |         with tarfile.open(data_path, "r:bz2") as f:
100 |             f.extractall(out_path)
101 |     else:
102 |         raise ValueError(f"Unknown file type {data_path.suffix}")
103 | 
104 | 
105 | def download_synthego(out_dir: Path) -> None:
106 |     """Download the SynthEgo dataset."""
107 |     out_dir.mkdir(exist_ok=True, parents=True)
108 |     for part in range(1, 11):
109 |         out_path = out_dir / f"synth_ego_{part:02d}.zip"
110 |         print(f"Downloading SynthEgo part {part}...")
111 |         url = f"https://facesyntheticspubwedata.z6.web.core.windows.net/3dv-2024/synth_ego_{part:02d}.zip"
112 |         try:
113 |             subprocess.check_call(
114 |                 [
115 |                     "wget",
116 |                     url,
117 |                     "-O",
118 |                     str(out_path),
119 |                     "--no-check-certificate",
120 |                     "--continue",
121 |                 ]
122 |             )
123 |         except FileNotFoundError as exc:
124 |             raise RuntimeError("wget not found, please install it") from exc
125 |         except subprocess.CalledProcessError:
126 |             print("Download failed")
127 |             if out_path.exists():
128 |                 out_path.unlink()
129 |             sys.exit(1)
130 | 
131 | 
132 | def process_metadata(data_dir: Path) -> None:
133 |     """Process the metadata to include the correct pose data."""
134 |     # load MANO dataset
135 |     mano_left = np.load(data_dir / f"{MANO_FILENAME}/mano_poses_v1_0/handsOnly_REGISTRATIONS_r_lm___POSES___L.npy")
136 |     mano_right = np.load(data_dir / f"{MANO_FILENAME}/mano_poses_v1_0/handsOnly_REGISTRATIONS_r_lm___POSES___R.npy")
137 |     # fill in the data
138 |     for metadata_fn in (data_dir / SYNTHEGO_DIRNAME).glob("*.json"):
139 |         with open(metadata_fn, "r") as f:
140 |             metadata = json.load(f)
141 |             if isinstance(metadata["pose"][1], str):
142 |                 # body pose comes from AMASS
143 |                 seq_name: str = metadata["pose"][1]
144 |                 frame = int(seq_name.split("_")[-2])
145 |                 mirrored = seq_name.split("_")[-1] == 1
146 |                 assert not mirrored
147 |                 seq_path = Path("/".join(seq_name.split("/")[1:])).with_suffix(".npz").as_posix()
148 |                 if seq_name.startswith("MoSh_MPI_MoSh"):
149 |                     # fix paths to match downloaded data
150 |                     seq_path = seq_path.replace("Data/moshpp_fits_SMPL", "MPI_mosh")
151 |                     seq_path = seq_path.replace(".npz", "_poses.npz")
152 |                     if not (data_dir / MOSH_FILENAME / seq_path).exists():
153 |                         # there is a sequence incorrectly named with _poses_poses
154 |                         seq_path = seq_path.replace(".npz", "_poses.npz")
155 |                     seq_data = np.load(data_dir / MOSH_FILENAME / seq_path)
156 |                 elif seq_name.startswith("MoSh_MPI_PoseLimits"):
157 |                     # fix paths to match downloaded data
158 |                     seq_path = seq_path.replace("Data/moshpp_fits_SMPL", "MPI_Limits")
159 |                     seq_path = seq_path.replace(".npz", "_poses.npz")
160 |                     seq_data = np.load(data_dir / POSELIM_FILENAME / seq_path)
161 |                 else:
162 |                     raise RuntimeError(f"Unknown sequence name {seq_name}")
163 |                 # we resampled to ~30 fps so have to adjust the frame number
164 |                 frame_step = int(np.floor(seq_data["mocap_framerate"] / 30))
165 |                 seq = seq_data["poses"][::frame_step]
166 |                 # exclude root joint
167 |                 metadata["pose"][1:SMPL_H_N_J] = (
168 |                     seq[frame].reshape((-1, 3))[1:SMPL_H_N_J].tolist()
169 |                 )
170 |             if isinstance(metadata["pose"][LEFT_HAND], str):
171 |                 # left hand comes from MANO
172 |                 idx = int(metadata["pose"][LEFT_HAND].split("_")[1])
173 |                 metadata["pose"][LEFT_HAND:RIGHT_HAND] = (
174 |                     mano_left[idx].reshape((MANO_N_J, 3)).tolist()
175 |                 )
176 |             if isinstance(metadata["pose"][RIGHT_HAND], str):
177 |                 # right hand comes from MANO
178 |                 idx = int(metadata["pose"][RIGHT_HAND].split("_")[1])
179 |                 metadata["pose"][RIGHT_HAND:] = (
180 |                     mano_right[idx].reshape((MANO_N_J, 3)).tolist()
181 |                 )
182 |         with open(metadata_fn, "w") as f:
183 |             json.dump(metadata, f, indent=4)
184 | 
185 | 
186 | def main() -> None:
187 |     """Download and process the dataset."""
188 |     assert len(sys.argv) == 2, "Usage: python process_pose_gt.py <output_dir>"
189 |     data_dir = Path(sys.argv[1])
190 |     # download data from MPII sources
191 |     get_amass(data_dir)
192 |     get_mano(data_dir)
193 |     # extract the data
194 |     for path in list(data_dir.glob("*.zip")) + list(data_dir.glob("*.bz2")):
195 |         extract(path)
196 |         path.unlink()
197 |     # download the SynthEgo dataset
198 |     zip_dir = data_dir / f"{SYNTHEGO_DIRNAME}_zip"
199 |     download_synthego(zip_dir)
200 |     # extract the SynthEgo dataset
201 |     for path in list(zip_dir.glob("*.zip")):
202 |         extract(path, data_dir / SYNTHEGO_DIRNAME)
203 |         path.unlink()
204 |     zip_dir.rmdir()
205 |     # process the metadata
206 |     process_metadata(data_dir)
207 | 
208 | 
209 | if __name__ == "__main__":
210 |     main()
211 | 


--------------------------------------------------------------------------------