├── docs
    ├── _static
    │   └── .gitkeep
    ├── collections.rst
    ├── index.rst
    ├── Makefile
    ├── api.rst
    └── conf.py
├── .coveragerc
├── MANIFEST.in
├── eosdis_store
    ├── version.py
    ├── __init__.py
    ├── dmrpp.py
    └── stores.py
├── presentation
    ├── requirements.txt
    ├── images
    │   ├── summary.png
    │   ├── output_12_2.png
    │   ├── output_15_1.png
    │   ├── output_18_2.png
    │   ├── output_3_1.png
    │   ├── output_5_1.png
    │   ├── output_7_1.png
    │   ├── output_9_2.png
    │   └── request-overhead.png
    ├── tutorial.ipynb
    └── background.md
├── .flake8
├── requirements.txt
├── requirements-dev.txt
├── .github
    ├── release-drafter.yml
    └── workflows
    │   ├── draft-release.yml
    │   ├── tests.yml
    │   └── publish-release.yml
├── CHANGELOG.md
├── scripts
    └── mkdmrpp
├── .gitignore
├── Makefile
├── setup.py
├── tests
    ├── test_dmrpp.py
    ├── test_stores.py
    └── fixtures
    │   ├── 20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.zarr.json
    │   ├── 20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.nc.dmrpp
    │   └── 3B-HHR.MS.MRG.3IMERG.20051022-S000000-E002959.0000.V06B.zarr.json
├── README.rst
└── LICENSE


/docs/_static/.gitkeep:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/.coveragerc:
--------------------------------------------------------------------------------
1 | [run]
2 | source = .


--------------------------------------------------------------------------------
/MANIFEST.in:
--------------------------------------------------------------------------------
1 | include requirements.txt
2 | 


--------------------------------------------------------------------------------
/eosdis_store/version.py:
--------------------------------------------------------------------------------
1 | __version__ = "0.1.6"
2 | 


--------------------------------------------------------------------------------
/presentation/requirements.txt:
--------------------------------------------------------------------------------
1 | matplotlib>=3.8.0
2 | h5py>=3.9.0
3 | 


--------------------------------------------------------------------------------
/.flake8:
--------------------------------------------------------------------------------
1 | [flake8]
2 | max-line-length = 99
3 | ignore = F401, W503
4 | 


--------------------------------------------------------------------------------
/presentation/images/summary.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/summary.png


--------------------------------------------------------------------------------
/presentation/images/output_12_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_12_2.png


--------------------------------------------------------------------------------
/presentation/images/output_15_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_15_1.png


--------------------------------------------------------------------------------
/presentation/images/output_18_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_18_2.png


--------------------------------------------------------------------------------
/presentation/images/output_3_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_3_1.png


--------------------------------------------------------------------------------
/presentation/images/output_5_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_5_1.png


--------------------------------------------------------------------------------
/presentation/images/output_7_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_7_1.png


--------------------------------------------------------------------------------
/presentation/images/output_9_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/output_9_2.png


--------------------------------------------------------------------------------
/presentation/images/request-overhead.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/nasa/zarr-eosdis-store/HEAD/presentation/images/request-overhead.png


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | CacheControl>=0.12.6
2 | requests>=2.23.0
3 | requests-futures>=1.0.0
4 | zarr>=2.7.1
5 | ipypb~=0.5
6 | xarray>=0.16
7 | numcodecs>=0.8.1


--------------------------------------------------------------------------------
/eosdis_store/__init__.py:
--------------------------------------------------------------------------------
1 | from .stores import EosdisStore, ConsolidatedChunkStore
2 | from .version import __version__
3 | 
4 | __all__ = ['EosdisStore', '__version__', 'version']
5 | version = __version__


--------------------------------------------------------------------------------
/requirements-dev.txt:
--------------------------------------------------------------------------------
 1 | setuptools >= 21.0.0
 2 | pytest~=5.4
 3 | flake8~=3.8
 4 | safety >= 1.8.5
 5 | coverage >= 4.5.4
 6 | pygments ~= 2.9
 7 | sphinx >= 3.2.1
 8 | sphinx-rtd-theme >= 0.5.0
 9 | recommonmark >= 0.7.1
10 | 


--------------------------------------------------------------------------------
/docs/collections.rst:
--------------------------------------------------------------------------------
 1 | Compatible Collections
 2 | ======================
 3 | 
 4 | Production collections coming soon
 5 | 
 6 | Test Collections
 7 | ----------------
 8 | 
 9 | The following collections are available for user testing and feedback.
10 | 
11 | * Coming soon


--------------------------------------------------------------------------------
/docs/index.rst:
--------------------------------------------------------------------------------
 1 | .. include:: ../README.rst
 2 | 
 3 | .. toctree::
 4 |    :maxdepth: 2
 5 |    :caption: Contents:
 6 | 
 7 |    api
 8 |    collections
 9 | 
10 | Indices and tables
11 | ==================
12 | 
13 | * :ref:`genindex`
14 | * :ref:`modindex`
15 | * :ref:`search`
16 | 


--------------------------------------------------------------------------------
/.github/release-drafter.yml:
--------------------------------------------------------------------------------
 1 | version-resolver:
 2 |   major:
 3 |     labels:
 4 |       - 'major'
 5 |   minor:
 6 |     labels:
 7 |       - 'minor'
 8 |   patch:
 9 |     labels:
10 |       - 'patch'
11 |   default: patch
12 | name-template: 'v$RESOLVED_VERSION'
13 | tag-template: 'v$RESOLVED_VERSION'
14 | template: |
15 |   $CHANGES
16 | 


--------------------------------------------------------------------------------
/.github/workflows/draft-release.yml:
--------------------------------------------------------------------------------
 1 | name: Draft Release
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 | 
 8 | jobs:
 9 |   build:
10 |     runs-on: ubuntu-latest
11 |     steps:
12 |     - name: Release Drafter
13 |       uses: release-drafter/release-drafter@v5.12.1
14 |       env:
15 |         GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
16 | 


--------------------------------------------------------------------------------
/CHANGELOG.md:
--------------------------------------------------------------------------------
 1 | # Changelog
 2 | All notable changes to this project will be documented in this file.
 3 | 
 4 | The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/)
 5 | and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0.html).
 6 | 
 7 | ## [Unreleased]
 8 | 
 9 | ## [v0.1.0] - 2020-xx-xx
10 | 
11 | Initial Release
12 | 
13 | [Unreleased]: https://github.com/<organization>/<repository>/compare/master...develop
14 | [v0.1.0]: https://github.com/<organization>/<repository>/tree/0.1.0
15 | 


--------------------------------------------------------------------------------
/scripts/mkdmrpp:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -ex
 4 | 
 5 | resolve_dir() {
 6 |         (builtin cd `dirname "${1/#~/$HOME}"`'/'`basename "${1/#~/$HOME}"` 2>/dev/null; if [ $? -eq 0 ]; then pwd; fi)
 7 | }
 8 | 
 9 | for var in "$@"; do
10 |   filename=$(basename $var)
11 |   dir=$(resolve_dir `dirname $var`)
12 |   ext=h5
13 |   echo $filename
14 |   echo $dir
15 | 
16 |   cp $var $var.$ext
17 |   docker run --rm -it -v $dir:/tmp --entrypoint get_dmrpp opendap/hyrax:snapshot -V -o /tmp/$filename.dmrpp /$filename.$ext
18 |   rm -rf $dir/conf_* $dir/dmr_* $dir/hyrax_ux
19 |   rm $var.$ext
20 | done
21 | 


--------------------------------------------------------------------------------
/docs/Makefile:
--------------------------------------------------------------------------------
 1 | # Minimal makefile for Sphinx documentation
 2 | #
 3 | 
 4 | # You can set these variables from the command line, and also
 5 | # from the environment for the first two.
 6 | SPHINXOPTS    ?=
 7 | SPHINXBUILD   ?= sphinx-build
 8 | SOURCEDIR     = .
 9 | BUILDDIR      = _build
10 | 
11 | # Put it first so that "make" without argument is like "make help".
12 | help:
13 | 	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
14 | 
15 | .PHONY: help Makefile
16 | 
17 | # Catch-all target: route all unknown targets to Sphinx using the new
18 | # "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
19 | %: Makefile
20 | 	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
21 | 


--------------------------------------------------------------------------------
/docs/api.rst:
--------------------------------------------------------------------------------
 1 | API Documentation
 2 | =================
 3 | 
 4 | .. automodule:: eosdis_store
 5 |    :members:
 6 |    :special-members:
 7 |    :show-inheritance:
 8 | 
 9 | 
10 | Submodules
11 | ----------
12 | 
13 | eosdis_store.common module
14 | --------------------------
15 | 
16 | .. automodule:: eosdis_store.common
17 |    :members:
18 |    :undoc-members:
19 |    :show-inheritance:
20 | 
21 | eosdis_store.dmrpp module
22 | -------------------------
23 | 
24 | .. automodule:: eosdis_store.dmrpp
25 |    :members:
26 |    :undoc-members:
27 |    :show-inheritance:
28 | 
29 | eosdis_store.stores module
30 | --------------------------
31 | 
32 | .. automodule:: eosdis_store.stores
33 |    :members:
34 |    :special-members:
35 |    :show-inheritance:
36 | 
37 | 


--------------------------------------------------------------------------------
/.github/workflows/tests.yml:
--------------------------------------------------------------------------------
 1 | name: Tests
 2 | 
 3 | # More conservative about duplicate tests due to tests accessing real files
 4 | on: [pull_request]
 5 | 
 6 | jobs:
 7 |   build:
 8 |     runs-on: ubuntu-latest
 9 |     strategy:
10 |       matrix:
11 |         python-version: [3.8]
12 | 
13 |     steps:
14 |     - uses: actions/checkout@v4
15 | 
16 |     - name: Set up Python ${{ matrix.python-version }}
17 |       uses: actions/setup-python@v5
18 |       with:
19 |         python-version: ${{ matrix.python-version }}
20 | 
21 |     - uses: extractions/netrc@v1
22 |       with:
23 |         machine: uat.urs.earthdata.nasa.gov
24 |         username: ${{ secrets.EDL_USER }}
25 |         password: ${{ secrets.EDL_PASSWORD }}
26 | 
27 |     - name: Install dependencies
28 |       run: |
29 |         make install
30 | 
31 |     - name: Tests
32 |       run: |
33 |         make ci
34 | 
35 |     - name: Archive code coverage results
36 |       uses: actions/upload-artifact@v4
37 |       with:
38 |         name: code-coverage-report
39 |         path: htmlcov/*
40 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # General
 2 | tmp/
 3 | .DS_Store
 4 | 
 5 | # Byte-compiled / optimized / DLL files
 6 | __pycache__/
 7 | *.py[cod]
 8 | *$py.class
 9 | 
10 | # C extensions
11 | *.so
12 | 
13 | # Distribution / packaging
14 | .Python
15 | build/
16 | develop-eggs/
17 | dist/
18 | downloads/
19 | eggs/
20 | .eggs/
21 | lib/
22 | lib64/
23 | parts/
24 | sdist/
25 | var/
26 | wheels/
27 | share/python-wheels/
28 | *.egg-info/
29 | .installed.cfg
30 | *.egg
31 | MANIFEST
32 | docs/_build
33 | 
34 | # PyInstaller
35 | #  Usually these files are written by a python script from a template
36 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
37 | *.manifest
38 | *.spec
39 | 
40 | # Installer logs
41 | pip-log.txt
42 | pip-delete-this-directory.txt
43 | 
44 | # Unit test / coverage reports
45 | htmlcov/
46 | .tox/
47 | .nox/
48 | .coverage
49 | .coverage.*
50 | .cache
51 | nosetests.xml
52 | coverage.xml
53 | *.cover
54 | *.py,cover
55 | .hypothesis/
56 | .pytest_cache/
57 | cover/
58 | 
59 | # Jupyter Notebook
60 | .ipynb_checkpoints
61 | 
62 | # IPython
63 | profile_default/
64 | ipython_config.py
65 | 
66 | # pyenv
67 | .python-version
68 | 


--------------------------------------------------------------------------------
/Makefile:
--------------------------------------------------------------------------------
 1 | .PHONY: venv-setup pyenv-setup install install-examples clean examples lint test test-watch ci docs
 2 | .SILENT: virtualenv
 3 | 
 4 | VERSION ?= $(shell git describe --tags | sed 's/-/\+/' | sed 's/-/\./g')
 5 | REPO ?= https://upload.pypi.org/legacy/
 6 | REPO_USER ?= __token__
 7 | REPO_PASS ?= unset
 8 | 
 9 | venv-setup:
10 | 	python -m venv .venv
11 | 
12 | pyenv-setup:
13 | 	if ! type pyenv > /dev/null; \
14 | 	then \
15 | 			echo "\nUnable to create virtualenv: pyenv not found. Please install pyenv & pyenv-virtualenv."; \
16 | 			echo "  See:"; \
17 | 			echo "    https://github.com/pyenv/pyenv"; \
18 | 			echo "    https://github.com/pyenv/pyenv-virtualenv"; \
19 | 			exit; \
20 | 	else \
21 | 			pyenv install 3.9.1; \
22 | 			pyenv virtualenv 3.9.1 zarr-eosdis-store; \
23 | 			pyenv activate zarr-eosdis-store; \
24 | 	fi
25 | 
26 | clean:
27 | 	coverage erase
28 | 	rm -rf htmlcov
29 | 	rm -rf build dist *.egg-info || true
30 | 
31 | clean-docs:
32 | 	cd docs && $(MAKE) clean
33 | 
34 | install:
35 | 	python -m pip install --upgrade pip
36 | 	pip install -r requirements.txt -r requirements-dev.txt
37 | 
38 | lint:
39 | 	flake8 eosdis_store --show-source --statistics
40 | 
41 | test:
42 | 	coverage run -m pytest
43 | 
44 | ci: test
45 | 	coverage html
46 | 
47 | build: clean
48 | 	sed -i.bak "s/__version__ .*/__version__ = \"$(VERSION)\"/" eosdis_store/version.py && rm eosdis_store/version.py.bak
49 | 	python -m pip install --upgrade --quiet setuptools wheel twine
50 | 	python setup.py --quiet sdist bdist_wheel
51 | 
52 | publish: build
53 | 	python -m twine check dist/*
54 | 	python -m twine upload --username "$(REPO_USER)" --password "$(REPO_PASS)" --repository-url "$(REPO)" dist/*
55 | 


--------------------------------------------------------------------------------
/.github/workflows/publish-release.yml:
--------------------------------------------------------------------------------
 1 | name: Publish Release
 2 | 
 3 | on:
 4 |   release:
 5 |     types: [published]
 6 | 
 7 | jobs:
 8 |   build:
 9 |     runs-on: ubuntu-latest
10 |     steps:
11 |     - uses: actions/checkout@v4
12 |       with:
13 |         fetch-depth: '0'
14 |     - uses: actions/setup-python@v5
15 |       with:
16 |         python-version: '3.8'
17 |     - shell: bash
18 |       env:
19 |         VERSION_TAG: ${{ github.event.release.tag_name }}
20 |         BRANCH: ${{ github.event.release.target_commitish }}
21 |       run: |
22 |         make install
23 |         VERSION=$(echo "${VERSION_TAG}" | cut -c2-) make build
24 | 
25 |         # Setup git
26 |         # https://api.github.com/users/github-actions%5Bbot%5D
27 |         git config --global user.name "github-actions[bot]"
28 |         git config --global user.email "41898282+github-actions[bot]@users.noreply.github.com"
29 | 
30 |         # Commit and push updated release files
31 |         git checkout -b "${BRANCH}"
32 |         git add .
33 |         git commit -m "Update release version to ${VERSION_TAG}"
34 |         git push origin "${BRANCH}"
35 | 
36 |         git tag --force "${VERSION_TAG}"
37 |         git push --force origin "${VERSION_TAG}"
38 |     - name: upload dists
39 |       uses: actions/upload-artifact@v4
40 |       with:
41 |         name: release-dists
42 |         path: dist/
43 | 
44 |   pypi-publish:
45 |     runs-on: ubuntu-latest
46 |     needs:
47 |       - build
48 |     permissions:
49 |       id-token: write
50 | 
51 |     steps:
52 |       - name: Retrieve release distributions
53 |         uses: actions/download-artifact@v4
54 |         with:
55 |           name: release-dists
56 |           path: dist/
57 | 
58 |       - name: Publish release distributions to PyPI
59 |         uses: pypa/gh-action-pypi-publish@release/v1
60 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | from setuptools import setup, find_packages
 3 | from imp import load_source
 4 | from os import path
 5 | import io
 6 | 
 7 | # use README for setup desciption
 8 | with open("README.rst", "r") as f:
 9 |     long_description = f.read()
10 | 
11 | # get version of package
12 | __version__ = load_source('eosdis_store.version', 'eosdis_store/version.py').__version__
13 | 
14 | # get the dependencies and installs
15 | with io.open(path.join(path.abspath(path.dirname(__file__)), 'requirements.txt'), encoding='utf-8') as f:
16 |     all_reqs = f.read().split('\n')
17 | 
18 | # remove direct installs from github
19 | install_requires = [x.strip() for x in all_reqs if 'git+' not in x]
20 | dependency_links = [x.strip().replace('git+', '') for x in all_reqs if 'git+' in x]
21 | 
22 | # get dev dependencies
23 | with io.open(path.join(path.abspath(path.dirname(__file__)), 'requirements-dev.txt'), encoding='utf-8') as f:
24 |     dev_reqs = f.read().split('\n')
25 | 
26 | 
27 | setup(
28 |     name="zarr-eosdis-store",
29 |     version=__version__,
30 |     author="Patrick Quinn, Matthew Hanson",
31 |     author_email="patrick@patrickquinn.net",
32 |     description="Zarr Store class for working with EOSDIS cloud data",
33 |     long_description=long_description,
34 |     long_description_content_type="text/markdown",
35 |     url="https://github.com/nasa/zarr-eosdis-store",
36 |     packages=find_packages(exclude=['docs', 'tests*']),
37 |     classifiers=[
38 |         'Development Status :: 7 - Inactive',
39 |         'Intended Audience :: Developers',
40 |         'Intended Audience :: Science/Research',
41 |         'License :: OSI Approved :: Apache Software License',
42 |         'Programming Language :: Python :: 3',
43 |         'Programming Language :: Python :: 3.8',
44 |         'Programming Language :: Python :: 3 :: Only',
45 |     ],
46 |     python_requires='>=3.8',
47 |     install_requires=install_requires,
48 |     dependency_links=dependency_links,
49 |     extras_require={
50 |         'dev': dev_reqs # Run `pip install -e .[dev]` to install dev dependencies
51 |     },
52 | )
53 | 


--------------------------------------------------------------------------------
/docs/conf.py:
--------------------------------------------------------------------------------
 1 | # Configuration file for the Sphinx documentation builder.
 2 | #
 3 | # This file only contains a selection of the most common options. For a full
 4 | # list see the documentation:
 5 | # https://www.sphinx-doc.org/en/master/usage/configuration.html
 6 | 
 7 | # -- Path setup --------------------------------------------------------------
 8 | 
 9 | # If extensions (or modules to document with autodoc) are in another directory,
10 | # add these directories to sys.path here. If the directory is relative to the
11 | # documentation root, use os.path.abspath to make it absolute, like shown here.
12 | #
13 | import os
14 | import sys
15 | sys.path.insert(0, os.path.abspath('../'))
16 | 
17 | import sphinx_rtd_theme
18 | 
19 | from importlib.machinery import SourceFileLoader
20 | 
21 | module_path = os.path.abspath('../eosdis_store/version.py')
22 | module = SourceFileLoader('eosdis_store.version', module_path).load_module(None)
23 | 
24 | # -- Project information -----------------------------------------------------
25 | 
26 | project = 'zarr-eosdis-store'
27 | copyright = '2020 United States Government as represented by the Administrator of the National Aeronautics and Space Administration. All Rights Reserved.'
28 | author = 'Patrick Quinn, Matthew Hanson'
29 | 
30 | # The full version, including alpha/beta/rc tags
31 | release = module.__version__
32 | 
33 | # -- General configuration ---------------------------------------------------
34 | 
35 | # Add any Sphinx extension module names here, as strings. They can be
36 | # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
37 | # ones.
38 | extensions = [
39 |   'sphinx.ext.autodoc',
40 |   'sphinx_rtd_theme',
41 |   'recommonmark'
42 | ]
43 | 
44 | # Add any paths that contain templates here, relative to this directory.
45 | templates_path = ['_templates']
46 | 
47 | # List of patterns, relative to source directory, that match files and
48 | # directories to ignore when looking for source files.
49 | # This pattern also affects html_static_path and html_extra_path.
50 | exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store']
51 | 
52 | source_suffix = {
53 |     '.rst': 'restructuredtext',
54 |     '.txt': 'markdown',
55 |     '.md': 'markdown',
56 | }
57 | 
58 | # -- Options for HTML output -------------------------------------------------
59 | 
60 | # The theme to use for HTML and HTML Help pages.  See the documentation for
61 | # a list of builtin themes.
62 | #
63 | html_theme = 'sphinx_rtd_theme'
64 | 
65 | # Add any paths that contain custom static files (such as style sheets) here,
66 | # relative to this directory. They are copied after the builtin static files,
67 | # so a file named "default.css" will overwrite the builtin "default.css".
68 | html_static_path = ['_static']


--------------------------------------------------------------------------------
/tests/test_dmrpp.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import os
  3 | import unittest
  4 | from  xml.etree import ElementTree
  5 | 
  6 | import requests
  7 | 
  8 | import eosdis_store.dmrpp as dmr
  9 | 
 10 | 
 11 | testpath = os.path.dirname(__file__)
 12 | 
 13 | s3_folder = 'https://harmony.uat.earthdata.nasa.gov/service-results/harmony-uat-eedtest-data/zarr-store'
 14 | 
 15 | class Test(unittest.TestCase):
 16 | 
 17 |     test_files = [
 18 |         f'{s3_folder}/f16_ssmis_20051022v7.nc.dmrpp',
 19 |         f'{s3_folder}/3B-HHR.MS.MRG.3IMERG.20051022-S000000-E002959.0000.V06B.HDF5.dmrpp',
 20 |         # MODIS data
 21 |         'https://archive.podaac.uat.earthdata.nasa.gov/podaac-uat-cumulus-protected/MODIS_A-JPL-L2P-v2019.0/20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.nc.dmrpp',
 22 |     ]
 23 | 
 24 |     @classmethod
 25 |     def get_test_xml(cls, idx=0):
 26 |         dmrpp = requests.get(cls.test_files[idx]).text
 27 |         tree = ElementTree.fromstring(dmrpp)
 28 |         return tree
 29 | 
 30 |     def test_find_child(self):
 31 |         tree = self.get_test_xml()
 32 |         node = dmr.find_child(tree, 'HDF5_GLOBAL')
 33 |         assert(node.attrib['name'] == 'HDF5_GLOBAL')
 34 | 
 35 |     def test_get_attribute_values(self):
 36 |         xml = '<Attribute name="axis" type="String"><Value>T</Value></Attribute>'
 37 |         node = ElementTree.fromstring(xml)
 38 |         vals = dmr.get_attribute_values(node)
 39 |         assert(vals == 'T')
 40 |         # TODO - test lists
 41 | 
 42 |     def test_get_attributes(self):
 43 |         tree = self.get_test_xml()
 44 |         node = dmr.find_child(tree, 'HDF5_GLOBAL')
 45 |         arr = dmr.get_attributes(node)
 46 |         assert(arr['chunksize'] == '90')
 47 |         assert(arr['Conventions'] == 'CF-1.6')
 48 |         assert(arr['numberofpasses'] == '2')
 49 | 
 50 |     def test_get_dimensions(self):
 51 |         tree = self.get_test_xml()
 52 |         dims = dmr.get_dimensions(tree)
 53 |         assert(len(dims) == 3)
 54 |         assert('/time' in dims.keys())
 55 |         assert('/latitude' in dims.keys())
 56 |         assert('/longitude' in dims.keys())
 57 |         assert(dims['/latitude']['size'] == 720)
 58 | 
 59 |     def test_chunks_to_zarr_single(self):
 60 |         tree = self.get_test_xml()
 61 |         node = tree.find(".//d:Float32[@name='latitude']/dpp:chunks", dmr.NS)
 62 |         chunks = dmr.chunks_to_zarr(node)
 63 |         assert('zarray' in chunks)
 64 |         assert('zchunkstore' in chunks)
 65 |         assert(chunks['zchunkstore']['0']['offset'] == 106784)
 66 |         assert(chunks['zchunkstore']['0']['size'] == 2880)
 67 | 
 68 |     def test_chunks_to_zarr_multi(self):
 69 |         tree = self.get_test_xml()
 70 |         node = tree.find(".//d:Int16[@name='sst_dtime']/dpp:chunks", dmr.NS)
 71 |         chunks = dmr.chunks_to_zarr(node)
 72 |         assert('zarray' in chunks)
 73 |         assert('zchunkstore' in chunks)
 74 |         assert(len(chunks['zchunkstore']) == 128)
 75 |         assert(chunks['zchunkstore']['0.7.15']['size'] == 4324)
 76 | 
 77 |     def test_array_to_zarr(self):
 78 |         tree = self.get_test_xml()
 79 |         dims = dmr.get_dimensions(tree)
 80 |         assert(dims['/longitude']['size'] == 1440)
 81 |         # test on wind_speed array
 82 |         node = tree.find(".//d:Int16[@name='wind_speed']", dmr.NS)
 83 |         arr = dmr.array_to_zarr(node, dims)
 84 |         assert('wind_speed/.zarray' in arr)
 85 |         assert('wind_speed/.zattrs' in arr)
 86 |         assert('wind_speed/.zchunkstore' in arr)
 87 |         assert(arr['wind_speed/.zattrs']['_ARRAY_DIMENSIONS'] == ['time', 'latitude', 'longitude'])
 88 |         assert(arr['wind_speed/.zchunkstore']['0.6.11']['size'] == 888)
 89 |         # test on latitude array
 90 |         node = tree.find(".//d:Float32[@name='latitude']", dmr.NS)
 91 |         arr = dmr.array_to_zarr(node, dims)
 92 |         assert('latitude/.zarray' in arr)
 93 |         assert('latitude/.zattrs' in arr)
 94 |         assert('latitude/.zchunkstore' in arr)
 95 |         assert(arr['latitude/.zattrs']['_ARRAY_DIMENSIONS'] == ['latitude'])
 96 |         assert(arr['latitude/.zchunkstore']['0']['size'] == 2880)
 97 | 
 98 |     def test_to_zarr(self):
 99 |         tree = self.get_test_xml()
100 |         zarr = dmr.to_zarr(tree)
101 |         with open(os.path.join(testpath, 'fixtures', 'f16_ssmis_20051022v7.zarr.json')) as f:
102 |             fixture = json.loads(f.read())
103 |         json1 = json.dumps(fixture, sort_keys=True)
104 |         json2 = json.dumps(zarr, sort_keys=True)
105 |         assert(json1 == json2)
106 | 
107 |     def test_to_zarr_more_examples(self):
108 |         for i in range(2, len(self.test_files)):
109 |             tree = self.get_test_xml(i)
110 |             zarr = dmr.to_zarr(tree)
111 | 
112 |             bname = os.path.splitext(os.path.basename(self.test_files[i].replace('.dmrpp', '')))[0]
113 |             with open(os.path.join(testpath, 'fixtures', f"{bname}.zarr.json")) as f:
114 |                 fixture = json.loads(f.read())
115 |             json1 = json.dumps(fixture, sort_keys=True)
116 |             json2 = json.dumps(zarr, sort_keys=True)
117 |             assert(json1 == json2)
118 | 
119 |     def test_deflate_shuffle(self):
120 |         filename = '20210715090000-JPL-L4_GHRSST-SSTfnd-MUR-GLOB-v02.0-fv04.1.nc.dmrpp'
121 |         with open(os.path.join(testpath, 'fixtures', filename)) as f:
122 |             dmrpp = f.read()
123 |         tree = ElementTree.fromstring(dmrpp)
124 |         zarr = dmr.to_zarr(tree)
125 |         attributes = zarr['analysed_sst/.zarray']
126 |         expected = {
127 |             'zarr_format': 2,
128 |             'filters': [{'id': 'shuffle', 'elementsize': 2}],
129 |             'order': 'C',
130 |             'dtype': '<i2',
131 |             'shape': [1, 17999, 36000],
132 |             'compressor': {'id': 'zlib', 'level': 4},
133 |             'chunks': [1, 1023, 2047],
134 |             'fill_value': -32768,
135 |         }
136 |         assert(attributes == expected)
137 | 


--------------------------------------------------------------------------------
/README.rst:
--------------------------------------------------------------------------------
  1 | .. warning::
  2 | 
  3 |    **DEPRECATED**: This repository is no longer maintained.
  4 |    Please use `VirtualiZarr <https://github.com/zarr-developers/VirtualiZarr>`_ instead.
  5 | 
  6 | ----
  7 | 
  8 | .. image:: https://img.shields.io/badge/maintenance-no--longer--maintained-red
  9 |    :alt: No Longer Maintained
 10 | 
 11 | zarr-eosdis-store
 12 | =================
 13 | 
 14 | The zarr-eosdis-store library allows NASA EOSDIS Collections to be accessed efficiently
 15 | by the `Zarr Python library <https://zarr.readthedocs.io/en/stable/index.html>`_, provided they
 16 | have a sidecar DMR++ metadata file generated.
 17 | 
 18 | Installation
 19 | ============
 20 | 
 21 | This module requires Python 3.8 or greater::
 22 | 
 23 |     $ python --version
 24 |     Python 3.8.2
 25 | 
 26 | Install from PyPI::
 27 | 
 28 |     $ pip install zarr-eosdis-store
 29 | 
 30 | To install the latest development version::
 31 | 
 32 |     $ pip install pip install git+https://github.com/nasa/zarr-eosdis-store.git@main#egg=zarr-eosdis-store
 33 | 
 34 | Earthdata Login
 35 | ===============
 36 | 
 37 | To access EOSDIS data, you need to sign in with a free NASA Earthdata Login account, which you can obtain at
 38 | `<https://urs.earthdata.nasa.gov/>`_.
 39 | 
 40 | Once you have an account, you will need to add your credentials to your ``~/.netrc`` file::
 41 | 
 42 |     machine urs.earthdata.nasa.gov login YOUR_USERNAME password YOUR_PASSWORD
 43 | 
 44 | If you are accessing test data, you will need to use an account from the Earthdata Login test system at
 45 | `<https://uat.urs.earthdata.nasa.gov/>`_ instead, adding a corresponding line to your ``~/.netrc`` file::
 46 | 
 47 |     machine uat.urs.earthdata.nasa.gov login YOUR_USERNAME password YOUR_PASSWORD
 48 | 
 49 | 
 50 | Usage
 51 | =====
 52 | 
 53 | To use the library, simply instantiate ``eosdis_store.EosdisStore`` with the URL to the data file you would
 54 | like to access, pass it to the Zarr library as you would with any other store, and use the Zarr API as with any
 55 | other read-only Zarr file.  Note: the URL to the data file will typically end with an HDF5 or NetCDF4 extension,
 56 | not .zarr.
 57 | 
 58 | .. code-block:: python
 59 | 
 60 |    from eosdis_store import EosdisStore
 61 |    import zarr
 62 | 
 63 |    # Assumes you have set up .netrc with your Earthdata Login information
 64 |    f = zarr.open(EosdisStore('https://example.com/your/data/file.nc4'))
 65 | 
 66 |    # Read metadata and data from f using the Zarr API
 67 |    print(f['parameter_name'][0:0:0])
 68 | 
 69 | If the data has _FillValue (to flag nodata), scale_factor, or add_offset set (defined in metadata using CF-conventions)
 70 | they can be retrieved from the parameter attributes.
 71 | 
 72 | .. code-block:: python
 73 | 
 74 |   import numpy as np
 75 | 
 76 |   scale_factor = f['parameter_name].scale_factor
 77 |   add_offset = f['parameter_name].add_offset
 78 |   nodata = f['parameter_name]._FillValue
 79 | 
 80 |   arr = f['parameter_name'][] * scale_factor + add_offset
 81 | 
 82 |   nodata_locs = np.where(arr == nodata)
 83 | 
 84 | 
 85 | A better way to handle these is to use XArray. Rather than reading the data immediately when a slice is requested, XArray
 86 | defers the read until the data is actually accessed. With the Zarr backend to XArray, the scale and offset can be set so that
 87 | when the data is accessed it will apply those values. This is more efficient if the data is going to be used in other operations.
 88 | 
 89 | The scale_factor and get_offset will be used if specified in the NetCDF/HDF5 file.
 90 | 
 91 | .. code-block:: python
 92 | 
 93 |   import xarray
 94 | 
 95 |   store = EosdisStore('https://example.com/your/data/file.nc4')
 96 | 
 97 |   f = xarray.open_zarr(store)
 98 | 
 99 |   # the data is not read yet
100 |   xa = f['parameter_name'][<slice>]
101 | 
102 |   # convert to numpy array, data is read
103 |   arr = xa.values
104 | 
105 | The resulting array will have had scale and offset applied, and any element that is equal to the _FillValue attribute will be
106 | set to numpy `nan`. To use XArray without apply the scale and offset or setting the nodata to `nan`, supply the `mask_and_scale`
107 | keyword to xarray.open_zarr to False:
108 | 
109 | .. code-block:: python
110 | 
111 |   store = EosdisStore('https://example.com/your/data/file.nc4')
112 | 
113 |   f = xarray.open_zarr(store, mask_and_scale=False)
114 | 
115 | 
116 | Technical Summary
117 | =================
118 | 
119 | We make use of a technique to read NetCDF4 and some HDF5 files that was prototyped by The HDF Group and USGS, described
120 | `here <https://medium.com/pangeo/cloud-performant-reading-of-netcdf4-hdf5-data-using-the-zarr-library-1a95c5c92314)>`_.
121 | 
122 | To allow the technique to work with EOSDIS data, we have extended it and optimized access in the following key ways:
123 | 
124 | * The ``EosdisStore`` reads a DMR++ file generated by OPeNDAP to present its metadata and determine byte offsets to the
125 |   Zarr library. By reusing these, we avoid needing to generate new metadata sidecar files to support new data.
126 | 
127 | * The store uses HTTPS and authenticates with a ``.netrc`` entry, rather than the S3 API, making it compatible with
128 |   EOSDIS access patterns and requirements
129 | 
130 | * The store caches redirect URLs for a period of time set by the Cache-Control header.  Doing this avoids the overhead
131 |   of repeated redirects when accessing parts of files.
132 | 
133 | * The store uses a parallel API that allows it to make more efficient access optimizations:
134 | *
135 |   * When the Zarr library accesses data that requires reading multiple near-sequential bytes in the file, the store combines
136 |     these smaller requests into a single larger request.
137 | 
138 |   * After an initial request to cache any authentication and redirect information, the store runs subsequent requests in
139 |     parallel.
140 | 
141 | Development
142 | ===========
143 | 
144 | Clone the repository, then ``pip install`` its dependencies::
145 | 
146 |     pip install -r requirements.txt
147 |     pip install -r requirements-dev.txt
148 | 
149 | To check code coverage and run tests::
150 | 
151 |     coverage run -m pytest
152 | 
153 | To check coding style::
154 | 
155 |     flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
156 | 
157 | To build documentation, generated at ``docs/_build/html/index.html``::
158 | 
159 |     cd docs && make html
160 | 


--------------------------------------------------------------------------------
/tests/test_stores.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import os
  3 | import unittest
  4 | from xml.etree import ElementTree
  5 | 
  6 | import numpy as np
  7 | import requests
  8 | import xarray
  9 | import zarr
 10 | 
 11 | from eosdis_store import EosdisStore, ConsolidatedChunkStore
 12 | 
 13 | testpath = os.path.dirname(__file__)
 14 | 
 15 | s3_folder = 'https://harmony.uat.earthdata.nasa.gov/service-results/harmony-uat-eedtest-data/zarr-store'
 16 | 
 17 | fixtures = [
 18 |     {
 19 |         "url": f"{s3_folder}/f16_ssmis_20051022v7.nc",
 20 |         "aoi": (0, slice(400, 549, None), slice(1040, 1261, None))
 21 |     },
 22 |     {
 23 |         "url": f"{s3_folder}/3B-HHR.MS.MRG.3IMERG.20051022-S000000-E002959.0000.V06B.HDF5",
 24 |         "aoi": (0, slice(800, 1351, None), slice(1000, 1371, None))
 25 |     },
 26 |     {
 27 |         "url": "https://archive.podaac.uat.earthdata.nasa.gov/podaac-uat-cumulus-protected/MODIS_A-JPL-L2P-v2019.0/20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.nc",
 28 |         "aoi": (0, slice(1800, 2000, None), slice(100, 400, None))
 29 |     },
 30 |     {
 31 |         "url": "https://archive.podaac.uat.earthdata.nasa.gov/podaac-uat-cumulus-protected/MODIS_A-JPL-L2P-v2019.0/20200911004001-JPL-L2P_GHRSST-SSTskin-MODIS_A-D-v02.0-fv01.0.nc",
 32 |         "aoi": (0, slice(1800, 2000, None), slice(100, 400, None))
 33 |     }
 34 | ]
 35 | 
 36 | 
 37 | def open_eosdis_store(idx=0):
 38 |     return EosdisStore(fixtures[idx]["url"], fixtures[idx]["url"] + ".dmrpp")
 39 | 
 40 | 
 41 | class TestZarr(unittest.TestCase):
 42 | 
 43 |     @classmethod
 44 |     def get_test_xml(cls, idx=0):
 45 |         url = fixtures[idx]["url"]
 46 |         dmrpp = requests.get(url + '.dmrpp').text
 47 |         tree = ElementTree.fromstring(dmrpp)
 48 |         return tree
 49 | 
 50 |     def test_eosdis_store_metadata(self):
 51 |         store = open_eosdis_store()
 52 |         keys = list(store.keys())
 53 |         assert(len(keys) == 26)
 54 |         # test default dmr_url
 55 |         store = EosdisStore(fixtures[0]["url"])
 56 |         keys = list(store.keys())
 57 |         assert(len(keys) == 26)
 58 | 
 59 |     def test_eosdis_store_open(self):
 60 |         store = zarr.open(open_eosdis_store())
 61 |         arrays = list(store.arrays())
 62 |         assert(len(arrays) == 8)
 63 |         assert(arrays[0][0] == 'atmosphere_cloud_liquid_water_content')
 64 |         arr = arrays[0][1]
 65 |         assert(type(arr) == zarr.core.Array)
 66 |         assert(arr.name == '/atmosphere_cloud_liquid_water_content')
 67 |         assert(arr.shape == (2, 720, 1440))
 68 | 
 69 |     def test_eosdis_store_read(self):
 70 |         store = zarr.open(open_eosdis_store())
 71 |         arr = store['wind_speed'][fixtures[0]["aoi"]]
 72 |         assert(arr.shape == (149, 221))
 73 |         assert(arr[0][0] == 19)
 74 |         assert(arr.mean() == 169.29050381123022)
 75 | 
 76 |     def test_eosdis_store_getranges_combined(self):
 77 |         store = open_eosdis_store()
 78 |         ranges = [
 79 |             ('wind_speed/0.4.11', 768280, 6830),
 80 |             ('wind_speed/0.4.12', 775112, 5759)
 81 |         ]
 82 |         result = store._getranges(ranges)
 83 |         assert(len(result) == 2)
 84 |         assert(len(store.responses) == 1)
 85 | 
 86 |     def test_eosdis_store_getranges_split(self):
 87 |         store = open_eosdis_store()
 88 |         ranges = [
 89 |             ('wind_speed/0.4.11', 768280, 6830),
 90 |             ('wind_speed/0.4.12', 785112, 5759)
 91 |         ]
 92 |         result = store._getranges(ranges)
 93 |         assert(len(result) == 2)
 94 |         assert(len(store.responses) == 2)
 95 | 
 96 |     def test_eosdis_store_parallel_reads(self):
 97 |         store = zarr.open(open_eosdis_store())
 98 |         arr = store['wind_speed'][fixtures[0]["aoi"]]
 99 |         responses = store.store.responses
100 |         end_time = responses[0].start + responses[1].elapsed
101 |         for r in responses[1:]:
102 |             assert(r.start < end_time)
103 | 
104 | 
105 | class TestXArray(unittest.TestCase):
106 | 
107 |     @classmethod
108 |     def _setUpClass(cls):
109 |         store = open_eosdis_store(2)
110 |         # use patched zarr metadata file as workaround to incorrect DMR++ files showing Int8 datasets as Int16
111 |         fix = fixtures[2]
112 |         bname = f"{os.path.splitext(os.path.basename(fix['url']))[0]}.zarr.json"
113 |         with open(os.path.join(testpath, 'fixtures', bname)) as f:
114 |             meta = json.loads(f.read())
115 | 
116 |         store = ConsolidatedChunkStore(meta, fix["url"])
117 | 
118 |         cls.xa_noscale = xarray.open_zarr(store, mask_and_scale=False)
119 |         cls.xa = xarray.open_zarr(store, mask_and_scale=True)
120 | 
121 |     def test_scale_offset(self):
122 |         store = open_eosdis_store(0)
123 |         var = 'wind_speed'
124 | 
125 |         xa_noscale = xarray.open_zarr(store, mask_and_scale=False)
126 |         xa = xarray.open_zarr(store, mask_and_scale=True)
127 | 
128 |         # get values without scale and offset
129 |         wv = xa_noscale[var]
130 |         assert(hasattr(wv, "scale_factor"))
131 |         assert(hasattr(wv, "add_offset"))
132 |         arr = wv[fixtures[0]["aoi"]]
133 |         mean = arr.mean().item()
134 |         scale_factor = wv.scale_factor
135 |         add_offset = wv.add_offset
136 | 
137 |         # test with scale and offset
138 |         wv = xa[var]
139 |         assert(not hasattr(wv, "scale_factor"))
140 |         assert(not hasattr(wv, "add_offset"))
141 |         arr = wv[fixtures[0]["aoi"]]
142 | 
143 |         self.assertAlmostEqual(arr.mean().item(), mean * scale_factor + add_offset, places=5)
144 | 
145 |     def test_fillvalue(self):
146 |         # use patched zarr metadata file as workaround to incorrect DMR++ files showing Int8 datasets as Int16
147 |         fix = fixtures[2]
148 |         bname = f"{os.path.splitext(os.path.basename(fix['url']))[0]}.zarr.json"
149 |         with open(os.path.join(testpath, 'fixtures', bname)) as f:
150 |             meta = json.loads(f.read())
151 | 
152 |         store = ConsolidatedChunkStore(meta, fix["url"])
153 | 
154 |         xa = xarray.open_zarr(store, mask_and_scale=True)
155 | 
156 |         var = 'sea_surface_temperature'
157 | 
158 |         # do not apply mask - check that fill value exists and calculate mean excluding them
159 |         xa_nofill = xarray.open_zarr(store, mask_and_scale=False)
160 |         arr = xa_nofill[var][fix["aoi"]].values
161 |         locs = np.where(arr == xa_nofill['sea_surface_temperature']._FillValue)
162 |         assert(len(locs[0]) > 0)
163 |         mean = arr[arr != xa_nofill['sea_surface_temperature']._FillValue].mean()
164 |         mean = mean * xa_nofill['sea_surface_temperature'].scale_factor + xa_nofill['sea_surface_temperature'].add_offset
165 | 
166 |         # apply mask and use numpy nanmean function to calculate mean
167 |         arr2 = xa[var][fix["aoi"]].values
168 |         mean2 = np.nanmean(arr2)
169 | 
170 |         self.assertAlmostEqual(mean, mean2, places=4)
171 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | Copyright © 2019-2021 United States Government as represented by the Administrator of the National Aeronautics and Space Administration. All Rights Reserved.
 2 | 
 3 | Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License.
 4 | You may obtain a copy of the License at
 5 | 
 6 |     http://www.apache.org/licenses/LICENSE-2.0
 7 | 
 8 | Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS,
 9 | WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.
10 | 
11 | ---
12 | 
13 | TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
14 | 
15 | 1. Definitions.
16 | 
17 | "License" shall mean the terms and conditions for use, reproduction, and distribution as defined by Sections 1 through 9 of this document.
18 | 
19 | "Licensor" shall mean the copyright owner or entity authorized by the copyright owner that is granting the License.
20 | 
21 | "Legal Entity" shall mean the union of the acting entity and all other entities that control, are controlled by, or are under common control with that entity. For the purposes of this definition, "control" means (i) the power, direct or indirect, to cause the direction or management of such entity, whether by contract or otherwise, or (ii) ownership of fifty percent (50%) or more of the outstanding shares, or (iii) beneficial ownership of such entity.
22 | 
23 | "You" (or "Your") shall mean an individual or Legal Entity exercising permissions granted by this License.
24 | 
25 | "Source" form shall mean the preferred form for making modifications, including but not limited to software source code, documentation source, and configuration files.
26 | 
27 | "Object" form shall mean any form resulting from mechanical transformation or translation of a Source form, including but not limited to compiled object code, generated documentation, and conversions to other media types.
28 | 
29 | "Work" shall mean the work of authorship, whether in Source or Object form, made available under the License, as indicated by a copyright notice that is included in or attached to the work (an example is provided in the Appendix below).
30 | 
31 | "Derivative Works" shall mean any work, whether in Source or Object form, that is based on (or derived from) the Work and for which the editorial revisions, annotations, elaborations, or other modifications represent, as a whole, an original work of authorship. For the purposes of this License, Derivative Works shall not include works that remain separable from, or merely link (or bind by name) to the interfaces of, the Work and Derivative Works thereof.
32 | 
33 | "Contribution" shall mean any work of authorship, including the original version of the Work and any modifications or additions to that Work or Derivative Works thereof, that is intentionally submitted to Licensor for inclusion in the Work by the copyright owner or by an individual or Legal Entity authorized to submit on behalf of the copyright owner. For the purposes of this definition, "submitted" means any form of electronic, verbal, or written communication sent to the Licensor or its representatives, including but not limited to communication on electronic mailing lists, source code control systems, and issue tracking systems that are managed by, or on behalf of, the Licensor for the purpose of discussing and improving the Work, but excluding communication that is conspicuously marked or otherwise designated in writing by the copyright owner as "Not a Contribution."
34 | 
35 | "Contributor" shall mean Licensor and any individual or Legal Entity on behalf of whom a Contribution has been received by Licensor and subsequently incorporated within the Work.
36 | 
37 | 2. Grant of Copyright License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable copyright license to reproduce, prepare Derivative Works of, publicly display, publicly perform, sublicense, and distribute the Work and such Derivative Works in Source or Object form.
38 | 
39 | 3. Grant of Patent License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable (except as stated in this section) patent license to make, have made, use, offer to sell, sell, import, and otherwise transfer the Work, where such license applies only to those patent claims licensable by such Contributor that are necessarily infringed by their Contribution(s) alone or by combination of their Contribution(s) with the Work to which such Contribution(s) was submitted. If You institute patent litigation against any entity (including a cross-claim or counterclaim in a lawsuit) alleging that the Work or a Contribution incorporated within the Work constitutes direct or contributory patent infringement, then any patent licenses granted to You under this License for that Work shall terminate as of the date such litigation is filed.
40 | 
41 | 4. Redistribution. You may reproduce and distribute copies of the Work or Derivative Works thereof in any medium, with or without modifications, and in Source or Object form, provided that You meet the following conditions:
42 | 
43 |     You must give any other recipients of the Work or Derivative Works a copy of this License; and
44 |     You must cause any modified files to carry prominent notices stating that You changed the files; and
45 |     You must retain, in the Source form of any Derivative Works that You distribute, all copyright, patent, trademark, and attribution notices from the Source form of the Work, excluding those notices that do not pertain to any part of the Derivative Works; and
46 |     If the Work includes a "NOTICE" text file as part of its distribution, then any Derivative Works that You distribute must include a readable copy of the attribution notices contained within such NOTICE file, excluding those notices that do not pertain to any part of the Derivative Works, in at least one of the following places: within a NOTICE text file distributed as part of the Derivative Works; within the Source form or documentation, if provided along with the Derivative Works; or, within a display generated by the Derivative Works, if and wherever such third-party notices normally appear. The contents of the NOTICE file are for informational purposes only and do not modify the License. You may add Your own attribution notices within Derivative Works that You distribute, alongside or as an addendum to the NOTICE text from the Work, provided that such additional attribution notices cannot be construed as modifying the License.
47 | 
48 |     You may add Your own copyright statement to Your modifications and may provide additional or different license terms and conditions for use, reproduction, or distribution of Your modifications, or for any such Derivative Works as a whole, provided Your use, reproduction, and distribution of the Work otherwise complies with the conditions stated in this License.
49 | 
50 | 5. Submission of Contributions. Unless You explicitly state otherwise, any Contribution intentionally submitted for inclusion in the Work by You to the Licensor shall be under the terms and conditions of this License, without any additional terms or conditions. Notwithstanding the above, nothing herein shall supersede or modify the terms of any separate license agreement you may have executed with Licensor regarding such Contributions.
51 | 
52 | 6. Trademarks. This License does not grant permission to use the trade names, trademarks, service marks, or product names of the Licensor, except as required for reasonable and customary use in describing the origin of the Work and reproducing the content of the NOTICE file.
53 | 
54 | 7. Disclaimer of Warranty. Unless required by applicable law or agreed to in writing, Licensor provides the Work (and each Contributor provides its Contributions) on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied, including, without limitation, any warranties or conditions of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are solely responsible for determining the appropriateness of using or redistributing the Work and assume any risks associated with Your exercise of permissions under this License.
55 | 
56 | 8. Limitation of Liability. In no event and under no legal theory, whether in tort (including negligence), contract, or otherwise, unless required by applicable law (such as deliberate and grossly negligent acts) or agreed to in writing, shall any Contributor be liable to You for damages, including any direct, indirect, special, incidental, or consequential damages of any character arising as a result of this License or out of the use or inability to use the Work (including but not limited to damages for loss of goodwill, work stoppage, computer failure or malfunction, or any and all other commercial damages or losses), even if such Contributor has been advised of the possibility of such damages.
57 | 
58 | 9. Accepting Warranty or Additional Liability. While redistributing the Work or Derivative Works thereof, You may choose to offer, and charge a fee for, acceptance of support, warranty, indemnity, or other liability obligations and/or rights consistent with this License. However, in accepting such obligations, You may act only on Your own behalf and on Your sole responsibility, not on behalf of any other Contributor, and only if You agree to indemnify, defend, and hold each Contributor harmless for any liability incurred by, or claims asserted against, such Contributor by reason of your accepting any such warranty or additional liability.
59 | 
60 | END OF TERMS AND CONDITIONS


--------------------------------------------------------------------------------
/eosdis_store/dmrpp.py:
--------------------------------------------------------------------------------
  1 | __all__ = ['to_zarr']
  2 | 
  3 | import logging
  4 | import os.path as op
  5 | import requests
  6 | import xml.etree.ElementTree as ElementTree
  7 | 
  8 | logger = logging.getLogger(__name__)
  9 | 
 10 | # Environment variables
 11 | 
 12 | """ Namespaces used in DMRPP XML Files """
 13 | NS = {
 14 |     'dpp': 'http://xml.opendap.org/dap/dmrpp/1.0.0#',
 15 |     'd': 'http://xml.opendap.org/ns/DAP/4.0#'
 16 | }
 17 | 
 18 | """ Default compression level """
 19 | UNKNOWN_COMPRESSION_LEVEL = 4
 20 | 
 21 | """ Data type mappings """
 22 | TYPE_INFO = {
 23 |     'Int8': (int, '|i1'),
 24 |     'Int16': (int, '<i2'),
 25 |     'Int32': (int, '<i4'),
 26 |     'Int64': (int, '<i8'),
 27 |     'Byte': (int, '|u1'),
 28 |     'UInt8': (int, '|u1'),
 29 |     'UInt16': (int, '<u2'),
 30 |     'UInt32': (int, '<u4'),
 31 |     'UInt64': (int, '<u8'),
 32 |     'Float32': (float, '<f4'),
 33 |     'Float64': (float, '<f8'),
 34 |     'String': (str, '|s'),
 35 |     'URI': (str, '|s')
 36 | }
 37 | 
 38 | 
 39 | def find_child(node, name):
 40 |     """Return child node with matching name (this function primarily used for testing)
 41 | 
 42 |     Args:
 43 |         node (XML Element): XML Node to search children
 44 |         name (string): Name of child
 45 | 
 46 |     Returns:
 47 |         XML Element: XML Child Element
 48 |     """
 49 |     return node.find(".//d:*[@name='%s']" % (name), NS)
 50 | 
 51 | 
 52 | def get_attribute_values(node):
 53 |     """Get value for a node
 54 | 
 55 |     Args:
 56 |         node (XML Element): An XML Element, presumably of Attribute type
 57 | 
 58 |     Returns:
 59 |         str or [str]: Single value or a list
 60 |     """
 61 |     t = TYPE_INFO[node.attrib['type']][0]
 62 |     vals = [t(val.text) for val in node]
 63 |     return vals[0] if len(vals) == 1 else vals
 64 | 
 65 | 
 66 | def get_attributes(node, exclude=[]):
 67 |     """Get all children from a node that are Attributes
 68 | 
 69 |     Args:
 70 |         node (XML Element): An XML Element containing Attribute children
 71 |         exclude (list[str], optional): List of attribute names to exclude. Defaults to [].
 72 | 
 73 |     Returns:
 74 |         dict: Dictionary of Atribute values
 75 |     """
 76 |     zattrs = {}
 77 |     for child in node :
 78 |         tag = child.tag.split('}')[-1]
 79 |         if tag == 'Attribute' and child.attrib['name'] not in exclude:
 80 |             zattrs[child.attrib['name']] = get_attribute_values(child)
 81 |     return zattrs
 82 | 
 83 | 
 84 | def get_dimensions(root, group=None):
 85 |     """Get dictionary of dimension info from the root of the DMRPP XML
 86 | 
 87 |     Args:
 88 |         root (XML Element): XML Element for the DMRPP root
 89 |         group (str, optional): Group name to get dimensions from
 90 | 
 91 |     Returns:
 92 |         dict: Dictionary containing dimension names, sizes, and full paths
 93 |     """
 94 |     #, group=None): #, path='/'):
 95 |     if group is None:
 96 |         group = root
 97 | 
 98 |     #dimensions = {}
 99 |     dim_infos = { '/' + dim.attrib['name']: {'size': int(dim.attrib['size'])} for dim in group.findall('d:Dimension', NS)}
100 |     for name in dim_infos:
101 |         basename = name.split('/')[-1]
102 |         dim_node = root.find(".//d:*[@name='%s']/d:Dim[@name='%s']/.." % (basename, name), NS)
103 |         if dim_node is None:
104 |             logger.warning(f"Could not find details for dimension {name}")
105 |             continue
106 |         #result = node.find(f"./d:Attribute[@name='{name}']/d:Value", NS)
107 |         #return result.text.lstrip('/')
108 |         node = dim_node.find(f"./d:Attribute[@name='fullnamepath']/d:Value", NS)
109 |         if node:
110 |             dim_infos[name]['path'] = node.text
111 |         else:
112 |             dim_infos[name]['path'] = name
113 | 
114 |     # TODO - HARMONY-530, don't think this works as originally intended. Need test files with nested groups
115 |     #for child in group.findall('d:Group', NS):
116 |     #    dim_infos.update(get_dimensions(root, child)) #, path + child.attrib['name'] + '/'))
117 |     return dim_infos
118 | 
119 | 
120 | def chunks_to_zarr(node):
121 |     """Convert DMRPP 'Chunks' Element into Zarr metadata
122 | 
123 |     Args:
124 |         node (XML Element): XML Element of type dmrpp:chunks
125 | 
126 |     Returns:
127 |         dict: Zarr metadata for chunks
128 |     """
129 |     chunks = None
130 |     zarray = {}
131 |     zchunkstore = {}
132 |     for child in node:
133 |         tag = child.tag.split('}')[-1]
134 |         if tag == 'chunkDimensionSizes':
135 |             chunks = [int(v) for v in child.text.split(' ')]
136 |         elif tag == 'chunk':
137 |             offset = int(child.attrib['offset'])
138 |             nbytes = int(child.attrib['nBytes'])
139 |             positions_in_array = child.get('chunkPositionInArray')
140 |             if positions_in_array:
141 |                 positions_str = positions_in_array[1:-1].split(',')
142 |                 positions = [int(p) for p in positions_str]
143 |                 indexes = [ int(p / c) for p, c in zip(positions, chunks) ]
144 |             else:
145 |                 indexes = [0]
146 |             key = '.'.join([ str(i) for i in indexes ])
147 |             zchunkstore[key] = { 'offset': offset, 'size': nbytes }
148 |     zarray['chunks'] = chunks
149 |     return {
150 |         'zarray': zarray,
151 |         'zchunkstore': zchunkstore
152 |     }
153 | 
154 | 
155 | def array_to_zarr(node, dims, prefix=''):
156 |     """Convert a DMRPP Array into Zarr metadata
157 | 
158 |     Args:
159 |         node (XML Element): XML Element of a DMRPP array
160 |         dims (dict): Dimension info from DMRPP XML root
161 |         prefix (str, optional): Prefix to prepend to array in Zarr metadata. Defaults to ''.
162 | 
163 |     Raises:
164 |         Exception: Unrecognized compression type
165 | 
166 |     Returns:
167 |         dict: Zarr metadata for this DMRPP array
168 |     """
169 |     datatype = node.tag.split('}')[-1]
170 |     dtype = TYPE_INFO[datatype][1]
171 |     pathnode = node.find(f"./d:Attribute[@name='fullnamepath']/d:Value", NS)
172 |     if pathnode is not None:
173 |         prefix = op.join(prefix, pathnode.text).lstrip('/')
174 |     else:
175 |         prefix = op.join(prefix, node.attrib['name']).lstrip('/')
176 | 
177 |     zarray = {
178 |         "zarr_format": 2,
179 |         "filters": None,
180 |         "order": "C",
181 |         "dtype": dtype,
182 |         "shape": []
183 |     }
184 |     zattrs = get_attributes(node, exclude=['fullnamepath', 'origname'])
185 |     zattrs.update({
186 |         "_ARRAY_DIMENSIONS": []
187 |     })
188 |     zchunkstore = None
189 | 
190 |     for child in node:
191 |         tag = child.tag.split('}')[-1]
192 |         if tag == 'Dim' and 'name' in child.attrib:
193 |             dim = dims[child.attrib['name']]
194 |             zattrs['_ARRAY_DIMENSIONS'].append(child.attrib['name'].lstrip('/'))
195 |             zarray['shape'].append(dim['size'])
196 |         elif tag == 'Dim':
197 |             # anonymous Dimensions still have size
198 |             zarray['shape'].append(int(child.attrib['size']))
199 |         elif tag == 'chunks':
200 |             compression = child.attrib.get('compressionType')
201 |             if compression == 'deflate':
202 |                 zarray['compressor'] = { "id": "zlib", "level": UNKNOWN_COMPRESSION_LEVEL }
203 |             elif compression == 'deflate shuffle':
204 |                 zarray['compressor'] = {"id": "zlib", "level": UNKNOWN_COMPRESSION_LEVEL}
205 |                 size = int(dtype[2:])
206 |                 zarray['filters'] = [{"id": "shuffle", "elementsize": size}]
207 |             elif compression is None:
208 |                 zarray['compressor'] = None
209 |             else:
210 |                 raise Exception('Unrecognized compressionType: ' + compression)
211 |             chunks = chunks_to_zarr(child)
212 |             zarray.update(chunks['zarray'])
213 |             zchunkstore = chunks['zchunkstore']
214 |     # NOTE - this is null in test file
215 |     zarray['fill_value'] = zattrs.get('_FillValue')
216 | 
217 |     # HARMONY-896: Automatic scale factor and offset filter.  Not yet working with all data types
218 |     # if zattrs.get('scale_factor') or zattrs.get('add_offset'):
219 |     #     zarray['filters'].append({
220 |     #         'id': 'fixedscaleoffset',
221 |     #         'offset': zattrs.get('add_offset', 0.0),
222 |     #         'scale': zattrs.get('scale_factor', 1.0),
223 |     #         'dtype': '<f8',
224 |     #     })
225 | 
226 |     if zarray.get('chunks') is None:
227 |         zarray['chunks'] = zarray['shape']
228 | 
229 |     zarr = {
230 |         op.join(prefix, '.zarray'): zarray,
231 |         op.join(prefix, '.zattrs'): zattrs,
232 |         op.join(prefix, '.zchunkstore'): zchunkstore
233 |     }
234 |     return zarr
235 | 
236 | 
237 | def group_to_zarr(node, dims, prefix=''):
238 |     """Convert DMRPP grouping into a Zarr group
239 | 
240 |     Args:
241 |         node (XML Element): XML Element representing DMRPP group
242 |         dims (dict): Dimension info retrieved from DMRPP root XML
243 |         prefix (str, optional): Prefix to prepend to Zarr metadata keys. Defaults to ''.
244 | 
245 |     Returns:
246 |         dict: Zarr metadata
247 |     """
248 |     zarr = {}
249 |     if prefix == '':
250 |         zarr['.zgroup'] = {
251 |             'zarr_format': 2
252 |         }
253 | 
254 |     for child in node:
255 |         tag = child.tag.split('}')[-1]
256 |         # if this is an array, convert to zarr array
257 |         if tag in TYPE_INFO:
258 |             zarr_array = array_to_zarr(child, dims, prefix=prefix)
259 |             zarr.update(zarr_array)
260 |         # otherwise, if this is group or a Container Attribute - this has not been tested
261 |         elif tag == 'Group' or (tag == 'Attribute' and child.attrib.get('type', '') == 'Container'):
262 |             name = child.attrib['name']
263 |             # use for global .zattrs
264 |             if name == 'HDF5_GLOBAL':
265 |                 zarr['.zattrs'] = get_attributes(child)
266 |             elif name != 'DODS_EXTRA' and len(child):
267 |                 zarr_child = group_to_zarr(child, dims, prefix=op.join(prefix, name))
268 |                 zarr.update(zarr_child)
269 |         # if attribute
270 |         elif tag == 'Attribute':
271 |             # put at current level
272 |             key = op.join(prefix, '.zattrs')
273 |             if key not in zarr:
274 |                 zarr[key] = {}
275 |             zarr[key][child.attrib['name']] = get_attribute_values(child)
276 |     return zarr
277 | 
278 | 
279 | def to_zarr(root):
280 |     """Convert DMRPP metadata to Zarr metadata
281 | 
282 |     Args:
283 |         root (XML Element): Root XML Element of DMRPP XML
284 | 
285 |     Returns:
286 |         dict: Zarr metadata
287 |     """
288 |     zarr = {}
289 |     dims = get_dimensions(root)
290 |     zarr = group_to_zarr(root, dims)
291 |     return zarr
292 | 
293 | 


--------------------------------------------------------------------------------
/eosdis_store/stores.py:
--------------------------------------------------------------------------------
  1 | import logging
  2 | import re
  3 | import time
  4 | 
  5 | from cachecontrol import CacheController, CacheControlAdapter
  6 | import requests
  7 | from requests_futures.sessions import FuturesSession
  8 | import xml.etree.ElementTree as ElementTree
  9 | 
 10 | from .dmrpp import to_zarr
 11 | from .version import __version__
 12 | from zarr.storage import ConsolidatedMetadataStore
 13 | 
 14 | logger = logging.getLogger(__name__)
 15 | 
 16 | 
 17 | class ElapsedFuturesSession(FuturesSession):
 18 |     """Track start time and elapsed time for all requests in this session
 19 | 
 20 |     Args:
 21 |         FuturesSession (FuturesSession): Parent class
 22 |     """
 23 | 
 24 |     def request(self, method, url, hooks={}, *args, **kwargs):
 25 |         start = time.time()
 26 | 
 27 |         def timing(r, *args, **kwargs):
 28 |             r.start = start
 29 |             r.elapsed = time.time() - start
 30 | 
 31 |         try:
 32 |             if isinstance(hooks['response'], (list, tuple)):
 33 |                 # needs to be first so we don't time other hooks execution
 34 |                 hooks['response'].insert(0, timing)
 35 |             else:
 36 |                 hooks['response'] = [timing, hooks['response']]
 37 |         except KeyError:
 38 |             hooks['response'] = timing
 39 | 
 40 |         return super(ElapsedFuturesSession, self) \
 41 |             .request(method, url, hooks=hooks, *args, **kwargs)
 42 | 
 43 | 
 44 | class HttpByteRangeReader():
 45 |     """Perform HTTP range reads on remote files
 46 |     """
 47 |     def __init__(self, url):
 48 |         """Create HttpByteRangeRead instance for a single file
 49 | 
 50 |         Args:
 51 |             url (str): URL to remote file
 52 |         """
 53 |         self.url = url
 54 |         self.first_fetch = True
 55 | 
 56 |         # create futures session
 57 |         self.session = ElapsedFuturesSession()
 58 |         cache_adapter = CacheControlAdapter()
 59 |         cache_adapter.controller = CacheController(
 60 |             cache=cache_adapter.cache,
 61 |             status_codes=(200, 203, 300, 301, 303, 307)
 62 |         )
 63 |         self.session.mount('http://', cache_adapter)
 64 |         self.session.mount('https://', cache_adapter)
 65 | 
 66 |     def read_range(self, offset, size):
 67 |         """Read a range of bytes from remote file
 68 | 
 69 |         Args:
 70 |             offset (int): Offset, in number of bytes
 71 |             size (int): Number of bytes to read
 72 | 
 73 |         Returns:
 74 |             Bytes: Contents file file over range
 75 |         """
 76 |         return self._async_read(offset, size).result().content
 77 | 
 78 |     def read_ranges(self, range_iter):
 79 |         """Read multiple ranges simultaneously (async)
 80 | 
 81 |         Args:
 82 |             range_iter (iterator): List of ranges
 83 | 
 84 |         Yields:
 85 |             iterator: Iterator to content of each range
 86 |         """
 87 |         futures = [self._async_read(offset, size) for offset, size in range_iter]
 88 |         for future in futures:
 89 |             yield future.result()
 90 | 
 91 |     def _async_read(self, offset, size):
 92 |         """Asynchronous HTTP read
 93 | 
 94 |         Args:
 95 |             offset (int): Offset, in number of Bytes
 96 |             size (int): Number of bytes to read
 97 | 
 98 |         Returns:
 99 |             response: Return request response
100 |         """
101 |         logger.debug(f"Reading {self.url} [{offset}:{offset+size}] ({size} bytes)")
102 |         range_str = '%d-%d' % (offset, offset + size)
103 |         request = self.session.get(self.url, headers={
104 |             'Range': 'bytes=' + range_str,
105 |             'User-Agent': f'zarr-eosdis-store/{__version__}'
106 |         })
107 |         if self.first_fetch:
108 |             self.first_fetch = False
109 |             request.result()
110 |         return request
111 | 
112 | 
113 | class ConsolidatedChunkStore(ConsolidatedMetadataStore):
114 |     """Zarr store for performing range reads on remote HTTP resources in a way that parallelizes
115 |     and combines reads.
116 | 
117 |     Args:
118 |         ConsolidatedMetadataStore (ConsolidatedMetadataStore): Parent class using single source of metadata
119 |     """
120 |     def __init__(self, meta_store, data_url):
121 |         """Instantiate ConsolidatedChunkStore
122 | 
123 |         Args:
124 |             meta_store (dict): A Python object with the structure of a consolidated Zarr metadata store
125 |             data_url (str): URL to data file
126 |         """
127 |         self.meta_store = meta_store
128 |         self.chunk_source = HttpByteRangeReader(data_url)
129 | 
130 |     def __getitem__(self, key):
131 |         """Get an item from the store
132 | 
133 |         Args:
134 |             key (str): Key of the item to fetch from the store as defined by Zarr
135 | 
136 |         Returns:
137 |             The data or metadata value of the item
138 |         """
139 |         return self.getitems((key, ))[key]
140 | 
141 |     def getitems(self, keys, **kwargs):
142 |         """Get values for the provided list of keys from the Zarr store
143 | 
144 |         Args:
145 |             keys (Array): Array of string keys to fetch from the store
146 | 
147 |         Returns:
148 |             An iterator returning tuples of the input keys to their data or metadata values
149 |         """
150 |         return dict(self._getitems_generator(keys, **kwargs))
151 | 
152 |     def _getitems_generator(self, keys, **kwargs):
153 |         """Generate results for getitems
154 |         """
155 |         ranges = []
156 |         for key in keys:
157 |             if re.search(r'/\d+(\.\d+)*$', key):
158 |                 # The key corresponds to a chunk within the file, look up its offset and size
159 |                 path, name = key.rsplit('/', 1)
160 |                 chunk_loc = self.meta_store[path + '/.zchunkstore'][name]
161 |                 ranges.append((key, chunk_loc['offset'], chunk_loc['size']))
162 |             else:
163 |                 # Metadata key, return its value
164 |                 yield (key, super().__getitem__(key))
165 | 
166 |         # Get all the byte ranges requested
167 |         for k, v in self._getranges(ranges).items():
168 |             yield (k, v)
169 | 
170 |     def _getranges(self, ranges):
171 |         '''Given a set of byte ranges [(key, offset, size), ...], fetches and returns a mapping of keys to bytes
172 | 
173 |         Args:
174 |             ranges (Array): Array of desired byte ranges of the form [(key, offset, size), ...]
175 |         Returns:
176 |             dict-like [(key, bytes), (key, bytes), ...]
177 |         '''
178 |         reader = self.chunk_source
179 |         ranges = sorted(ranges, key=lambda r: r[1])
180 |         merged_ranges = self._merge_ranges(ranges)
181 |         range_data_offsets = [r[-1] for r in merged_ranges]
182 |         logger.debug(f"Merged {len(ranges)} requests into {len(range_data_offsets)}")
183 | 
184 |         range_data = reader.read_ranges([(offset, size) for offset, size, _ in merged_ranges])
185 |         self.responses = list(range_data)
186 |         range_data = [r.content for r in self.responses]
187 |         result = self._split_ranges(zip(range_data_offsets, range_data))
188 |         return result
189 | 
190 |     def _split_ranges(self, merged_ranges):
191 |         '''Given tuples of range groups as returned by _merge_ranges and corresponding bytes,
192 |         returns a map of keys to corresponding bytes.
193 | 
194 |         Args:
195 |             merged_ranges (Array): Array of (group, bytes) where group is as returned by _merge_ranges
196 |         Returns:
197 |             dict-like [(key, bytes), (key, bytes), ...]
198 |         '''
199 |         result = {}
200 |         for ranges, data in merged_ranges:
201 |             for key, offset, size in ranges:
202 |                 result[key] = data[offset:(offset+size)]
203 |         return result
204 | 
205 |     def _merge_ranges(self, ranges, max_gap=10000):
206 |         '''Group an array of byte ranges that need to be read such that any that are within `max_gap`
207 |         of each other are in the same group.
208 | 
209 |         Args:
210 |             ranges (Array): An array of tuples of (key, offset, size)
211 |         Returns:
212 |             An array of groups of near-adjacent ranges
213 |                 [
214 |                     [
215 |                         offset, # The byte offset of the group from the start of the file
216 |                         size,   # The number of bytes that need to be read
217 |                         [
218 |                             (   # Range within group
219 |                                 key,        # The key from the input tuple
220 |                                 sub-offset, # The byte offset of the range from the start of the group
221 |                                 size        # The number of bytes for the range
222 |                             ),
223 |                             (key, sub-offset, size),
224 |                             ...
225 |                         ]
226 |                     ],
227 |                     ...
228 |                 ]
229 |         '''
230 |         ranges = sorted(ranges, key=lambda r: r[1])
231 |         if len(ranges) == 0:
232 |             return []
233 |         group_offset = ranges[0][1]
234 |         prev_offset = ranges[0][1]
235 |         group = []
236 |         result = []
237 |         for key, offset, size in ranges:
238 |             if offset - prev_offset > max_gap + 1:
239 |                 logger.debug("Starting new range due to gap of %d bytes" % (offset - prev_offset,))
240 |                 result.append((group_offset, prev_offset - group_offset, group))
241 |                 group_offset = offset
242 |                 group = []
243 |             group.append((key, offset - group_offset, size))
244 |             prev_offset = offset + size
245 |         result.append((group_offset, prev_offset - group_offset, group))
246 |         return result
247 | 
248 | 
249 | class EosdisStore(ConsolidatedChunkStore):
250 |     """Store representing a HDF5/NetCDF file accessed over HTTP with zarr metadata derived from a DMR++ file
251 | 
252 |     Args:
253 |         ConsolidatedChunkStore (ConsolidatedChunkStore): Parent class is a store for doing byte range reads
254 |     """
255 |     def __init__(self, data_url, dmr_url=None):
256 |         """Construct the store
257 | 
258 |         Args:
259 |             data_url (String): The URL of the remote data file which should be accessed through Zarr
260 |             dmr_url (String): Optional URL to a DMR++ file describing metadata and byte offsets of the
261 |             given file.  If not provided, the URL is assumed to be the original file with a .dmrpp suffix
262 |         """
263 |         if dmr_url is None:
264 |             dmr_url = data_url + '.dmrpp'
265 |         dmrpp = requests.get(dmr_url).text
266 |         tree = ElementTree.fromstring(dmrpp)
267 |         meta_store = to_zarr(tree)
268 |         super(EosdisStore, self).__init__(meta_store, data_url)
269 | 


--------------------------------------------------------------------------------
/presentation/tutorial.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# EOSDIS Zarr Store: Spatial & Variable Subsetting without Services\n",
  8 |     "\n",
  9 |     "## Goal\n",
 10 |     "\n",
 11 |     "Produce a library that would let the Zarr Python library read EOSDIS cloud holdings efficiently, without requiring any modifications to our archive.  This has the potential to expand use to new communities and tools, allow more efficient access both in place and outside of the cloud, and therefore save money for the archive as well as time for users.\n",
 12 |     "\n",
 13 |     "## Background\n",
 14 |     "\n",
 15 |     "This is a demo of a data store I've been working on, building off of the work of a few others.  Adapting the Zarr library (which is meant to read cloud-optimized data stores) read NetCDF4 / HDF 5 files was discussed as a possibility at Summer ESIP last year.  Rich Signell from USGS worked with HDF Group to get [a prototype](https://medium.com/pangeo/cloud-performant-reading-of-netcdf4-hdf5-data-using-the-zarr-library-1a95c5c92314).  The resulting code showed no performance degradation over an equivalent native Zarr store.  This adaptation requies an up-front generation of metadata containing data attributes and byte offsets to allow efficient reads.\n",
 16 |     "\n",
 17 |     "## What I did\n",
 18 |     "\n",
 19 |     "I recognized that the DMR++ files OPeNDAP / GHRC have started generating on ingest in PI 20.1 contain nearly equivalent information to that required by the Zarr library.  Hearing that small chunk sizes (chunks are a region of data that can / must be read all at once) caused issues for some NetCDF files and required re-chunking (i.e. altering the original data file), I further looked at mitigating that issue to avoid having to re-host data.  In picking through the Zarr code, I came across a for loop that, if changed, would allow a set of optimizations that would greatly improve performance.  I advocated for this in the Zarr tracker and what we need is now being planned.\n",
 20 |     "![png](summary.png)\n",
 21 |     "\n",
 22 |     "In terms of actual code, I produced a Python library, eosdis-zarr-store that:\n",
 23 |     "\n",
 24 |     "1. Implements the Zarr storage API in a natural and familiar way to Zarr developers\n",
 25 |     "2. Sets up HTTP access to allow EDL credential handshaking and, importantly, caching of redirect URLs\n",
 26 |     "3. Adapts our underlying data files and DMR++ files generated on ingest to a Zarr-compatible API\n",
 27 |     "4. Implements optimizations using the API worked out with the Zarr community to make fewer total data reads and do them in parallel where possible\n",
 28 |     "\n",
 29 |     "The remainder of this notebook contains results and conclusions.\n",
 30 |     "\n",
 31 |     "## How to use it\n",
 32 |     "\n",
 33 |     "In the eosdis-zarr-store directory run `pip install -e .`.  Obtain or stage an HDF5 (NetCDF4) file along with a DMR++ file with identical URL + \".dmrpp\", you can run \"mkdmrpp\" in this folder to produce DMR++ files.  Then:\n",
 34 |     "\n",
 35 |     "```python\n",
 36 |     "from eosdis_zarr_store import Store\n",
 37 |     "import zarr\n",
 38 |     "\n",
 39 |     "f = zarr.open(Store(data_file_url))\n",
 40 |     "# Manipulate f as any Zarr store (see examples below)\n",
 41 |     "```\n",
 42 |     "\n",
 43 |     "The URLs in this notebook will not be available for general use, since one example produces 500 MB of egress for benchmarking.\n",
 44 |     "\n",
 45 |     "## Helpers and Constants (You can skip this)"
 46 |    ]
 47 |   },
 48 |   {
 49 |    "cell_type": "code",
 50 |    "execution_count": null,
 51 |    "metadata": {},
 52 |    "outputs": [],
 53 |    "source": [
 54 |     "# Helpers to draw stuff, generate URLs, and translate bounding boxes to array indices, \n",
 55 |     "# wholly ignoring all the helpful attributes present in the HDF and Zarr metadata\n",
 56 |     "# Please don't judge me on this mess.  It's not called \"Clean code fest\"\n",
 57 |     "\n",
 58 |     "from matplotlib import pyplot as plt\n",
 59 |     "from matplotlib import colors\n",
 60 |     "from ipypb import track\n",
 61 |     "import numpy as np\n",
 62 |     "\n",
 63 |     "def show(data, transpose=True):\n",
 64 |     "    plt.rcParams[\"figure.figsize\"] = [16, 8]\n",
 65 |     "    if transpose:\n",
 66 |     "        data = np.transpose(data)\n",
 67 |     "    plt.imshow(data[::-1,:], norm=colors.Normalize(0, 150), cmap='Blues')\n",
 68 |     "\n",
 69 |     "def get_aoi(bbox, scale, x0=180, y0=90):\n",
 70 |     "    aoi = (0, \n",
 71 |     "           slice(scale * int(bbox[1] + x0), scale * int(bbox[3] + x0) + 1), \n",
 72 |     "           slice(scale * int(bbox[0] +  y0), scale * int(bbox[2] + y0) + 1))\n",
 73 |     "    shape = [d.stop - d.start for d in aoi[1:]]\n",
 74 |     "    return aoi, shape\n",
 75 |     "\n",
 76 |     "url_root = 'https://harmony.uat.earthdata.nasa.gov/service-results/harmony-uat-staging/public/demo/zarr-store/'\n",
 77 |     "# GPM HHR URLs\n",
 78 |     "filename_template = '3B-HHR.MS.MRG.3IMERG.20051022-S%02d%02d00-E%02d%02d59.%04d.V06B.HDF5'\n",
 79 |     "data_urls = [ url_root + filename_template % (h, m, h, m + 29, h * 60 + m) for h in range(0, 24) for m in range(0, 60, 30) ]\n",
 80 |     "\n",
 81 |     "bbox = [10, -100, 47.5, -45]\n",
 82 |     "\n",
 83 |     "# Basic file info (also readable from metadata)\n",
 84 |     "GPM_NODATA = -9999.9\n",
 85 |     "gpm_aoi, gpm_shape = get_aoi(bbox, 10)\n",
 86 |     "RSS_NODATA = 251\n",
 87 |     "RSS_SCALE_FACTOR = 0.5 # In-file scale factor is 0.1.  This increases it solely for the purpose of making it show up in pics\n",
 88 |     "rss_aoi, rss_shape = get_aoi(bbox, 4, 360)\n",
 89 |     "rss_aoi = (0, rss_aoi[2], rss_aoi[1])\n"
 90 |    ]
 91 |   },
 92 |   {
 93 |    "cell_type": "code",
 94 |    "execution_count": null,
 95 |    "metadata": {},
 96 |    "outputs": [],
 97 |    "source": [
 98 |     "gpm_aoi"
 99 |    ]
100 |   },
101 |   {
102 |    "cell_type": "markdown",
103 |    "metadata": {},
104 |    "source": [
105 |     "## Problem 1: Atmospheric water vapor off the East Coast on Patrick's wedding day\n",
106 |     "\n",
107 |     "It rained a little that day in DC and hurricanes were threatening our honeymoon in the Carribbean.\n",
108 |     "\n",
109 |     "We have a bounding box defined above.  Use data distributed by GHRC derived from the SSMIS sensor of the F16 DMSP satellite to build a picture.\n",
110 |     "\n",
111 |     "### Without Partial Access\n",
112 |     "\n",
113 |     "Download 2.6 MB file and subset it"
114 |    ]
115 |   },
116 |   {
117 |    "cell_type": "code",
118 |    "execution_count": null,
119 |    "metadata": {
120 |     "scrolled": false
121 |    },
122 |    "outputs": [],
123 |    "source": [
124 |     "%%time\n",
125 |     "from h5py import File as H5File\n",
126 |     "import requests\n",
127 |     "from io import BytesIO\n",
128 |     "\n",
129 |     "response = requests.get(url_root + 'f16_ssmis_20051022v7.nc')\n",
130 |     "with H5File(BytesIO(response.content), 'r') as f:\n",
131 |     "    aoi_data = f['atmosphere_water_vapor_content'][rss_aoi]\n",
132 |     "    show(np.where(aoi_data < RSS_NODATA, aoi_data * RSS_SCALE_FACTOR, 0), transpose=False)\n"
133 |    ]
134 |   },
135 |   {
136 |    "cell_type": "markdown",
137 |    "metadata": {},
138 |    "source": [
139 |     "### Partial Access Step 1 - Make our data readable in Zarr for partial access\n",
140 |     "\n",
141 |     "Mimick a Zarr store by reading OPeNDAP's DMR++ files and returning their metadata in a Zarr interface.  DMR++ files are planned to be generated on ingest\n",
142 |     "\n",
143 |     "Downloads 200 KB of data from the 2.6 MB file with conventional Zarr storage implementation.\n",
144 |     "\n",
145 |     "Result: 12 data requests, each of which goes through internet services, pre-signs a URL, and redirects to the data range.  All sequentially.  Slow."
146 |    ]
147 |   },
148 |   {
149 |    "cell_type": "code",
150 |    "execution_count": null,
151 |    "metadata": {},
152 |    "outputs": [],
153 |    "source": [
154 |     "%%time\n",
155 |     "from eosdis_store import EosdisStore\n",
156 |     "import zarr\n",
157 |     "\n",
158 |     "f = zarr.open(EosdisStore(url_root + 'f16_ssmis_20051022v7.nc'))\n",
159 |     "aoi_data = f['atmosphere_water_vapor_content'][rss_aoi]\n",
160 |     "print(aoi_data)\n",
161 |     "show(np.where(aoi_data < RSS_NODATA, aoi_data * RSS_SCALE_FACTOR, 0), transpose=False)"
162 |    ]
163 |   },
164 |   {
165 |    "cell_type": "markdown",
166 |    "metadata": {},
167 |    "source": [
168 |     "### Partial Access Step 2 - Make Zarr reads fast\n",
169 |     "\n",
170 |     "Downloads 200 KB of data from the 2.6 MB file with Zarr optimizations: \n",
171 |     "1. (Working with Zarr community) Implement \"getitems\" concept, allowing storage to know all of the chunks that will be accessed up front\n",
172 |     "2. Combine nearby range requests into single HTTP requests before sending them, allowing fewer requests.\n",
173 |     "3. Cache presigned URLs returned by the archive for a short time, as directed by caching headers (TEA has a ticket to add these), allowing reuse and avoiding many round-trips and redirects\n",
174 |     "4. Run the first data range request serially to get the presigned URL.  Run subsequent requests in parallel.\n",
175 |     "\n",
176 |     "Result: 3 data requests, one of which goes through internet services, pre-signs a URL, and redirects to the data range.  The following two reuse the signed URL and fetch in parallel.  Faster!\n",
177 |     "\n",
178 |     "When more than a couple of chunks are involved, this is expected to be faster than the native Zarr S3 format is capable of, and the more chunks involved in a read the more it improves."
179 |    ]
180 |   },
181 |   {
182 |    "cell_type": "code",
183 |    "execution_count": null,
184 |    "metadata": {
185 |     "scrolled": true
186 |    },
187 |    "outputs": [],
188 |    "source": [
189 |     "%%time\n",
190 |     "from eosdis_store import EosdisStore\n",
191 |     "import zarr\n",
192 |     "\n",
193 |     "f = zarr.open(EosdisStore(url_root + 'f16_ssmis_20051022v7.nc'))\n",
194 |     "aoi_data = f['atmosphere_water_vapor_content'][rss_aoi]\n",
195 |     "print(rss_aoi)\n",
196 |     "show(np.where(aoi_data < RSS_NODATA, aoi_data * RSS_SCALE_FACTOR, 0), transpose=False)"
197 |    ]
198 |   },
199 |   {
200 |    "cell_type": "code",
201 |    "execution_count": null,
202 |    "metadata": {
203 |     "scrolled": false
204 |    },
205 |    "outputs": [],
206 |    "source": [
207 |     "f['atmosphere_water_vapor_content'].shape\n"
208 |    ]
209 |   },
210 |   {
211 |    "cell_type": "markdown",
212 |    "metadata": {},
213 |    "source": [
214 |     "## Problem 2: Rain along the East Coast on Patrick's wedding day\n",
215 |     "\n",
216 |     "With the same bounding box above, get half-hourly high-quality precipitation values from GPM and sum them for the entire day (48 L3 global data files)\n",
217 |     "\n",
218 |     "### Without Partial Access\n",
219 |     "\n",
220 |     "Download approximately 500MB of data in whole files and processes them"
221 |    ]
222 |   },
223 |   {
224 |    "cell_type": "code",
225 |    "execution_count": null,
226 |    "metadata": {},
227 |    "outputs": [],
228 |    "source": [
229 |     "%%time\n",
230 |     "from h5py import File as H5File\n",
231 |     "import requests\n",
232 |     "from io import BytesIO\n",
233 |     "\n",
234 |     "result = np.zeros(gpm_shape)\n",
235 |     "for url in track(data_urls):\n",
236 |     "    response = requests.get(url)\n",
237 |     "    with H5File(BytesIO(response.content), 'r') as f:\n",
238 |     "        aoi_data = f['Grid/HQprecipitation'][gpm_aoi]\n",
239 |     "        result = result + np.where(aoi_data != GPM_NODATA, aoi_data / 2, 0)\n",
240 |     "show(result)"
241 |    ]
242 |   },
243 |   {
244 |    "cell_type": "markdown",
245 |    "metadata": {},
246 |    "source": [
247 |     "### With the EOSDIS Zarr Store"
248 |    ]
249 |   },
250 |   {
251 |    "cell_type": "markdown",
252 |    "metadata": {},
253 |    "source": [
254 |     "Downloads approximately 5 MB of data by doing partial reads in fewer lines of code"
255 |    ]
256 |   },
257 |   {
258 |    "cell_type": "code",
259 |    "execution_count": null,
260 |    "metadata": {},
261 |    "outputs": [],
262 |    "source": [
263 |     "%%time\n",
264 |     "from eosdis_store import EosdisStore\n",
265 |     "import zarr\n",
266 |     "\n",
267 |     "result = np.zeros(gpm_shape)\n",
268 |     "for url in track(data_urls):\n",
269 |     "    f = zarr.open(EosdisStore(url, quiet=True))\n",
270 |     "    aoi_data = f['Grid/HQprecipitation'][gpm_aoi]\n",
271 |     "    result = result + np.where(aoi_data != GPM_NODATA, aoi_data / 2, 0)\n",
272 |     "show(result)"
273 |    ]
274 |   },
275 |   {
276 |    "cell_type": "markdown",
277 |    "metadata": {},
278 |    "source": [
279 |     "### Comparison to L3 Daily Average Product"
280 |    ]
281 |   },
282 |   {
283 |    "cell_type": "markdown",
284 |    "metadata": {},
285 |    "source": [
286 |     "Download a 30 MB file from the daily average collection to produce a similar result, validating the result at 6x egress cost of partial access for all of the half-hourly source files."
287 |    ]
288 |   },
289 |   {
290 |    "cell_type": "code",
291 |    "execution_count": null,
292 |    "metadata": {},
293 |    "outputs": [],
294 |    "source": [
295 |     "%%time\n",
296 |     "from h5py import File as H5File\n",
297 |     "import requests\n",
298 |     "from io import BytesIO\n",
299 |     "\n",
300 |     "response = requests.get(url_root + '3B-DAY.MS.MRG.3IMERG.20051022-S000000-E235959.V06.nc4')\n",
301 |     "with H5File(BytesIO(response.content), 'r') as f:\n",
302 |     "    show(f['HQprecipitation'][gpm_aoi])"
303 |    ]
304 |   },
305 |   {
306 |    "cell_type": "markdown",
307 |    "metadata": {},
308 |    "source": [
309 |     "## I can see my house from here!\n",
310 |     "\n",
311 |     "Download GEDI L2B data.  Use small geolocation arrays to find the area of interest, then download only the data within those chunks.  \n",
312 |     "\n",
313 |     "A full file download is 1.3 GB.  The code below downloads approximately 15 MB of data and metadata.  This reduces a 15 minute download to about 8s.  (Aside: the download is 2/3 metadata, which could be dramatically reduced by using Zarr's default format rather than DMR++)"
314 |    ]
315 |   },
316 |   {
317 |    "cell_type": "code",
318 |    "execution_count": null,
319 |    "metadata": {},
320 |    "outputs": [],
321 |    "source": [
322 |     "from eosdis_zarr_store import Store\n",
323 |     "import zarr\n",
324 |     "import numpy as np\n",
325 |     "\n",
326 |     "url = 'http://localhost:4000/data/GEDI02_B_2019182140038_O03117_T05635_02_001_01.h5'\n",
327 |     "f = zarr.open(Store(url))\n",
328 |     "print(f.tree())"
329 |    ]
330 |   },
331 |   {
332 |    "cell_type": "code",
333 |    "execution_count": null,
334 |    "metadata": {},
335 |    "outputs": [],
336 |    "source": [
337 |     "n, w, s, e = [40.2, -75.25, 40.15, -75.2]\n",
338 |     "\n",
339 |     "geoloc = f['BEAM0000/geolocation']\n",
340 |     "all_lats = geoloc['latitude_bin0'][:]\n",
341 |     "all_lons = geoloc['longitude_bin0'][:]\n",
342 |     "valid_lat_i = np.where(np.logical_and(all_lats >= s, all_lats <= n))\n",
343 |     "valid_lon_i = np.where(np.logical_and(all_lons >= w, all_lons <= e))\n",
344 |     "indices = np.intersect1d(valid_lat_i, valid_lon_i)\n",
345 |     "\n",
346 |     "lats = all_lats[indices]\n",
347 |     "lons = all_lons[indices]\n",
348 |     "data = f['BEAM0000/cover'][:][indices]\n",
349 |     "data_i = np.where(data != -9999)\n",
350 |     "data = data[data_i]\n",
351 |     "lats = lats[data_i]\n",
352 |     "lons = lons[data_i]\n",
353 |     "\n",
354 |     "ambler = plt.imread('ambler.png')\n",
355 |     "fig, ax = plt.subplots(figsize=(10,10))\n",
356 |     "ax.scatter(lons, lats, s=50, c=data, cmap='Greens')\n",
357 |     "ax.set_xlim(w, e)\n",
358 |     "ax.set_ylim(s, n)\n",
359 |     "ax.imshow(ambler, zorder=0, extent = [w, e, s, n], aspect='equal')"
360 |    ]
361 |   },
362 |   {
363 |    "cell_type": "markdown",
364 |    "metadata": {},
365 |    "source": [
366 |     "## Why is it sometimes slower?\n",
367 |     "\n",
368 |     "![png](request-overhead.png)\n",
369 |     "\n",
370 |     "We pay a penalty for every new file we access, needing to go over the Internet, through the Internet services stack, the request signing process, and ultimately get redirected to S3.  The Zarr store has to pay this penalty twice to read the metadata and then the file, while a full-file download only pays the penalty once.  With current performance, the break-even point in file size is about 10 MB.  That is to say, if a user wants to access even a tiny amount of data in each granule from a collection whose granules are under 10 MB in size, he or she is better off downloading the granules.  While there is some uncontrollable overhead, there is significant room for improvement in areas that are under our control to promote inexpensive access patterns while improving time to science.\n",
371 |     "\n",
372 |     "## Conclusions\n",
373 |     "\n",
374 |     "* If providers generate DMR++ on ingest, we can expose our data efficiently using a Python API that is gaining increasing traction, particulary in the Pangeo community, with minimal storage overhead\n",
375 |     "* Works out of the cloud, but works even better / faster in the cloud for analysis near data\n",
376 |     "* For partial access cases, an overall egress reduction of 90% or more could be possible, as demonstrated\n",
377 |     "* Chunking matters.  This work makes smaller chunks more desirable, which has not historically been the case with Zarr\n",
378 |     "* Overhead in our stack, from EDL, to Internet services, to redirects, are eating up the potential user savings.  At a 90% egress reduction, we struggle to compete with \"Just download everything.\"  How do we balance preventing undesirable behavior with encouraging desirable behavior?\n",
379 |     "* There are lingering questions about whether DMR++ is the correct format to capture this metadata in.  Zarr's native format is in many cases more complete and easier to parse while having mechanisms for more easily working with the 100,000-ish chunks in GEDI granules and for unifying multiple granules into a coherent view.\n",
380 |     "\n",
381 |     "## Limitations / Needs\n",
382 |     "\n",
383 |     "* The DMR++ file must be generated on ingest into the cloud, which is currently optional\n",
384 |     "* Only works on HDF5 and NetCDF4 files.  In principle, it could work on HDF4 / NetCDF Classic files but nothing yet generates the necessary metadata\n",
385 |     "* DMR++ does not quite specify everything we could need for some datasets.  We assume little endian byte order and column-major ordering.\n",
386 |     "\n",
387 |     "## Future Work\n",
388 |     "\n",
389 |     "* Packaging, unit tests, and docs sufficient for publication\n",
390 |     "* Open source (relies on a naming decision)\n",
391 |     "* Cache repeated calls for the same byte ranges to avoid requerying data we have\n",
392 |     "* Implement unknown / undocumented areas of the DMR++ spec, including compression types and data filters\n",
393 |     "* Tests with Dask and XArray\n",
394 |     "* Implement CF conventions to populate fill values, offsets, scales, etc\n",
395 |     "* Extensions to present L3 global collections as a coherent data cube\n",
396 |     "\n",
397 |     "I strongly believe in this access pattern as a win for our users and ourselves.  To the extent it is not fully realized, it suffers from being an early adopter of our cloud access stack.  My sincere hope is that we can learn from it to improve partial file access not only here but in other tools and libraries."
398 |    ]
399 |   }
400 |  ],
401 |  "metadata": {
402 |   "kernelspec": {
403 |    "display_name": "Python 3",
404 |    "language": "python",
405 |    "name": "python3"
406 |   },
407 |   "language_info": {
408 |    "codemirror_mode": {
409 |     "name": "ipython",
410 |     "version": 3
411 |    },
412 |    "file_extension": ".py",
413 |    "mimetype": "text/x-python",
414 |    "name": "python",
415 |    "nbconvert_exporter": "python",
416 |    "pygments_lexer": "ipython3",
417 |    "version": "3.8.3"
418 |   }
419 |  },
420 |  "nbformat": 4,
421 |  "nbformat_minor": 4
422 | }
423 | 


--------------------------------------------------------------------------------
/tests/fixtures/20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.zarr.json:
--------------------------------------------------------------------------------
  1 | {
  2 |     ".zgroup": {
  3 |         "zarr_format": 2
  4 |     },
  5 |     "wind_speed/.zarray": {
  6 |         "zarr_format": 2,
  7 |         "filters": null,
  8 |         "order": "C",
  9 |         "dtype": "<i2",
 10 |         "shape": [
 11 |             1,
 12 |             2030,
 13 |             1354
 14 |         ],
 15 |         "compressor": {
 16 |             "id": "zlib",
 17 |             "level": 4
 18 |         },
 19 |         "chunks": [
 20 |             1,
 21 |             1015,
 22 |             677
 23 |         ],
 24 |         "fill_value": -128
 25 |     },
 26 |     "wind_speed/.zattrs": {
 27 |         "long_name": "10m wind speed",
 28 |         "standard_name": "wind_speed",
 29 |         "units": "m s-1",
 30 |         "_FillValue": -128,
 31 |         "valid_min": -127,
 32 |         "valid_max": 127,
 33 |         "comment": "Wind at 10 meters above the sea surface",
 34 |         "scale_factor": 0.200000003,
 35 |         "add_offset": 25.0,
 36 |         "source": "TBD.  Placeholder.  Currently empty",
 37 |         "grid_mapping": "TBD",
 38 |         "time_offset": 2.0,
 39 |         "height": "10 m",
 40 |         "coverage_content_type": "auxiliaryInformation",
 41 |         "coordinates": "time lat lon",
 42 |         "_ARRAY_DIMENSIONS": [
 43 |             "time",
 44 |             "nj",
 45 |             "ni"
 46 |         ]
 47 |     },
 48 |     "wind_speed/.zchunkstore": {
 49 |         "0.0.0": {
 50 |             "offset": 27358005,
 51 |             "size": 689
 52 |         },
 53 |         "0.0.1": {
 54 |             "offset": 27358694,
 55 |             "size": 689
 56 |         },
 57 |         "0.1.0": {
 58 |             "offset": 27359383,
 59 |             "size": 689
 60 |         },
 61 |         "0.1.1": {
 62 |             "offset": 27360072,
 63 |             "size": 689
 64 |         }
 65 |     },
 66 |     "sses_standard_deviation/.zarray": {
 67 |         "zarr_format": 2,
 68 |         "filters": null,
 69 |         "order": "C",
 70 |         "dtype": "<i2",
 71 |         "shape": [
 72 |             1,
 73 |             2030,
 74 |             1354
 75 |         ],
 76 |         "compressor": {
 77 |             "id": "zlib",
 78 |             "level": 4
 79 |         },
 80 |         "chunks": [
 81 |             1,
 82 |             1015,
 83 |             677
 84 |         ],
 85 |         "fill_value": -128
 86 |     },
 87 |     "sses_standard_deviation/.zattrs": {
 88 |         "long_name": "SSES standard deviation error based on proximity confidence flags",
 89 |         "units": "kelvin",
 90 |         "_FillValue": -128,
 91 |         "valid_min": -127,
 92 |         "valid_max": 127,
 93 |         "comment": "thermal IR SST standard deviation error; signed byte array: WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value",
 94 |         "scale_factor": 0.07874015719,
 95 |         "add_offset": 10.0,
 96 |         "coverage_content_type": "auxiliaryInformation",
 97 |         "coordinates": "time lat lon",
 98 |         "_ARRAY_DIMENSIONS": [
 99 |             "time",
100 |             "nj",
101 |             "ni"
102 |         ]
103 |     },
104 |     "sses_standard_deviation/.zchunkstore": {
105 |         "0.0.0": {
106 |             "offset": 22317539,
107 |             "size": 23320
108 |         },
109 |         "0.0.1": {
110 |             "offset": 22340859,
111 |             "size": 28041
112 |         },
113 |         "0.1.0": {
114 |             "offset": 22368900,
115 |             "size": 13222
116 |         },
117 |         "0.1.1": {
118 |             "offset": 22382122,
119 |             "size": 4287
120 |         }
121 |     },
122 |     "sst_dtime/.zarray": {
123 |         "zarr_format": 2,
124 |         "filters": null,
125 |         "order": "C",
126 |         "dtype": "<i2",
127 |         "shape": [
128 |             1,
129 |             2030,
130 |             1354
131 |         ],
132 |         "compressor": {
133 |             "id": "zlib",
134 |             "level": 4
135 |         },
136 |         "chunks": [
137 |             1,
138 |             1015,
139 |             677
140 |         ],
141 |         "fill_value": -32768
142 |     },
143 |     "sst_dtime/.zattrs": {
144 |         "long_name": "time difference from reference time",
145 |         "units": "seconds",
146 |         "_FillValue": -32768,
147 |         "valid_min": -32767,
148 |         "valid_max": 32767,
149 |         "comment": "time plus sst_dtime gives seconds after 00:00:00 UTC January 1, 1981",
150 |         "coverage_content_type": "referenceInformation",
151 |         "coordinates": "time lat lon",
152 |         "_ARRAY_DIMENSIONS": [
153 |             "time",
154 |             "nj",
155 |             "ni"
156 |         ]
157 |     },
158 |     "sst_dtime/.zchunkstore": {
159 |         "0.0.0": {
160 |             "offset": 22145604,
161 |             "size": 1577
162 |         },
163 |         "0.0.1": {
164 |             "offset": 22147181,
165 |             "size": 1577
166 |         },
167 |         "0.1.0": {
168 |             "offset": 22148758,
169 |             "size": 1579
170 |         },
171 |         "0.1.1": {
172 |             "offset": 22150337,
173 |             "size": 1579
174 |         }
175 |     },
176 |     "l2p_flags/.zarray": {
177 |         "zarr_format": 2,
178 |         "filters": null,
179 |         "order": "C",
180 |         "dtype": "<i2",
181 |         "shape": [
182 |             1,
183 |             2030,
184 |             1354
185 |         ],
186 |         "compressor": {
187 |             "id": "zlib",
188 |             "level": 4
189 |         },
190 |         "chunks": [
191 |             1,
192 |             1015,
193 |             677
194 |         ],
195 |         "fill_value": null
196 |     },
197 |     "l2p_flags/.zattrs": {
198 |         "long_name": "L2P flags",
199 |         "valid_min": 0,
200 |         "valid_max": 16,
201 |         "comment": "These flags can be used to further filter data variables",
202 |         "flag_meanings": "microwave land ice lake river",
203 |         "flag_masks": [
204 |             1,
205 |             2,
206 |             4,
207 |             8,
208 |             16
209 |         ],
210 |         "coverage_content_type": "qualityInformation",
211 |         "coordinates": "time lat lon",
212 |         "_ARRAY_DIMENSIONS": [
213 |             "time",
214 |             "nj",
215 |             "ni"
216 |         ]
217 |     },
218 |     "l2p_flags/.zchunkstore": {
219 |         "0.0.0": {
220 |             "offset": 22393463,
221 |             "size": 1354
222 |         },
223 |         "0.0.1": {
224 |             "offset": 22394817,
225 |             "size": 1354
226 |         },
227 |         "0.1.0": {
228 |             "offset": 22396171,
229 |             "size": 1381
230 |         },
231 |         "0.1.1": {
232 |             "offset": 22397552,
233 |             "size": 1354
234 |         }
235 |     },
236 |     "sea_surface_temperature/.zarray": {
237 |         "zarr_format": 2,
238 |         "filters": null,
239 |         "order": "C",
240 |         "dtype": "<i2",
241 |         "shape": [
242 |             1,
243 |             2030,
244 |             1354
245 |         ],
246 |         "compressor": {
247 |             "id": "zlib",
248 |             "level": 4
249 |         },
250 |         "chunks": [
251 |             1,
252 |             1015,
253 |             677
254 |         ],
255 |         "fill_value": -32767
256 |     },
257 |     "sea_surface_temperature/.zattrs": {
258 |         "long_name": "sea surface temperature",
259 |         "standard_name": "sea_surface_skin_temperature",
260 |         "units": "kelvin",
261 |         "_FillValue": -32767,
262 |         "valid_min": -1000,
263 |         "valid_max": 10000,
264 |         "comment": "sea surface temperature from thermal IR (11 um) channels",
265 |         "scale_factor": 0.004999999888,
266 |         "add_offset": 273.1499939,
267 |         "source": "NASA and University of Miami",
268 |         "coverage_content_type": "physicalMeasurement",
269 |         "coordinates": "time lat lon",
270 |         "_ARRAY_DIMENSIONS": [
271 |             "time",
272 |             "nj",
273 |             "ni"
274 |         ]
275 |     },
276 |     "sea_surface_temperature/.zchunkstore": {
277 |         "0.0.0": {
278 |             "offset": 17538750,
279 |             "size": 1200672
280 |         },
281 |         "0.0.1": {
282 |             "offset": 18739422,
283 |             "size": 1157643
284 |         },
285 |         "0.1.0": {
286 |             "offset": 19897065,
287 |             "size": 1115469
288 |         },
289 |         "0.1.1": {
290 |             "offset": 21012534,
291 |             "size": 1126406
292 |         }
293 |     },
294 |     "quality_level/.zarray": {
295 |         "zarr_format": 2,
296 |         "filters": null,
297 |         "order": "C",
298 |         "dtype": "<i2",
299 |         "shape": [
300 |             1,
301 |             2030,
302 |             1354
303 |         ],
304 |         "compressor": {
305 |             "id": "zlib",
306 |             "level": 4
307 |         },
308 |         "chunks": [
309 |             1,
310 |             1015,
311 |             677
312 |         ],
313 |         "fill_value": -128
314 |     },
315 |     "quality_level/.zattrs": {
316 |         "long_name": "quality level of SST pixel",
317 |         "_FillValue": -128,
318 |         "valid_min": 0,
319 |         "valid_max": 5,
320 |         "comment": "thermal IR SST proximity confidence value; signed byte array: WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value",
321 |         "flag_values": [
322 |             0,
323 |             1,
324 |             2,
325 |             3,
326 |             4,
327 |             5
328 |         ],
329 |         "flag_meanings": "no_data bad_data worst_quality low_quality acceptable_quality best_quality",
330 |         "coverage_content_type": "qualityInformation",
331 |         "coordinates": "time lat lon",
332 |         "_ARRAY_DIMENSIONS": [
333 |             "time",
334 |             "nj",
335 |             "ni"
336 |         ]
337 |     },
338 |     "quality_level/.zchunkstore": {
339 |         "0.0.0": {
340 |             "offset": 22162994,
341 |             "size": 24444
342 |         },
343 |         "0.0.1": {
344 |             "offset": 22187438,
345 |             "size": 30682
346 |         },
347 |         "0.1.0": {
348 |             "offset": 22218120,
349 |             "size": 13679
350 |         },
351 |         "0.1.1": {
352 |             "offset": 22231799,
353 |             "size": 4661
354 |         }
355 |     },
356 |     "dt_analysis/.zarray": {
357 |         "zarr_format": 2,
358 |         "filters": null,
359 |         "order": "C",
360 |         "dtype": "<i2",
361 |         "shape": [
362 |             1,
363 |             2030,
364 |             1354
365 |         ],
366 |         "compressor": {
367 |             "id": "zlib",
368 |             "level": 4
369 |         },
370 |         "chunks": [
371 |             1,
372 |             1015,
373 |             677
374 |         ],
375 |         "fill_value": -128
376 |     },
377 |     "dt_analysis/.zattrs": {
378 |         "long_name": "deviation from SST reference climatology",
379 |         "units": "kelvin",
380 |         "_FillValue": -128,
381 |         "valid_min": -127,
382 |         "valid_max": 127,
383 |         "comment": "TBD",
384 |         "scale_factor": 0.1000000015,
385 |         "add_offset": 0.0,
386 |         "source": "TBD. Placeholder.  Currently empty",
387 |         "coverage_content_type": "auxiliaryInformation",
388 |         "coordinates": "time lat lon",
389 |         "_ARRAY_DIMENSIONS": [
390 |             "time",
391 |             "nj",
392 |             "ni"
393 |         ]
394 |     },
395 |     "dt_analysis/.zchunkstore": {
396 |         "0.0.0": {
397 |             "offset": 27367954,
398 |             "size": 689
399 |         },
400 |         "0.0.1": {
401 |             "offset": 27368643,
402 |             "size": 689
403 |         },
404 |         "0.1.0": {
405 |             "offset": 27369332,
406 |             "size": 689
407 |         },
408 |         "0.1.1": {
409 |             "offset": 27370021,
410 |             "size": 689
411 |         }
412 |     },
413 |     "sses_standard_deviation_4um/.zarray": {
414 |         "zarr_format": 2,
415 |         "filters": null,
416 |         "order": "C",
417 |         "dtype": "<i2",
418 |         "shape": [
419 |             1,
420 |             2030,
421 |             1354
422 |         ],
423 |         "compressor": {
424 |             "id": "zlib",
425 |             "level": 4
426 |         },
427 |         "chunks": [
428 |             1,
429 |             1015,
430 |             677
431 |         ],
432 |         "fill_value": -128
433 |     },
434 |     "sses_standard_deviation_4um/.zattrs": {
435 |         "long_name": "SSES standard deviation error based on proximity confidence flags",
436 |         "units": "kelvin",
437 |         "_FillValue": -128,
438 |         "valid_min": -127,
439 |         "valid_max": 127,
440 |         "comment": "mid-IR SST standard deviation error; non L2P core field; signed byte array:  WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value",
441 |         "scale_factor": 0.07874015719,
442 |         "add_offset": 10.0,
443 |         "coverage_content_type": "auxiliaryInformation",
444 |         "coordinates": "time lat lon",
445 |         "_ARRAY_DIMENSIONS": [
446 |             "time",
447 |             "nj",
448 |             "ni"
449 |         ]
450 |     },
451 |     "sses_standard_deviation_4um/.zchunkstore": {
452 |         "0.0.0": {
453 |             "offset": 27251747,
454 |             "size": 30619
455 |         },
456 |         "0.0.1": {
457 |             "offset": 27282366,
458 |             "size": 39107
459 |         },
460 |         "0.1.0": {
461 |             "offset": 27321473,
462 |             "size": 18171
463 |         },
464 |         "0.1.1": {
465 |             "offset": 27339644,
466 |             "size": 6275
467 |         }
468 |     },
469 |     "sses_bias_4um/.zarray": {
470 |         "zarr_format": 2,
471 |         "filters": null,
472 |         "order": "C",
473 |         "dtype": "<i2",
474 |         "shape": [
475 |             1,
476 |             2030,
477 |             1354
478 |         ],
479 |         "compressor": {
480 |             "id": "zlib",
481 |             "level": 4
482 |         },
483 |         "chunks": [
484 |             1,
485 |             1015,
486 |             677
487 |         ],
488 |         "fill_value": -128
489 |     },
490 |     "sses_bias_4um/.zattrs": {
491 |         "long_name": "SSES bias error based on proximity confidence flags",
492 |         "units": "kelvin",
493 |         "_FillValue": -128,
494 |         "valid_min": -127,
495 |         "valid_max": 127,
496 |         "comment": "mid-IR SST bias error; non L2P core field; signed byte array:  WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value",
497 |         "scale_factor": 0.1574803144,
498 |         "add_offset": 0.0,
499 |         "coverage_content_type": "auxiliaryInformation",
500 |         "coordinates": "time lat lon",
501 |         "_ARRAY_DIMENSIONS": [
502 |             "time",
503 |             "nj",
504 |             "ni"
505 |         ]
506 |     },
507 |     "sses_bias_4um/.zchunkstore": {
508 |         "0.0.0": {
509 |             "offset": 27160872,
510 |             "size": 27847
511 |         },
512 |         "0.0.1": {
513 |             "offset": 27188719,
514 |             "size": 35589
515 |         },
516 |         "0.1.0": {
517 |             "offset": 27224308,
518 |             "size": 14687
519 |         },
520 |         "0.1.1": {
521 |             "offset": 27238995,
522 |             "size": 5623
523 |         }
524 |     },
525 |     "sses_bias/.zarray": {
526 |         "zarr_format": 2,
527 |         "filters": null,
528 |         "order": "C",
529 |         "dtype": "<i2",
530 |         "shape": [
531 |             1,
532 |             2030,
533 |             1354
534 |         ],
535 |         "compressor": {
536 |             "id": "zlib",
537 |             "level": 4
538 |         },
539 |         "chunks": [
540 |             1,
541 |             1015,
542 |             677
543 |         ],
544 |         "fill_value": -128
545 |     },
546 |     "sses_bias/.zattrs": {
547 |         "long_name": "SSES bias error based on proximity confidence flags",
548 |         "units": "kelvin",
549 |         "_FillValue": -128,
550 |         "valid_min": -127,
551 |         "valid_max": 127,
552 |         "comment": "thermal IR SST bias error; signed byte array: WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value",
553 |         "scale_factor": 0.1574803144,
554 |         "add_offset": 0.0,
555 |         "coverage_content_type": "auxiliaryInformation",
556 |         "coordinates": "time lat lon",
557 |         "_ARRAY_DIMENSIONS": [
558 |             "time",
559 |             "nj",
560 |             "ni"
561 |         ]
562 |     },
563 |     "sses_bias/.zchunkstore": {
564 |         "0.0.0": {
565 |             "offset": 22244733,
566 |             "size": 22729
567 |         },
568 |         "0.0.1": {
569 |             "offset": 22267462,
570 |             "size": 26981
571 |         },
572 |         "0.1.0": {
573 |             "offset": 22294443,
574 |             "size": 12149
575 |         },
576 |         "0.1.1": {
577 |             "offset": 22306592,
578 |             "size": 4272
579 |         }
580 |     },
581 |     "sea_surface_temperature_4um/.zarray": {
582 |         "zarr_format": 2,
583 |         "filters": null,
584 |         "order": "C",
585 |         "dtype": "<i2",
586 |         "shape": [
587 |             1,
588 |             2030,
589 |             1354
590 |         ],
591 |         "compressor": {
592 |             "id": "zlib",
593 |             "level": 4
594 |         },
595 |         "chunks": [
596 |             1,
597 |             1015,
598 |             677
599 |         ],
600 |         "fill_value": -32767
601 |     },
602 |     "sea_surface_temperature_4um/.zattrs": {
603 |         "long_name": "sea surface temperature",
604 |         "units": "kelvin",
605 |         "_FillValue": -32767,
606 |         "valid_min": -1000,
607 |         "valid_max": 10000,
608 |         "comment": "sea surface temperature from mid-IR (4 um) channels; non L2P core field",
609 |         "scale_factor": 0.004999999888,
610 |         "add_offset": 273.1499939,
611 |         "coverage_content_type": "physicalMeasurement",
612 |         "coordinates": "time lat lon",
613 |         "_ARRAY_DIMENSIONS": [
614 |             "time",
615 |             "nj",
616 |             "ni"
617 |         ]
618 |     },
619 |     "sea_surface_temperature_4um/.zchunkstore": {
620 |         "0.0.0": {
621 |             "offset": 22405618,
622 |             "size": 1197232
623 |         },
624 |         "0.0.1": {
625 |             "offset": 23602850,
626 |             "size": 1171640
627 |         },
628 |         "0.1.0": {
629 |             "offset": 24774490,
630 |             "size": 1141479
631 |         },
632 |         "0.1.1": {
633 |             "offset": 25915969,
634 |             "size": 1153202
635 |         }
636 |     },
637 |     "quality_level_4um/.zarray": {
638 |         "zarr_format": 2,
639 |         "filters": null,
640 |         "order": "C",
641 |         "dtype": "<i2",
642 |         "shape": [
643 |             1,
644 |             2030,
645 |             1354
646 |         ],
647 |         "compressor": {
648 |             "id": "zlib",
649 |             "level": 4
650 |         },
651 |         "chunks": [
652 |             1,
653 |             1015,
654 |             677
655 |         ],
656 |         "fill_value": -128
657 |     },
658 |     "quality_level_4um/.zattrs": {
659 |         "long_name": "quality level of SST pixel",
660 |         "_FillValue": -128,
661 |         "valid_min": 0,
662 |         "valid_max": 5,
663 |         "comment": "mid-IR SST proximity confidence value; non L2P core field; signed byte array:  WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value",
664 |         "flag_values": [
665 |             0,
666 |             1,
667 |             2,
668 |             3,
669 |             4,
670 |             5
671 |         ],
672 |         "flag_meanings": "no_data bad_data worst_quality low_quality acceptable_quality best_quality",
673 |         "coverage_content_type": "qualityInformation",
674 |         "coordinates": "time lat lon",
675 |         "_ARRAY_DIMENSIONS": [
676 |             "time",
677 |             "nj",
678 |             "ni"
679 |         ]
680 |     },
681 |     "quality_level_4um/.zchunkstore": {
682 |         "0.0.0": {
683 |             "offset": 27076250,
684 |             "size": 25483
685 |         },
686 |         "0.0.1": {
687 |             "offset": 27101733,
688 |             "size": 33457
689 |         },
690 |         "0.1.0": {
691 |             "offset": 27135190,
692 |             "size": 13796
693 |         },
694 |         "0.1.1": {
695 |             "offset": 27148986,
696 |             "size": 5147
697 |         }
698 |     },
699 |     "time/.zarray": {
700 |         "zarr_format": 2,
701 |         "filters": null,
702 |         "order": "C",
703 |         "dtype": "<i4",
704 |         "shape": [
705 |             1
706 |         ],
707 |         "compressor": {
708 |             "id": "zlib",
709 |             "level": 4
710 |         },
711 |         "chunks": [
712 |             1
713 |         ],
714 |         "fill_value": null
715 |     },
716 |     "time/.zattrs": {
717 |         "long_name": "reference time of sst file",
718 |         "standard_name": "time",
719 |         "units": "seconds since 1981-01-01 00:00:00",
720 |         "comment": "time of first sensor observation",
721 |         "coverage_content_type": "coordinate",
722 |         "_ARRAY_DIMENSIONS": [
723 |             "time"
724 |         ]
725 |     },
726 |     "time/.zchunkstore": {
727 |         "0": {
728 |             "offset": 17528467,
729 |             "size": 12
730 |         }
731 |     },
732 |     "lat/.zarray": {
733 |         "zarr_format": 2,
734 |         "filters": null,
735 |         "order": "C",
736 |         "dtype": "<f4",
737 |         "shape": [
738 |             2030,
739 |             1354
740 |         ],
741 |         "compressor": {
742 |             "id": "zlib",
743 |             "level": 4
744 |         },
745 |         "chunks": [
746 |             1015,
747 |             677
748 |         ],
749 |         "fill_value": -999.0
750 |     },
751 |     "lat/.zattrs": {
752 |         "long_name": "latitude",
753 |         "standard_name": "latitude",
754 |         "units": "degrees_north",
755 |         "_FillValue": -999.0,
756 |         "valid_min": -90.0,
757 |         "valid_max": 90.0,
758 |         "comment": "geographical coordinates, WGS84 projection",
759 |         "coverage_content_type": "coordinate",
760 |         "_ARRAY_DIMENSIONS": [
761 |             "nj",
762 |             "ni"
763 |         ]
764 |     },
765 |     "lat/.zchunkstore": {
766 |         "0.0": {
767 |             "offset": 19762,
768 |             "size": 2073756
769 |         },
770 |         "0.1": {
771 |             "offset": 2093518,
772 |             "size": 1940803
773 |         },
774 |         "1.0": {
775 |             "offset": 4034321,
776 |             "size": 2080328
777 |         },
778 |         "1.1": {
779 |             "offset": 6114649,
780 |             "size": 1911892
781 |         }
782 |     },
783 |     "lon/.zarray": {
784 |         "zarr_format": 2,
785 |         "filters": null,
786 |         "order": "C",
787 |         "dtype": "<f4",
788 |         "shape": [
789 |             2030,
790 |             1354
791 |         ],
792 |         "compressor": {
793 |             "id": "zlib",
794 |             "level": 4
795 |         },
796 |         "chunks": [
797 |             1015,
798 |             677
799 |         ],
800 |         "fill_value": -999.0
801 |     },
802 |     "lon/.zattrs": {
803 |         "long_name": "longitude",
804 |         "standard_name": "longitude",
805 |         "units": "degrees_east",
806 |         "_FillValue": -999.0,
807 |         "valid_min": -180.0,
808 |         "valid_max": 180.0,
809 |         "comment": "geographical coordinates, WGS84 projection",
810 |         "coverage_content_type": "coordinate",
811 |         "_ARRAY_DIMENSIONS": [
812 |             "nj",
813 |             "ni"
814 |         ]
815 |     },
816 |     "lon/.zchunkstore": {
817 |         "0.0": {
818 |             "offset": 8032699,
819 |             "size": 2408756
820 |         },
821 |         "0.1": {
822 |             "offset": 10441455,
823 |             "size": 2316773
824 |         },
825 |         "1.0": {
826 |             "offset": 12758228,
827 |             "size": 2460793
828 |         },
829 |         "1.1": {
830 |             "offset": 15219021,
831 |             "size": 2306544
832 |         }
833 |     },
834 |     ".zattrs": {
835 |         "Conventions": "CF-1.7, ACDD-1.3",
836 |         "title": "MODIS Aqua L2P SST",
837 |         "summary": "Sea surface temperature retrievals produced at the NASA OBPG for the MODIS Aqua sensor.  These have been reformatted to GHRSST GDS specifications by the JPL PO.DAAC",
838 |         "references": "GHRSST Data Processing Specification v2r5",
839 |         "institution": "NASA/JPL/OBPG/RSMAS",
840 |         "history": "MODIS L2P created at JPL PO.DAAC",
841 |         "comment": "L2P Core without DT analysis or other ancillary fields; Night, Start Node:Descending, End Node:Descending; WARNING Some applications are unable to properly handle signed byte values. If values are encountered > 127, please subtract 256 from this reported value; Quicklook",
842 |         "license": "GHRSST and PO.DAAC protocol allow data use as free and open.",
843 |         "id": "MODIS_A-JPL-L2P-v2019.0",
844 |         "naming_authority": "org.ghrsst",
845 |         "product_version": "2019.0",
846 |         "uuid": "f6e1f61d-c4a4-4c17-8354-0c15e12d688b",
847 |         "gds_version_id": "2.0",
848 |         "netcdf_version_id": "4.1",
849 |         "date_created": "20200911T024514Z",
850 |         "file_quality_level": 3,
851 |         "spatial_resolution": "1km",
852 |         "start_time": "20200911T000001Z",
853 |         "time_coverage_start": "20200911T000001Z",
854 |         "stop_time": "20200911T000458Z",
855 |         "time_coverage_end": "20200911T000458Z",
856 |         "northernmost_latitude": -36.22299957,
857 |         "southernmost_latitude": -57.91799927,
858 |         "easternmost_longitude": 31.05480003,
859 |         "westernmost_longitude": -7.165909767,
860 |         "source": "MODIS sea surface temperature observations for the OBPG",
861 |         "platform": "Aqua",
862 |         "sensor": "MODIS",
863 |         "metadata_link": "http://podaac.jpl.nasa.gov/ws/metadata/dataset/?format=iso&shortName=MODIS_A-JPL-L2P-v2019.0",
864 |         "keywords": "Oceans > Ocean Temperature > Sea Surface Temperature",
865 |         "keywords_vocabulary": "NASA Global Change Master Directory (GCMD) Science Keywords",
866 |         "standard_name_vocabulary": "NetCDF Climate and Forecast (CF) Metadata Convention",
867 |         "geospatial_lat_units": "degrees_north",
868 |         "geospatial_lat_resolution": 0.009999999776,
869 |         "geospatial_lon_units": "degrees_east",
870 |         "geospatial_lon_resolution": 0.009999999776,
871 |         "acknowledgment": "The MODIS L2P sea surface temperature data are sponsored by NASA",
872 |         "creator_name": "Ed Armstrong, JPL PO.DAAC",
873 |         "creator_email": "edward.m.armstrong@jpl.nasa.gov",
874 |         "creator_url": "http://podaac.jpl.nasa.gov",
875 |         "project": "Group for High Resolution Sea Surface Temperature",
876 |         "publisher_name": "The GHRSST Project Office",
877 |         "publisher_url": "http://www.ghrsst.org",
878 |         "publisher_email": "ghrsst-po@nceo.ac.uk",
879 |         "processing_level": "L2P",
880 |         "cdm_data_type": "swath",
881 |         "startDirection": "Descending",
882 |         "endDirection": "Descending",
883 |         "day_night_flag": "Night"
884 |     }
885 | }


--------------------------------------------------------------------------------
/presentation/background.md:
--------------------------------------------------------------------------------
  1 | # EOSDIS Zarr Store: Spatial & Variable Subsetting without Services
  2 | 
  3 | ## Goal
  4 | 
  5 | Produce a library that would let the Zarr Python library read EOSDIS cloud holdings efficiently, without requiring any modifications to our archive.  This has the potential to expand use to new communities and tools, allow more efficient access both in place and outside of the cloud, and therefore save money for the archive as well as time for users.
  6 | 
  7 | ## Background
  8 | 
  9 | This is a demo of a data store I've been working on, building off of the work of a few others.  Adapting the Zarr library (which is meant to read cloud-optimized data stores) read NetCDF4 / HDF 5 files was discussed as a possibility at Summer ESIP last year.  Rich Signell from USGS worked with HDF Group to get [a prototype](https://medium.com/pangeo/cloud-performant-reading-of-netcdf4-hdf5-data-using-the-zarr-library-1a95c5c92314).  The resulting code showed no performance degradation over an equivalent native Zarr store.  This adaptation requies an up-front generation of metadata containing data attributes and byte offsets to allow efficient reads.
 10 | 
 11 | ## What I did
 12 | 
 13 | I recognized that the DMR++ files OPeNDAP / GHRC have started generating on ingest in PI 20.1 contain nearly equivalent information to that required by the Zarr library.  Hearing that small chunk sizes (chunks are a region of data that can / must be read all at once) caused issues for some NetCDF files and required re-chunking (i.e. altering the original data file), I further looked at mitigating that issue to avoid having to re-host data.  In picking through the Zarr code, I came across a for loop that, if changed, would allow a set of optimizations that would greatly improve performance.  I advocated for this in the Zarr tracker and what we need is now being planned.
 14 | ![png](images/summary.png)
 15 | 
 16 | In terms of actual code, I produced a Python library, eosdis-zarr-store that:
 17 | 
 18 | 1. Implements the Zarr storage API in a natural and familiar way to Zarr developers
 19 | 2. Sets up HTTP access to allow EDL credential handshaking and, importantly, caching of redirect URLs
 20 | 3. Adapts our underlying data files and DMR++ files generated on ingest to a Zarr-compatible API
 21 | 4. Implements optimizations using the API worked out with the Zarr community to make fewer total data reads and do them in parallel where possible
 22 | 
 23 | The remainder of this notebook contains results and conclusions.
 24 | 
 25 | ## How to use it
 26 | 
 27 | In the eosdis-zarr-store directory run `pip install -e .`.  Obtain or stage an HDF5 (NetCDF4) file along with a DMR++ file with identical URL + ".dmrpp", you can run "mkdmrpp" ([scripts/mkdmrpp](scripts/mkdmrpp))in this folder to produce DMR++ files.  Then:
 28 | 
 29 | ```python
 30 | from eosdis_zarr_store import Store
 31 | import zarr
 32 | 
 33 | f = zarr.open(Store(data_file_url))
 34 | # Manipulate f as any Zarr store (see examples below)
 35 | ```
 36 | 
 37 | The URLs in this notebook have been redacted, since some produce substantial egress for benchmarking and illustration.  If you need example data, please reach out.
 38 | 
 39 | ## Helpers and Constants (You can skip this)
 40 | 
 41 | 
 42 | ```python
 43 | # Helpers to draw stuff, generate URLs, and translate bounding boxes to array indices,
 44 | # wholly ignoring all the helpful attributes present in the HDF and Zarr metadata
 45 | # Please don't judge me on this mess.  It's not called "Clean code fest"
 46 | 
 47 | from matplotlib import pyplot as plt
 48 | from matplotlib import colors
 49 | from ipypb import track
 50 | import numpy as np
 51 | 
 52 | def show(data, transpose=True):
 53 |     plt.rcParams["figure.figsize"] = [16, 8]
 54 |     if transpose:
 55 |         data = np.transpose(data)
 56 |     plt.imshow(data[::-1,:], norm=colors.Normalize(0, 150), cmap='Blues')
 57 | 
 58 | def get_aoi(bbox, scale, x0=180, y0=90):
 59 |     aoi = (0,
 60 |            slice(scale * int(bbox[1] + x0), scale * int(bbox[3] + x0) + 1),
 61 |            slice(scale * int(bbox[0] +  y0), scale * int(bbox[2] + y0) + 1))
 62 |     shape = [d.stop - d.start for d in aoi[1:]]
 63 |     return aoi, shape
 64 | 
 65 | url_root = 'https://example.earthdata.nasa.gov/example-staging-url/'
 66 | # GPM HHR URLs
 67 | filename_template = '3B-HHR.MS.MRG.3IMERG.20051022-S%02d%02d00-E%02d%02d59.%04d.V06B.HDF5'
 68 | data_urls = [ url_root + filename_template % (h, m, h, m + 29, h * 60 + m) for h in range(0, 24) for m in range(0, 60, 30) ]
 69 | 
 70 | bbox = [10, -100, 47.5, -45]
 71 | 
 72 | # Basic file info (also readable from metadata)
 73 | GPM_NODATA = -9999.9
 74 | gpm_aoi, gpm_shape = get_aoi(bbox, 10)
 75 | RSS_NODATA = 251
 76 | RSS_SCALE_FACTOR = 0.5 # In-file scale factor is 0.1.  This increases it solely for the purpose of making it show up in pics
 77 | rss_aoi, rss_shape = get_aoi(bbox, 4, 360)
 78 | rss_aoi = (0, rss_aoi[2], rss_aoi[1])
 79 | 
 80 | ```
 81 | 
 82 | ## Problem 1: Atmospheric water vapor off the East Coast on Patrick's wedding day
 83 | 
 84 | It rained a little that day in DC and hurricanes were threatening our honeymoon in the Carribbean.
 85 | 
 86 | We have a bounding box defined above.  Use data distributed by GHRC derived from the SSMIS sensor of the F16 DMSP satellite to build a picture.
 87 | 
 88 | ### Without Partial Access
 89 | 
 90 | Download 2.6 MB file and subset it
 91 | 
 92 | 
 93 | ```python
 94 | %%time
 95 | from h5py import File as H5File
 96 | import requests
 97 | from io import BytesIO
 98 | 
 99 | response = requests.get(url_root + 'f16_ssmis_20051022v7.nc')
100 | with H5File(BytesIO(response.content), 'r') as f:
101 |     aoi_data = f['atmosphere_water_vapor_content'][rss_aoi]
102 |     show(np.where(aoi_data < RSS_NODATA, aoi_data * RSS_SCALE_FACTOR, 0), transpose=False)
103 | 
104 | ```
105 | 
106 |     CPU times: user 206 ms, sys: 43.1 ms, total: 249 ms
107 |     Wall time: 8.32 s
108 | 
109 | 
110 | 
111 | ![png](images/output_3_1.png)
112 | 
113 | 
114 | ### Partial Access Step 1 - Make our data readable in Zarr for partial access
115 | 
116 | Mimick a Zarr store by reading OPeNDAP's DMR++ files and returning their metadata in a Zarr interface.  DMR++ files are planned to be generated on ingest
117 | 
118 | Downloads 200 KB of data from the 2.6 MB file with conventional Zarr storage implementation.
119 | 
120 | Result: 12 data requests, each of which goes through internet services, pre-signs a URL, and redirects to the data range.  All sequentially.  Slow.
121 | 
122 | 
123 | ```python
124 | %%time
125 | from unoptimized_zarr_store import Store
126 | import zarr
127 | 
128 | f = zarr.open(Store(url_root + 'f16_ssmis_20051022v7.nc'))
129 | aoi_data = f['atmosphere_water_vapor_content'][rss_aoi]
130 | show(np.where(aoi_data < RSS_NODATA, aoi_data * RSS_SCALE_FACTOR, 0), transpose=False)
131 | ```
132 | 
133 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1455912:1465233] (9321 bytes)
134 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1465240:1472085] (6845 bytes)
135 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1472088:1479515] (7427 bytes)
136 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1479520:1488808] (9288 bytes)
137 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1562808:1564995] (2187 bytes)
138 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1565000:1572245] (7245 bytes)
139 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1572248:1582809] (10561 bytes)
140 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1582816:1593902] (11086 bytes)
141 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1635624:1636392] (768 bytes)
142 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1636392:1639400] (3008 bytes)
143 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1639400:1645720] (6320 bytes)
144 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1645720:1654949] (9229 bytes)
145 |     CPU times: user 246 ms, sys: 45.5 ms, total: 292 ms
146 |     Wall time: 39.3 s
147 | 
148 | 
149 | 
150 | ![png](images/output_5_1.png)
151 | 
152 | 
153 | ### Partial Access Step 2 - Make Zarr reads fast
154 | 
155 | Downloads 200 KB of data from the 2.6 MB file with Zarr optimizations:
156 | 1. (Working with Zarr community) Implement "getitems" concept, allowing storage to know all of the chunks that will be accessed up front
157 | 2. Combine nearby range requests into single HTTP requests before sending them, allowing fewer requests.
158 | 3. Cache presigned URLs returned by the archive for a short time, as directed by caching headers (TEA has a ticket to add these), allowing reuse and avoiding many round-trips and redirects
159 | 4. Run the first data range request serially to get the presigned URL.  Run subsequent requests in parallel.
160 | 
161 | Result: 3 data requests, one of which goes through internet services, pre-signs a URL, and redirects to the data range.  The following two reuse the signed URL and fetch in parallel.  Faster!
162 | 
163 | When more than a couple of chunks are involved, this is expected to be faster than the native Zarr S3 format is capable of, and the more chunks involved in a read the more it improves.
164 | 
165 | 
166 | ```python
167 | %%time
168 | from eosdis_zarr_store import Store
169 | import zarr
170 | 
171 | f = zarr.open(Store(url_root + 'f16_ssmis_20051022v7.nc'))
172 | aoi_data = f['atmosphere_water_vapor_content'][rss_aoi]
173 | show(np.where(aoi_data < RSS_NODATA, aoi_data * RSS_SCALE_FACTOR, 0), transpose=False)
174 | ```
175 | 
176 |     Starting new range due to gap of 74000 bytes
177 |     Starting new range due to gap of 41722 bytes
178 |     Merged 12 requests into 3
179 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1455912:1488808] (32896 bytes)
180 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1562808:1593902] (31094 bytes)
181 |     Reading https://example.earthdata.nasa.gov/example-staging-url/f16_ssmis_20051022v7.nc [1635624:1654949] (19325 bytes)
182 |     CPU times: user 137 ms, sys: 19.9 ms, total: 156 ms
183 |     Wall time: 17.3 s
184 | 
185 | 
186 | 
187 | ![png](images/output_7_1.png)
188 | 
189 | 
190 | ## Problem 2: Rain along the East Coast on Patrick's wedding day
191 | 
192 | With the same bounding box above, get half-hourly high-quality precipitation values from GPM and sum them for the entire day (48 L3 global data files)
193 | 
194 | ### Without Partial Access
195 | 
196 | Download approximately 500MB of data in whole files and processes them
197 | 
198 | 
199 | ```python
200 | %%time
201 | from h5py import File as H5File
202 | import requests
203 | from io import BytesIO
204 | 
205 | result = np.zeros(gpm_shape)
206 | for url in track(data_urls):
207 |     response = requests.get(url)
208 |     with H5File(BytesIO(response.content), 'r') as f:
209 |         aoi_data = f['Grid/HQprecipitation'][gpm_aoi]
210 |         result = result + np.where(aoi_data != GPM_NODATA, aoi_data / 2, 0)
211 | show(result)
212 | ```
213 | 
214 | 
215 | <div><span class="Text-label" style="display:inline-block; overflow:hidden; white-space:nowrap; text-overflow:ellipsis; min-width:0; max-width:15ex; vertical-align:middle; text-align:right"></span>
216 | <progress style="width:60ex" max="48" value="48" class="Progress-main"/></progress>
217 | <span class="Progress-label"><strong>100%</strong></span>
218 | <span class="Iteration-label">48/48</span>
219 | <span class="Time-label">[05:55<00:06, 7.39s/it]</span></div>
220 | 
221 | 
222 |     CPU times: user 8.51 s, sys: 3 s, total: 11.5 s
223 |     Wall time: 5min 54s
224 | 
225 | 
226 | 
227 | ![png](images/output_9_2.png)
228 | 
229 | 
230 | ### With the EOSDIS Zarr Store
231 | 
232 | Downloads approximately 5 MB of data by doing partial reads in fewer lines of code
233 | 
234 | 
235 | ```python
236 | %%time
237 | from eosdis_zarr_store import Store
238 | import zarr
239 | 
240 | result = np.zeros(gpm_shape)
241 | for url in track(data_urls):
242 |     f = zarr.open(Store(url, quiet=True))
243 |     aoi_data = f['Grid/HQprecipitation'][gpm_aoi]
244 |     result = result + np.where(aoi_data != GPM_NODATA, aoi_data / 2, 0)
245 | show(result)
246 | ```
247 | 
248 | 
249 | <div><span class="Text-label" style="display:inline-block; overflow:hidden; white-space:nowrap; text-overflow:ellipsis; min-width:0; max-width:15ex; vertical-align:middle; text-align:right"></span>
250 | <progress style="width:60ex" max="48" value="48" class="Progress-main"/></progress>
251 | <span class="Progress-label"><strong>100%</strong></span>
252 | <span class="Iteration-label">48/48</span>
253 | <span class="Time-label">[03:58<00:05, 4.96s/it]</span></div>
254 | 
255 | 
256 |     CPU times: user 1.72 s, sys: 185 ms, total: 1.91 s
257 |     Wall time: 3min 57s
258 | 
259 | 
260 | 
261 | ![png](images/output_12_2.png)
262 | 
263 | 
264 | ### Comparison to L3 Daily Average Product
265 | 
266 | Download a 30 MB file from the daily average collection to produce a similar result, validating the result at 6x egress cost of partial access for all of the half-hourly source files.
267 | 
268 | 
269 | ```python
270 | %%time
271 | from h5py import File as H5File
272 | import requests
273 | from io import BytesIO
274 | 
275 | response = requests.get(url_root + '3B-DAY.MS.MRG.3IMERG.20051022-S000000-E235959.V06.nc4')
276 | with H5File(BytesIO(response.content), 'r') as f:
277 |     show(f['HQprecipitation'][gpm_aoi])
278 | ```
279 | 
280 |     CPU times: user 415 ms, sys: 187 ms, total: 602 ms
281 |     Wall time: 11.2 s
282 | 
283 | 
284 | 
285 | ![png](images/output_15_1.png)
286 | 
287 | 
288 | ## I can see my house from here!
289 | 
290 | Download GEDI L2B data.  Use small geolocation arrays to find the area of interest, then download only the data within those chunks.
291 | 
292 | A full file download is 1.3 GB.  The code below downloads approximately 15 MB of data and metadata.  This reduces a 15 minute download to about 8s.  (Aside: the download is 2/3 metadata, which could be dramatically reduced by using Zarr's default format rather than DMR++)
293 | 
294 | 
295 | ```python
296 | from eosdis_zarr_store import Store
297 | import zarr
298 | import numpy as np
299 | 
300 | url = 'https://example.earthdata.nasa.gov/example-staging-url/GEDI02_B_2019182140038_O03117_T05635_02_001_01.h5'
301 | f = zarr.open(Store(url))
302 | print(f.tree())
303 | ```
304 | 
305 |     /
306 |      ├── BEAM0000
307 |      │   ├── algorithmrun_flag (238914,) uint8
308 |      │   ├── ancillary
309 |      │   │   ├── dz (1,) float64
310 |      │   │   ├── maxheight_cuttoff (1,) float64
311 |      │   │   ├── rg_eg_constraint_center_buffer (1,) int32
312 |      │   │   ├── rg_eg_mpfit_max_func_evals (1,) uint16
313 |      │   │   ├── rg_eg_mpfit_maxiters (1,) uint16
314 |      │   │   ├── rg_eg_mpfit_tolerance (1,) float64
315 |      │   │   ├── signal_search_buff (1,) float64
316 |      │   │   └── tx_noise_stddev_multiplier (1,) float64
317 |      │   ├── beam (238914,) uint16
318 |      │   ├── channel (238914,) uint8
319 |      │   ├── cover (238914,) float32
320 |      │   ├── cover_z (238914, 30) float32
321 |      │   ├── fhd_normal (238914,) float32
322 |      │   ├── geolocation
323 |      │   │   ├── degrade_flag (238914,) int16
324 |      │   │   ├── delta_time (238914,) float64
325 |      │   │   ├── digital_elevation_model (238914,) float32
326 |      │   │   ├── elev_highestreturn (238914,) float32
327 |      │   │   ├── elev_lowestmode (238914,) float32
328 |      │   │   ├── elevation_bin0 (238914,) float64
329 |      │   │   ├── elevation_bin0_error (238914,) float32
330 |      │   │   ├── elevation_lastbin (238914,) float64
331 |      │   │   ├── elevation_lastbin_error (238914,) float32
332 |      │   │   ├── height_bin0 (238914,) float32
333 |      │   │   ├── height_lastbin (238914,) float32
334 |      │   │   ├── lat_highestreturn (238914,) float64
335 |      │   │   ├── lat_lowestmode (238914,) float64
336 |      │   │   ├── latitude_bin0 (238914,) float64
337 |      │   │   ├── latitude_bin0_error (238914,) float32
338 |      │   │   ├── latitude_lastbin (238914,) float64
339 |      │   │   ├── latitude_lastbin_error (238914,) float32
340 |      │   │   ├── local_beam_azimuth (238914,) float32
341 |      │   │   ├── local_beam_elevation (238914,) float32
342 |      │   │   ├── lon_highestreturn (238914,) float64
343 |      │   │   ├── lon_lowestmode (238914,) float64
344 |      │   │   ├── longitude_bin0 (238914,) float64
345 |      │   │   ├── longitude_bin0_error (238914,) float32
346 |      │   │   ├── longitude_lastbin (238914,) float64
347 |      │   │   ├── longitude_lastbin_error (238914,) float32
348 |      │   │   ├── solar_azimuth (238914,) float32
349 |      │   │   └── solar_elevation (238914,) float32
350 |      │   ├── l2a_quality_flag (238914,) uint8
351 |      │   ├── l2b_quality_flag (238914,) uint8
352 |      │   ├── land_cover_data
353 |      │   │   ├── landsat_treecover (238914,) float64
354 |      │   │   ├── modis_nonvegetated (238914,) float64
355 |      │   │   ├── modis_nonvegetated_sd (238914,) float64
356 |      │   │   ├── modis_treecover (238914,) float64
357 |      │   │   └── modis_treecover_sd (238914,) float64
358 |      │   ├── master_frac (238914,) float64
359 |      │   ├── master_int (238914,) uint32
360 |      │   ├── num_detectedmodes (238914,) uint8
361 |      │   ├── omega (238914,) float32
362 |      │   ├── pai (238914,) float32
363 |      │   ├── pai_z (238914, 30) float32
364 |      │   ├── pavd_z (238914, 30) float32
365 |      │   ├── pgap_theta (238914,) float32
366 |      │   ├── pgap_theta_error (238914,) float32
367 |      │   ├── pgap_theta_z (7926559,) float32
368 |      │   ├── rg (238914,) float32
369 |      │   ├── rh100 (238914,) int16
370 |      │   ├── rhog (238914,) float32
371 |      │   ├── rhog_error (238914,) float32
372 |      │   ├── rhov (238914,) float32
373 |      │   ├── rhov_error (238914,) float32
374 |      │   ├── rossg (238914,) float32
375 |      │   ├── rv (238914,) float32
376 |      │   ├── rx_processing
377 |      │   │   ├── algorithmrun_flag_a1 (238914,) uint8
378 |      │   │   ├── algorithmrun_flag_a2 (238914,) uint8
379 |      │   │   ├── algorithmrun_flag_a3 (238914,) uint8
380 |      │   │   ├── algorithmrun_flag_a4 (238914,) uint8
381 |      │   │   ├── algorithmrun_flag_a5 (238914,) uint8
382 |      │   │   ├── algorithmrun_flag_a6 (238914,) uint8
383 |      │   │   ├── pgap_theta_a1 (238914,) float32
384 |      │   │   ├── pgap_theta_a2 (238914,) float32
385 |      │   │   ├── pgap_theta_a3 (238914,) float32
386 |      │   │   ├── pgap_theta_a4 (238914,) float32
387 |      │   │   ├── pgap_theta_a5 (238914,) float32
388 |      │   │   ├── pgap_theta_a6 (238914,) float32
389 |      │   │   ├── pgap_theta_error_a1 (238914,) float32
390 |      │   │   ├── pgap_theta_error_a2 (238914,) float32
391 |      │   │   ├── pgap_theta_error_a3 (238914,) float32
392 |      │   │   ├── pgap_theta_error_a4 (238914,) float32
393 |      │   │   ├── pgap_theta_error_a5 (238914,) float32
394 |      │   │   ├── pgap_theta_error_a6 (238914,) float32
395 |      │   │   ├── rg_a1 (238914,) float32
396 |      │   │   ├── rg_a2 (238914,) float32
397 |      │   │   ├── rg_a3 (238914,) float32
398 |      │   │   ├── rg_a4 (238914,) float32
399 |      │   │   ├── rg_a5 (238914,) float32
400 |      │   │   ├── rg_a6 (238914,) float32
401 |      │   │   ├── rg_eg_amplitude_a1 (238914,) float32
402 |      │   │   ├── rg_eg_amplitude_a2 (238914,) float32
403 |      │   │   ├── rg_eg_amplitude_a3 (238914,) float32
404 |      │   │   ├── rg_eg_amplitude_a4 (238914,) float32
405 |      │   │   ├── rg_eg_amplitude_a5 (238914,) float32
406 |      │   │   ├── rg_eg_amplitude_a6 (238914,) float32
407 |      │   │   ├── rg_eg_amplitude_error_a1 (238914,) float32
408 |      │   │   ├── rg_eg_amplitude_error_a2 (238914,) float32
409 |      │   │   ├── rg_eg_amplitude_error_a3 (238914,) float32
410 |      │   │   ├── rg_eg_amplitude_error_a4 (238914,) float32
411 |      │   │   ├── rg_eg_amplitude_error_a5 (238914,) float32
412 |      │   │   ├── rg_eg_amplitude_error_a6 (238914,) float32
413 |      │   │   ├── rg_eg_center_a1 (238914,) float32
414 |      │   │   ├── rg_eg_center_a2 (238914,) float32
415 |      │   │   ├── rg_eg_center_a3 (238914,) float32
416 |      │   │   ├── rg_eg_center_a4 (238914,) float32
417 |      │   │   ├── rg_eg_center_a5 (238914,) float32
418 |      │   │   ├── rg_eg_center_a6 (238914,) float32
419 |      │   │   ├── rg_eg_center_error_a1 (238914,) float32
420 |      │   │   ├── rg_eg_center_error_a2 (238914,) float32
421 |      │   │   ├── rg_eg_center_error_a3 (238914,) float32
422 |      │   │   ├── rg_eg_center_error_a4 (238914,) float32
423 |      │   │   ├── rg_eg_center_error_a5 (238914,) float32
424 |      │   │   ├── rg_eg_center_error_a6 (238914,) float32
425 |      │   │   ├── rg_eg_chisq_a1 (238914,) float32
426 |      │   │   ├── rg_eg_chisq_a2 (238914,) float32
427 |      │   │   ├── rg_eg_chisq_a3 (238914,) float32
428 |      │   │   ├── rg_eg_chisq_a4 (238914,) float32
429 |      │   │   ├── rg_eg_chisq_a5 (238914,) float32
430 |      │   │   ├── rg_eg_chisq_a6 (238914,) float32
431 |      │   │   ├── rg_eg_flag_a1 (238914,) int16
432 |      │   │   ├── rg_eg_flag_a2 (238914,) int16
433 |      │   │   ├── rg_eg_flag_a3 (238914,) int16
434 |      │   │   ├── rg_eg_flag_a4 (238914,) int16
435 |      │   │   ├── rg_eg_flag_a5 (238914,) int16
436 |      │   │   ├── rg_eg_flag_a6 (238914,) int16
437 |      │   │   ├── rg_eg_gamma_a1 (238914,) float32
438 |      │   │   ├── rg_eg_gamma_a2 (238914,) float32
439 |      │   │   ├── rg_eg_gamma_a3 (238914,) float32
440 |      │   │   ├── rg_eg_gamma_a4 (238914,) float32
441 |      │   │   ├── rg_eg_gamma_a5 (238914,) float32
442 |      │   │   ├── rg_eg_gamma_a6 (238914,) float32
443 |      │   │   ├── rg_eg_gamma_error_a1 (238914,) float32
444 |      │   │   ├── rg_eg_gamma_error_a2 (238914,) float32
445 |      │   │   ├── rg_eg_gamma_error_a3 (238914,) float32
446 |      │   │   ├── rg_eg_gamma_error_a4 (238914,) float32
447 |      │   │   ├── rg_eg_gamma_error_a5 (238914,) float32
448 |      │   │   ├── rg_eg_gamma_error_a6 (238914,) float32
449 |      │   │   ├── rg_eg_niter_a1 (238914,) uint8
450 |      │   │   ├── rg_eg_niter_a2 (238914,) uint8
451 |      │   │   ├── rg_eg_niter_a3 (238914,) uint8
452 |      │   │   ├── rg_eg_niter_a4 (238914,) uint8
453 |      │   │   ├── rg_eg_niter_a5 (238914,) uint8
454 |      │   │   ├── rg_eg_niter_a6 (238914,) uint8
455 |      │   │   ├── rg_eg_sigma_a1 (238914,) float32
456 |      │   │   ├── rg_eg_sigma_a2 (238914,) float32
457 |      │   │   ├── rg_eg_sigma_a3 (238914,) float32
458 |      │   │   ├── rg_eg_sigma_a4 (238914,) float32
459 |      │   │   ├── rg_eg_sigma_a5 (238914,) float32
460 |      │   │   ├── rg_eg_sigma_a6 (238914,) float32
461 |      │   │   ├── rg_eg_sigma_error_a1 (238914,) float32
462 |      │   │   ├── rg_eg_sigma_error_a2 (238914,) float32
463 |      │   │   ├── rg_eg_sigma_error_a3 (238914,) float32
464 |      │   │   ├── rg_eg_sigma_error_a4 (238914,) float32
465 |      │   │   ├── rg_eg_sigma_error_a5 (238914,) float32
466 |      │   │   ├── rg_eg_sigma_error_a6 (238914,) float32
467 |      │   │   ├── rg_error_a1 (238914,) float32
468 |      │   │   ├── rg_error_a2 (238914,) float32
469 |      │   │   ├── rg_error_a3 (238914,) float32
470 |      │   │   ├── rg_error_a4 (238914,) float32
471 |      │   │   ├── rg_error_a5 (238914,) float32
472 |      │   │   ├── rg_error_a6 (238914,) float32
473 |      │   │   ├── rv_a1 (238914,) float32
474 |      │   │   ├── rv_a2 (238914,) float32
475 |      │   │   ├── rv_a3 (238914,) float32
476 |      │   │   ├── rv_a4 (238914,) float32
477 |      │   │   ├── rv_a5 (238914,) float32
478 |      │   │   ├── rv_a6 (238914,) float32
479 |      │   │   ├── rx_energy_a1 (238914,) float32
480 |      │   │   ├── rx_energy_a2 (238914,) float32
481 |      │   │   ├── rx_energy_a3 (238914,) float32
482 |      │   │   ├── rx_energy_a4 (238914,) float32
483 |      │   │   ├── rx_energy_a5 (238914,) float32
484 |      │   │   └── rx_energy_a6 (238914,) float32
485 |      │   ├── rx_range_highestreturn (238914,) float64
486 |      │   ├── selected_l2a_algorithm (238914,) uint8
487 |      │   ├── selected_rg_algorithm (238914,) uint8
488 |      │   ├── sensitivity (238914,) float32
489 |      │   ├── stale_return_flag (238914,) uint8
490 |      │   └── surface_flag (238914,) uint8
491 |      ==== 1000 lines removed for brevity, see commit history ====
492 |      └── METADATA
493 | 
494 | 
495 | 
496 | ```python
497 | n, w, s, e = [40.2, -75.25, 40.15, -75.2]
498 | 
499 | geoloc = f['BEAM0000/geolocation']
500 | all_lats = geoloc['latitude_bin0'][:]
501 | all_lons = geoloc['longitude_bin0'][:]
502 | valid_lat_i = np.where(np.logical_and(all_lats >= s, all_lats <= n))
503 | valid_lon_i = np.where(np.logical_and(all_lons >= w, all_lons <= e))
504 | indices = np.intersect1d(valid_lat_i, valid_lon_i)
505 | 
506 | lats = all_lats[indices]
507 | lons = all_lons[indices]
508 | data = f['BEAM0000/cover'][:][indices]
509 | data_i = np.where(data != -9999)
510 | data = data[data_i]
511 | lats = lats[data_i]
512 | lons = lons[data_i]
513 | 
514 | ambler = plt.imread('ambler.png')
515 | fig, ax = plt.subplots(figsize=(10,10))
516 | ax.scatter(lons, lats, s=50, c=data, cmap='Greens')
517 | ax.set_xlim(w, e)
518 | ax.set_ylim(s, n)
519 | ax.imshow(ambler, zorder=0, extent = [w, e, s, n], aspect='equal')
520 | ```
521 | 
522 |     Merged 17 requests into 1
523 |     Reading https://example.earthdata.nasa.gov/example-staging-url/GEDI02_B_2019182140038_O03117_T05635_02_001_01.h5 [35434732:36859543] (1424811 bytes)
524 |     Merged 17 requests into 1
525 |     Reading https://example.earthdata.nasa.gov/example-staging-url/GEDI02_B_2019182140038_O03117_T05635_02_001_01.h5 [43931476:45340903] (1409427 bytes)
526 |     Merged 17 requests into 1
527 |     Reading https://example.earthdata.nasa.gov/example-staging-url/GEDI02_B_2019182140038_O03117_T05635_02_001_01.h5 [12035:442316] (430281 bytes)
528 | 
529 | 
530 | 
531 | 
532 | 
533 |     <matplotlib.image.AxesImage at 0x11f1a7eb0>
534 | 
535 | 
536 | 
537 | 
538 | ![png](images/output_18_2.png)
539 | 
540 | 
541 | ## Why is it sometimes slower?
542 | 
543 | ![png](images/request-overhead.png)
544 | 
545 | We pay a penalty for every new file we access, needing to go over the Internet, through the Internet services stack, the request signing process, and ultimately get redirected to S3.  The Zarr store has to pay this penalty twice to read the metadata and then the file, while a full-file download only pays the penalty once.  With current performance, the break-even point in file size is about 10 MB.  That is to say, if a user wants to access even a tiny amount of data in each granule from a collection whose granules are under 10 MB in size, he or she is better off downloading the granules.  While there is some uncontrollable overhead, there is significant room for improvement in areas that are under our control to promote inexpensive access patterns while improving time to science.
546 | 
547 | ## Conclusions
548 | 
549 | * If providers generate DMR++ on ingest, we can expose our data efficiently using a Python API that is gaining increasing traction, particulary in the Pangeo community, with minimal storage overhead
550 | * Works out of the cloud, but works even better / faster in the cloud for analysis near data
551 | * For partial access cases, an overall egress reduction of 90% or more could be possible, as demonstrated
552 | * Chunking matters.  This work makes smaller chunks more desirable, which has not historically been the case with Zarr
553 | * Overhead in our stack, from EDL, to Internet services, to redirects, are eating up the potential user savings.  At a 90% egress reduction, we struggle to compete with "Just download everything."  How do we balance preventing undesirable behavior with encouraging desirable behavior?
554 | * There are lingering questions about whether DMR++ is the correct format to capture this metadata in.  Zarr's native format is in many cases more complete and easier to parse while having mechanisms for more easily working with the 100,000-ish chunks in GEDI granules and for unifying multiple granules into a coherent view.
555 | 
556 | ## Limitations / Needs
557 | 
558 | * The DMR++ file must be generated on ingest into the cloud, which is currently optional
559 | * Only works on HDF5 and NetCDF4 files.  In principle, it could work on HDF4 / NetCDF Classic files but nothing yet generates the necessary metadata
560 | * DMR++ does not quite specify everything we could need for some datasets.  We assume little endian byte order and column-major ordering.
561 | 
562 | ## Future Work
563 | 
564 | * Packaging, unit tests, and docs sufficient for publication
565 | * Open source (relies on a naming decision)
566 | * Cache repeated calls for the same byte ranges to avoid requerying data we have
567 | * Implement unknown / undocumented areas of the DMR++ spec, including compression types and data filters
568 | * Tests with Dask and XArray
569 | * Implement CF conventions to populate fill values, offsets, scales, etc
570 | * Extensions to present L3 global collections as a coherent data cube
571 | 
572 | I strongly believe in this access pattern as a win for our users and ourselves.  To the extent it is not fully realized, it suffers from being an early adopter of our cloud access stack.  My sincere hope is that we can learn from it to improve partial file access not only here but in other tools and libraries.
573 | 


--------------------------------------------------------------------------------
/tests/fixtures/20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.nc.dmrpp:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="ISO-8859-1"?>
  2 | <Dataset xmlns="http://xml.opendap.org/ns/DAP/4.0#" xmlns:dmrpp="http://xml.opendap.org/dap/dmrpp/1.0.0#" dapVersion="4.0" dmrVersion="1.0" name="20200911000001-JPL-L2P_GHRSST-SSTskin-MODIS_A-N-v02.0-fv01.0.nc" dmrpp:href="OPeNDAP_DMRpp_DATA_ACCESS_URL">
  3 |     <Dimension name="time" size="1"/>
  4 |     <Dimension name="nj" size="2030"/>
  5 |     <Dimension name="ni" size="1354"/>
  6 |     <Int16 name="wind_speed">
  7 |         <Dim name="/time"/>
  8 |         <Dim name="/nj"/>
  9 |         <Dim name="/ni"/>
 10 |         <Attribute name="long_name" type="String">
 11 |             <Value>10m wind speed</Value>
 12 |         </Attribute>
 13 |         <Attribute name="standard_name" type="String">
 14 |             <Value>wind_speed</Value>
 15 |         </Attribute>
 16 |         <Attribute name="units" type="String">
 17 |             <Value>m s-1</Value>
 18 |         </Attribute>
 19 |         <Attribute name="_FillValue" type="Int16">
 20 |             <Value>-128</Value>
 21 |         </Attribute>
 22 |         <Attribute name="valid_min" type="Int16">
 23 |             <Value>-127</Value>
 24 |         </Attribute>
 25 |         <Attribute name="valid_max" type="Int16">
 26 |             <Value>127</Value>
 27 |         </Attribute>
 28 |         <Attribute name="comment" type="String">
 29 |             <Value>Wind at 10 meters above the sea surface</Value>
 30 |         </Attribute>
 31 |         <Attribute name="scale_factor" type="Float32">
 32 |             <Value>0.2000000030</Value>
 33 |         </Attribute>
 34 |         <Attribute name="add_offset" type="Float32">
 35 |             <Value>25.00000000</Value>
 36 |         </Attribute>
 37 |         <Attribute name="source" type="String">
 38 |             <Value>TBD.  Placeholder.  Currently empty</Value>
 39 |         </Attribute>
 40 |         <Attribute name="grid_mapping" type="String">
 41 |             <Value>TBD</Value>
 42 |         </Attribute>
 43 |         <Attribute name="time_offset" type="Float32">
 44 |             <Value>2.000000000</Value>
 45 |         </Attribute>
 46 |         <Attribute name="height" type="String">
 47 |             <Value>10 m</Value>
 48 |         </Attribute>
 49 |         <Attribute name="coverage_content_type" type="String">
 50 |             <Value>auxiliaryInformation</Value>
 51 |         </Attribute>
 52 |         <Attribute name="origname" type="String">
 53 |             <Value>wind_speed</Value>
 54 |         </Attribute>
 55 |         <Attribute name="fullnamepath" type="String">
 56 |             <Value>/wind_speed</Value>
 57 |         </Attribute>
 58 |         <Attribute name="coordinates" type="String">
 59 |             <Value>time lat lon</Value>
 60 |         </Attribute>
 61 |         <dmrpp:chunks compressionType="deflate">
 62 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
 63 |             <dmrpp:chunk offset="27358005" nBytes="689" chunkPositionInArray="[0,0,0]"/>
 64 |             <dmrpp:chunk offset="27358694" nBytes="689" chunkPositionInArray="[0,0,677]"/>
 65 |             <dmrpp:chunk offset="27359383" nBytes="689" chunkPositionInArray="[0,1015,0]"/>
 66 |             <dmrpp:chunk offset="27360072" nBytes="689" chunkPositionInArray="[0,1015,677]"/>
 67 |         </dmrpp:chunks>
 68 |     </Int16>
 69 |     <Int16 name="sses_standard_deviation">
 70 |         <Dim name="/time"/>
 71 |         <Dim name="/nj"/>
 72 |         <Dim name="/ni"/>
 73 |         <Attribute name="long_name" type="String">
 74 |             <Value>SSES standard deviation error based on proximity confidence flags</Value>
 75 |         </Attribute>
 76 |         <Attribute name="units" type="String">
 77 |             <Value>kelvin</Value>
 78 |         </Attribute>
 79 |         <Attribute name="_FillValue" type="Int16">
 80 |             <Value>-128</Value>
 81 |         </Attribute>
 82 |         <Attribute name="valid_min" type="Int16">
 83 |             <Value>-127</Value>
 84 |         </Attribute>
 85 |         <Attribute name="valid_max" type="Int16">
 86 |             <Value>127</Value>
 87 |         </Attribute>
 88 |         <Attribute name="comment" type="String">
 89 |             <Value>thermal IR SST standard deviation error; signed byte array: WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value</Value>
 90 |         </Attribute>
 91 |         <Attribute name="scale_factor" type="Float32">
 92 |             <Value>0.07874015719</Value>
 93 |         </Attribute>
 94 |         <Attribute name="add_offset" type="Float32">
 95 |             <Value>10.00000000</Value>
 96 |         </Attribute>
 97 |         <Attribute name="coverage_content_type" type="String">
 98 |             <Value>auxiliaryInformation</Value>
 99 |         </Attribute>
100 |         <Attribute name="origname" type="String">
101 |             <Value>sses_standard_deviation</Value>
102 |         </Attribute>
103 |         <Attribute name="fullnamepath" type="String">
104 |             <Value>/sses_standard_deviation</Value>
105 |         </Attribute>
106 |         <Attribute name="coordinates" type="String">
107 |             <Value>time lat lon</Value>
108 |         </Attribute>
109 |         <dmrpp:chunks compressionType="deflate">
110 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
111 |             <dmrpp:chunk offset="22317539" nBytes="23320" chunkPositionInArray="[0,0,0]"/>
112 |             <dmrpp:chunk offset="22340859" nBytes="28041" chunkPositionInArray="[0,0,677]"/>
113 |             <dmrpp:chunk offset="22368900" nBytes="13222" chunkPositionInArray="[0,1015,0]"/>
114 |             <dmrpp:chunk offset="22382122" nBytes="4287" chunkPositionInArray="[0,1015,677]"/>
115 |         </dmrpp:chunks>
116 |     </Int16>
117 |     <Int16 name="sst_dtime">
118 |         <Dim name="/time"/>
119 |         <Dim name="/nj"/>
120 |         <Dim name="/ni"/>
121 |         <Attribute name="long_name" type="String">
122 |             <Value>time difference from reference time</Value>
123 |         </Attribute>
124 |         <Attribute name="units" type="String">
125 |             <Value>seconds</Value>
126 |         </Attribute>
127 |         <Attribute name="_FillValue" type="Int16">
128 |             <Value>-32768</Value>
129 |         </Attribute>
130 |         <Attribute name="valid_min" type="Int16">
131 |             <Value>-32767</Value>
132 |         </Attribute>
133 |         <Attribute name="valid_max" type="Int16">
134 |             <Value>32767</Value>
135 |         </Attribute>
136 |         <Attribute name="comment" type="String">
137 |             <Value>time plus sst_dtime gives seconds after 00:00:00 UTC January 1, 1981</Value>
138 |         </Attribute>
139 |         <Attribute name="coverage_content_type" type="String">
140 |             <Value>referenceInformation</Value>
141 |         </Attribute>
142 |         <Attribute name="origname" type="String">
143 |             <Value>sst_dtime</Value>
144 |         </Attribute>
145 |         <Attribute name="fullnamepath" type="String">
146 |             <Value>/sst_dtime</Value>
147 |         </Attribute>
148 |         <Attribute name="coordinates" type="String">
149 |             <Value>time lat lon</Value>
150 |         </Attribute>
151 |         <dmrpp:chunks compressionType="deflate">
152 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
153 |             <dmrpp:chunk offset="22145604" nBytes="1577" chunkPositionInArray="[0,0,0]"/>
154 |             <dmrpp:chunk offset="22147181" nBytes="1577" chunkPositionInArray="[0,0,677]"/>
155 |             <dmrpp:chunk offset="22148758" nBytes="1579" chunkPositionInArray="[0,1015,0]"/>
156 |             <dmrpp:chunk offset="22150337" nBytes="1579" chunkPositionInArray="[0,1015,677]"/>
157 |         </dmrpp:chunks>
158 |     </Int16>
159 |     <Int16 name="l2p_flags">
160 |         <Dim name="/time"/>
161 |         <Dim name="/nj"/>
162 |         <Dim name="/ni"/>
163 |         <Attribute name="long_name" type="String">
164 |             <Value>L2P flags</Value>
165 |         </Attribute>
166 |         <Attribute name="valid_min" type="Int16">
167 |             <Value>0</Value>
168 |         </Attribute>
169 |         <Attribute name="valid_max" type="Int16">
170 |             <Value>16</Value>
171 |         </Attribute>
172 |         <Attribute name="comment" type="String">
173 |             <Value>These flags can be used to further filter data variables</Value>
174 |         </Attribute>
175 |         <Attribute name="flag_meanings" type="String">
176 |             <Value>microwave land ice lake river</Value>
177 |         </Attribute>
178 |         <Attribute name="flag_masks" type="Int16">
179 |             <Value>1</Value>
180 |             <Value>2</Value>
181 |             <Value>4</Value>
182 |             <Value>8</Value>
183 |             <Value>16</Value>
184 |         </Attribute>
185 |         <Attribute name="coverage_content_type" type="String">
186 |             <Value>qualityInformation</Value>
187 |         </Attribute>
188 |         <Attribute name="origname" type="String">
189 |             <Value>l2p_flags</Value>
190 |         </Attribute>
191 |         <Attribute name="fullnamepath" type="String">
192 |             <Value>/l2p_flags</Value>
193 |         </Attribute>
194 |         <Attribute name="coordinates" type="String">
195 |             <Value>time lat lon</Value>
196 |         </Attribute>
197 |         <dmrpp:chunks compressionType="deflate">
198 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
199 |             <dmrpp:chunk offset="22393463" nBytes="1354" chunkPositionInArray="[0,0,0]"/>
200 |             <dmrpp:chunk offset="22394817" nBytes="1354" chunkPositionInArray="[0,0,677]"/>
201 |             <dmrpp:chunk offset="22396171" nBytes="1381" chunkPositionInArray="[0,1015,0]"/>
202 |             <dmrpp:chunk offset="22397552" nBytes="1354" chunkPositionInArray="[0,1015,677]"/>
203 |         </dmrpp:chunks>
204 |     </Int16>
205 |     <Int16 name="sea_surface_temperature">
206 |         <Dim name="/time"/>
207 |         <Dim name="/nj"/>
208 |         <Dim name="/ni"/>
209 |         <Attribute name="long_name" type="String">
210 |             <Value>sea surface temperature</Value>
211 |         </Attribute>
212 |         <Attribute name="standard_name" type="String">
213 |             <Value>sea_surface_skin_temperature</Value>
214 |         </Attribute>
215 |         <Attribute name="units" type="String">
216 |             <Value>kelvin</Value>
217 |         </Attribute>
218 |         <Attribute name="_FillValue" type="Int16">
219 |             <Value>-32767</Value>
220 |         </Attribute>
221 |         <Attribute name="valid_min" type="Int16">
222 |             <Value>-1000</Value>
223 |         </Attribute>
224 |         <Attribute name="valid_max" type="Int16">
225 |             <Value>10000</Value>
226 |         </Attribute>
227 |         <Attribute name="comment" type="String">
228 |             <Value>sea surface temperature from thermal IR (11 um) channels</Value>
229 |         </Attribute>
230 |         <Attribute name="scale_factor" type="Float32">
231 |             <Value>0.004999999888</Value>
232 |         </Attribute>
233 |         <Attribute name="add_offset" type="Float32">
234 |             <Value>273.1499939</Value>
235 |         </Attribute>
236 |         <Attribute name="source" type="String">
237 |             <Value>NASA and University of Miami</Value>
238 |         </Attribute>
239 |         <Attribute name="coverage_content_type" type="String">
240 |             <Value>physicalMeasurement</Value>
241 |         </Attribute>
242 |         <Attribute name="origname" type="String">
243 |             <Value>sea_surface_temperature</Value>
244 |         </Attribute>
245 |         <Attribute name="fullnamepath" type="String">
246 |             <Value>/sea_surface_temperature</Value>
247 |         </Attribute>
248 |         <Attribute name="coordinates" type="String">
249 |             <Value>time lat lon</Value>
250 |         </Attribute>
251 |         <dmrpp:chunks compressionType="deflate">
252 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
253 |             <dmrpp:chunk offset="17538750" nBytes="1200672" chunkPositionInArray="[0,0,0]"/>
254 |             <dmrpp:chunk offset="18739422" nBytes="1157643" chunkPositionInArray="[0,0,677]"/>
255 |             <dmrpp:chunk offset="19897065" nBytes="1115469" chunkPositionInArray="[0,1015,0]"/>
256 |             <dmrpp:chunk offset="21012534" nBytes="1126406" chunkPositionInArray="[0,1015,677]"/>
257 |         </dmrpp:chunks>
258 |     </Int16>
259 |     <Int16 name="quality_level">
260 |         <Dim name="/time"/>
261 |         <Dim name="/nj"/>
262 |         <Dim name="/ni"/>
263 |         <Attribute name="long_name" type="String">
264 |             <Value>quality level of SST pixel</Value>
265 |         </Attribute>
266 |         <Attribute name="_FillValue" type="Int16">
267 |             <Value>-128</Value>
268 |         </Attribute>
269 |         <Attribute name="valid_min" type="Int16">
270 |             <Value>0</Value>
271 |         </Attribute>
272 |         <Attribute name="valid_max" type="Int16">
273 |             <Value>5</Value>
274 |         </Attribute>
275 |         <Attribute name="comment" type="String">
276 |             <Value>thermal IR SST proximity confidence value; signed byte array: WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value</Value>
277 |         </Attribute>
278 |         <Attribute name="flag_values" type="Int16">
279 |             <Value>0</Value>
280 |             <Value>1</Value>
281 |             <Value>2</Value>
282 |             <Value>3</Value>
283 |             <Value>4</Value>
284 |             <Value>5</Value>
285 |         </Attribute>
286 |         <Attribute name="flag_meanings" type="String">
287 |             <Value>no_data bad_data worst_quality low_quality acceptable_quality best_quality</Value>
288 |         </Attribute>
289 |         <Attribute name="coverage_content_type" type="String">
290 |             <Value>qualityInformation</Value>
291 |         </Attribute>
292 |         <Attribute name="origname" type="String">
293 |             <Value>quality_level</Value>
294 |         </Attribute>
295 |         <Attribute name="fullnamepath" type="String">
296 |             <Value>/quality_level</Value>
297 |         </Attribute>
298 |         <Attribute name="coordinates" type="String">
299 |             <Value>time lat lon</Value>
300 |         </Attribute>
301 |         <dmrpp:chunks compressionType="deflate">
302 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
303 |             <dmrpp:chunk offset="22162994" nBytes="24444" chunkPositionInArray="[0,0,0]"/>
304 |             <dmrpp:chunk offset="22187438" nBytes="30682" chunkPositionInArray="[0,0,677]"/>
305 |             <dmrpp:chunk offset="22218120" nBytes="13679" chunkPositionInArray="[0,1015,0]"/>
306 |             <dmrpp:chunk offset="22231799" nBytes="4661" chunkPositionInArray="[0,1015,677]"/>
307 |         </dmrpp:chunks>
308 |     </Int16>
309 |     <Int16 name="dt_analysis">
310 |         <Dim name="/time"/>
311 |         <Dim name="/nj"/>
312 |         <Dim name="/ni"/>
313 |         <Attribute name="long_name" type="String">
314 |             <Value>deviation from SST reference climatology</Value>
315 |         </Attribute>
316 |         <Attribute name="units" type="String">
317 |             <Value>kelvin</Value>
318 |         </Attribute>
319 |         <Attribute name="_FillValue" type="Int16">
320 |             <Value>-128</Value>
321 |         </Attribute>
322 |         <Attribute name="valid_min" type="Int16">
323 |             <Value>-127</Value>
324 |         </Attribute>
325 |         <Attribute name="valid_max" type="Int16">
326 |             <Value>127</Value>
327 |         </Attribute>
328 |         <Attribute name="comment" type="String">
329 |             <Value>TBD</Value>
330 |         </Attribute>
331 |         <Attribute name="scale_factor" type="Float32">
332 |             <Value>0.1000000015</Value>
333 |         </Attribute>
334 |         <Attribute name="add_offset" type="Float32">
335 |             <Value>0.000000000</Value>
336 |         </Attribute>
337 |         <Attribute name="source" type="String">
338 |             <Value>TBD. Placeholder.  Currently empty</Value>
339 |         </Attribute>
340 |         <Attribute name="coverage_content_type" type="String">
341 |             <Value>auxiliaryInformation</Value>
342 |         </Attribute>
343 |         <Attribute name="origname" type="String">
344 |             <Value>dt_analysis</Value>
345 |         </Attribute>
346 |         <Attribute name="fullnamepath" type="String">
347 |             <Value>/dt_analysis</Value>
348 |         </Attribute>
349 |         <Attribute name="coordinates" type="String">
350 |             <Value>time lat lon</Value>
351 |         </Attribute>
352 |         <dmrpp:chunks compressionType="deflate">
353 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
354 |             <dmrpp:chunk offset="27367954" nBytes="689" chunkPositionInArray="[0,0,0]"/>
355 |             <dmrpp:chunk offset="27368643" nBytes="689" chunkPositionInArray="[0,0,677]"/>
356 |             <dmrpp:chunk offset="27369332" nBytes="689" chunkPositionInArray="[0,1015,0]"/>
357 |             <dmrpp:chunk offset="27370021" nBytes="689" chunkPositionInArray="[0,1015,677]"/>
358 |         </dmrpp:chunks>
359 |     </Int16>
360 |     <Int16 name="sses_standard_deviation_4um">
361 |         <Dim name="/time"/>
362 |         <Dim name="/nj"/>
363 |         <Dim name="/ni"/>
364 |         <Attribute name="long_name" type="String">
365 |             <Value>SSES standard deviation error based on proximity confidence flags</Value>
366 |         </Attribute>
367 |         <Attribute name="units" type="String">
368 |             <Value>kelvin</Value>
369 |         </Attribute>
370 |         <Attribute name="_FillValue" type="Int16">
371 |             <Value>-128</Value>
372 |         </Attribute>
373 |         <Attribute name="valid_min" type="Int16">
374 |             <Value>-127</Value>
375 |         </Attribute>
376 |         <Attribute name="valid_max" type="Int16">
377 |             <Value>127</Value>
378 |         </Attribute>
379 |         <Attribute name="comment" type="String">
380 |             <Value>mid-IR SST standard deviation error; non L2P core field; signed byte array:  WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value</Value>
381 |         </Attribute>
382 |         <Attribute name="scale_factor" type="Float32">
383 |             <Value>0.07874015719</Value>
384 |         </Attribute>
385 |         <Attribute name="add_offset" type="Float32">
386 |             <Value>10.00000000</Value>
387 |         </Attribute>
388 |         <Attribute name="coverage_content_type" type="String">
389 |             <Value>auxiliaryInformation</Value>
390 |         </Attribute>
391 |         <Attribute name="origname" type="String">
392 |             <Value>sses_standard_deviation_4um</Value>
393 |         </Attribute>
394 |         <Attribute name="fullnamepath" type="String">
395 |             <Value>/sses_standard_deviation_4um</Value>
396 |         </Attribute>
397 |         <Attribute name="coordinates" type="String">
398 |             <Value>time lat lon</Value>
399 |         </Attribute>
400 |         <dmrpp:chunks compressionType="deflate">
401 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
402 |             <dmrpp:chunk offset="27251747" nBytes="30619" chunkPositionInArray="[0,0,0]"/>
403 |             <dmrpp:chunk offset="27282366" nBytes="39107" chunkPositionInArray="[0,0,677]"/>
404 |             <dmrpp:chunk offset="27321473" nBytes="18171" chunkPositionInArray="[0,1015,0]"/>
405 |             <dmrpp:chunk offset="27339644" nBytes="6275" chunkPositionInArray="[0,1015,677]"/>
406 |         </dmrpp:chunks>
407 |     </Int16>
408 |     <Int16 name="sses_bias_4um">
409 |         <Dim name="/time"/>
410 |         <Dim name="/nj"/>
411 |         <Dim name="/ni"/>
412 |         <Attribute name="long_name" type="String">
413 |             <Value>SSES bias error based on proximity confidence flags</Value>
414 |         </Attribute>
415 |         <Attribute name="units" type="String">
416 |             <Value>kelvin</Value>
417 |         </Attribute>
418 |         <Attribute name="_FillValue" type="Int16">
419 |             <Value>-128</Value>
420 |         </Attribute>
421 |         <Attribute name="valid_min" type="Int16">
422 |             <Value>-127</Value>
423 |         </Attribute>
424 |         <Attribute name="valid_max" type="Int16">
425 |             <Value>127</Value>
426 |         </Attribute>
427 |         <Attribute name="comment" type="String">
428 |             <Value>mid-IR SST bias error; non L2P core field; signed byte array:  WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value</Value>
429 |         </Attribute>
430 |         <Attribute name="scale_factor" type="Float32">
431 |             <Value>0.1574803144</Value>
432 |         </Attribute>
433 |         <Attribute name="add_offset" type="Float32">
434 |             <Value>0.000000000</Value>
435 |         </Attribute>
436 |         <Attribute name="coverage_content_type" type="String">
437 |             <Value>auxiliaryInformation</Value>
438 |         </Attribute>
439 |         <Attribute name="origname" type="String">
440 |             <Value>sses_bias_4um</Value>
441 |         </Attribute>
442 |         <Attribute name="fullnamepath" type="String">
443 |             <Value>/sses_bias_4um</Value>
444 |         </Attribute>
445 |         <Attribute name="coordinates" type="String">
446 |             <Value>time lat lon</Value>
447 |         </Attribute>
448 |         <dmrpp:chunks compressionType="deflate">
449 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
450 |             <dmrpp:chunk offset="27160872" nBytes="27847" chunkPositionInArray="[0,0,0]"/>
451 |             <dmrpp:chunk offset="27188719" nBytes="35589" chunkPositionInArray="[0,0,677]"/>
452 |             <dmrpp:chunk offset="27224308" nBytes="14687" chunkPositionInArray="[0,1015,0]"/>
453 |             <dmrpp:chunk offset="27238995" nBytes="5623" chunkPositionInArray="[0,1015,677]"/>
454 |         </dmrpp:chunks>
455 |     </Int16>
456 |     <Int16 name="sses_bias">
457 |         <Dim name="/time"/>
458 |         <Dim name="/nj"/>
459 |         <Dim name="/ni"/>
460 |         <Attribute name="long_name" type="String">
461 |             <Value>SSES bias error based on proximity confidence flags</Value>
462 |         </Attribute>
463 |         <Attribute name="units" type="String">
464 |             <Value>kelvin</Value>
465 |         </Attribute>
466 |         <Attribute name="_FillValue" type="Int16">
467 |             <Value>-128</Value>
468 |         </Attribute>
469 |         <Attribute name="valid_min" type="Int16">
470 |             <Value>-127</Value>
471 |         </Attribute>
472 |         <Attribute name="valid_max" type="Int16">
473 |             <Value>127</Value>
474 |         </Attribute>
475 |         <Attribute name="comment" type="String">
476 |             <Value>thermal IR SST bias error; signed byte array: WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value</Value>
477 |         </Attribute>
478 |         <Attribute name="scale_factor" type="Float32">
479 |             <Value>0.1574803144</Value>
480 |         </Attribute>
481 |         <Attribute name="add_offset" type="Float32">
482 |             <Value>0.000000000</Value>
483 |         </Attribute>
484 |         <Attribute name="coverage_content_type" type="String">
485 |             <Value>auxiliaryInformation</Value>
486 |         </Attribute>
487 |         <Attribute name="origname" type="String">
488 |             <Value>sses_bias</Value>
489 |         </Attribute>
490 |         <Attribute name="fullnamepath" type="String">
491 |             <Value>/sses_bias</Value>
492 |         </Attribute>
493 |         <Attribute name="coordinates" type="String">
494 |             <Value>time lat lon</Value>
495 |         </Attribute>
496 |         <dmrpp:chunks compressionType="deflate">
497 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
498 |             <dmrpp:chunk offset="22244733" nBytes="22729" chunkPositionInArray="[0,0,0]"/>
499 |             <dmrpp:chunk offset="22267462" nBytes="26981" chunkPositionInArray="[0,0,677]"/>
500 |             <dmrpp:chunk offset="22294443" nBytes="12149" chunkPositionInArray="[0,1015,0]"/>
501 |             <dmrpp:chunk offset="22306592" nBytes="4272" chunkPositionInArray="[0,1015,677]"/>
502 |         </dmrpp:chunks>
503 |     </Int16>
504 |     <Int16 name="sea_surface_temperature_4um">
505 |         <Dim name="/time"/>
506 |         <Dim name="/nj"/>
507 |         <Dim name="/ni"/>
508 |         <Attribute name="long_name" type="String">
509 |             <Value>sea surface temperature</Value>
510 |         </Attribute>
511 |         <Attribute name="units" type="String">
512 |             <Value>kelvin</Value>
513 |         </Attribute>
514 |         <Attribute name="_FillValue" type="Int16">
515 |             <Value>-32767</Value>
516 |         </Attribute>
517 |         <Attribute name="valid_min" type="Int16">
518 |             <Value>-1000</Value>
519 |         </Attribute>
520 |         <Attribute name="valid_max" type="Int16">
521 |             <Value>10000</Value>
522 |         </Attribute>
523 |         <Attribute name="comment" type="String">
524 |             <Value>sea surface temperature from mid-IR (4 um) channels; non L2P core field</Value>
525 |         </Attribute>
526 |         <Attribute name="scale_factor" type="Float32">
527 |             <Value>0.004999999888</Value>
528 |         </Attribute>
529 |         <Attribute name="add_offset" type="Float32">
530 |             <Value>273.1499939</Value>
531 |         </Attribute>
532 |         <Attribute name="coverage_content_type" type="String">
533 |             <Value>physicalMeasurement</Value>
534 |         </Attribute>
535 |         <Attribute name="origname" type="String">
536 |             <Value>sea_surface_temperature_4um</Value>
537 |         </Attribute>
538 |         <Attribute name="fullnamepath" type="String">
539 |             <Value>/sea_surface_temperature_4um</Value>
540 |         </Attribute>
541 |         <Attribute name="coordinates" type="String">
542 |             <Value>time lat lon</Value>
543 |         </Attribute>
544 |         <dmrpp:chunks compressionType="deflate">
545 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
546 |             <dmrpp:chunk offset="22405618" nBytes="1197232" chunkPositionInArray="[0,0,0]"/>
547 |             <dmrpp:chunk offset="23602850" nBytes="1171640" chunkPositionInArray="[0,0,677]"/>
548 |             <dmrpp:chunk offset="24774490" nBytes="1141479" chunkPositionInArray="[0,1015,0]"/>
549 |             <dmrpp:chunk offset="25915969" nBytes="1153202" chunkPositionInArray="[0,1015,677]"/>
550 |         </dmrpp:chunks>
551 |     </Int16>
552 |     <Int16 name="quality_level_4um">
553 |         <Dim name="/time"/>
554 |         <Dim name="/nj"/>
555 |         <Dim name="/ni"/>
556 |         <Attribute name="long_name" type="String">
557 |             <Value>quality level of SST pixel</Value>
558 |         </Attribute>
559 |         <Attribute name="_FillValue" type="Int16">
560 |             <Value>-128</Value>
561 |         </Attribute>
562 |         <Attribute name="valid_min" type="Int16">
563 |             <Value>0</Value>
564 |         </Attribute>
565 |         <Attribute name="valid_max" type="Int16">
566 |             <Value>5</Value>
567 |         </Attribute>
568 |         <Attribute name="comment" type="String">
569 |             <Value>mid-IR SST proximity confidence value; non L2P core field; signed byte array:  WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value</Value>
570 |         </Attribute>
571 |         <Attribute name="flag_values" type="Int16">
572 |             <Value>0</Value>
573 |             <Value>1</Value>
574 |             <Value>2</Value>
575 |             <Value>3</Value>
576 |             <Value>4</Value>
577 |             <Value>5</Value>
578 |         </Attribute>
579 |         <Attribute name="flag_meanings" type="String">
580 |             <Value>no_data bad_data worst_quality low_quality acceptable_quality best_quality</Value>
581 |         </Attribute>
582 |         <Attribute name="coverage_content_type" type="String">
583 |             <Value>qualityInformation</Value>
584 |         </Attribute>
585 |         <Attribute name="origname" type="String">
586 |             <Value>quality_level_4um</Value>
587 |         </Attribute>
588 |         <Attribute name="fullnamepath" type="String">
589 |             <Value>/quality_level_4um</Value>
590 |         </Attribute>
591 |         <Attribute name="coordinates" type="String">
592 |             <Value>time lat lon</Value>
593 |         </Attribute>
594 |         <dmrpp:chunks compressionType="deflate">
595 |             <dmrpp:chunkDimensionSizes>1 1015 677</dmrpp:chunkDimensionSizes>
596 |             <dmrpp:chunk offset="27076250" nBytes="25483" chunkPositionInArray="[0,0,0]"/>
597 |             <dmrpp:chunk offset="27101733" nBytes="33457" chunkPositionInArray="[0,0,677]"/>
598 |             <dmrpp:chunk offset="27135190" nBytes="13796" chunkPositionInArray="[0,1015,0]"/>
599 |             <dmrpp:chunk offset="27148986" nBytes="5147" chunkPositionInArray="[0,1015,677]"/>
600 |         </dmrpp:chunks>
601 |     </Int16>
602 |     <Int32 name="time">
603 |         <Dim name="/time"/>
604 |         <Attribute name="long_name" type="String">
605 |             <Value>reference time of sst file</Value>
606 |         </Attribute>
607 |         <Attribute name="standard_name" type="String">
608 |             <Value>time</Value>
609 |         </Attribute>
610 |         <Attribute name="units" type="String">
611 |             <Value>seconds since 1981-01-01 00:00:00</Value>
612 |         </Attribute>
613 |         <Attribute name="comment" type="String">
614 |             <Value>time of first sensor observation</Value>
615 |         </Attribute>
616 |         <Attribute name="coverage_content_type" type="String">
617 |             <Value>coordinate</Value>
618 |         </Attribute>
619 |         <Attribute name="origname" type="String">
620 |             <Value>time</Value>
621 |         </Attribute>
622 |         <Attribute name="fullnamepath" type="String">
623 |             <Value>/time</Value>
624 |         </Attribute>
625 |         <dmrpp:chunks compressionType="deflate">
626 |             <dmrpp:chunkDimensionSizes>1</dmrpp:chunkDimensionSizes>
627 |             <dmrpp:chunk offset="17528467" nBytes="12" chunkPositionInArray="[0]"/>
628 |         </dmrpp:chunks>
629 |     </Int32>
630 |     <Float32 name="lat">
631 |         <Dim name="/nj"/>
632 |         <Dim name="/ni"/>
633 |         <Attribute name="long_name" type="String">
634 |             <Value>latitude</Value>
635 |         </Attribute>
636 |         <Attribute name="standard_name" type="String">
637 |             <Value>latitude</Value>
638 |         </Attribute>
639 |         <Attribute name="units" type="String">
640 |             <Value>degrees_north</Value>
641 |         </Attribute>
642 |         <Attribute name="_FillValue" type="Float32">
643 |             <Value>-999.0000000</Value>
644 |         </Attribute>
645 |         <Attribute name="valid_min" type="Float32">
646 |             <Value>-90.00000000</Value>
647 |         </Attribute>
648 |         <Attribute name="valid_max" type="Float32">
649 |             <Value>90.00000000</Value>
650 |         </Attribute>
651 |         <Attribute name="comment" type="String">
652 |             <Value>geographical coordinates, WGS84 projection</Value>
653 |         </Attribute>
654 |         <Attribute name="coverage_content_type" type="String">
655 |             <Value>coordinate</Value>
656 |         </Attribute>
657 |         <Attribute name="origname" type="String">
658 |             <Value>lat</Value>
659 |         </Attribute>
660 |         <Attribute name="fullnamepath" type="String">
661 |             <Value>/lat</Value>
662 |         </Attribute>
663 |         <dmrpp:chunks compressionType="deflate">
664 |             <dmrpp:chunkDimensionSizes>1015 677</dmrpp:chunkDimensionSizes>
665 |             <dmrpp:chunk offset="19762" nBytes="2073756" chunkPositionInArray="[0,0]"/>
666 |             <dmrpp:chunk offset="2093518" nBytes="1940803" chunkPositionInArray="[0,677]"/>
667 |             <dmrpp:chunk offset="4034321" nBytes="2080328" chunkPositionInArray="[1015,0]"/>
668 |             <dmrpp:chunk offset="6114649" nBytes="1911892" chunkPositionInArray="[1015,677]"/>
669 |         </dmrpp:chunks>
670 |     </Float32>
671 |     <Float32 name="lon">
672 |         <Dim name="/nj"/>
673 |         <Dim name="/ni"/>
674 |         <Attribute name="long_name" type="String">
675 |             <Value>longitude</Value>
676 |         </Attribute>
677 |         <Attribute name="standard_name" type="String">
678 |             <Value>longitude</Value>
679 |         </Attribute>
680 |         <Attribute name="units" type="String">
681 |             <Value>degrees_east</Value>
682 |         </Attribute>
683 |         <Attribute name="_FillValue" type="Float32">
684 |             <Value>-999.0000000</Value>
685 |         </Attribute>
686 |         <Attribute name="valid_min" type="Float32">
687 |             <Value>-180.0000000</Value>
688 |         </Attribute>
689 |         <Attribute name="valid_max" type="Float32">
690 |             <Value>180.0000000</Value>
691 |         </Attribute>
692 |         <Attribute name="comment" type="String">
693 |             <Value>geographical coordinates, WGS84 projection</Value>
694 |         </Attribute>
695 |         <Attribute name="coverage_content_type" type="String">
696 |             <Value>coordinate</Value>
697 |         </Attribute>
698 |         <Attribute name="origname" type="String">
699 |             <Value>lon</Value>
700 |         </Attribute>
701 |         <Attribute name="fullnamepath" type="String">
702 |             <Value>/lon</Value>
703 |         </Attribute>
704 |         <dmrpp:chunks compressionType="deflate">
705 |             <dmrpp:chunkDimensionSizes>1015 677</dmrpp:chunkDimensionSizes>
706 |             <dmrpp:chunk offset="8032699" nBytes="2408756" chunkPositionInArray="[0,0]"/>
707 |             <dmrpp:chunk offset="10441455" nBytes="2316773" chunkPositionInArray="[0,677]"/>
708 |             <dmrpp:chunk offset="12758228" nBytes="2460793" chunkPositionInArray="[1015,0]"/>
709 |             <dmrpp:chunk offset="15219021" nBytes="2306544" chunkPositionInArray="[1015,677]"/>
710 |         </dmrpp:chunks>
711 |     </Float32>
712 |     <Attribute name="HDF5_GLOBAL" type="Container">
713 |         <Attribute name="Conventions" type="String">
714 |             <Value>CF-1.7, ACDD-1.3</Value>
715 |         </Attribute>
716 |         <Attribute name="title" type="String">
717 |             <Value>MODIS Aqua L2P SST</Value>
718 |         </Attribute>
719 |         <Attribute name="summary" type="String">
720 |             <Value>Sea surface temperature retrievals produced at the NASA OBPG for the MODIS Aqua sensor.  These have been reformatted to GHRSST GDS specifications by the JPL PO.DAAC</Value>
721 |         </Attribute>
722 |         <Attribute name="references" type="String">
723 |             <Value>GHRSST Data Processing Specification v2r5</Value>
724 |         </Attribute>
725 |         <Attribute name="institution" type="String">
726 |             <Value>NASA/JPL/OBPG/RSMAS</Value>
727 |         </Attribute>
728 |         <Attribute name="history" type="String">
729 |             <Value>MODIS L2P created at JPL PO.DAAC</Value>
730 |         </Attribute>
731 |         <Attribute name="comment" type="String">
732 |             <Value>L2P Core without DT analysis or other ancillary fields; Night, Start Node:Descending, End Node:Descending; WARNING Some applications are unable to properly handle signed byte values. If values are encountered &gt; 127, please subtract 256 from this reported value; Quicklook</Value>
733 |         </Attribute>
734 |         <Attribute name="license" type="String">
735 |             <Value>GHRSST and PO.DAAC protocol allow data use as free and open.</Value>
736 |         </Attribute>
737 |         <Attribute name="id" type="String">
738 |             <Value>MODIS_A-JPL-L2P-v2019.0</Value>
739 |         </Attribute>
740 |         <Attribute name="naming_authority" type="String">
741 |             <Value>org.ghrsst</Value>
742 |         </Attribute>
743 |         <Attribute name="product_version" type="String">
744 |             <Value>2019.0</Value>
745 |         </Attribute>
746 |         <Attribute name="uuid" type="String">
747 |             <Value>f6e1f61d-c4a4-4c17-8354-0c15e12d688b</Value>
748 |         </Attribute>
749 |         <Attribute name="gds_version_id" type="String">
750 |             <Value>2.0</Value>
751 |         </Attribute>
752 |         <Attribute name="netcdf_version_id" type="String">
753 |             <Value>4.1</Value>
754 |         </Attribute>
755 |         <Attribute name="date_created" type="String">
756 |             <Value>20200911T024514Z</Value>
757 |         </Attribute>
758 |         <Attribute name="file_quality_level" type="Int32">
759 |             <Value>3</Value>
760 |         </Attribute>
761 |         <Attribute name="spatial_resolution" type="String">
762 |             <Value>1km</Value>
763 |         </Attribute>
764 |         <Attribute name="start_time" type="String">
765 |             <Value>20200911T000001Z</Value>
766 |         </Attribute>
767 |         <Attribute name="time_coverage_start" type="String">
768 |             <Value>20200911T000001Z</Value>
769 |         </Attribute>
770 |         <Attribute name="stop_time" type="String">
771 |             <Value>20200911T000458Z</Value>
772 |         </Attribute>
773 |         <Attribute name="time_coverage_end" type="String">
774 |             <Value>20200911T000458Z</Value>
775 |         </Attribute>
776 |         <Attribute name="northernmost_latitude" type="Float32">
777 |             <Value>-36.22299957</Value>
778 |         </Attribute>
779 |         <Attribute name="southernmost_latitude" type="Float32">
780 |             <Value>-57.91799927</Value>
781 |         </Attribute>
782 |         <Attribute name="easternmost_longitude" type="Float32">
783 |             <Value>31.05480003</Value>
784 |         </Attribute>
785 |         <Attribute name="westernmost_longitude" type="Float32">
786 |             <Value>-7.165909767</Value>
787 |         </Attribute>
788 |         <Attribute name="source" type="String">
789 |             <Value>MODIS sea surface temperature observations for the OBPG</Value>
790 |         </Attribute>
791 |         <Attribute name="platform" type="String">
792 |             <Value>Aqua</Value>
793 |         </Attribute>
794 |         <Attribute name="sensor" type="String">
795 |             <Value>MODIS</Value>
796 |         </Attribute>
797 |         <Attribute name="metadata_link" type="String">
798 |             <Value>http://podaac.jpl.nasa.gov/ws/metadata/dataset/?format=iso&amp;shortName=MODIS_A-JPL-L2P-v2019.0</Value>
799 |         </Attribute>
800 |         <Attribute name="keywords" type="String">
801 |             <Value>Oceans &gt; Ocean Temperature &gt; Sea Surface Temperature</Value>
802 |         </Attribute>
803 |         <Attribute name="keywords_vocabulary" type="String">
804 |             <Value>NASA Global Change Master Directory (GCMD) Science Keywords</Value>
805 |         </Attribute>
806 |         <Attribute name="standard_name_vocabulary" type="String">
807 |             <Value>NetCDF Climate and Forecast (CF) Metadata Convention</Value>
808 |         </Attribute>
809 |         <Attribute name="geospatial_lat_units" type="String">
810 |             <Value>degrees_north</Value>
811 |         </Attribute>
812 |         <Attribute name="geospatial_lat_resolution" type="Float32">
813 |             <Value>0.009999999776</Value>
814 |         </Attribute>
815 |         <Attribute name="geospatial_lon_units" type="String">
816 |             <Value>degrees_east</Value>
817 |         </Attribute>
818 |         <Attribute name="geospatial_lon_resolution" type="Float32">
819 |             <Value>0.009999999776</Value>
820 |         </Attribute>
821 |         <Attribute name="acknowledgment" type="String">
822 |             <Value>The MODIS L2P sea surface temperature data are sponsored by NASA</Value>
823 |         </Attribute>
824 |         <Attribute name="creator_name" type="String">
825 |             <Value>Ed Armstrong, JPL PO.DAAC</Value>
826 |         </Attribute>
827 |         <Attribute name="creator_email" type="String">
828 |             <Value>edward.m.armstrong@jpl.nasa.gov</Value>
829 |         </Attribute>
830 |         <Attribute name="creator_url" type="String">
831 |             <Value>http://podaac.jpl.nasa.gov</Value>
832 |         </Attribute>
833 |         <Attribute name="project" type="String">
834 |             <Value>Group for High Resolution Sea Surface Temperature</Value>
835 |         </Attribute>
836 |         <Attribute name="publisher_name" type="String">
837 |             <Value>The GHRSST Project Office</Value>
838 |         </Attribute>
839 |         <Attribute name="publisher_url" type="String">
840 |             <Value>http://www.ghrsst.org</Value>
841 |         </Attribute>
842 |         <Attribute name="publisher_email" type="String">
843 |             <Value>ghrsst-po@nceo.ac.uk</Value>
844 |         </Attribute>
845 |         <Attribute name="processing_level" type="String">
846 |             <Value>L2P</Value>
847 |         </Attribute>
848 |         <Attribute name="cdm_data_type" type="String">
849 |             <Value>swath</Value>
850 |         </Attribute>
851 |         <Attribute name="startDirection" type="String">
852 |             <Value>Descending</Value>
853 |         </Attribute>
854 |         <Attribute name="endDirection" type="String">
855 |             <Value>Descending</Value>
856 |         </Attribute>
857 |         <Attribute name="day_night_flag" type="String">
858 |             <Value>Night</Value>
859 |         </Attribute>
860 |     </Attribute>
861 | </Dataset>
862 | 


--------------------------------------------------------------------------------
/tests/fixtures/3B-HHR.MS.MRG.3IMERG.20051022-S000000-E002959.0000.V06B.zarr.json:
--------------------------------------------------------------------------------
   1 | {
   2 |     ".zgroup": {
   3 |         "zarr_format": 2
   4 |     },
   5 |     "Grid/precipitationQualityIndex/.zarray": {
   6 |         "zarr_format": 2,
   7 |         "filters": null,
   8 |         "order": "C",
   9 |         "dtype": "<f4",
  10 |         "shape": [
  11 |             1,
  12 |             3600,
  13 |             1800
  14 |         ],
  15 |         "compressor": {
  16 |             "id": "zlib",
  17 |             "level": 4
  18 |         },
  19 |         "chunks": [
  20 |             1,
  21 |             145,
  22 |             1800
  23 |         ],
  24 |         "fill_value": -9999.900391
  25 |     },
  26 |     "Grid/precipitationQualityIndex/.zattrs": {
  27 |         "DimensionNames": "time,lon,lat",
  28 |         "coordinates": "time lon lat",
  29 |         "_FillValue": -9999.900391,
  30 |         "CodeMissingValue": "-9999.9",
  31 |         "_ARRAY_DIMENSIONS": [
  32 |             "time",
  33 |             "lon",
  34 |             "lat"
  35 |         ]
  36 |     },
  37 |     "Grid/precipitationQualityIndex/.zchunkstore": {
  38 |         "0.0.0": {
  39 |             "offset": 9317952,
  40 |             "size": 9237
  41 |         },
  42 |         "0.1.0": {
  43 |             "offset": 9327189,
  44 |             "size": 9298
  45 |         },
  46 |         "0.2.0": {
  47 |             "offset": 9336487,
  48 |             "size": 10475
  49 |         },
  50 |         "0.3.0": {
  51 |             "offset": 9346962,
  52 |             "size": 13576
  53 |         },
  54 |         "0.4.0": {
  55 |             "offset": 9360538,
  56 |             "size": 13692
  57 |         },
  58 |         "0.5.0": {
  59 |             "offset": 9374230,
  60 |             "size": 10939
  61 |         },
  62 |         "0.6.0": {
  63 |             "offset": 9385169,
  64 |             "size": 13671
  65 |         },
  66 |         "0.7.0": {
  67 |             "offset": 9398840,
  68 |             "size": 17147
  69 |         },
  70 |         "0.8.0": {
  71 |             "offset": 9415987,
  72 |             "size": 13784
  73 |         },
  74 |         "0.9.0": {
  75 |             "offset": 9429771,
  76 |             "size": 8797
  77 |         },
  78 |         "0.10.0": {
  79 |             "offset": 9438568,
  80 |             "size": 9465
  81 |         },
  82 |         "0.11.0": {
  83 |             "offset": 9448033,
  84 |             "size": 10915
  85 |         },
  86 |         "0.12.0": {
  87 |             "offset": 9458948,
  88 |             "size": 12400
  89 |         },
  90 |         "0.13.0": {
  91 |             "offset": 9471348,
  92 |             "size": 15399
  93 |         },
  94 |         "0.14.0": {
  95 |             "offset": 9486747,
  96 |             "size": 12980
  97 |         },
  98 |         "0.15.0": {
  99 |             "offset": 9499727,
 100 |             "size": 13896
 101 |         },
 102 |         "0.16.0": {
 103 |             "offset": 9513623,
 104 |             "size": 12558
 105 |         },
 106 |         "0.17.0": {
 107 |             "offset": 9526181,
 108 |             "size": 14488
 109 |         },
 110 |         "0.18.0": {
 111 |             "offset": 9540669,
 112 |             "size": 14174
 113 |         },
 114 |         "0.19.0": {
 115 |             "offset": 9554843,
 116 |             "size": 13685
 117 |         },
 118 |         "0.20.0": {
 119 |             "offset": 9568528,
 120 |             "size": 13572
 121 |         },
 122 |         "0.21.0": {
 123 |             "offset": 9582100,
 124 |             "size": 14551
 125 |         },
 126 |         "0.22.0": {
 127 |             "offset": 9596651,
 128 |             "size": 13688
 129 |         },
 130 |         "0.23.0": {
 131 |             "offset": 9610339,
 132 |             "size": 12507
 133 |         },
 134 |         "0.24.0": {
 135 |             "offset": 10033663,
 136 |             "size": 10124
 137 |         }
 138 |     },
 139 |     "Grid/IRkalmanFilterWeight/.zarray": {
 140 |         "zarr_format": 2,
 141 |         "filters": null,
 142 |         "order": "C",
 143 |         "dtype": "<i2",
 144 |         "shape": [
 145 |             1,
 146 |             3600,
 147 |             1800
 148 |         ],
 149 |         "compressor": {
 150 |             "id": "zlib",
 151 |             "level": 4
 152 |         },
 153 |         "chunks": [
 154 |             1,
 155 |             291,
 156 |             1800
 157 |         ],
 158 |         "fill_value": -9999
 159 |     },
 160 |     "Grid/IRkalmanFilterWeight/.zattrs": {
 161 |         "DimensionNames": "time,lon,lat",
 162 |         "coordinates": "time lon lat",
 163 |         "_FillValue": -9999,
 164 |         "CodeMissingValue": "-9999",
 165 |         "_ARRAY_DIMENSIONS": [
 166 |             "time",
 167 |             "lon",
 168 |             "lat"
 169 |         ]
 170 |     },
 171 |     "Grid/IRkalmanFilterWeight/.zchunkstore": {
 172 |         "0.0.0": {
 173 |             "offset": 8780740,
 174 |             "size": 5845
 175 |         },
 176 |         "0.1.0": {
 177 |             "offset": 8786585,
 178 |             "size": 11136
 179 |         },
 180 |         "0.2.0": {
 181 |             "offset": 8797721,
 182 |             "size": 11287
 183 |         },
 184 |         "0.3.0": {
 185 |             "offset": 8809008,
 186 |             "size": 7592
 187 |         },
 188 |         "0.4.0": {
 189 |             "offset": 8816600,
 190 |             "size": 9363
 191 |         },
 192 |         "0.5.0": {
 193 |             "offset": 8825963,
 194 |             "size": 9960
 195 |         },
 196 |         "0.6.0": {
 197 |             "offset": 8835923,
 198 |             "size": 10853
 199 |         },
 200 |         "0.7.0": {
 201 |             "offset": 8846776,
 202 |             "size": 8382
 203 |         },
 204 |         "0.8.0": {
 205 |             "offset": 8855158,
 206 |             "size": 10696
 207 |         },
 208 |         "0.9.0": {
 209 |             "offset": 8865854,
 210 |             "size": 12040
 211 |         },
 212 |         "0.10.0": {
 213 |             "offset": 8877894,
 214 |             "size": 15373
 215 |         },
 216 |         "0.11.0": {
 217 |             "offset": 8893267,
 218 |             "size": 12902
 219 |         },
 220 |         "0.12.0": {
 221 |             "offset": 10018401,
 222 |             "size": 5969
 223 |         }
 224 |     },
 225 |     "Grid/HQprecipSource/.zarray": {
 226 |         "zarr_format": 2,
 227 |         "filters": null,
 228 |         "order": "C",
 229 |         "dtype": "<i2",
 230 |         "shape": [
 231 |             1,
 232 |             3600,
 233 |             1800
 234 |         ],
 235 |         "compressor": {
 236 |             "id": "zlib",
 237 |             "level": 4
 238 |         },
 239 |         "chunks": [
 240 |             1,
 241 |             291,
 242 |             1800
 243 |         ],
 244 |         "fill_value": -9999
 245 |     },
 246 |     "Grid/HQprecipSource/.zattrs": {
 247 |         "DimensionNames": "time,lon,lat",
 248 |         "coordinates": "time lon lat",
 249 |         "_FillValue": -9999,
 250 |         "CodeMissingValue": "-9999",
 251 |         "_ARRAY_DIMENSIONS": [
 252 |             "time",
 253 |             "lon",
 254 |             "lat"
 255 |         ]
 256 |     },
 257 |     "Grid/HQprecipSource/.zchunkstore": {
 258 |         "0.0.0": {
 259 |             "offset": 7358550,
 260 |             "size": 6805
 261 |         },
 262 |         "0.1.0": {
 263 |             "offset": 7365355,
 264 |             "size": 7269
 265 |         },
 266 |         "0.2.0": {
 267 |             "offset": 7372624,
 268 |             "size": 4462
 269 |         },
 270 |         "0.3.0": {
 271 |             "offset": 7377086,
 272 |             "size": 7867
 273 |         },
 274 |         "0.4.0": {
 275 |             "offset": 7384953,
 276 |             "size": 10454
 277 |         },
 278 |         "0.5.0": {
 279 |             "offset": 7395407,
 280 |             "size": 7487
 281 |         },
 282 |         "0.6.0": {
 283 |             "offset": 7402894,
 284 |             "size": 4883
 285 |         },
 286 |         "0.7.0": {
 287 |             "offset": 7407777,
 288 |             "size": 4152
 289 |         },
 290 |         "0.8.0": {
 291 |             "offset": 7411929,
 292 |             "size": 3863
 293 |         },
 294 |         "0.9.0": {
 295 |             "offset": 7415792,
 296 |             "size": 9014
 297 |         },
 298 |         "0.10.0": {
 299 |             "offset": 7424806,
 300 |             "size": 5463
 301 |         },
 302 |         "0.11.0": {
 303 |             "offset": 7430269,
 304 |             "size": 3521
 305 |         },
 306 |         "0.12.0": {
 307 |             "offset": 9977607,
 308 |             "size": 3409
 309 |         }
 310 |     },
 311 |     "Grid/precipitationCal/.zarray": {
 312 |         "zarr_format": 2,
 313 |         "filters": null,
 314 |         "order": "C",
 315 |         "dtype": "<f4",
 316 |         "shape": [
 317 |             1,
 318 |             3600,
 319 |             1800
 320 |         ],
 321 |         "compressor": {
 322 |             "id": "zlib",
 323 |             "level": 4
 324 |         },
 325 |         "chunks": [
 326 |             1,
 327 |             145,
 328 |             1800
 329 |         ],
 330 |         "fill_value": -9999.900391
 331 |     },
 332 |     "Grid/precipitationCal/.zattrs": {
 333 |         "DimensionNames": "time,lon,lat",
 334 |         "Units": "mm/hr",
 335 |         "units": "mm/hr",
 336 |         "coordinates": "time lon lat",
 337 |         "_FillValue": -9999.900391,
 338 |         "CodeMissingValue": "-9999.9",
 339 |         "_ARRAY_DIMENSIONS": [
 340 |             "time",
 341 |             "lon",
 342 |             "lat"
 343 |         ]
 344 |     },
 345 |     "Grid/precipitationCal/.zchunkstore": {
 346 |         "0.0.0": {
 347 |             "offset": 29354,
 348 |             "size": 138036
 349 |         },
 350 |         "0.1.0": {
 351 |             "offset": 167390,
 352 |             "size": 96825
 353 |         },
 354 |         "0.2.0": {
 355 |             "offset": 264215,
 356 |             "size": 106335
 357 |         },
 358 |         "0.3.0": {
 359 |             "offset": 370550,
 360 |             "size": 114836
 361 |         },
 362 |         "0.4.0": {
 363 |             "offset": 485386,
 364 |             "size": 78192
 365 |         },
 366 |         "0.5.0": {
 367 |             "offset": 563578,
 368 |             "size": 46256
 369 |         },
 370 |         "0.6.0": {
 371 |             "offset": 609834,
 372 |             "size": 97230
 373 |         },
 374 |         "0.7.0": {
 375 |             "offset": 707064,
 376 |             "size": 107310
 377 |         },
 378 |         "0.8.0": {
 379 |             "offset": 814374,
 380 |             "size": 145441
 381 |         },
 382 |         "0.9.0": {
 383 |             "offset": 959815,
 384 |             "size": 103591
 385 |         },
 386 |         "0.10.0": {
 387 |             "offset": 1063406,
 388 |             "size": 45351
 389 |         },
 390 |         "0.11.0": {
 391 |             "offset": 1108757,
 392 |             "size": 77722
 393 |         },
 394 |         "0.12.0": {
 395 |             "offset": 1186479,
 396 |             "size": 97843
 397 |         },
 398 |         "0.13.0": {
 399 |             "offset": 1284322,
 400 |             "size": 101104
 401 |         },
 402 |         "0.14.0": {
 403 |             "offset": 1385426,
 404 |             "size": 61258
 405 |         },
 406 |         "0.15.0": {
 407 |             "offset": 1446684,
 408 |             "size": 76255
 409 |         },
 410 |         "0.16.0": {
 411 |             "offset": 1522939,
 412 |             "size": 65043
 413 |         },
 414 |         "0.17.0": {
 415 |             "offset": 1587982,
 416 |             "size": 121463
 417 |         },
 418 |         "0.18.0": {
 419 |             "offset": 1709445,
 420 |             "size": 94356
 421 |         },
 422 |         "0.19.0": {
 423 |             "offset": 1803801,
 424 |             "size": 101363
 425 |         },
 426 |         "0.20.0": {
 427 |             "offset": 1905164,
 428 |             "size": 101590
 429 |         },
 430 |         "0.21.0": {
 431 |             "offset": 2006754,
 432 |             "size": 97542
 433 |         },
 434 |         "0.22.0": {
 435 |             "offset": 2104296,
 436 |             "size": 116422
 437 |         },
 438 |         "0.23.0": {
 439 |             "offset": 2220718,
 440 |             "size": 151610
 441 |         },
 442 |         "0.24.0": {
 443 |             "offset": 9664057,
 444 |             "size": 102572
 445 |         }
 446 |     },
 447 |     "Grid/lat_bnds/.zarray": {
 448 |         "zarr_format": 2,
 449 |         "filters": null,
 450 |         "order": "C",
 451 |         "dtype": "<f4",
 452 |         "shape": [
 453 |             1800,
 454 |             2
 455 |         ],
 456 |         "compressor": {
 457 |             "id": "zlib",
 458 |             "level": 4
 459 |         },
 460 |         "chunks": [
 461 |             1800,
 462 |             2
 463 |         ],
 464 |         "fill_value": null
 465 |     },
 466 |     "Grid/lat_bnds/.zattrs": {
 467 |         "DimensionNames": "lat,latv",
 468 |         "Units": "degrees_north",
 469 |         "units": "degrees_north",
 470 |         "coordinates": "lat latv",
 471 |         "_ARRAY_DIMENSIONS": [
 472 |             "lat",
 473 |             "latv"
 474 |         ]
 475 |     },
 476 |     "Grid/lat_bnds/.zchunkstore": {
 477 |         "0.0": {
 478 |             "offset": 9657746,
 479 |             "size": 6311
 480 |         }
 481 |     },
 482 |     "Grid/precipitationUncal/.zarray": {
 483 |         "zarr_format": 2,
 484 |         "filters": null,
 485 |         "order": "C",
 486 |         "dtype": "<f4",
 487 |         "shape": [
 488 |             1,
 489 |             3600,
 490 |             1800
 491 |         ],
 492 |         "compressor": {
 493 |             "id": "zlib",
 494 |             "level": 4
 495 |         },
 496 |         "chunks": [
 497 |             1,
 498 |             145,
 499 |             1800
 500 |         ],
 501 |         "fill_value": -9999.900391
 502 |     },
 503 |     "Grid/precipitationUncal/.zattrs": {
 504 |         "DimensionNames": "time,lon,lat",
 505 |         "Units": "mm/hr",
 506 |         "units": "mm/hr",
 507 |         "coordinates": "time lon lat",
 508 |         "_FillValue": -9999.900391,
 509 |         "CodeMissingValue": "-9999.9",
 510 |         "_ARRAY_DIMENSIONS": [
 511 |             "time",
 512 |             "lon",
 513 |             "lat"
 514 |         ]
 515 |     },
 516 |     "Grid/precipitationUncal/.zchunkstore": {
 517 |         "0.0.0": {
 518 |             "offset": 2375464,
 519 |             "size": 137325
 520 |         },
 521 |         "0.1.0": {
 522 |             "offset": 2512789,
 523 |             "size": 93331
 524 |         },
 525 |         "0.2.0": {
 526 |             "offset": 2606120,
 527 |             "size": 105773
 528 |         },
 529 |         "0.3.0": {
 530 |             "offset": 2711893,
 531 |             "size": 112564
 532 |         },
 533 |         "0.4.0": {
 534 |             "offset": 2824457,
 535 |             "size": 76916
 536 |         },
 537 |         "0.5.0": {
 538 |             "offset": 2901373,
 539 |             "size": 44604
 540 |         },
 541 |         "0.6.0": {
 542 |             "offset": 2945977,
 543 |             "size": 90928
 544 |         },
 545 |         "0.7.0": {
 546 |             "offset": 3036905,
 547 |             "size": 101240
 548 |         },
 549 |         "0.8.0": {
 550 |             "offset": 3138145,
 551 |             "size": 134426
 552 |         },
 553 |         "0.9.0": {
 554 |             "offset": 3272571,
 555 |             "size": 101348
 556 |         },
 557 |         "0.10.0": {
 558 |             "offset": 3373919,
 559 |             "size": 45166
 560 |         },
 561 |         "0.11.0": {
 562 |             "offset": 3419085,
 563 |             "size": 76360
 564 |         },
 565 |         "0.12.0": {
 566 |             "offset": 3495445,
 567 |             "size": 90674
 568 |         },
 569 |         "0.13.0": {
 570 |             "offset": 3586119,
 571 |             "size": 91817
 572 |         },
 573 |         "0.14.0": {
 574 |             "offset": 3677936,
 575 |             "size": 51573
 576 |         },
 577 |         "0.15.0": {
 578 |             "offset": 3729509,
 579 |             "size": 74661
 580 |         },
 581 |         "0.16.0": {
 582 |             "offset": 3804170,
 583 |             "size": 63953
 584 |         },
 585 |         "0.17.0": {
 586 |             "offset": 3868123,
 587 |             "size": 115123
 588 |         },
 589 |         "0.18.0": {
 590 |             "offset": 3983246,
 591 |             "size": 84610
 592 |         },
 593 |         "0.19.0": {
 594 |             "offset": 4067856,
 595 |             "size": 92590
 596 |         },
 597 |         "0.20.0": {
 598 |             "offset": 4160446,
 599 |             "size": 97404
 600 |         },
 601 |         "0.21.0": {
 602 |             "offset": 4257850,
 603 |             "size": 94958
 604 |         },
 605 |         "0.22.0": {
 606 |             "offset": 4352808,
 607 |             "size": 114114
 608 |         },
 609 |         "0.23.0": {
 610 |             "offset": 4466922,
 611 |             "size": 151072
 612 |         },
 613 |         "0.24.0": {
 614 |             "offset": 9766629,
 615 |             "size": 101765
 616 |         }
 617 |     },
 618 |     "Grid/HQprecipitation/.zarray": {
 619 |         "zarr_format": 2,
 620 |         "filters": null,
 621 |         "order": "C",
 622 |         "dtype": "<f4",
 623 |         "shape": [
 624 |             1,
 625 |             3600,
 626 |             1800
 627 |         ],
 628 |         "compressor": {
 629 |             "id": "zlib",
 630 |             "level": 4
 631 |         },
 632 |         "chunks": [
 633 |             1,
 634 |             145,
 635 |             1800
 636 |         ],
 637 |         "fill_value": -9999.900391
 638 |     },
 639 |     "Grid/HQprecipitation/.zattrs": {
 640 |         "DimensionNames": "time,lon,lat",
 641 |         "Units": "mm/hr",
 642 |         "units": "mm/hr",
 643 |         "coordinates": "time lon lat",
 644 |         "_FillValue": -9999.900391,
 645 |         "CodeMissingValue": "-9999.9",
 646 |         "_ARRAY_DIMENSIONS": [
 647 |             "time",
 648 |             "lon",
 649 |             "lat"
 650 |         ]
 651 |     },
 652 |     "Grid/HQprecipitation/.zchunkstore": {
 653 |         "0.0.0": {
 654 |             "offset": 6930005,
 655 |             "size": 32164
 656 |         },
 657 |         "0.1.0": {
 658 |             "offset": 6962169,
 659 |             "size": 61114
 660 |         },
 661 |         "0.2.0": {
 662 |             "offset": 7023283,
 663 |             "size": 19958
 664 |         },
 665 |         "0.3.0": {
 666 |             "offset": 7043241,
 667 |             "size": 12182
 668 |         },
 669 |         "0.4.0": {
 670 |             "offset": 7055423,
 671 |             "size": 5329
 672 |         },
 673 |         "0.5.0": {
 674 |             "offset": 7060752,
 675 |             "size": 15720
 676 |         },
 677 |         "0.6.0": {
 678 |             "offset": 7076472,
 679 |             "size": 29443
 680 |         },
 681 |         "0.7.0": {
 682 |             "offset": 7105915,
 683 |             "size": 17943
 684 |         },
 685 |         "0.8.0": {
 686 |             "offset": 7123858,
 687 |             "size": 33435
 688 |         },
 689 |         "0.9.0": {
 690 |             "offset": 7157293,
 691 |             "size": 42749
 692 |         },
 693 |         "0.10.0": {
 694 |             "offset": 7200042,
 695 |             "size": 20294
 696 |         },
 697 |         "0.11.0": {
 698 |             "offset": 7220336,
 699 |             "size": 6346
 700 |         },
 701 |         "0.12.0": {
 702 |             "offset": 7226682,
 703 |             "size": 3469
 704 |         },
 705 |         "0.13.0": {
 706 |             "offset": 7230151,
 707 |             "size": 4841
 708 |         },
 709 |         "0.14.0": {
 710 |             "offset": 7234992,
 711 |             "size": 11070
 712 |         },
 713 |         "0.15.0": {
 714 |             "offset": 7246062,
 715 |             "size": 5682
 716 |         },
 717 |         "0.16.0": {
 718 |             "offset": 7251744,
 719 |             "size": 2402
 720 |         },
 721 |         "0.17.0": {
 722 |             "offset": 7254146,
 723 |             "size": 4530
 724 |         },
 725 |         "0.18.0": {
 726 |             "offset": 7258676,
 727 |             "size": 33869
 728 |         },
 729 |         "0.19.0": {
 730 |             "offset": 7292545,
 731 |             "size": 37338
 732 |         },
 733 |         "0.20.0": {
 734 |             "offset": 7329883,
 735 |             "size": 10805
 736 |         },
 737 |         "0.21.0": {
 738 |             "offset": 7340688,
 739 |             "size": 4730
 740 |         },
 741 |         "0.22.0": {
 742 |             "offset": 7345418,
 743 |             "size": 5177
 744 |         },
 745 |         "0.23.0": {
 746 |             "offset": 7350595,
 747 |             "size": 4819
 748 |         },
 749 |         "0.24.0": {
 750 |             "offset": 9969123,
 751 |             "size": 8484
 752 |         }
 753 |     },
 754 |     "Grid/probabilityLiquidPrecipitation/.zarray": {
 755 |         "zarr_format": 2,
 756 |         "filters": null,
 757 |         "order": "C",
 758 |         "dtype": "<i2",
 759 |         "shape": [
 760 |             1,
 761 |             3600,
 762 |             1800
 763 |         ],
 764 |         "compressor": {
 765 |             "id": "zlib",
 766 |             "level": 4
 767 |         },
 768 |         "chunks": [
 769 |             1,
 770 |             291,
 771 |             1800
 772 |         ],
 773 |         "fill_value": -9999
 774 |     },
 775 |     "Grid/probabilityLiquidPrecipitation/.zattrs": {
 776 |         "DimensionNames": "time,lon,lat",
 777 |         "Units": "percent",
 778 |         "units": "percent",
 779 |         "coordinates": "time lon lat",
 780 |         "_FillValue": -9999,
 781 |         "CodeMissingValue": "-9999",
 782 |         "_ARRAY_DIMENSIONS": [
 783 |             "time",
 784 |             "lon",
 785 |             "lat"
 786 |         ]
 787 |     },
 788 |     "Grid/probabilityLiquidPrecipitation/.zchunkstore": {
 789 |         "0.0.0": {
 790 |             "offset": 8909305,
 791 |             "size": 32811
 792 |         },
 793 |         "0.1.0": {
 794 |             "offset": 8942116,
 795 |             "size": 35446
 796 |         },
 797 |         "0.2.0": {
 798 |             "offset": 8977562,
 799 |             "size": 31052
 800 |         },
 801 |         "0.3.0": {
 802 |             "offset": 9008614,
 803 |             "size": 49850
 804 |         },
 805 |         "0.4.0": {
 806 |             "offset": 9058464,
 807 |             "size": 27337
 808 |         },
 809 |         "0.5.0": {
 810 |             "offset": 9085801,
 811 |             "size": 22485
 812 |         },
 813 |         "0.6.0": {
 814 |             "offset": 9108286,
 815 |             "size": 25930
 816 |         },
 817 |         "0.7.0": {
 818 |             "offset": 9134216,
 819 |             "size": 50128
 820 |         },
 821 |         "0.8.0": {
 822 |             "offset": 9184344,
 823 |             "size": 35730
 824 |         },
 825 |         "0.9.0": {
 826 |             "offset": 9220074,
 827 |             "size": 44409
 828 |         },
 829 |         "0.10.0": {
 830 |             "offset": 9264483,
 831 |             "size": 26558
 832 |         },
 833 |         "0.11.0": {
 834 |             "offset": 9291041,
 835 |             "size": 23775
 836 |         },
 837 |         "0.12.0": {
 838 |             "offset": 10024370,
 839 |             "size": 9293
 840 |         }
 841 |     },
 842 |     "Grid/HQobservationTime/.zarray": {
 843 |         "zarr_format": 2,
 844 |         "filters": null,
 845 |         "order": "C",
 846 |         "dtype": "<i2",
 847 |         "shape": [
 848 |             1,
 849 |             3600,
 850 |             1800
 851 |         ],
 852 |         "compressor": {
 853 |             "id": "zlib",
 854 |             "level": 4
 855 |         },
 856 |         "chunks": [
 857 |             1,
 858 |             291,
 859 |             1800
 860 |         ],
 861 |         "fill_value": -9999
 862 |     },
 863 |     "Grid/HQobservationTime/.zattrs": {
 864 |         "DimensionNames": "time,lon,lat",
 865 |         "Units": "minutes",
 866 |         "units": "minutes",
 867 |         "coordinates": "time lon lat",
 868 |         "_FillValue": -9999,
 869 |         "CodeMissingValue": "-9999",
 870 |         "_ARRAY_DIMENSIONS": [
 871 |             "time",
 872 |             "lon",
 873 |             "lat"
 874 |         ]
 875 |     },
 876 |     "Grid/HQobservationTime/.zchunkstore": {
 877 |         "0.0.0": {
 878 |             "offset": 7436926,
 879 |             "size": 12046
 880 |         },
 881 |         "0.1.0": {
 882 |             "offset": 7448972,
 883 |             "size": 10005
 884 |         },
 885 |         "0.2.0": {
 886 |             "offset": 7458977,
 887 |             "size": 6466
 888 |         },
 889 |         "0.3.0": {
 890 |             "offset": 7465443,
 891 |             "size": 12446
 892 |         },
 893 |         "0.4.0": {
 894 |             "offset": 7477889,
 895 |             "size": 15760
 896 |         },
 897 |         "0.5.0": {
 898 |             "offset": 7493649,
 899 |             "size": 10828
 900 |         },
 901 |         "0.6.0": {
 902 |             "offset": 7504477,
 903 |             "size": 6309
 904 |         },
 905 |         "0.7.0": {
 906 |             "offset": 7510786,
 907 |             "size": 7155
 908 |         },
 909 |         "0.8.0": {
 910 |             "offset": 7517941,
 911 |             "size": 5206
 912 |         },
 913 |         "0.9.0": {
 914 |             "offset": 7523147,
 915 |             "size": 14582
 916 |         },
 917 |         "0.10.0": {
 918 |             "offset": 7537729,
 919 |             "size": 6068
 920 |         },
 921 |         "0.11.0": {
 922 |             "offset": 7543797,
 923 |             "size": 4158
 924 |         },
 925 |         "0.12.0": {
 926 |             "offset": 9981016,
 927 |             "size": 3544
 928 |         }
 929 |     },
 930 |     "Grid/randomError/.zarray": {
 931 |         "zarr_format": 2,
 932 |         "filters": null,
 933 |         "order": "C",
 934 |         "dtype": "<f4",
 935 |         "shape": [
 936 |             1,
 937 |             3600,
 938 |             1800
 939 |         ],
 940 |         "compressor": {
 941 |             "id": "zlib",
 942 |             "level": 4
 943 |         },
 944 |         "chunks": [
 945 |             1,
 946 |             145,
 947 |             1800
 948 |         ],
 949 |         "fill_value": -9999.900391
 950 |     },
 951 |     "Grid/randomError/.zattrs": {
 952 |         "DimensionNames": "time,lon,lat",
 953 |         "Units": "mm/hr",
 954 |         "units": "mm/hr",
 955 |         "coordinates": "time lon lat",
 956 |         "_FillValue": -9999.900391,
 957 |         "CodeMissingValue": "-9999.9",
 958 |         "_ARRAY_DIMENSIONS": [
 959 |             "time",
 960 |             "lon",
 961 |             "lat"
 962 |         ]
 963 |     },
 964 |     "Grid/randomError/.zchunkstore": {
 965 |         "0.0.0": {
 966 |             "offset": 4621130,
 967 |             "size": 136731
 968 |         },
 969 |         "0.1.0": {
 970 |             "offset": 4757861,
 971 |             "size": 97007
 972 |         },
 973 |         "0.2.0": {
 974 |             "offset": 4854868,
 975 |             "size": 104913
 976 |         },
 977 |         "0.3.0": {
 978 |             "offset": 4959781,
 979 |             "size": 113020
 980 |         },
 981 |         "0.4.0": {
 982 |             "offset": 5072801,
 983 |             "size": 76619
 984 |         },
 985 |         "0.5.0": {
 986 |             "offset": 5149420,
 987 |             "size": 45168
 988 |         },
 989 |         "0.6.0": {
 990 |             "offset": 5194588,
 991 |             "size": 95972
 992 |         },
 993 |         "0.7.0": {
 994 |             "offset": 5290560,
 995 |             "size": 105349
 996 |         },
 997 |         "0.8.0": {
 998 |             "offset": 5395909,
 999 |             "size": 143036
1000 |         },
1001 |         "0.9.0": {
1002 |             "offset": 5538945,
1003 |             "size": 102698
1004 |         },
1005 |         "0.10.0": {
1006 |             "offset": 5641643,
1007 |             "size": 44944
1008 |         },
1009 |         "0.11.0": {
1010 |             "offset": 5686587,
1011 |             "size": 76318
1012 |         },
1013 |         "0.12.0": {
1014 |             "offset": 5762905,
1015 |             "size": 95743
1016 |         },
1017 |         "0.13.0": {
1018 |             "offset": 5858648,
1019 |             "size": 98157
1020 |         },
1021 |         "0.14.0": {
1022 |             "offset": 5956805,
1023 |             "size": 59252
1024 |         },
1025 |         "0.15.0": {
1026 |             "offset": 6016057,
1027 |             "size": 75013
1028 |         },
1029 |         "0.16.0": {
1030 |             "offset": 6091070,
1031 |             "size": 63860
1032 |         },
1033 |         "0.17.0": {
1034 |             "offset": 6154930,
1035 |             "size": 119238
1036 |         },
1037 |         "0.18.0": {
1038 |             "offset": 6274168,
1039 |             "size": 93465
1040 |         },
1041 |         "0.19.0": {
1042 |             "offset": 6367633,
1043 |             "size": 100552
1044 |         },
1045 |         "0.20.0": {
1046 |             "offset": 6468185,
1047 |             "size": 99613
1048 |         },
1049 |         "0.21.0": {
1050 |             "offset": 6567798,
1051 |             "size": 95495
1052 |         },
1053 |         "0.22.0": {
1054 |             "offset": 6663293,
1055 |             "size": 114268
1056 |         },
1057 |         "0.23.0": {
1058 |             "offset": 6777561,
1059 |             "size": 149308
1060 |         },
1061 |         "0.24.0": {
1062 |             "offset": 9868394,
1063 |             "size": 100729
1064 |         }
1065 |     },
1066 |     "Grid/time_bnds/.zarray": {
1067 |         "zarr_format": 2,
1068 |         "filters": null,
1069 |         "order": "C",
1070 |         "dtype": "<i4",
1071 |         "shape": [
1072 |             1,
1073 |             2
1074 |         ],
1075 |         "compressor": {
1076 |             "id": "zlib",
1077 |             "level": 4
1078 |         },
1079 |         "chunks": [
1080 |             32,
1081 |             2
1082 |         ],
1083 |         "fill_value": null
1084 |     },
1085 |     "Grid/time_bnds/.zattrs": {
1086 |         "DimensionNames": "time,nv",
1087 |         "Units": "seconds since 1970-01-01 00:00:00 UTC",
1088 |         "units": "seconds since 1970-01-01 00:00:00 UTC",
1089 |         "coordinates": "time nv",
1090 |         "_ARRAY_DIMENSIONS": [
1091 |             "time",
1092 |             "nv"
1093 |         ]
1094 |     },
1095 |     "Grid/time_bnds/.zchunkstore": {
1096 |         "0.0": {
1097 |             "offset": 3971,
1098 |             "size": 19
1099 |         }
1100 |     },
1101 |     "Grid/IRprecipitation/.zarray": {
1102 |         "zarr_format": 2,
1103 |         "filters": null,
1104 |         "order": "C",
1105 |         "dtype": "<f4",
1106 |         "shape": [
1107 |             1,
1108 |             3600,
1109 |             1800
1110 |         ],
1111 |         "compressor": {
1112 |             "id": "zlib",
1113 |             "level": 4
1114 |         },
1115 |         "chunks": [
1116 |             1,
1117 |             145,
1118 |             1800
1119 |         ],
1120 |         "fill_value": -9999.900391
1121 |     },
1122 |     "Grid/IRprecipitation/.zattrs": {
1123 |         "DimensionNames": "time,lon,lat",
1124 |         "Units": "mm/hr",
1125 |         "units": "mm/hr",
1126 |         "coordinates": "time lon lat",
1127 |         "_FillValue": -9999.900391,
1128 |         "CodeMissingValue": "-9999.9",
1129 |         "_ARRAY_DIMENSIONS": [
1130 |             "time",
1131 |             "lon",
1132 |             "lat"
1133 |         ]
1134 |     },
1135 |     "Grid/IRprecipitation/.zchunkstore": {
1136 |         "0.0.0": {
1137 |             "offset": 7551091,
1138 |             "size": 71028
1139 |         },
1140 |         "0.1.0": {
1141 |             "offset": 7622119,
1142 |             "size": 82261
1143 |         },
1144 |         "0.2.0": {
1145 |             "offset": 7704380,
1146 |             "size": 57618
1147 |         },
1148 |         "0.3.0": {
1149 |             "offset": 7761998,
1150 |             "size": 55876
1151 |         },
1152 |         "0.4.0": {
1153 |             "offset": 7817874,
1154 |             "size": 41569
1155 |         },
1156 |         "0.5.0": {
1157 |             "offset": 7859443,
1158 |             "size": 11253
1159 |         },
1160 |         "0.6.0": {
1161 |             "offset": 7870696,
1162 |             "size": 63480
1163 |         },
1164 |         "0.7.0": {
1165 |             "offset": 7934176,
1166 |             "size": 63338
1167 |         },
1168 |         "0.8.0": {
1169 |             "offset": 7997514,
1170 |             "size": 104409
1171 |         },
1172 |         "0.9.0": {
1173 |             "offset": 8101923,
1174 |             "size": 59928
1175 |         },
1176 |         "0.10.0": {
1177 |             "offset": 8161851,
1178 |             "size": 34103
1179 |         },
1180 |         "0.11.0": {
1181 |             "offset": 8195954,
1182 |             "size": 23064
1183 |         },
1184 |         "0.12.0": {
1185 |             "offset": 8219018,
1186 |             "size": 31140
1187 |         },
1188 |         "0.13.0": {
1189 |             "offset": 8250158,
1190 |             "size": 49727
1191 |         },
1192 |         "0.14.0": {
1193 |             "offset": 8299885,
1194 |             "size": 26124
1195 |         },
1196 |         "0.15.0": {
1197 |             "offset": 8326009,
1198 |             "size": 29266
1199 |         },
1200 |         "0.16.0": {
1201 |             "offset": 8355275,
1202 |             "size": 29433
1203 |         },
1204 |         "0.17.0": {
1205 |             "offset": 8384708,
1206 |             "size": 46130
1207 |         },
1208 |         "0.18.0": {
1209 |             "offset": 8430838,
1210 |             "size": 66105
1211 |         },
1212 |         "0.19.0": {
1213 |             "offset": 8496943,
1214 |             "size": 88043
1215 |         },
1216 |         "0.20.0": {
1217 |             "offset": 8584986,
1218 |             "size": 38391
1219 |         },
1220 |         "0.21.0": {
1221 |             "offset": 8623377,
1222 |             "size": 32663
1223 |         },
1224 |         "0.22.0": {
1225 |             "offset": 8656040,
1226 |             "size": 54438
1227 |         },
1228 |         "0.23.0": {
1229 |             "offset": 8710478,
1230 |             "size": 67126
1231 |         },
1232 |         "0.24.0": {
1233 |             "offset": 9984560,
1234 |             "size": 33841
1235 |         }
1236 |     },
1237 |     "Grid/lon_bnds/.zarray": {
1238 |         "zarr_format": 2,
1239 |         "filters": null,
1240 |         "order": "C",
1241 |         "dtype": "<f4",
1242 |         "shape": [
1243 |             3600,
1244 |             2
1245 |         ],
1246 |         "compressor": {
1247 |             "id": "zlib",
1248 |             "level": 4
1249 |         },
1250 |         "chunks": [
1251 |             3600,
1252 |             2
1253 |         ],
1254 |         "fill_value": null
1255 |     },
1256 |     "Grid/lon_bnds/.zattrs": {
1257 |         "DimensionNames": "lon,lonv",
1258 |         "Units": "degrees_east",
1259 |         "units": "degrees_east",
1260 |         "coordinates": "lon lonv",
1261 |         "_ARRAY_DIMENSIONS": [
1262 |             "lon",
1263 |             "lonv"
1264 |         ]
1265 |     },
1266 |     "Grid/lon_bnds/.zchunkstore": {
1267 |         "0.0": {
1268 |             "offset": 9645529,
1269 |             "size": 12217
1270 |         }
1271 |     },
1272 |     "Grid/lat/.zarray": {
1273 |         "zarr_format": 2,
1274 |         "filters": null,
1275 |         "order": "C",
1276 |         "dtype": "<f4",
1277 |         "shape": [
1278 |             1800
1279 |         ],
1280 |         "compressor": {
1281 |             "id": "zlib",
1282 |             "level": 4
1283 |         },
1284 |         "chunks": [
1285 |             1800
1286 |         ],
1287 |         "fill_value": null
1288 |     },
1289 |     "Grid/lat/.zattrs": {
1290 |         "DimensionNames": "lat",
1291 |         "Units": "degrees_north",
1292 |         "units": "degrees_north",
1293 |         "standard_name": "latitude",
1294 |         "LongName": "Latitude at the center of\n\t\t\t0.10 degree grid intervals of latitude\n\t\t\tfrom -90 to 90.",
1295 |         "bounds": "lat_bnds",
1296 |         "axis": "Y",
1297 |         "_ARRAY_DIMENSIONS": [
1298 |             "lat"
1299 |         ]
1300 |     },
1301 |     "Grid/lat/.zchunkstore": {
1302 |         "0": {
1303 |             "offset": 9642214,
1304 |             "size": 3315
1305 |         }
1306 |     },
1307 |     "latv/.zarray": {
1308 |         "zarr_format": 2,
1309 |         "filters": null,
1310 |         "order": "C",
1311 |         "dtype": "<i4",
1312 |         "shape": [
1313 |             2
1314 |         ],
1315 |         "fill_value": null,
1316 |         "chunks": [
1317 |             2
1318 |         ]
1319 |     },
1320 |     "latv/.zattrs": {
1321 |         "DimensionNames": "latv",
1322 |         "standard_name": "numberlatbnds",
1323 |         "LongName": "Number of latitude bounds.",
1324 |         "_ARRAY_DIMENSIONS": [
1325 |             "latv"
1326 |         ]
1327 |     },
1328 |     "latv/.zchunkstore": null,
1329 |     "Grid/lon/.zarray": {
1330 |         "zarr_format": 2,
1331 |         "filters": null,
1332 |         "order": "C",
1333 |         "dtype": "<f4",
1334 |         "shape": [
1335 |             3600
1336 |         ],
1337 |         "compressor": {
1338 |             "id": "zlib",
1339 |             "level": 4
1340 |         },
1341 |         "chunks": [
1342 |             3600
1343 |         ],
1344 |         "fill_value": null
1345 |     },
1346 |     "Grid/lon/.zattrs": {
1347 |         "DimensionNames": "lon",
1348 |         "Units": "degrees_east",
1349 |         "units": "degrees_east",
1350 |         "standard_name": "longitude",
1351 |         "LongName": "Longitude at the center of\n\t\t\t0.10 degree grid intervals of longitude \n\t\t\tfrom -180 to 180.",
1352 |         "bounds": "lon_bnds",
1353 |         "axis": "X",
1354 |         "_ARRAY_DIMENSIONS": [
1355 |             "lon"
1356 |         ]
1357 |     },
1358 |     "Grid/lon/.zchunkstore": {
1359 |         "0": {
1360 |             "offset": 9635707,
1361 |             "size": 6507
1362 |         }
1363 |     },
1364 |     "lonv/.zarray": {
1365 |         "zarr_format": 2,
1366 |         "filters": null,
1367 |         "order": "C",
1368 |         "dtype": "<i4",
1369 |         "shape": [
1370 |             2
1371 |         ],
1372 |         "fill_value": null,
1373 |         "chunks": [
1374 |             2
1375 |         ]
1376 |     },
1377 |     "lonv/.zattrs": {
1378 |         "DimensionNames": "lonv",
1379 |         "standard_name": "numberlonbnds",
1380 |         "LongName": "Number of longitude bounds.",
1381 |         "_ARRAY_DIMENSIONS": [
1382 |             "lonv"
1383 |         ]
1384 |     },
1385 |     "lonv/.zchunkstore": null,
1386 |     "nv/.zarray": {
1387 |         "zarr_format": 2,
1388 |         "filters": null,
1389 |         "order": "C",
1390 |         "dtype": "<i4",
1391 |         "shape": [
1392 |             2
1393 |         ],
1394 |         "fill_value": null,
1395 |         "chunks": [
1396 |             2
1397 |         ]
1398 |     },
1399 |     "nv/.zattrs": {
1400 |         "DimensionNames": "nv",
1401 |         "standard_name": "numbertimebnds",
1402 |         "LongName": "Number of time bounds.",
1403 |         "_ARRAY_DIMENSIONS": [
1404 |             "nv"
1405 |         ]
1406 |     },
1407 |     "nv/.zchunkstore": null,
1408 |     "Grid/time/.zarray": {
1409 |         "zarr_format": 2,
1410 |         "filters": null,
1411 |         "order": "C",
1412 |         "dtype": "<i4",
1413 |         "shape": [
1414 |             1
1415 |         ],
1416 |         "compressor": {
1417 |             "id": "zlib",
1418 |             "level": 4
1419 |         },
1420 |         "chunks": [
1421 |             32
1422 |         ],
1423 |         "fill_value": null
1424 |     },
1425 |     "Grid/time/.zattrs": {
1426 |         "DimensionNames": "time",
1427 |         "Units": "seconds since 1970-01-01 00:00:00 UTC",
1428 |         "units": "seconds since 1970-01-01 00:00:00 UTC",
1429 |         "standard_name": "time",
1430 |         "LongName": "Representative time of data in \n\t\t\tseconds since 1970-01-01 00:00:00 UTC.",
1431 |         "bounds": "time_bnds",
1432 |         "axis": "T",
1433 |         "calendar": "julian",
1434 |         "_ARRAY_DIMENSIONS": [
1435 |             "time"
1436 |         ]
1437 |     },
1438 |     "Grid/time/.zchunkstore": {
1439 |         "0": {
1440 |             "offset": 9632108,
1441 |             "size": 15
1442 |         }
1443 |     },
1444 |     ".zattrs": {
1445 |         "FileHeader": "DOI=10.5067/GPM/IMERG/3B-HH/06;\nDOIauthority=http://dx.doi.org/;\nDOIshortName=3IMERGHH;\nAlgorithmID=3IMERGHH;\nAlgorithmVersion=3IMERGH_6.3;\nFileName=3B-HHR.MS.MRG.3IMERG.20051022-S000000-E002959.0000.V06B.HDF5;\nSatelliteName=MULTI;\nInstrumentName=MERGED;\nGenerationDateTime=2019-06-23T04:40:15.000Z;\nStartGranuleDateTime=2005-10-22T00:00:00.000Z;\nStopGranuleDateTime=2005-10-22T00:29:59.999Z;\nGranuleNumber=;\nNumberOfSwaths=0;\nNumberOfGrids=1;\nGranuleStart=;\nTimeInterval=HALF_HOUR;\nProcessingSystem=PPS;\nProductVersion=V06B;\nEmptyGranule=NOT_EMPTY;\nMissingData=;\n",
1446 |         "FileInfo": "DataFormatVersion=6a;\nTKCodeBuildVersion=0;\nMetadataVersion=6a;\nFormatPackage=HDF5-1.8.9;\nBlueprintFilename=GPM.V6.3IMERGHH.blueprint.xml;\nBlueprintVersion=BV_62;\nTKIOVersion=3.93;\nMetadataStyle=PVL;\nEndianType=LITTLE_ENDIAN;\n"
1447 |     },
1448 |     "Grid/.zattrs": {
1449 |         "GridHeader": "BinMethod=ARITHMETIC_MEAN;\nRegistration=CENTER;\nLatitudeResolution=0.1;\nLongitudeResolution=0.1;\nNorthBoundingCoordinate=90;\nSouthBoundingCoordinate=-90;\nEastBoundingCoordinate=180;\nWestBoundingCoordinate=-180;\nOrigin=SOUTHWEST;\n",
1450 |         "fullnamepath": "/Grid"
1451 |     }
1452 | }


--------------------------------------------------------------------------------