├── .github
    └── workflows
    │   └── ci-test.yaml
├── .gitignore
├── LICENSE
├── README.md
├── docs
    ├── Makefile
    ├── make.bat
    ├── requirements.txt
    └── source
    │   ├── code.rst
    │   ├── conf.py
    │   ├── index.rst
    │   ├── logo-1.png
    │   ├── logo-1.svg
    │   ├── logo-2-dark.svg
    │   ├── logo-2-gray.svg
    │   ├── logo-2-white.svg
    │   ├── logo-2.png
    │   └── logo-2.svg
├── requirements.txt
├── setup.py
├── tests
    ├── __init__.py
    ├── test_pandas_typedframe.py
    └── test_polars_typedframe.py
└── typedframe
    ├── __init__.py
    ├── base.py
    ├── pandas_.py
    └── polars_.py


/.github/workflows/ci-test.yaml:
--------------------------------------------------------------------------------
 1 | name: Tests
 2 | 
 3 | on: [push]
 4 | 
 5 | jobs:
 6 |   test_pandas:
 7 | 
 8 |     runs-on: ubuntu-latest
 9 |     strategy:
10 |       fail-fast: false
11 |       matrix:
12 |         python-version: ["3.9"]
13 |         pandas-version: ["1.2", "1.3", "1.4"]
14 |         numpy-version: ["1.20", "1.21", "1.22"]
15 | 
16 |     steps:
17 |     - uses: actions/checkout@v2
18 |     - name: Set up Python ${{ matrix.python-version }}
19 |       uses: actions/setup-python@v2
20 |       with:
21 |         python-version: ${{ matrix.python-version }}
22 |     - name: Install dependencies
23 |       run: |
24 |         python -m pip install --upgrade pip
25 |         python -m pip install numpy==${{ matrix.numpy-version }}
26 |         python -m pip install pandas==${{ matrix.pandas-version }}
27 |         python -m pip install flake8 pytest==6.2.4
28 |     - name: Lint with flake8
29 |       run: |
30 |         # stop the build if there are Python syntax errors or undefined names
31 |         flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
32 |         # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
33 |         flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
34 |     - name: Test with pytest
35 |       run: |
36 |         pytest tests/test_pandas_typedframe.py
37 | 
38 |   test_polars:
39 | 
40 |     runs-on: ubuntu-latest
41 |     strategy:
42 |       fail-fast: false
43 |       matrix:
44 |         python-version: [ "3.9" ]
45 |         polars-version: [ "0.15"]
46 |         pyarrow-version: [ "10.0" ]
47 | 
48 |     steps:
49 |       - uses: actions/checkout@v2
50 |       - name: Set up Python ${{ matrix.python-version }}
51 |         uses: actions/setup-python@v2
52 |         with:
53 |           python-version: ${{ matrix.python-version }}
54 |       - name: Install dependencies
55 |         run: |
56 |           python -m pip install --upgrade pip
57 |           python -m pip install polars==${{ matrix.polars-version }}
58 |           python -m pip install pyarrow==${{ matrix.pyarrow-version }}
59 |           python -m pip install pytest==6.2.4
60 |       - name: Test with pytest
61 |         run: |
62 |           pytest tests/test_polars_typedframe.py


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | pip-wheel-metadata/
 24 | share/python-wheels/
 25 | *.egg-info/
 26 | .installed.cfg
 27 | *.egg
 28 | MANIFEST
 29 | 
 30 | # PyInstaller
 31 | #  Usually these files are written by a python script from a template
 32 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 33 | *.manifest
 34 | *.spec
 35 | 
 36 | # Installer logs
 37 | pip-log.txt
 38 | pip-delete-this-directory.txt
 39 | 
 40 | # Unit test / coverage reports
 41 | htmlcov/
 42 | .tox/
 43 | .nox/
 44 | .coverage
 45 | .coverage.*
 46 | .cache
 47 | nosetests.xml
 48 | coverage.xml
 49 | *.cover
 50 | *.py,cover
 51 | .hypothesis/
 52 | .pytest_cache/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | target/
 76 | 
 77 | # Jupyter Notebook
 78 | .ipynb_checkpoints
 79 | 
 80 | # IPython
 81 | profile_default/
 82 | ipython_config.py
 83 | 
 84 | # pyenv
 85 | .python-version
 86 | 
 87 | # pipenv
 88 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 89 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 90 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 91 | #   install all needed dependencies.
 92 | #Pipfile.lock
 93 | 
 94 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow
 95 | __pypackages__/
 96 | 
 97 | # Celery stuff
 98 | celerybeat-schedule
 99 | celerybeat.pid
100 | 
101 | # SageMath parsed files
102 | *.sage.py
103 | 
104 | # VS Code
105 | .vscode
106 | 
107 | # Idea
108 | .idea
109 | 
110 | # Environments
111 | .env
112 | .venv
113 | env/
114 | venv/
115 | ENV/
116 | env.bak/
117 | venv.bak/
118 | 
119 | # Spyder project settings
120 | .spyderproject
121 | .spyproject
122 | 
123 | # Rope project settings
124 | .ropeproject
125 | 
126 | # mkdocs documentation
127 | /site
128 | 
129 | # mypy
130 | .mypy_cache/
131 | .dmypy.json
132 | dmypy.json
133 | 
134 | # Pyre type checker
135 | .pyre/
136 | 
137 | # Mac
138 | .DS_Store


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2021 Alexander Reshytko
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | 
  2 | ![logo](./docs/source/logo-2-dark.svg#gh-dark-mode-only)![logo](./docs/source/logo-2.svg#gh-light-mode-only)
  3 | 
  4 | ---
  5 | 
  6 | # typedframe
  7 | 
  8 | **Typed wrappers over pandas DataFrames with schema validation.**
  9 | 
 10 | [![Tests](https://github.com/areshytko/typedframe/actions/workflows/ci-test.yaml/badge.svg)](https://github.com/areshytko/typedframe/actions/workflows/ci-test.yaml)
 11 | 
 12 | `TypedDataFrame` is a lightweight wrapper over pandas `DataFrame` that provides runtime schema validation and can be used to establish strong data contracts between interfaces in your Python code.
 13 | 
 14 | The goal of the library is to reveal and make explicit all unclear or forgotten assumptions about your DataFrame.
 15 | 
 16 | Check [the Official Documentation](https://typedframe.readthedocs.io/en/latest/).
 17 | 
 18 | ### Quickstart
 19 | 
 20 | Install typedframe library:
 21 | ```
 22 | pip install typedframe
 23 | ```
 24 | Assume an overly simplified preprocessing code like this:
 25 | ```python
 26 | def preprocess(df: pd.DataFrame) -> pd.DataFrame:
 27 |     df = df.copy()
 28 |     c1_min, c1_max = df['col1'].min(), df['col1'].max()
 29 |     df['col1'] = 0 if c1_min == c1_max else (df['col1'] - c1_min) / (c1_max - c1_min)
 30 |     df['month'] = df['date'].dt.month
 31 |     df['comment'] = df['comment'].str.lower()
 32 |     return df
 33 | ```
 34 | To add `typedframe` schema support for this transformation we will define two schema classes - for the input and for the output:
 35 | ```python
 36 | import numpy as np
 37 | from typedframe import TypedDataFrame, DATE_TIME_DTYPE
 38 | 
 39 | class MyRawData(TypedDataFrame):
 40 |     schema = {
 41 |         'col1': np.float64,
 42 |         'date': DATE_TIME_DTYPE,
 43 |         'comment': str,
 44 |     }
 45 | 
 46 | 
 47 | class PreprocessedData(MyRawData):
 48 |     schema = {
 49 |         'month': np.int8
 50 |     }
 51 | ```
 52 | 
 53 | Then let's modify the `preprocess` function to take a typed wrapper `MyRawData` as input and return `PreprocessedData`:
 54 | ```python
 55 | def preprocess(data: MyRawData) -> PreprocessedData:
 56 |     df = data.df.copy()
 57 |     c1_min, c1_max = df['col1'].min(), df['col1'].max()
 58 |     df['col1'] = 0 if c1_min == c1_max else (df['col1'] - c1_min) / (c1_max - c1_min)
 59 |     df['month'] = df['date'].dt.month
 60 |     df['comment'] = df['comment'].str.lower()
 61 |     return PreprocessedData.convert(df)
 62 | ```
 63 | 
 64 | As you can see the actual DataFrame can be accessed via the `.df` attribute of the Typed DataFrame.
 65 | 
 66 | Now clients of the `preprocess` function can easily check what are the inputs and outputs without the need to look at its internals.
 67 | And if there are some unforseen changes in the data an exception will be thrown before the actual function will be invoked.
 68 | 
 69 | Let's check:
 70 | 
 71 | ```python
 72 | import pandas as pd
 73 | 
 74 | df = pd.DataFrame({
 75 |   'col1': [0.1, 0.2],
 76 |   'date': ['2021-01-01', '2022-01-01'],
 77 |   'comment': ['foo', 'bar']
 78 | })
 79 | df.date = pd.to_datetime(df.date)
 80 | 
 81 | bad_df = pd.DataFrame({
 82 |   'col1': [1, 2],
 83 |   'comment': ['foo', 'bar']
 84 | })
 85 | 
 86 | df2 = preprocess(MyRawData(df))
 87 | df3 = preprocess(MyRawData(bad_df))
 88 | ```
 89 | 
 90 | The first call was successful.
 91 | But when we've tried to pass a wrong dataframe as input we've got the following error:
 92 | 
 93 | ```
 94 | AssertionError: Dataframe doesn't match schema
 95 | Actual: {'col1': dtype('int64'), 'comment': dtype('O')}
 96 | Expected: {'col1': <class 'numpy.float64'>, 'date': dtype('<M8[ns]'), 'comment': <class 'object'>}
 97 | Difference: {('col1', <class 'numpy.float64'>), ('date', dtype('<M8[ns]'))}
 98 | ```
 99 | 
100 | ## Supported versions
101 | 
102 | Tested on the following versions:
103 | 
104 | Python: 3.9
105 | 
106 | numpy: 1.20, 1.21, 1.22
107 | 
108 | pandas: 1.2, 1.3, 1.4
109 | 
110 | ### Manually test in your environment
111 | 
112 | ```python
113 | git clone git@github.com:areshytko/typedframe.git
114 | cd typedframe
115 | pip install -r requirements.txt
116 | pytest
117 | ```
118 | 
119 | ## Releases
120 | 
121 | ### v0.7.0
122 | #### New Functionality
123 | - NaNs in categoricals are not allowed and cause an assertion.
124 |   Motivation: Explicit use of pd.Categorical(df.col, categories=[MyTypedFrame.schema['col']]) conversion can
125 |   introduce such NaNs and bypass the type check. 
126 |   See the [pd.Categorical documentation](https://pandas.pydata.org/docs/reference/api/pandas.Categorical.html).
127 | 
128 | ### v0.6.1
129 | 
130 | #### New Functionality
131 | - updated docstrings
132 | #### Breaking changes
133 |  


--------------------------------------------------------------------------------
/docs/Makefile:
--------------------------------------------------------------------------------
 1 | # Minimal makefile for Sphinx documentation
 2 | #
 3 | 
 4 | # You can set these variables from the command line, and also
 5 | # from the environment for the first two.
 6 | SPHINXOPTS    ?=
 7 | SPHINXBUILD   ?= sphinx-build
 8 | SOURCEDIR     = source
 9 | BUILDDIR      = build
10 | 
11 | # Put it first so that "make" without argument is like "make help".
12 | help:
13 | 	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
14 | 
15 | .PHONY: help Makefile
16 | 
17 | # Catch-all target: route all unknown targets to Sphinx using the new
18 | # "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
19 | %: Makefile
20 | 	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
21 | 


--------------------------------------------------------------------------------
/docs/make.bat:
--------------------------------------------------------------------------------
 1 | @ECHO OFF
 2 | 
 3 | pushd %~dp0
 4 | 
 5 | REM Command file for Sphinx documentation
 6 | 
 7 | if "%SPHINXBUILD%" == "" (
 8 | 	set SPHINXBUILD=sphinx-build
 9 | )
10 | set SOURCEDIR=source
11 | set BUILDDIR=build
12 | 
13 | if "%1" == "" goto help
14 | 
15 | %SPHINXBUILD% >NUL 2>NUL
16 | if errorlevel 9009 (
17 | 	echo.
18 | 	echo.The 'sphinx-build' command was not found. Make sure you have Sphinx
19 | 	echo.installed, then set the SPHINXBUILD environment variable to point
20 | 	echo.to the full path of the 'sphinx-build' executable. Alternatively you
21 | 	echo.may add the Sphinx directory to PATH.
22 | 	echo.
23 | 	echo.If you don't have Sphinx installed, grab it from
24 | 	echo.https://www.sphinx-doc.org/
25 | 	exit /b 1
26 | )
27 | 
28 | %SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
29 | goto end
30 | 
31 | :help
32 | %SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
33 | 
34 | :end
35 | popd
36 | 


--------------------------------------------------------------------------------
/docs/requirements.txt:
--------------------------------------------------------------------------------
1 | sphinx-rtd-theme==1.0.0
2 | sphinx==4.4.0


--------------------------------------------------------------------------------
/docs/source/code.rst:
--------------------------------------------------------------------------------
1 | 
2 | Docstrings
3 | ============
4 | 
5 | .. automodule:: typedframe.typedframe
6 |     :members:


--------------------------------------------------------------------------------
/docs/source/conf.py:
--------------------------------------------------------------------------------
 1 | # Configuration file for the Sphinx documentation builder.
 2 | #
 3 | # This file only contains a selection of the most common options. For a full
 4 | # list see the documentation:
 5 | # https://www.sphinx-doc.org/en/master/usage/configuration.html
 6 | 
 7 | # -- Path setup --------------------------------------------------------------
 8 | 
 9 | # If extensions (or modules to document with autodoc) are in another directory,
10 | # add these directories to sys.path here. If the directory is relative to the
11 | # documentation root, use os.path.abspath to make it absolute, like shown here.
12 | #
13 | import os
14 | import sys
15 | sys.path.insert(0, os.path.abspath(os.path.join('..', '..')))
16 | 
17 | 
18 | # -- Project information -----------------------------------------------------
19 | 
20 | project = 'Typedframe'
21 | copyright = '2022, Alexander Reshytko'
22 | author = 'Alexander Reshytko'
23 | 
24 | 
25 | # -- General configuration ---------------------------------------------------
26 | 
27 | # Add any Sphinx extension module names here, as strings. They can be
28 | # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
29 | # ones.
30 | extensions = ['sphinx.ext.autodoc', 'sphinx.ext.coverage', 'sphinx.ext.napoleon'
31 | ]
32 | 
33 | # Add any paths that contain templates here, relative to this directory.
34 | templates_path = ['_templates']
35 | 
36 | # List of patterns, relative to source directory, that match files and
37 | # directories to ignore when looking for source files.
38 | # This pattern also affects html_static_path and html_extra_path.
39 | exclude_patterns = []
40 | 
41 | 
42 | # -- Options for HTML output -------------------------------------------------
43 | 
44 | # The theme to use for HTML and HTML Help pages.  See the documentation for
45 | # a list of builtin themes.
46 | #
47 | html_theme = 'sphinx_rtd_theme'
48 | 
49 | # Add any paths that contain custom static files (such as style sheets) here,
50 | # relative to this directory. They are copied after the builtin static files,
51 | # so a file named "default.css" will overwrite the builtin "default.css".
52 | html_static_path = ['_static']
53 | 
54 | html_logo = "logo-2-white.svg"
55 | html_theme_options = {
56 |     'logo_only': True,
57 |     'display_version': False,
58 | }


--------------------------------------------------------------------------------
/docs/source/index.rst:
--------------------------------------------------------------------------------
  1 | .. Typedframe documentation master file, created by
  2 |    sphinx-quickstart on Sat Mar  5 19:33:48 2022.
  3 |    You can adapt this file completely to your liking, but it should at least
  4 |    contain the root `toctree` directive.
  5 | 
  6 | .. image:: logo-2.svg
  7 |    :alt: logo
  8 | 
  9 | ----
 10 | 
 11 | Typedframe
 12 | ============
 13 | 
 14 | **Typed wrappers over pandas DataFrames with schema validation.**
 15 | 
 16 | .. toctree::
 17 |    :maxdepth: 2
 18 |    :caption: Contents:
 19 | 
 20 | ``TypedDataFrame`` is a lightweight wrapper over pandas ``DataFrame``
 21 | that provides runtime schema validation and can be used to establish
 22 | strong data contracts between interfaces in your Python code.
 23 | 
 24 | The goal of the library is to reveal and make explicit all unclear or
 25 | forgotten assumptions about your DataFrame.
 26 | 
 27 | Quickstart
 28 | ~~~~~~~~~~
 29 | 
 30 | Install typedframe library:
 31 | 
 32 | ::
 33 | 
 34 |    pip install typedframe
 35 | 
 36 | Assume an overly simplified preprocessing code like this:
 37 | 
 38 | .. code:: python
 39 | 
 40 |    def preprocess(df: pd.DataFrame) -> pd.DataFrame:
 41 |        df = df.copy()
 42 |        c1_min, c1_max = df['col1'].min(), df['col1'].max()
 43 |        df['col1'] = 0 if c1_min == c1_max else (df['col1'] - c1_min) / (c1_max - c1_min)
 44 |        df['month'] = df['date'].dt.month
 45 |        df['comment'] = df['comment'].str.lower()
 46 |        return df
 47 | 
 48 | To add ``typedframe`` schema support for this transformation we will
 49 | define two schema classes - for the input and for the output:
 50 | 
 51 | .. code:: python
 52 | 
 53 |    import numpy as np
 54 |    from typedframe import TypedDataFrame, DATE_TIME_DTYPE
 55 | 
 56 |    class MyRawData(TypedDataFrame):
 57 |        schema = {
 58 |            'col1': np.float64,
 59 |            'date': DATE_TIME_DTYPE,
 60 |            'comment': str,
 61 |        }
 62 | 
 63 | 
 64 |    class PreprocessedData(MyRawData):
 65 |        schema = {
 66 |            'month': np.int8
 67 |        }
 68 | 
 69 | Then let’s modify the ``preprocess`` function to take a typed wrapper
 70 | ``MyRawData`` as input and return ``PreprocessedData``:
 71 | 
 72 | .. code:: python
 73 | 
 74 |    def preprocess(data: MyRawData) -> PreprocessedData:
 75 |        df = data.df.copy()
 76 |        c1_min, c1_max = df['col1'].min(), df['col1'].max()
 77 |        df['col1'] = 0 if c1_min == c1_max else (df['col1'] - c1_min) / (c1_max - c1_min)
 78 |        df['month'] = df['date'].dt.month
 79 |        df['comment'] = df['comment'].str.lower()
 80 |        return PreprocessedData.convert(df)
 81 | 
 82 | As you can see the actual DataFrame can be accessed via the ``.df``
 83 | attribute of the Typed DataFrame.
 84 | 
 85 | Now clients of the ``preprocess`` function can easily check what are the
 86 | inputs and outputs without the need to look at its internals. And if
 87 | there are some unforseen changes in the data an exception will be thrown
 88 | before the actual function will be invoked.
 89 | 
 90 | Let’s check:
 91 | 
 92 | .. code:: python
 93 | 
 94 |    import pandas as pd
 95 | 
 96 |    df = pd.DataFrame({
 97 |      'col1': [0.1, 0.2],
 98 |      'date': ['2021-01-01', '2022-01-01'],
 99 |      'comment': ['foo', 'bar']
100 |    })
101 |    df.date = pd.to_datetime(df.date)
102 | 
103 |    bad_df = pd.DataFrame({
104 |      'col1': [1, 2],
105 |      'comment': ['foo', 'bar']
106 |    })
107 | 
108 |    df2 = preprocess(MyRawData(df))
109 |    df3 = preprocess(MyRawData(bad_df))
110 | 
111 | The first call was successful. But when we’ve tried to pass a wrong
112 | dataframe as input we’ve got the following error:
113 | 
114 | ::
115 | 
116 |    AssertionError: Dataframe doesn't match schema
117 |    Actual: {'col1': dtype('int64'), 'comment': dtype('O')}
118 |    Expected: {'col1': <class 'numpy.float64'>, 'date': dtype('<M8[ns]'), 'comment': <class 'object'>}
119 |    Difference: {('col1', <class 'numpy.float64'>), ('date', dtype('<M8[ns]'))}
120 | 
121 | Problems with pandas DataFrame
122 | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
123 | 
124 | Let’s return the initial code example above. What’s the problem here?
125 | 
126 | .. code:: python
127 | 
128 |    def preprocess(df: pd.DataFrame) -> pd.DataFrame:
129 | 
130 | Even when we have added type hints to our function, the user doesn’t
131 | really know how he can use it. He must dig inside the code of the
132 | function to find out things like expected columns and their types. This
133 | violates on of the core software development principles - the
134 | encapsulation.
135 | 
136 | Pandas DataFrame is an open data type. It introduces a lot of implicit
137 | assumptions about the data. Let’s explore some examples where one can
138 | easily overlook these implicit assumptions:
139 | 
140 | Required columns and data types:
141 | ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
142 | 
143 | .. code:: python
144 | 
145 |    df.grouby('state')['income'].mean()
146 | 
147 | The dataframe is expected to have ``state`` and ``income`` columns.
148 | ``income`` column must have a numeric type.
149 | 
150 | Index name and type
151 | ^^^^^^^^^^^^^^^^^^^
152 | 
153 | .. code:: python
154 | 
155 |    df.reset_index(inplace=True)
156 |    x = df['my_index']
157 | 
158 | It is expected that a dataframe has a named index with a name
159 | ``my_index``.
160 | 
161 | Categorical columns
162 | ^^^^^^^^^^^^^^^^^^^
163 | 
164 | .. code:: python
165 | 
166 |    df3 = pd.merge(df1, df2, on='categorical_col')
167 | 
168 | The result above will differ based on whether a ``categorical_col`` in
169 | ``df1`` and ``df2`` has exactly the same set of categories or not.
170 | 
171 | All these scenarios above can lead to a variety of subtle bugs in our
172 | pipeline.
173 | 
174 | The concept of Typed DataFrame
175 | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
176 | 
177 | A Typed DataFrame is a minimalistic wrapper on top of your pandas
178 | DataFrame. You create it by creating a subclass of a ``TypedDataFrame``
179 | and defining ``schema`` static variable. Then you can wrap your
180 | DataFrame in it by passing it to your Typed DataFrame constructor. The
181 | constructor will do a runtime schema validation and the original
182 | dataframe can be accessed through ``df`` attribute of a wrapper.
183 | 
184 | This wrapper serves 2 purposes:
185 | 
186 | - Formal explicit documentation about dataframe assumptions.
187 |   You can use your Typed DataFrame schema definition as a form
188 |   of documentation to communicate your data interfaces to others.
189 |   This works very well especially in combination with Python type hints.
190 | 
191 | - Runtime schema validation. In case of any data contracts violation
192 |   you’ll get an exception explaining the exact reason. If you guard
193 |   your pipeline with such Typed DataFrames you’ll be able to catch
194 |   errors early - closer to the root causes.
195 | 
196 | Features
197 | ~~~~~~~~
198 | 
199 | Required Schema
200 | ^^^^^^^^^^^^^^^
201 | 
202 | You can define the required schema by passing a dictionary to a static
203 | variable ``schema`` of a ``TypeFrame`` subclass. The dictionary defines
204 | the mapping from a column name to a dtype:
205 | 
206 | .. code:: python
207 | 
208 |    class MyTable(TypedDataFrame):
209 |       schema = {
210 |          "col1": str,
211 |          "col2": np.int32,
212 |          "col3": ('foo', 'bar')
213 |       }
214 | 
215 | Schema Inheritance
216 | ^^^^^^^^^^^^^^^^^^
217 | 
218 | You can inherit one Typed DataFrame from another one.
219 | 
220 | The semantics of the inheritance relation is the same as with class
221 | methods and attributes in classic OOP. I.e. if Typed DataFrame A is a
222 | subclass of a Typed DataFrame B, all the schema requirements for B must
223 | also be held for A. In case of any conflicts, the schema defined in A
224 | takes a precedence.
225 | 
226 | .. code:: python
227 | 
228 |    class MyDataFrame(TypedDataFrame):
229 |        schema = {
230 |            'int_field': np.int16,
231 |            'float_field': np.float64,
232 |            'bool_field': bool,
233 |            'str_field': str,
234 |            'obj_field': object
235 |        }
236 | 
237 | 
238 |    class InheritedDataFrame(MyDataFrame):
239 |        schema = {
240 |            'new_field': np.int64
241 |        }
242 | 
243 | Multiple Inheritance
244 | ''''''''''''''''''''
245 | 
246 | Multiple Inheritance is allowed. It has a “union” semantics.
247 | 
248 | .. code:: python
249 | 
250 |    class Root(TypedDataFrame):
251 | 
252 |        schema = {
253 |            'root': bool
254 |        }
255 | 
256 | 
257 |    class Left(Root):
258 |        schema = {
259 |            'left': bool
260 |        }
261 | 
262 | 
263 |    class Right(Root):
264 |        schema = {
265 |            'root': object,
266 |            'right': bool
267 |        }
268 | 
269 | 
270 |    class Down(Left, Right):
271 |        pass
272 | 
273 | Index Schema
274 | ^^^^^^^^^^^^
275 | 
276 | You can specify schema for the index of the DataFrame. It’s defined as a
277 | tuple of a dtype and a name which you assign to an ``index_schema``
278 | static variable:
279 | 
280 | .. code:: python
281 | 
282 |    class IndexDataFrame(TypedDataFrame):
283 |        schema = {
284 |            'foo': bool
285 |        }
286 | 
287 |        index_schema = ('bar', np.int32)
288 | 
289 | Optional Schema
290 | ^^^^^^^^^^^^^^^
291 | 
292 | You can specify optional columns in a schema definition. Optional column
293 | types will be checked only if present in a DataFrame. In case some
294 | optional column (or all of them) is missing no validation error will be
295 | raised. Besides that all columns from optional schema that are missing
296 | in a dataframe will be added with NaN values.
297 | 
298 | .. code:: python
299 | 
300 |    class DataFrameWithOptional(TypedDataFrame):
301 |        schema = {
302 |            'required': bool
303 |        }
304 |        optional = {
305 |            'optional': bool
306 |        }
307 | 
308 | Convert Method
309 | ^^^^^^^^^^^^^^
310 | 
311 | ``TypedDataFrame`` provides a convenient ``convert`` classmethod that
312 | tries to convert a given DataFrame to be compliant with a schema.
313 | 
314 | .. code:: python
315 | 
316 |    class IndexDataFrame(TypedDataFrame):
317 |        schema = {
318 |            'foo': bool
319 |        }
320 | 
321 |        index_schema = ('bar', DATE_TIME_DTYPE)
322 | 
323 |    df = pd.DataFrame({'foo': [True, False]},
324 |                      index=pd.Series(['2021-06-03', '2021-05-31']))
325 |    data = IndexDataFrame.convert(df)
326 | 
327 | Supported types
328 | ~~~~~~~~~~~~~~~
329 | 
330 | Integers
331 | ^^^^^^^^
332 | 
333 | ``np.int16``, ``np.int32``, ``np.int64``, etc.
334 | 
335 | Floats
336 | ^^^^^^
337 | 
338 | ``np.float16``, ``np.float32``, ``np.float64``, etc.
339 | 
340 | Boolean
341 | ^^^^^^^
342 | 
343 | ``bool``
344 | 
345 | Python objects
346 | ^^^^^^^^^^^^^^
347 | 
348 | ``str``, ``dict``, ``list``, ``object``
349 | 
350 | WARNING: no actual check is performed for Python objects. They are all
351 | considered to be of the same type ``object``.
352 | 
353 | Categorical
354 | ^^^^^^^^^^^
355 | 
356 | Categorical dtype is specified as a tuple of categories. To avoid common
357 | categorical pitfalls categorical types are required to have an exact
358 | schema with all categories enumerated in the exact order.
359 | 
360 | .. code:: python
361 | 
362 |    class MyTable(TypedDataFrame):
363 |       schema = {
364 |          "col": ('foo', 'bar')
365 |       }
366 | 
367 |    df = pd.DataFrame({"col": ['foo', 'foo', 'bar']})
368 |    df.col = pd.Categorical(df.col, categories=('foo', 'bar'), ordered=True)
369 |    data = MyTable(df)
370 | 
371 | DateTime
372 | ^^^^^^^^
373 | 
374 | ``np.dtype('datetime64[ns]')``
375 | 
376 | ``typedframe`` library provides an alias for that also:
377 | ``DATE_TIME_DTYPE``
378 | 
379 | UTC DateTime
380 | ''''''''''''
381 | 
382 | ``pd.DatetimeTZDtype('ns', pytz.UTC)``
383 | 
384 | ``typedframe`` library provides an alias for that also:
385 | ``UTC_DATE_TIME_DTYPE``
386 | 
387 | Best practices to use Typed DataFrame
388 | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
389 | 
390 | What are the best places to use Typed DataFrame wrappers in your
391 | codebase?
392 | 
393 | Our experience with ``typedframe`` library in a number of projects has
394 | shown the following scenarios where it’s use was justified the most:
395 | 
396 | Team Borders
397 | ^^^^^^^^^^^^
398 | 
399 | Typed DataFrame helps to establish data contracts between teams. It also
400 | helps to spot the errors caused by miscommunication or inconsistent
401 | system evolution early. Whenever some dataset is being passed between
402 | teams it makes sense to define a Typed DataFrame class with its
403 | specification.
404 | 
405 | Public Functions and Methods
406 | ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
407 | 
408 | Typed DataFrame work especially well in combination with Python type
409 | hints. So a good place to use it is when you have a public function or
410 | method that takes as an argument / returns some pandas DataFrame.
411 | 
412 | Sources and Sinks of Data Pipelines
413 | ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
414 | 
415 | It is a good practice to provide schema definitions and runtime
416 | validation at the beginning and at the end of data pipelines. I.e. right
417 | after you read from the external storage and before you write to it.
418 | This is where Typed DataFrames can also be used.
419 | 
420 | Similar Projects
421 | ~~~~~~~~~~~~~~~~
422 | 
423 | -  `Great Expectations <https://greatexpectations.io/>`__. It’s a much
424 |    more feature-rich library which allows data teams to do a lot of
425 |    assertions about the data. ``typedframe`` is a more light-weight
426 |    library which can be considered as a thin extension layer on top of
427 |    pandas DataFrame.
428 | 
429 | -  `Marshmallow <https://marshmallow.readthedocs.io/>`__. A library for
430 |    Python objects serialization and deserialization with schema
431 |    validation. It’s not integrated with pandas or numpy and focuses only
432 |    on Python classes and builtin objects.
433 | 
434 | 
435 | 
436 | Indices and tables
437 | ==================
438 | 
439 | * :ref:`genindex`
440 | * :ref:`modindex`
441 | * :ref:`search`
442 | 


--------------------------------------------------------------------------------
/docs/source/logo-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/areshytko/typedframe/dcb5daed3f84296247633840b61d6cd217704b56/docs/source/logo-1.png


--------------------------------------------------------------------------------
/docs/source/logo-1.svg:
--------------------------------------------------------------------------------
 1 | <svg width="1024" height="1024" viewBox="0 0 1024 1024" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M893.118 276.728L842.482 249.463L811.322 229.987L784.057 214.407L752.897 194.932L530.88 66.3964C523.09 62.5014 507.51 62.5014 499.72 66.3964C488.035 70.2915 484.14 81.9765 484.14 93.6616V253.358L347.814 175.457C340.024 171.562 328.339 171.562 316.654 175.457C312.759 175.457 308.864 179.352 308.864 183.247C304.969 187.142 301.074 194.932 301.074 202.722V315.678L363.394 350.733V257.253L663.311 432.529V526.009L725.632 561.065V413.054C725.632 401.369 717.842 389.683 710.052 385.788L542.566 288.413V144.297L749.002 265.043L780.162 284.518L807.427 300.098L838.588 319.573H842.482V666.23L168.643 272.833C156.958 268.938 145.273 268.938 137.483 272.833C125.798 276.728 121.903 288.413 121.903 300.098V716.866C121.903 728.551 125.798 736.341 137.483 744.131L499.72 954.462C503.615 958.357 511.405 958.357 515.3 958.357C519.195 958.357 526.985 958.357 530.88 954.462C538.671 950.567 546.461 938.882 546.461 927.197V779.186L678.891 857.087C686.681 860.982 690.577 860.982 694.472 860.982C698.367 860.982 706.157 860.982 710.052 857.087C721.737 853.192 725.632 841.506 725.632 829.821V705.181L663.311 670.125V779.186L363.394 603.91V494.849L301.074 459.794V623.385C301.074 635.07 308.864 642.86 316.654 650.65L484.14 748.026V876.562L184.223 701.286V354.628L861.958 748.026C865.853 751.921 873.643 751.921 877.538 751.921C881.433 751.921 889.223 751.921 893.118 748.026C904.803 744.131 908.698 732.446 908.698 720.761V303.993C908.698 292.308 900.908 284.518 893.118 276.728Z" fill="url(#paint0_linear_15_67)"/>
 3 | <defs>
 4 | <linearGradient id="paint0_linear_15_67" x1="639.022" y1="209.317" x2="341.002" y2="935.217" gradientUnits="userSpaceOnUse">
 5 | <stop offset="0.2682" stop-color="#1072FF"/>
 6 | <stop offset="1" stop-color="#6B4DED"/>
 7 | </linearGradient>
 8 | </defs>
 9 | </svg>
10 | 


--------------------------------------------------------------------------------
/docs/source/logo-2-dark.svg:
--------------------------------------------------------------------------------
 1 | <svg width="620" height="164" viewBox="0 0 620 164" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M134.267 49.8667L127.333 46.1333L123.067 43.4666L119.333 41.3333L115.067 38.6667L84.6665 21.0667C83.5998 20.5333 81.4665 20.5333 80.3998 21.0667C78.7998 21.6 78.2665 23.2 78.2665 24.8V46.6666L59.5998 36C58.5332 35.4667 56.9332 35.4667 55.3332 36C54.7998 36 54.2665 36.5333 54.2665 37.0667C53.7332 37.6 53.1998 38.6667 53.1998 39.7333V55.2L61.7332 60V47.2L102.8 71.2V84L111.333 88.8V68.5333C111.333 66.9333 110.266 65.3333 109.2 64.8L86.2665 51.4666V31.7333L114.533 48.2667L118.8 50.9333L122.533 53.0667L126.8 55.7333H127.333V103.2L35.0665 49.3333C33.4665 48.8 31.8665 48.8 30.7998 49.3333C29.1998 49.8666 28.6665 51.4667 28.6665 53.0667V110.133C28.6665 111.733 29.1998 112.8 30.7998 113.867L80.3998 142.667C80.9332 143.2 81.9998 143.2 82.5332 143.2C83.0665 143.2 84.1332 143.2 84.6665 142.667C85.7332 142.133 86.7998 140.533 86.7998 138.933V118.667L104.933 129.333C106 129.867 106.533 129.867 107.067 129.867C107.6 129.867 108.666 129.867 109.2 129.333C110.8 128.8 111.333 127.2 111.333 125.6V108.533L102.8 103.733V118.667L61.7332 94.6666V79.7333L53.1998 74.9333V97.3333C53.1998 98.9333 54.2665 100 55.3332 101.067L78.2665 114.4V132L37.1998 108V60.5333L130 114.4C130.533 114.933 131.6 114.933 132.133 114.933C132.667 114.933 133.733 114.933 134.267 114.4C135.867 113.867 136.4 112.267 136.4 110.667V53.6C136.4 52 135.333 50.9333 134.267 49.8667Z" fill="url(#paint0_linear_37_2)"/>
 3 | <path d="M134.267 49.8667L127.333 46.1333L123.067 43.4666L119.333 41.3333L115.067 38.6667L84.6665 21.0667C83.5998 20.5333 81.4665 20.5333 80.3998 21.0667C78.7998 21.6 78.2665 23.2 78.2665 24.8V46.6666L59.5998 36C58.5332 35.4667 56.9332 35.4667 55.3332 36C54.7998 36 54.2665 36.5333 54.2665 37.0667C53.7332 37.6 53.1998 38.6667 53.1998 39.7333V55.2L61.7332 60V47.2L102.8 71.2V84L111.333 88.8V68.5333C111.333 66.9333 110.266 65.3333 109.2 64.8L86.2665 51.4666V31.7333L114.533 48.2667L118.8 50.9333L122.533 53.0667L126.8 55.7333H127.333V103.2L35.0665 49.3333C33.4665 48.8 31.8665 48.8 30.7998 49.3333C29.1998 49.8666 28.6665 51.4667 28.6665 53.0667V110.133C28.6665 111.733 29.1998 112.8 30.7998 113.867L80.3998 142.667C80.9332 143.2 81.9998 143.2 82.5332 143.2C83.0665 143.2 84.1332 143.2 84.6665 142.667C85.7332 142.133 86.7998 140.533 86.7998 138.933V118.667L104.933 129.333C106 129.867 106.533 129.867 107.067 129.867C107.6 129.867 108.666 129.867 109.2 129.333C110.8 128.8 111.333 127.2 111.333 125.6V108.533L102.8 103.733V118.667L61.7332 94.6666V79.7333L53.1998 74.9333V97.3333C53.1998 98.9333 54.2665 100 55.3332 101.067L78.2665 114.4V132L37.1998 108V60.5333L130 114.4C130.533 114.933 131.6 114.933 132.133 114.933C132.667 114.933 133.733 114.933 134.267 114.4C135.867 113.867 136.4 112.267 136.4 110.667V53.6C136.4 52 135.333 50.9333 134.267 49.8667Z" fill="white" fill-opacity="0.3"/>
 4 | <path d="M169 87.8333V59.4759H174.615V68.2498H186.197V73.5142H174.615V87.2717C174.615 92.5127 176.487 95.1332 180.231 95.1332C182.056 95.1332 183.717 94.5483 185.214 93.3784L186.969 97.7303C184.77 99.5085 182.079 100.398 178.897 100.398C175.481 100.398 172.978 99.3681 171.387 97.3091C169.796 95.2502 169 92.0915 169 87.8333Z" fill="white"/>
 5 | <path d="M214.953 68.2498H221.34L208.706 99.836C206.413 105.405 204.424 109.101 202.74 110.926C200.961 112.892 198.926 113.874 196.633 113.874C194.574 113.874 192.585 113.219 190.667 111.909L192.492 107.627C193.989 108.329 195.159 108.68 196.001 108.68C197.312 108.68 198.481 108.119 199.511 106.996C200.587 105.872 201.663 104.048 202.74 101.521L203.442 99.836L188.28 68.2498H195.019L204.284 88.3246C204.471 88.6522 205.103 90.2432 206.179 93.0976C206.6 91.5534 207.092 89.939 207.653 88.2544L214.953 68.2498Z" fill="white"/>
 6 | <path d="M231.322 113.874H225.707V68.2498H231.322V71.97C232.446 70.6597 233.99 69.6068 235.955 68.8113C237.92 67.969 239.956 67.5479 242.062 67.5479C246.554 67.5479 250.087 69.0453 252.661 72.0402C255.328 74.9882 256.662 78.8253 256.662 83.5516C256.662 88.3714 255.141 92.4191 252.099 95.6947C249.104 98.9235 245.15 100.538 240.237 100.538C236.446 100.538 233.475 99.8126 231.322 98.362V113.874ZM240.447 72.8123C236.704 72.8123 233.662 74.2629 231.322 77.1641V92.8169C233.803 94.4547 236.61 95.2736 239.745 95.2736C243.068 95.2736 245.712 94.2207 247.677 92.1149C249.689 89.9624 250.695 87.1781 250.695 83.7621C250.695 80.4397 249.783 77.7959 247.958 75.8305C246.133 73.8183 243.629 72.8123 240.447 72.8123Z" fill="white"/>
 7 | <path d="M288.224 91.9746L289.979 96.3966C286.937 99.1575 282.983 100.538 278.117 100.538C272.969 100.538 268.875 99.0405 265.833 96.0457C262.745 93.0508 261.2 89.0499 261.2 84.0429C261.2 79.3167 262.651 75.386 265.552 72.2507C268.407 69.1155 272.384 67.5479 277.485 67.5479C281.696 67.5479 285.183 68.9049 287.943 71.619C290.751 74.2863 292.155 77.7491 292.155 82.0074C292.155 83.3644 292.038 84.6278 291.804 85.7977H267.518C267.752 88.7457 268.851 91.0621 270.817 92.7467C272.829 94.4313 275.403 95.2736 278.538 95.2736C282.656 95.2736 285.885 94.1739 288.224 91.9746ZM277.204 72.8123C274.443 72.8123 272.15 73.5844 270.325 75.1286C268.547 76.6728 267.494 78.7084 267.167 81.2353H286.329C286.189 78.6148 285.3 76.5558 283.662 75.0584C282.071 73.561 279.918 72.8123 277.204 72.8123Z" fill="white"/>
 8 | <path d="M327.148 99.836H321.532V95.8351C318.725 98.8767 315.379 100.398 311.495 100.398C306.862 100.398 303.166 98.9235 300.405 95.9755C297.644 92.9806 296.263 89.0733 296.263 84.2535C296.263 79.3401 297.878 75.3392 301.107 72.2507C304.382 69.1155 308.523 67.5479 313.53 67.5479C316.713 67.5479 319.38 68.2966 321.532 69.794V50.7019H327.148V99.836ZM312.548 95.1332C316.011 95.1332 319.005 93.7293 321.532 90.9217V75.269C318.912 73.6312 316.315 72.8123 313.741 72.8123C310.512 72.8123 307.775 73.8651 305.529 75.9709C303.329 78.0298 302.23 80.7439 302.23 84.1131C302.23 87.4823 303.166 90.173 305.037 92.1851C306.956 94.1505 309.459 95.1332 312.548 95.1332Z" fill="white"/>
 9 | <path d="M342.148 99.836H336.533V63.1258C336.533 58.8207 337.492 55.5685 339.411 53.3692C341.329 51.1231 344.067 50 347.623 50C351.32 50 354.128 50.9359 356.046 52.8077L354.081 57.0894C352.583 55.8727 350.735 55.2644 348.536 55.2644C344.277 55.2644 342.148 58.0954 342.148 63.7576V68.2498H352.677V73.5142H342.148V99.836Z" fill="white"/>
10 | <path d="M363.211 99.836H357.596V68.2498H363.211V71.97C365.083 69.1155 367.727 67.6883 371.143 67.6883C373.342 67.6883 374.98 68.086 376.056 68.8815L374.091 74.1459C372.734 73.3504 371.307 72.9526 369.809 72.9526C366.955 72.9526 364.756 74.4501 363.211 77.4449V99.836Z" fill="white"/>
11 | <path d="M381.731 74.918L380.257 70.4257C383.392 68.5072 386.902 67.5479 390.786 67.5479C395.044 67.5479 398.132 68.6008 400.051 70.7065C401.97 72.8123 402.929 76.0645 402.929 80.4631V99.836H397.594V95.7649C395.114 98.8065 391.745 100.327 387.487 100.327C384.585 100.327 382.246 99.4617 380.467 97.7303C378.689 95.9521 377.8 93.5656 377.8 90.5707C377.8 87.4823 378.9 85.049 381.099 83.2708C383.299 81.4458 386.176 80.5333 389.733 80.5333C393.055 80.5333 395.676 81.2119 397.594 82.5689C397.594 79.0125 397.103 76.4622 396.12 74.918C395.138 73.3738 393.242 72.6017 390.435 72.6017C387.58 72.6017 384.679 73.3738 381.731 74.918ZM389.452 95.2736C392.587 95.2736 395.301 93.9165 397.594 91.2025V87.2015C395.629 85.7977 393.266 85.0958 390.505 85.0958C388.586 85.0958 386.972 85.5637 385.662 86.4996C384.398 87.3887 383.766 88.6522 383.766 90.29C383.766 91.8342 384.258 93.0508 385.241 93.9399C386.27 94.829 387.674 95.2736 389.452 95.2736Z" fill="white"/>
12 | <path d="M457.816 79.1295V99.836H452.201V80.6737C452.201 75.5263 449.931 72.9526 445.392 72.9526C443.567 72.9526 441.906 73.3738 440.408 74.2161C438.958 75.0116 437.858 76.1113 437.109 77.5151C437.156 77.7491 437.18 78.4978 437.18 79.7612V99.836H431.564V79.4805C431.564 77.4683 430.956 75.8773 429.739 74.7074C428.569 73.5376 426.932 72.9526 424.826 72.9526C421.316 72.9526 418.555 74.3799 416.543 77.2343V99.836H410.928V68.2498H416.543V72.2507C417.713 70.8937 419.234 69.794 421.106 68.9517C423.024 68.1094 424.99 67.6883 427.002 67.6883C429.388 67.6883 431.424 68.1796 433.108 69.1623C434.793 70.145 435.939 71.4786 436.548 73.1632C437.718 71.4786 439.285 70.145 441.251 69.1623C443.216 68.1796 445.345 67.6883 447.638 67.6883C454.423 67.6883 457.816 71.502 457.816 79.1295Z" fill="white"/>
13 | <path d="M490.787 91.9746L492.542 96.3966C489.5 99.1575 485.546 100.538 480.68 100.538C475.532 100.538 471.438 99.0405 468.396 96.0457C465.308 93.0508 463.763 89.0499 463.763 84.0429C463.763 79.3167 465.214 75.386 468.115 72.2507C470.97 69.1155 474.947 67.5479 480.048 67.5479C484.259 67.5479 487.746 68.9049 490.506 71.619C493.314 74.2863 494.718 77.7491 494.718 82.0074C494.718 83.3644 494.601 84.6278 494.367 85.7977H470.081C470.315 88.7457 471.414 91.0621 473.38 92.7467C475.392 94.4313 477.966 95.2736 481.101 95.2736C485.219 95.2736 488.448 94.1739 490.787 91.9746ZM479.767 72.8123C477.006 72.8123 474.713 73.5844 472.888 75.1286C471.11 76.6728 470.057 78.7084 469.73 81.2353H488.892C488.752 78.6148 487.863 76.5558 486.225 75.0584C484.634 73.561 482.481 72.8123 479.767 72.8123Z" fill="white"/>
14 | <defs>
15 | <linearGradient id="paint0_linear_37_2" x1="99.474" y1="40.6363" x2="58.667" y2="140.031" gradientUnits="userSpaceOnUse">
16 | <stop offset="0.2682" stop-color="#1072FF"/>
17 | <stop offset="1" stop-color="#6B4DED"/>
18 | </linearGradient>
19 | </defs>
20 | </svg>
21 | 


--------------------------------------------------------------------------------
/docs/source/logo-2-gray.svg:
--------------------------------------------------------------------------------
 1 | <svg width="620" height="164" viewBox="0 0 620 164" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M134.267 49.8667L127.333 46.1333L123.067 43.4667L119.333 41.3333L115.067 38.6667L84.6665 21.0667C83.5998 20.5333 81.4665 20.5333 80.3998 21.0667C78.7998 21.6 78.2665 23.2 78.2665 24.8V46.6667L59.5998 36C58.5332 35.4667 56.9332 35.4667 55.3332 36C54.7998 36 54.2665 36.5333 54.2665 37.0667C53.7332 37.6 53.1998 38.6667 53.1998 39.7333V55.2L61.7332 60V47.2L102.8 71.2V84L111.333 88.8V68.5333C111.333 66.9333 110.266 65.3333 109.2 64.8L86.2665 51.4667V31.7333L114.533 48.2667L118.8 50.9333L122.533 53.0667L126.8 55.7333H127.333V103.2L35.0665 49.3333C33.4665 48.8 31.8665 48.8 30.7998 49.3333C29.1998 49.8667 28.6665 51.4667 28.6665 53.0667V110.133C28.6665 111.733 29.1998 112.8 30.7998 113.867L80.3998 142.667C80.9332 143.2 81.9998 143.2 82.5332 143.2C83.0665 143.2 84.1332 143.2 84.6665 142.667C85.7332 142.133 86.7998 140.533 86.7998 138.933V118.667L104.933 129.333C106 129.867 106.533 129.867 107.067 129.867C107.6 129.867 108.666 129.867 109.2 129.333C110.8 128.8 111.333 127.2 111.333 125.6V108.533L102.8 103.733V118.667L61.7332 94.6667V79.7333L53.1998 74.9333V97.3333C53.1998 98.9333 54.2665 100 55.3332 101.067L78.2665 114.4V132L37.1998 108V60.5333L130 114.4C130.533 114.933 131.6 114.933 132.133 114.933C132.667 114.933 133.733 114.933 134.267 114.4C135.867 113.867 136.4 112.267 136.4 110.667V53.6C136.4 52 135.333 50.9333 134.267 49.8667Z" fill="url(#paint0_linear_37_18)"/>
 3 | <path d="M175 87.8333V59.4759H180.615V68.2498H192.197V73.5142H180.615V87.2717C180.615 92.5127 182.487 95.1332 186.231 95.1332C188.056 95.1332 189.717 94.5483 191.214 93.3784L192.969 97.7303C190.77 99.5085 188.079 100.398 184.897 100.398C181.481 100.398 178.978 99.3681 177.387 97.3091C175.796 95.2502 175 92.0915 175 87.8333Z" fill="#292840"/>
 4 | <path d="M220.953 68.2498H227.34L214.706 99.836C212.413 105.405 210.424 109.101 208.74 110.926C206.961 112.892 204.926 113.874 202.633 113.874C200.574 113.874 198.585 113.219 196.667 111.909L198.492 107.627C199.989 108.329 201.159 108.68 202.001 108.68C203.312 108.68 204.481 108.119 205.511 106.996C206.587 105.872 207.663 104.048 208.74 101.521L209.442 99.836L194.28 68.2498H201.019L210.284 88.3246C210.471 88.6522 211.103 90.2432 212.179 93.0976C212.6 91.5534 213.092 89.939 213.653 88.2544L220.953 68.2498Z" fill="#292840"/>
 5 | <path d="M237.322 113.874H231.707V68.2498H237.322V71.97C238.446 70.6597 239.99 69.6068 241.955 68.8113C243.92 67.969 245.956 67.5479 248.062 67.5479C252.554 67.5479 256.087 69.0453 258.661 72.0402C261.328 74.9882 262.662 78.8253 262.662 83.5516C262.662 88.3714 261.141 92.4191 258.099 95.6947C255.104 98.9235 251.15 100.538 246.237 100.538C242.446 100.538 239.475 99.8126 237.322 98.362V113.874ZM246.447 72.8123C242.704 72.8123 239.662 74.2629 237.322 77.1641V92.8169C239.803 94.4547 242.61 95.2736 245.745 95.2736C249.068 95.2736 251.712 94.2207 253.677 92.1149C255.689 89.9624 256.695 87.1781 256.695 83.7621C256.695 80.4397 255.783 77.7959 253.958 75.8305C252.133 73.8183 249.629 72.8123 246.447 72.8123Z" fill="#292840"/>
 6 | <path d="M294.224 91.9746L295.979 96.3966C292.937 99.1575 288.983 100.538 284.117 100.538C278.969 100.538 274.875 99.0405 271.833 96.0457C268.745 93.0508 267.2 89.0499 267.2 84.0429C267.2 79.3167 268.651 75.386 271.552 72.2507C274.407 69.1155 278.384 67.5479 283.485 67.5479C287.696 67.5479 291.183 68.9049 293.943 71.619C296.751 74.2863 298.155 77.7491 298.155 82.0074C298.155 83.3644 298.038 84.6278 297.804 85.7977H273.518C273.752 88.7457 274.851 91.0621 276.817 92.7467C278.829 94.4313 281.403 95.2736 284.538 95.2736C288.656 95.2736 291.885 94.1739 294.224 91.9746ZM283.204 72.8123C280.443 72.8123 278.15 73.5844 276.325 75.1286C274.547 76.6728 273.494 78.7084 273.167 81.2353H292.329C292.189 78.6148 291.3 76.5558 289.662 75.0584C288.071 73.561 285.918 72.8123 283.204 72.8123Z" fill="#292840"/>
 7 | <path d="M333.148 99.836H327.532V95.8351C324.725 98.8767 321.379 100.398 317.495 100.398C312.862 100.398 309.166 98.9235 306.405 95.9755C303.644 92.9806 302.263 89.0733 302.263 84.2535C302.263 79.3401 303.878 75.3392 307.107 72.2507C310.382 69.1155 314.523 67.5479 319.53 67.5479C322.713 67.5479 325.38 68.2966 327.532 69.794V50.7019H333.148V99.836ZM318.548 95.1332C322.011 95.1332 325.005 93.7293 327.532 90.9217V75.269C324.912 73.6312 322.315 72.8123 319.741 72.8123C316.512 72.8123 313.775 73.8651 311.529 75.9709C309.329 78.0298 308.23 80.7439 308.23 84.1131C308.23 87.4823 309.166 90.173 311.037 92.1851C312.956 94.1505 315.459 95.1332 318.548 95.1332Z" fill="#292840"/>
 8 | <path d="M348.148 99.836H342.533V63.1258C342.533 58.8207 343.492 55.5685 345.411 53.3692C347.329 51.1231 350.067 50 353.623 50C357.32 50 360.128 50.9359 362.046 52.8077L360.081 57.0894C358.583 55.8727 356.735 55.2644 354.536 55.2644C350.277 55.2644 348.148 58.0954 348.148 63.7576V68.2498H358.677V73.5142H348.148V99.836Z" fill="#292840"/>
 9 | <path d="M369.211 99.836H363.596V68.2498H369.211V71.97C371.083 69.1155 373.727 67.6883 377.143 67.6883C379.342 67.6883 380.98 68.086 382.056 68.8815L380.091 74.1459C378.734 73.3504 377.307 72.9526 375.809 72.9526C372.955 72.9526 370.756 74.4501 369.211 77.4449V99.836Z" fill="#292840"/>
10 | <path d="M387.731 74.918L386.257 70.4257C389.392 68.5072 392.902 67.5479 396.786 67.5479C401.044 67.5479 404.132 68.6008 406.051 70.7065C407.97 72.8123 408.929 76.0645 408.929 80.4631V99.836H403.594V95.7649C401.114 98.8065 397.745 100.327 393.487 100.327C390.585 100.327 388.246 99.4617 386.467 97.7303C384.689 95.9521 383.8 93.5656 383.8 90.5707C383.8 87.4823 384.9 85.049 387.099 83.2708C389.299 81.4458 392.176 80.5333 395.733 80.5333C399.055 80.5333 401.676 81.2119 403.594 82.5689C403.594 79.0125 403.103 76.4622 402.12 74.918C401.138 73.3738 399.242 72.6017 396.435 72.6017C393.58 72.6017 390.679 73.3738 387.731 74.918ZM395.452 95.2736C398.587 95.2736 401.301 93.9165 403.594 91.2025V87.2015C401.629 85.7977 399.266 85.0958 396.505 85.0958C394.586 85.0958 392.972 85.5637 391.662 86.4996C390.398 87.3887 389.766 88.6522 389.766 90.29C389.766 91.8342 390.258 93.0508 391.241 93.9399C392.27 94.829 393.674 95.2736 395.452 95.2736Z" fill="#292840"/>
11 | <path d="M463.816 79.1295V99.836H458.201V80.6737C458.201 75.5263 455.931 72.9526 451.392 72.9526C449.567 72.9526 447.906 73.3738 446.408 74.2161C444.958 75.0116 443.858 76.1113 443.109 77.5151C443.156 77.7491 443.18 78.4978 443.18 79.7612V99.836H437.564V79.4805C437.564 77.4683 436.956 75.8773 435.739 74.7074C434.569 73.5376 432.932 72.9526 430.826 72.9526C427.316 72.9526 424.555 74.3799 422.543 77.2343V99.836H416.928V68.2498H422.543V72.2507C423.713 70.8937 425.234 69.794 427.106 68.9517C429.024 68.1094 430.99 67.6883 433.002 67.6883C435.388 67.6883 437.424 68.1796 439.108 69.1623C440.793 70.145 441.939 71.4786 442.548 73.1632C443.718 71.4786 445.285 70.145 447.251 69.1623C449.216 68.1796 451.345 67.6883 453.638 67.6883C460.423 67.6883 463.816 71.502 463.816 79.1295Z" fill="#292840"/>
12 | <path d="M496.787 91.9746L498.542 96.3966C495.5 99.1575 491.546 100.538 486.68 100.538C481.532 100.538 477.438 99.0405 474.396 96.0457C471.308 93.0508 469.763 89.0499 469.763 84.0429C469.763 79.3167 471.214 75.386 474.115 72.2507C476.97 69.1155 480.947 67.5479 486.048 67.5479C490.259 67.5479 493.746 68.9049 496.506 71.619C499.314 74.2863 500.718 77.7491 500.718 82.0074C500.718 83.3644 500.601 84.6278 500.367 85.7977H476.081C476.315 88.7457 477.414 91.0621 479.38 92.7467C481.392 94.4313 483.966 95.2736 487.101 95.2736C491.219 95.2736 494.448 94.1739 496.787 91.9746ZM485.767 72.8123C483.006 72.8123 480.713 73.5844 478.888 75.1286C477.11 76.6728 476.057 78.7084 475.73 81.2353H494.892C494.752 78.6148 493.863 76.5558 492.225 75.0584C490.634 73.561 488.481 72.8123 485.767 72.8123Z" fill="#292840"/>
13 | <defs>
14 | <linearGradient id="paint0_linear_37_18" x1="99.474" y1="40.6363" x2="58.667" y2="140.031" gradientUnits="userSpaceOnUse">
15 | <stop offset="0.2682" stop-color="#8C8C8C"/>
16 | <stop offset="1" stop-color="#4A4A4A"/>
17 | </linearGradient>
18 | </defs>
19 | </svg>
20 | 


--------------------------------------------------------------------------------
/docs/source/logo-2-white.svg:
--------------------------------------------------------------------------------
 1 | <svg width="585" height="164" viewBox="0 0 585 164" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M134.267 49.8667L127.333 46.1333L123.067 43.4667L119.333 41.3333L115.067 38.6667L84.6665 21.0667C83.5998 20.5334 81.4665 20.5334 80.3998 21.0667C78.7998 21.6 78.2665 23.2 78.2665 24.8V46.6667L59.5998 36C58.5332 35.4667 56.9332 35.4667 55.3332 36C54.7998 36 54.2665 36.5334 54.2665 37.0667C53.7332 37.6 53.1998 38.6667 53.1998 39.7334V55.2L61.7332 60V47.2L102.8 71.2V84L111.333 88.8V68.5333C111.333 66.9333 110.266 65.3333 109.2 64.8L86.2665 51.4667V31.7334L114.533 48.2667L118.8 50.9334L122.533 53.0667L126.8 55.7334H127.333V103.2L35.0665 49.3333C33.4665 48.8 31.8665 48.8 30.7998 49.3333C29.1998 49.8667 28.6665 51.4667 28.6665 53.0667V110.133C28.6665 111.733 29.1998 112.8 30.7998 113.867L80.3998 142.667C80.9332 143.2 81.9998 143.2 82.5332 143.2C83.0665 143.2 84.1332 143.2 84.6665 142.667C85.7332 142.133 86.7998 140.533 86.7998 138.933V118.667L104.933 129.333C106 129.867 106.533 129.867 107.067 129.867C107.6 129.867 108.666 129.867 109.2 129.333C110.8 128.8 111.333 127.2 111.333 125.6V108.533L102.8 103.733V118.667L61.7332 94.6667V79.7333L53.1998 74.9334V97.3333C53.1998 98.9333 54.2665 100 55.3332 101.067L78.2665 114.4V132L37.1998 108V60.5333L130 114.4C130.533 114.933 131.6 114.933 132.133 114.933C132.667 114.933 133.733 114.933 134.267 114.4C135.867 113.867 136.4 112.267 136.4 110.667V53.6C136.4 52 135.333 50.9333 134.267 49.8667Z" fill="url(#paint0_linear_37_23)"/>
 3 | <path d="M175 87.8333V59.4759H180.615V68.2498H192.197V73.5142H180.615V87.2717C180.615 92.5127 182.487 95.1332 186.231 95.1332C188.056 95.1332 189.717 94.5483 191.214 93.3784L192.969 97.7303C190.77 99.5085 188.079 100.398 184.897 100.398C181.481 100.398 178.978 99.3681 177.387 97.3091C175.796 95.2502 175 92.0915 175 87.8333Z" fill="#292840"/>
 4 | <path d="M220.953 68.2498H227.34L214.706 99.836C212.413 105.405 210.424 109.101 208.74 110.926C206.961 112.892 204.926 113.874 202.633 113.874C200.574 113.874 198.585 113.219 196.667 111.909L198.492 107.627C199.989 108.329 201.159 108.68 202.001 108.68C203.312 108.68 204.481 108.119 205.511 106.996C206.587 105.872 207.663 104.048 208.74 101.521L209.442 99.836L194.28 68.2498H201.019L210.284 88.3246C210.471 88.6522 211.103 90.2432 212.179 93.0976C212.6 91.5534 213.092 89.939 213.653 88.2544L220.953 68.2498Z" fill="#292840"/>
 5 | <path d="M237.322 113.874H231.707V68.2498H237.322V71.97C238.446 70.6597 239.99 69.6068 241.955 68.8113C243.92 67.969 245.956 67.5479 248.062 67.5479C252.554 67.5479 256.087 69.0453 258.661 72.0402C261.328 74.9882 262.662 78.8253 262.662 83.5516C262.662 88.3714 261.141 92.4191 258.099 95.6947C255.104 98.9235 251.15 100.538 246.237 100.538C242.446 100.538 239.475 99.8126 237.322 98.362V113.874ZM246.447 72.8123C242.704 72.8123 239.662 74.2629 237.322 77.1641V92.8169C239.803 94.4547 242.61 95.2736 245.745 95.2736C249.068 95.2736 251.712 94.2207 253.677 92.1149C255.689 89.9624 256.695 87.1781 256.695 83.7621C256.695 80.4397 255.783 77.7959 253.958 75.8305C252.133 73.8183 249.629 72.8123 246.447 72.8123Z" fill="#292840"/>
 6 | <path d="M294.224 91.9746L295.979 96.3966C292.937 99.1575 288.983 100.538 284.117 100.538C278.969 100.538 274.875 99.0405 271.833 96.0457C268.745 93.0508 267.2 89.0499 267.2 84.0429C267.2 79.3167 268.651 75.386 271.552 72.2507C274.407 69.1155 278.384 67.5479 283.485 67.5479C287.696 67.5479 291.183 68.9049 293.943 71.619C296.751 74.2863 298.155 77.7491 298.155 82.0074C298.155 83.3644 298.038 84.6278 297.804 85.7977H273.518C273.752 88.7457 274.851 91.0621 276.817 92.7467C278.829 94.4313 281.403 95.2736 284.538 95.2736C288.656 95.2736 291.885 94.1739 294.224 91.9746ZM283.204 72.8123C280.443 72.8123 278.15 73.5844 276.325 75.1286C274.547 76.6728 273.494 78.7084 273.167 81.2353H292.329C292.189 78.6148 291.3 76.5558 289.662 75.0584C288.071 73.561 285.918 72.8123 283.204 72.8123Z" fill="#292840"/>
 7 | <path d="M333.148 99.836H327.532V95.8351C324.725 98.8767 321.379 100.398 317.495 100.398C312.862 100.398 309.166 98.9235 306.405 95.9755C303.644 92.9806 302.263 89.0733 302.263 84.2535C302.263 79.3401 303.878 75.3392 307.107 72.2507C310.382 69.1155 314.523 67.5479 319.53 67.5479C322.713 67.5479 325.38 68.2966 327.532 69.794V50.7019H333.148V99.836ZM318.548 95.1332C322.011 95.1332 325.005 93.7293 327.532 90.9217V75.269C324.912 73.6312 322.315 72.8123 319.741 72.8123C316.512 72.8123 313.775 73.8651 311.529 75.9709C309.329 78.0298 308.23 80.7439 308.23 84.1131C308.23 87.4823 309.166 90.173 311.037 92.1851C312.956 94.1505 315.459 95.1332 318.548 95.1332Z" fill="#292840"/>
 8 | <path d="M348.148 99.836H342.533V63.1258C342.533 58.8207 343.492 55.5685 345.411 53.3692C347.329 51.1231 350.067 50 353.623 50C357.32 50 360.128 50.9359 362.046 52.8077L360.081 57.0894C358.583 55.8727 356.735 55.2644 354.536 55.2644C350.277 55.2644 348.148 58.0954 348.148 63.7576V68.2498H358.677V73.5142H348.148V99.836Z" fill="#292840"/>
 9 | <path d="M369.211 99.836H363.596V68.2498H369.211V71.97C371.083 69.1155 373.727 67.6883 377.143 67.6883C379.342 67.6883 380.98 68.086 382.056 68.8815L380.091 74.1459C378.734 73.3504 377.307 72.9526 375.809 72.9526C372.955 72.9526 370.756 74.4501 369.211 77.4449V99.836Z" fill="#292840"/>
10 | <path d="M387.731 74.918L386.257 70.4257C389.392 68.5072 392.902 67.5479 396.786 67.5479C401.044 67.5479 404.132 68.6008 406.051 70.7065C407.97 72.8123 408.929 76.0645 408.929 80.4631V99.836H403.594V95.7649C401.114 98.8065 397.745 100.327 393.487 100.327C390.585 100.327 388.246 99.4617 386.467 97.7303C384.689 95.9521 383.8 93.5656 383.8 90.5707C383.8 87.4823 384.9 85.049 387.099 83.2708C389.299 81.4458 392.176 80.5333 395.733 80.5333C399.055 80.5333 401.676 81.2119 403.594 82.5689C403.594 79.0125 403.103 76.4622 402.12 74.918C401.138 73.3738 399.242 72.6017 396.435 72.6017C393.58 72.6017 390.679 73.3738 387.731 74.918ZM395.452 95.2736C398.587 95.2736 401.301 93.9165 403.594 91.2025V87.2015C401.629 85.7977 399.266 85.0958 396.505 85.0958C394.586 85.0958 392.972 85.5637 391.662 86.4996C390.398 87.3887 389.766 88.6522 389.766 90.29C389.766 91.8342 390.258 93.0508 391.241 93.9399C392.27 94.829 393.674 95.2736 395.452 95.2736Z" fill="#292840"/>
11 | <path d="M463.816 79.1295V99.836H458.201V80.6737C458.201 75.5263 455.931 72.9526 451.392 72.9526C449.567 72.9526 447.906 73.3738 446.408 74.2161C444.958 75.0116 443.858 76.1113 443.109 77.5151C443.156 77.7491 443.18 78.4978 443.18 79.7612V99.836H437.564V79.4805C437.564 77.4683 436.956 75.8773 435.739 74.7074C434.569 73.5376 432.932 72.9526 430.826 72.9526C427.316 72.9526 424.555 74.3799 422.543 77.2343V99.836H416.928V68.2498H422.543V72.2507C423.713 70.8937 425.234 69.794 427.106 68.9517C429.024 68.1094 430.99 67.6883 433.002 67.6883C435.388 67.6883 437.424 68.1796 439.108 69.1623C440.793 70.145 441.939 71.4786 442.548 73.1632C443.718 71.4786 445.285 70.145 447.251 69.1623C449.216 68.1796 451.345 67.6883 453.638 67.6883C460.423 67.6883 463.816 71.502 463.816 79.1295Z" fill="#292840"/>
12 | <path d="M496.787 91.9746L498.542 96.3966C495.5 99.1575 491.546 100.538 486.68 100.538C481.532 100.538 477.438 99.0405 474.396 96.0457C471.308 93.0508 469.763 89.0499 469.763 84.0429C469.763 79.3167 471.214 75.386 474.115 72.2507C476.97 69.1155 480.947 67.5479 486.048 67.5479C490.259 67.5479 493.746 68.9049 496.506 71.619C499.314 74.2863 500.718 77.7491 500.718 82.0074C500.718 83.3644 500.601 84.6278 500.367 85.7977H476.081C476.315 88.7457 477.414 91.0621 479.38 92.7467C481.392 94.4313 483.966 95.2736 487.101 95.2736C491.219 95.2736 494.448 94.1739 496.787 91.9746ZM485.767 72.8123C483.006 72.8123 480.713 73.5844 478.888 75.1286C477.11 76.6728 476.057 78.7084 475.73 81.2353H494.892C494.752 78.6148 493.863 76.5558 492.225 75.0584C490.634 73.561 488.481 72.8123 485.767 72.8123Z" fill="#292840"/>
13 | <defs>
14 | <linearGradient id="paint0_linear_37_23" x1="99.474" y1="40.6363" x2="58.667" y2="140.031" gradientUnits="userSpaceOnUse">
15 | <stop offset="0.2682" stop-color="white"/>
16 | <stop offset="1" stop-color="#ADADAD"/>
17 | </linearGradient>
18 | </defs>
19 | </svg>
20 | 


--------------------------------------------------------------------------------
/docs/source/logo-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/areshytko/typedframe/dcb5daed3f84296247633840b61d6cd217704b56/docs/source/logo-2.png


--------------------------------------------------------------------------------
/docs/source/logo-2.svg:
--------------------------------------------------------------------------------
 1 | <svg width="529" height="128" viewBox="0 0 529 128" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M116.118 31.826L109.194 28.0974L104.933 25.4342L101.204 23.3036L96.9429 20.6403L66.5816 3.06276C65.5163 2.5301 63.3857 2.5301 62.3204 3.06276C60.7225 3.59541 60.1898 5.19336 60.1898 6.79132V28.6301L41.547 17.977C40.4816 17.4444 38.8837 17.4444 37.2857 17.977C36.7531 17.977 36.2204 18.5097 36.2204 19.0423C35.6878 19.575 35.1551 20.6403 35.1551 21.7056V37.1525L43.6776 41.9464V29.1628L84.6919 53.1321V65.9158L93.2143 70.7097V50.4689C93.2143 48.8709 92.149 47.2729 91.0837 46.7403L68.1796 33.424V13.7158L96.4102 30.2281L100.671 32.8913L104.4 35.0219L108.661 37.6852H109.194V85.0913L17.0449 31.2934C15.447 30.7607 13.849 30.7607 12.7837 31.2934C11.1857 31.826 10.6531 33.424 10.6531 35.0219V92.0158C10.6531 93.6138 11.1857 94.6791 12.7837 95.7444L62.3204 124.508C62.8531 125.04 63.9184 125.04 64.451 125.04C64.9837 125.04 66.049 125.04 66.5816 124.508C67.647 123.975 68.7123 122.377 68.7123 120.779V100.538L86.8225 111.191C87.8878 111.724 88.4204 111.724 88.9531 111.724C89.4857 111.724 90.551 111.724 91.0837 111.191C92.6816 110.659 93.2143 109.061 93.2143 107.463V90.4179L84.6919 85.624V100.538L43.6776 76.5689V61.6546L35.1551 56.8607V79.2321C35.1551 80.8301 36.2204 81.8954 37.2857 82.9607L60.1898 96.277V113.855L19.1755 89.8852V42.4791L111.857 96.277C112.39 96.8097 113.455 96.8097 113.988 96.8097C114.52 96.8097 115.586 96.8097 116.118 96.277C117.716 95.7444 118.249 94.1464 118.249 92.5485V35.5546C118.249 33.9566 117.184 32.8913 116.118 31.826Z" fill="url(#paint0_linear_15_20)"/>
 3 | <path d="M156.96 77.32V45H163.36V55H176.56V61H163.36V76.68C163.36 82.6533 165.493 85.64 169.76 85.64C171.84 85.64 173.733 84.9733 175.44 83.64L177.44 88.6C174.933 90.6267 171.867 91.64 168.24 91.64C164.347 91.64 161.493 90.4667 159.68 88.12C157.867 85.7733 156.96 82.1733 156.96 77.32Z" fill="#292840"/>
 4 | <path d="M209.334 55H216.614L202.214 91C199.601 97.3467 197.334 101.56 195.414 103.64C193.388 105.88 191.068 107 188.454 107C186.108 107 183.841 106.253 181.654 104.76L183.734 99.88C185.441 100.68 186.774 101.08 187.734 101.08C189.228 101.08 190.561 100.44 191.734 99.16C192.961 97.88 194.188 95.8 195.414 92.92L196.214 91L178.934 55H186.614L197.174 77.88C197.388 78.2533 198.108 80.0667 199.334 83.32C199.814 81.56 200.374 79.72 201.014 77.8L209.334 55Z" fill="#292840"/>
 5 | <path d="M227.991 107H221.591V55H227.991V59.24C229.271 57.7467 231.031 56.5467 233.271 55.64C235.511 54.68 237.831 54.2 240.231 54.2C245.351 54.2 249.378 55.9067 252.311 59.32C255.351 62.68 256.871 67.0533 256.871 72.44C256.871 77.9333 255.138 82.5467 251.671 86.28C248.258 89.96 243.751 91.8 238.151 91.8C233.831 91.8 230.445 90.9733 227.991 89.32V107ZM238.391 60.2C234.125 60.2 230.658 61.8533 227.991 65.16V83C230.818 84.8667 234.018 85.8 237.591 85.8C241.378 85.8 244.391 84.6 246.631 82.2C248.925 79.7467 250.071 76.5733 250.071 72.68C250.071 68.8933 249.031 65.88 246.951 63.64C244.871 61.3467 242.018 60.2 238.391 60.2Z" fill="#292840"/>
 6 | <path d="M292.844 82.04L294.844 87.08C291.378 90.2267 286.871 91.8 281.324 91.8C275.458 91.8 270.791 90.0933 267.324 86.68C263.804 83.2667 262.044 78.7067 262.044 73C262.044 67.6133 263.698 63.1333 267.004 59.56C270.258 55.9867 274.791 54.2 280.604 54.2C285.404 54.2 289.378 55.7467 292.524 58.84C295.724 61.88 297.324 65.8267 297.324 70.68C297.324 72.2267 297.191 73.6667 296.924 75H269.244C269.511 78.36 270.764 81 273.004 82.92C275.298 84.84 278.231 85.8 281.804 85.8C286.498 85.8 290.178 84.5467 292.844 82.04ZM280.284 60.2C277.138 60.2 274.524 61.08 272.444 62.84C270.418 64.6 269.218 66.92 268.844 69.8H290.684C290.524 66.8133 289.511 64.4667 287.644 62.76C285.831 61.0533 283.378 60.2 280.284 60.2Z" fill="#292840"/>
 7 | <path d="M337.207 91H330.807V86.44C327.607 89.9067 323.794 91.64 319.367 91.64C314.087 91.64 309.874 89.96 306.727 86.6C303.58 83.1867 302.007 78.7333 302.007 73.24C302.007 67.64 303.847 63.08 307.527 59.56C311.26 55.9867 315.98 54.2 321.687 54.2C325.314 54.2 328.354 55.0533 330.807 56.76V35H337.207V91ZM320.567 85.64C324.514 85.64 327.927 84.04 330.807 80.84V63C327.82 61.1333 324.86 60.2 321.927 60.2C318.247 60.2 315.127 61.4 312.567 63.8C310.06 66.1467 308.807 69.24 308.807 73.08C308.807 76.92 309.874 79.9867 312.007 82.28C314.193 84.52 317.047 85.64 320.567 85.64Z" fill="#292840"/>
 8 | <path d="M354.304 91H347.904V49.16C347.904 44.2533 348.997 40.5467 351.184 38.04C353.37 35.48 356.49 34.2 360.544 34.2C364.757 34.2 367.957 35.2667 370.144 37.4L367.904 42.28C366.197 40.8933 364.09 40.2 361.584 40.2C356.73 40.2 354.304 43.4267 354.304 49.88V55H366.304V61H354.304V91Z" fill="#292840"/>
 9 | <path d="M378.31 91H371.91V55H378.31V59.24C380.443 55.9867 383.457 54.36 387.35 54.36C389.857 54.36 391.723 54.8133 392.95 55.72L390.71 61.72C389.163 60.8133 387.537 60.36 385.83 60.36C382.577 60.36 380.07 62.0667 378.31 65.48V91Z" fill="#292840"/>
10 | <path d="M399.417 62.6L397.737 57.48C401.311 55.2933 405.311 54.2 409.737 54.2C414.591 54.2 418.111 55.4 420.297 57.8C422.484 60.2 423.577 63.9067 423.577 68.92V91H417.497V86.36C414.671 89.8267 410.831 91.56 405.977 91.56C402.671 91.56 400.004 90.5733 397.977 88.6C395.951 86.5733 394.937 83.8533 394.937 80.44C394.937 76.92 396.191 74.1467 398.697 72.12C401.204 70.04 404.484 69 408.537 69C412.324 69 415.311 69.7733 417.497 71.32C417.497 67.2667 416.937 64.36 415.817 62.6C414.697 60.84 412.537 59.96 409.337 59.96C406.084 59.96 402.777 60.84 399.417 62.6ZM408.217 85.8C411.791 85.8 414.884 84.2533 417.497 81.16V76.6C415.257 75 412.564 74.2 409.417 74.2C407.231 74.2 405.391 74.7333 403.897 75.8C402.457 76.8133 401.737 78.2533 401.737 80.12C401.737 81.88 402.297 83.2667 403.417 84.28C404.591 85.2933 406.191 85.8 408.217 85.8Z" fill="#292840"/>
11 | <path d="M486.134 67.4V91H479.734V69.16C479.734 63.2933 477.148 60.36 471.974 60.36C469.894 60.36 468.001 60.84 466.294 61.8C464.641 62.7067 463.388 63.96 462.534 65.56C462.588 65.8267 462.614 66.68 462.614 68.12V91H456.214V67.8C456.214 65.5067 455.521 63.6933 454.134 62.36C452.801 61.0267 450.934 60.36 448.534 60.36C444.534 60.36 441.388 61.9867 439.094 65.24V91H432.694V55H439.094V59.56C440.428 58.0133 442.161 56.76 444.294 55.8C446.481 54.84 448.721 54.36 451.014 54.36C453.734 54.36 456.054 54.92 457.974 56.04C459.894 57.16 461.201 58.68 461.894 60.6C463.228 58.68 465.014 57.16 467.254 56.04C469.494 54.92 471.921 54.36 474.534 54.36C482.268 54.36 486.134 58.7067 486.134 67.4Z" fill="#292840"/>
12 | <path d="M523.713 82.04L525.713 87.08C522.246 90.2267 517.74 91.8 512.193 91.8C506.326 91.8 501.66 90.0933 498.193 86.68C494.673 83.2667 492.913 78.7067 492.913 73C492.913 67.6133 494.566 63.1333 497.873 59.56C501.126 55.9867 505.66 54.2 511.473 54.2C516.273 54.2 520.246 55.7467 523.393 58.84C526.593 61.88 528.193 65.8267 528.193 70.68C528.193 72.2267 528.06 73.6667 527.793 75H500.113C500.38 78.36 501.633 81 503.873 82.92C506.166 84.84 509.1 85.8 512.673 85.8C517.366 85.8 521.046 84.5467 523.713 82.04ZM511.153 60.2C508.006 60.2 505.393 61.08 503.313 62.84C501.286 64.6 500.086 66.92 499.713 69.8H521.553C521.393 66.8133 520.38 64.4667 518.513 62.76C516.7 61.0533 514.246 60.2 511.153 60.2Z" fill="#292840"/>
13 | <defs>
14 | <linearGradient id="paint0_linear_15_20" x1="81.3702" y1="22.6074" x2="40.6153" y2="121.876" gradientUnits="userSpaceOnUse">
15 | <stop offset="0.2682" stop-color="#1072FF"/>
16 | <stop offset="1" stop-color="#6B4DED"/>
17 | </linearGradient>
18 | </defs>
19 | </svg>
20 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | numpy
2 | pandas
3 | polars
4 | pyarrow
5 | pytest==6.2.4


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | import pathlib
 2 | from setuptools import setup
 3 | 
 4 | HERE = pathlib.Path(__file__).parent
 5 | README = (HERE / "README.md").read_text()
 6 | 
 7 | 
 8 | setup(
 9 |     name="typedframe",
10 |     version='0.11.0',
11 |     description="Typed Wrappers over Pandas and Polars DataFrames with schema validation",
12 |     long_description=README,
13 |     long_description_content_type="text/markdown",
14 |     url="https://github.com/areshytko/typedframe",
15 |     author="Alexander Reshytko",
16 |     author_email="alexander@reshytko.com",
17 |     license="MIT",
18 |     classifiers=[
19 |         "License :: OSI Approved :: MIT License",
20 |         "Programming Language :: Python :: 3",
21 |         "Programming Language :: Python :: 3.8",
22 |     ],
23 |     packages=["typedframe"],
24 |     install_requires=[
25 |     ],
26 |     extras_require={
27 |         "pandas": ["pandas", "numpy"],
28 |         "polars": ["polars", "pyarrow"],
29 |     },
30 |     setup_requires=['pytest-runner'],
31 |     tests_require=['pytest']
32 | )


--------------------------------------------------------------------------------
/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/areshytko/typedframe/dcb5daed3f84296247633840b61d6cd217704b56/tests/__init__.py


--------------------------------------------------------------------------------
/tests/test_pandas_typedframe.py:
--------------------------------------------------------------------------------
  1 | 
  2 | import abc
  3 | import datetime
  4 | 
  5 | import pandas as pd
  6 | import numpy as np
  7 | import pytest
  8 | 
  9 | from typedframe.pandas_ import UTC_DATE_TIME_DTYPE, DATE_TIME_DTYPE, PandasTypedFrame as TypedDataFrame
 10 | 
 11 | 
 12 | class MyDataFrame(TypedDataFrame):
 13 |     schema = {
 14 |         'int_field': np.int16,
 15 |         'float_field': np.float64,
 16 |         'bool_field': bool,
 17 |         'str_field': str,
 18 |         'obj_field': object
 19 |     }
 20 | 
 21 | 
 22 | class InheritedDataFrame(MyDataFrame):
 23 |     schema = {
 24 |         'new_field': np.int64
 25 |     }
 26 | 
 27 | 
 28 | class DataFrameWithOptional(TypedDataFrame):
 29 |     schema = {
 30 |         'required': bool
 31 |     }
 32 |     optional = {
 33 |         'optional': bool
 34 |     }
 35 | 
 36 | 
 37 | class IndexDataFrame(TypedDataFrame):
 38 |     schema = {
 39 |         'foo': bool
 40 |     }
 41 | 
 42 |     index_schema = ('bar', DATE_TIME_DTYPE)
 43 | 
 44 | 
 45 | class ChildIndexDataFrame(IndexDataFrame):
 46 |     pass
 47 | 
 48 | 
 49 | class UTCDateTimeDataframe(TypedDataFrame):
 50 |     schema = {
 51 |         'date_field': UTC_DATE_TIME_DTYPE
 52 |     }
 53 | 
 54 | 
 55 | def test_utc_datetime_success_case():
 56 |     df = pd.DataFrame({'date_field': [datetime.date.today(), datetime.date(2021, 5, 31)]})
 57 |     df.date_field = pd.to_datetime(df.date_field, utc=True)
 58 |     _ = UTCDateTimeDataframe(df)
 59 | 
 60 | 
 61 | def test_utc_datetime_error_case():
 62 |     df = pd.DataFrame({'date_field': [datetime.date.today(), datetime.date(2021, 5, 31)]})
 63 |     df.date_field = pd.to_datetime(df.date_field)
 64 |     with pytest.raises(AssertionError):
 65 |         _ = UTCDateTimeDataframe(df)
 66 | 
 67 | 
 68 | def test_utc_datetime_convert_case():
 69 |     df = pd.DataFrame({'date_field': [datetime.date.today(), datetime.date(2021, 5, 31)]})
 70 |     _ = UTCDateTimeDataframe.convert(df)
 71 | 
 72 | 
 73 | def test_index_success_case():
 74 |     df = pd.DataFrame({'foo': [True, False]})
 75 |     df.index = pd.to_datetime(pd.Series([datetime.date.today(), datetime.date(2021, 5, 31)], name='bar'))
 76 |     _ = IndexDataFrame(df)
 77 |     _ = ChildIndexDataFrame(df)
 78 | 
 79 | 
 80 | def test_index_fail_case():
 81 |     df = pd.DataFrame({'foo': [True, False]})
 82 |     with pytest.raises(AssertionError):
 83 |         _ = IndexDataFrame(df)
 84 | 
 85 | 
 86 | def test_index_convert_success_case():
 87 |     df = pd.DataFrame({'foo': [True, False]})
 88 |     df.index = pd.Series(['2021-06-03', '2021-05-31'])
 89 |     _ = IndexDataFrame.convert(df)
 90 | 
 91 | 
 92 | def test_base_success_case():
 93 |     df = pd.DataFrame({
 94 |         'int_field': np.int16([1, 2]),
 95 |         'float_field': np.float64([0.1, 0.2]),
 96 |         'bool_field': [True, False],
 97 |         'str_field': ["one", "two"],
 98 |         'obj_field': ["", ""],
 99 |         'new_field': np.int64([10, 20])
100 |     })
101 |     _ = InheritedDataFrame(df)
102 | 
103 | 
104 | class CategoricalFrame(TypedDataFrame):
105 |     schema = {
106 |         'col': ('foo', 'bar')
107 |     }
108 | 
109 | 
110 | def test_categorical_success_1():
111 |     df = pd.DataFrame({'col': ['foo', 'foo', 'bar']})
112 |     df.col = pd.Categorical(df.col, categories=('foo', 'bar'), ordered=True)
113 |     _ = CategoricalFrame(df)
114 | 
115 | 
116 | def test_categorical_success_2():
117 |     df = pd.DataFrame({'col': ['foo', 'foo']})
118 |     df.col = pd.Categorical(df.col, categories=('foo', 'bar'), ordered=True)
119 |     _ = CategoricalFrame(df)
120 | 
121 | 
122 | def test_categorical_failure_1():
123 |     df = pd.DataFrame({'col': ['foo', 'foo']})
124 |     df.col = pd.Categorical(df.col, categories=('foo', 'bar', 'buzz'), ordered=True)
125 |     with pytest.raises(AssertionError):
126 |         _ = CategoricalFrame(df)
127 | 
128 | 
129 | def test_categorical_failure_3():
130 |     df = pd.DataFrame({'col': ['foo', 'foo']})
131 |     with pytest.raises(AssertionError):
132 |         _ = CategoricalFrame(df)
133 | 
134 | 
135 | def test_convert_categorical():
136 |     df = pd.DataFrame({'col': ['foo', 'foo']})
137 |     _ = CategoricalFrame.convert(df)
138 | 
139 | 
140 | def test_convert_optional():
141 |     df = pd.DataFrame({'required': [True]})
142 |     data = DataFrameWithOptional.convert(df, add_optional_cols=True)
143 |     assert all(col in data.df.columns for col in DataFrameWithOptional.dtype().keys())
144 | 
145 | 
146 | def test_convert_categorical_failure():
147 |     df = pd.DataFrame({'col': ['foo', 'buzz']})
148 |     with pytest.raises(AssertionError):
149 |         _ = CategoricalFrame.convert(df)
150 | 
151 | 
152 | def test_categorical_with_nans_failure():
153 |     df = pd.DataFrame({'col': ['foo', 'buzz']})
154 |     df.col = pd.Categorical(df.col, categories=CategoricalFrame.schema['col'], ordered=True)
155 |     with pytest.raises(AssertionError):
156 |         _ = CategoricalFrame(df)
157 | 
158 | 
159 | class PingInterface(metaclass=abc.ABCMeta):
160 | 
161 |     @abc.abstractmethod
162 |     def ping(self):
163 |         pass
164 | 
165 | 
166 | class Parent(TypedDataFrame):
167 |     schema = {
168 |         'foo': bool
169 |     }
170 | 
171 | 
172 | class Child(Parent, PingInterface):
173 |     
174 |     schema = {
175 |         'bar': bool
176 |     }
177 | 
178 |     def ping(self):
179 |         print("ping")
180 | 
181 | 
182 | def test_multiple_inheritance_1_success():
183 |     _ = Child(pd.DataFrame({'foo': [True], 'bar': [False]}))
184 | 
185 | 
186 | def test_multiple_inheritance_1_failure():
187 |     with pytest.raises(AssertionError):
188 |         _ = Child(pd.DataFrame({'bar': [False]}))
189 | 
190 | 
191 | class Root(TypedDataFrame):
192 |     
193 |     schema = {
194 |         'root': bool
195 |     }
196 | 
197 | 
198 | class Left(Root):
199 |     schema = {
200 |         'left': bool
201 |     }
202 | 
203 | 
204 | class Right(Root):
205 |     schema = {
206 |         'root': object,
207 |         'right': bool
208 |     }
209 | 
210 | 
211 | class Down(Left, Right):
212 |     pass
213 | 
214 | 
215 | def test_multiple_inheritance_2_success():
216 |     _ = Down(pd.DataFrame({'root': [True], 'left': [True], 'right': [True]}))
217 | 
218 | 
219 | def test_multiple_inheritance_2_failure():
220 |     with pytest.raises(AssertionError):
221 |         _ = Down(pd.DataFrame({'root': [True], 'left': [True]}))
222 | 
223 | 
224 | def test_multiple_inheritance_2_failure_with_root_overwrite():
225 |     with pytest.raises(AssertionError):
226 |         _ = Down(pd.DataFrame({'root': [True], 'left': [True], 'right': ['string']}))
227 | 


--------------------------------------------------------------------------------
/tests/test_polars_typedframe.py:
--------------------------------------------------------------------------------
  1 | import datetime
  2 | 
  3 | import polars as pl
  4 | import pytest
  5 | 
  6 | from typedframe.polars_ import PolarsTypedFrame as TypedDataFrame
  7 | 
  8 | 
  9 | class ParentDataFrame(TypedDataFrame):
 10 |     schema = {
 11 |         'int_field': pl.Int16,
 12 |         'float_field': pl.Float64,
 13 |         'bool_field': pl.Boolean,
 14 |         'str_field': pl.Utf8,
 15 |         'date_field': pl.Date,
 16 |         'datetime_field': pl.Datetime
 17 |     }
 18 | 
 19 | 
 20 | class MixinDataFrame(TypedDataFrame):
 21 |     schema = {
 22 |         'mixin_field': pl.Int64
 23 |     }
 24 | 
 25 | 
 26 | class ChildDataFrame(ParentDataFrame, MixinDataFrame):
 27 |     schema = {
 28 |         'new_field': pl.Int64
 29 |     }
 30 | 
 31 | 
 32 | class OptionalDataFrame(TypedDataFrame):
 33 |     schema = {
 34 |         'required': pl.Boolean
 35 |     }
 36 |     optional = {
 37 |         'optional': pl.Boolean
 38 |     }
 39 | 
 40 | 
 41 | def test_base_success_case():
 42 |     df = pl.DataFrame({'int_field': [1, 2, 3],
 43 |                        'float_field': [1.0, 2.0, 3.0],
 44 |                        'bool_field': [True, False, True],
 45 |                        'str_field': ['a', 'b', 'c'],
 46 |                        'date_field': [datetime.date(2021, 5, 31), datetime.date(2021, 6, 1), datetime.date(2021, 6, 2)],
 47 |                        'datetime_field': [datetime.datetime(2021, 5, 31, 12, 0, 0), datetime.datetime(2021, 6, 1, 12, 0, 0), datetime.datetime(2021, 6, 2, 12, 0, 0)],
 48 |                        'mixin_field': [1, 2, 3],
 49 |                        'new_field': [1, 2, 3]})
 50 |     df = df.with_column(pl.col('int_field').cast(pl.Int16))
 51 |     _ = ChildDataFrame(df)
 52 | 
 53 | 
 54 | def test_base_error_case():
 55 |     df = pl.DataFrame({'int_field': [1, 2, 3],
 56 |                        'float_field': [1.0, 2.0, 3.0],
 57 |                        'bool_field': [True, False, True],
 58 |                        'str_field': ['a', 'b', 'c'],
 59 |                        'new_field': [1, 2, 3]})
 60 |     with pytest.raises(AssertionError):
 61 |         _ = ChildDataFrame(df)
 62 | 
 63 | 
 64 | def test_convert_success_case():
 65 |     df = pl.DataFrame({'int_field': [1, 2, 3],
 66 |                        'float_field': [1.0, 2.0, 3.0],
 67 |                        'bool_field': [True, False, True],
 68 |                        'str_field': ['a', 'b', 'c'],
 69 |                        'date_field': [datetime.date(2021, 5, 31), datetime.date(2021, 6, 1), datetime.date(2021, 6, 2)],
 70 |                        'datetime_field': [datetime.datetime(2021, 5, 31, 12, 0, 0),
 71 |                                           datetime.datetime(2021, 6, 1, 12, 0, 0),
 72 |                                           datetime.datetime(2021, 6, 2, 12, 0, 0)]})
 73 |     _ = ParentDataFrame.convert(df)
 74 | 
 75 | 
 76 | def test_convert_error_case():
 77 |     df = pl.DataFrame({'int_field': [1, 2, 3],
 78 |                        'float_field': [1.0, 2.0, 3.0],
 79 |                        'bool_field': [True, False, True],
 80 |                        'str_field': ['a', 'b', 'c']})
 81 |     with pytest.raises(AssertionError):
 82 |         _ = ParentDataFrame.convert(df)
 83 | 
 84 | 
 85 | def test_optional_success_case():
 86 |     df = pl.DataFrame({'required': [True, False, True]})
 87 |     _ = OptionalDataFrame(df)
 88 | 
 89 | 
 90 | def test_optional_success_case_2():
 91 |     df = pl.DataFrame({'required': [True, False, True],
 92 |                        'optional': [True, False, True]})
 93 |     _ = OptionalDataFrame(df)
 94 | 
 95 | 
 96 | def test_optional_error_case():
 97 |     df = pl.DataFrame({'required': [True, False, True],
 98 |                        'optional': [2, 3, 1]})
 99 |     with pytest.raises(AssertionError):
100 |         _ = OptionalDataFrame(df)
101 | 
102 | 
103 | def test_convert_optional():
104 |     df = pl.DataFrame({'required': [True]})
105 |     data = OptionalDataFrame.convert(df, add_optional_cols=True)
106 |     assert all(col in data.df.columns for col in OptionalDataFrame.dtype().keys())
107 | 


--------------------------------------------------------------------------------
/typedframe/__init__.py:
--------------------------------------------------------------------------------
 1 | 
 2 | try:
 3 |     import pandas
 4 | except ImportError:
 5 |     pass
 6 | else:
 7 |     from typedframe.pandas_ import PandasTypedFrame as TypedDataFrame, DATE_TIME_DTYPE, UTC_DATE_TIME_DTYPE
 8 | 
 9 | try:
10 |     import polars
11 | except ImportError:
12 |     pass
13 | else:
14 |     from typedframe.polars_ import PolarsTypedFrame
15 | 
16 | __version__ = '0.11.0'
17 | 


--------------------------------------------------------------------------------
/typedframe/base.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Basic classes for typed wrappers over dataframes
 3 | """
 4 | from abc import abstractmethod
 5 | from itertools import chain
 6 | from typing import Type, TypeVar, Any
 7 | 
 8 | 
 9 | T = TypeVar("T", bound="TypedDataFrameBase")
10 | 
11 | 
12 | class TypedDataFrameBase:
13 |     """
14 |     Wrapper class over DataFrame to provide explicit schema specs.
15 | 
16 |     Provide expected dataframe schema in schema static variable.
17 |     Provide optional columns in optional static variable.
18 |     All columns from optional schema that are missing in a wrapped dataframe will be added with NaN values.
19 | 
20 |     Schemas can be inheritted via Python class inheritance. The semantics of it is the following:
21 |     all columns of the parent are also included to a child schema.
22 |     """
23 | 
24 |     schema = {}
25 | 
26 |     optional = {}
27 | 
28 |     @classmethod
29 |     @abstractmethod
30 |     def convert(cls: Type[T], df, add_optional_cols: bool = True) -> T:
31 |         pass
32 | 
33 |     @classmethod
34 |     def dtype(cls: Type[T], with_optional: bool = True) -> dict:
35 |         """
36 |         Combines schema of a current class and all super classes
37 |         """
38 |         return dict(chain(*(chain(cls.schema.items(), cls.optional.items())
39 |                             if with_optional else cls.schema.items()
40 |                             for cls in cls.__mro__[:-1] if hasattr(cls, 'schema'))))
41 | 
42 |     @classmethod
43 |     def _extract_actual_dtypes(cls: Type[T], df) -> dict:
44 |         return cls._extract_actual_dtypes(df)
45 | 
46 |     @classmethod
47 |     @abstractmethod
48 |     def _normalize_actual_dtype(cls: Type[T], dtype: Any) -> Any:
49 |         pass
50 | 
51 |     @classmethod
52 |     @abstractmethod
53 |     def _normalize_expected_dtype(cls: Type[T], dtype: Any) -> Any:
54 |         pass
55 | 
56 |     @classmethod
57 |     def _dtypes_mismatch(cls: Type[T], actual: Any, expected: Any) -> bool:
58 |         actual = cls._normalize_actual_dtype(actual)
59 |         expected = cls._normalize_expected_dtype(expected)
60 |         return actual != expected
61 | 
62 |     def __init__(self, df):
63 | 
64 |         actual_dtypes = self._extract_actual_dtypes(df)
65 |         expected = self.dtype(with_optional=False).items()
66 | 
67 |         diff = set()
68 |         for col, dtype in expected:
69 |             try:
70 |                 if col not in actual_dtypes or self._dtypes_mismatch(actual_dtypes[col], dtype):
71 |                     diff.add((col, dtype))
72 |             except TypeError:
73 |                 diff.add((col, dtype))
74 | 
75 |         optional = self.dtype().items()
76 |         for col, dtype in optional:
77 |             try:
78 |                 if col in actual_dtypes and self._dtypes_mismatch(actual_dtypes[col], dtype):
79 |                     diff.add((col, dtype))
80 |             except TypeError:
81 |                 diff.add((col, dtype))
82 | 
83 |         if diff:
84 |             actual = {key: self._normalize_actual_dtype(value) for key, value in actual_dtypes.items()}
85 |             expected = {key: self._normalize_expected_dtype(value) for key, value in self.dtype().items()}
86 |             raise AssertionError(
87 |                 "Dataframe doesn't match schema\n"
88 |                 f"Actual: {actual}\nExpected: {expected}\nDifference: {diff}"
89 |             )
90 | 


--------------------------------------------------------------------------------
/typedframe/pandas_.py:
--------------------------------------------------------------------------------
  1 | 
  2 | from typing import Type, TypeVar, Any
  3 | import pytz
  4 | 
  5 | import pandas as pd
  6 | import numpy as np
  7 | 
  8 | from typedframe.base import TypedDataFrameBase
  9 | 
 10 | try:
 11 |     from pandas.api.types import CategoricalDtype
 12 | except ImportError:
 13 |     from pandas.types.dtypes import CategoricalDtype
 14 | 
 15 | """
 16 | dtype for datetime column
 17 | """
 18 | DATE_TIME_DTYPE = np.dtype('datetime64[ns]')
 19 | UTC_DATE_TIME_DTYPE = pd.DatetimeTZDtype('ns', pytz.UTC)
 20 | 
 21 | T = TypeVar("T", bound="PandasTypedFrame")
 22 | 
 23 | _OBJECT_TYPES = {list, str, dict}
 24 | 
 25 | 
 26 | class PandasTypedFrame(TypedDataFrameBase):
 27 |     """
 28 |     Wrapper class over pandas
 29 |     """
 30 | 
 31 |     index_schema = (None, None)  # (name, dtype)
 32 | 
 33 |     @classmethod
 34 |     def convert(cls: Type[T], df: pd.DataFrame, add_optional_cols: bool = True) -> T:
 35 |         """
 36 |         Tries to convert a given dataframe and wrap in a typed dataframe.
 37 | 
 38 |         Examples
 39 |         --------
 40 | 
 41 |         >>> from typedframe.pandas_ import PandasTypedFrame, DATE_TIME_DTYPE
 42 |         >>> class MyTable(PandasTypedFrame):
 43 |         ...    schema = {
 44 |         ...       "col1": str,
 45 |         ...       "col2": np.int32,
 46 |         ...       "col3": ('foo', 'bar')
 47 |         ...    }
 48 |         ...    optional = {
 49 |         ...       "col4": bool,
 50 |         ...       "col5": DATE_TIME_DTYPE
 51 |         ...    }
 52 | 
 53 |         >>> df = pd.DataFrame({"col1": ['foo'], "col2": np.array([1], dtype=np.int32), "col3": ['bar']})
 54 |         >>> df.col3 = pd.Categorical(df.col3, categories=('foo', 'bar'), ordered=True)
 55 |         >>> print(MyTable.convert(df).df)
 56 |         """
 57 |         df = df.copy()
 58 | 
 59 |         if add_optional_cols:
 60 |             required = cls.dtype(with_optional=False)
 61 |             addon = {col: dtype for col, dtype in cls.dtype().items() if col not in df.columns and col not in required}
 62 |             df: pd.DataFrame = df if len(addon) == 0 else pd.concat(
 63 |                 [df, pd.DataFrame(columns=addon.keys()).astype(addon)], axis=1)
 64 | 
 65 |         expected = cls.dtype()
 66 |         for col in df.columns:
 67 |             try:
 68 |                 if col in expected:
 69 |                     if isinstance(expected[col], tuple):
 70 |                         actual_cats = set(df[col].unique())
 71 |                         categories_diff = actual_cats.difference(set(expected[col]))
 72 |                         if categories_diff:
 73 |                             raise AssertionError(f"For column: {col} there are unknown categories: {categories_diff}")
 74 |                         df[col] = pd.Categorical(df[col], categories=expected[col], ordered=True)
 75 |                     elif expected[col] == DATE_TIME_DTYPE:
 76 |                         df[col] = pd.to_datetime(df[col])
 77 |                     elif expected[col] == UTC_DATE_TIME_DTYPE:
 78 |                         df[col] = pd.to_datetime(df[col], utc=True)
 79 |                     else:
 80 |                         df[col] = df[col].astype(expected[col])
 81 |             except Exception as e:
 82 |                 raise AssertionError(f"Failed to convert column: {col}") from e
 83 | 
 84 |         if cls.index_schema[1]:
 85 |             df.index = df.index.astype(cls.index_schema[1])
 86 |             df.index.name = cls.index_schema[0]
 87 | 
 88 |         return cls(df)
 89 | 
 90 |     @classmethod
 91 |     def _extract_actual_dtypes(cls: Type[T], df: pd.DataFrame) -> dict:
 92 |         return df.dtypes.to_dict()
 93 | 
 94 |     @classmethod
 95 |     def _normalize_actual_dtype(cls: Type[T], dtype: Any) -> Any:
 96 |         if isinstance(dtype, CategoricalDtype):
 97 |             return tuple(dtype.categories)
 98 |         else:
 99 |             return dtype
100 | 
101 |     @classmethod
102 |     def _normalize_expected_dtype(cls: Type[T], dtype: Any) -> Any:
103 |         try:
104 |             if dtype in _OBJECT_TYPES:
105 |                 return object
106 |             else:
107 |                 return dtype
108 |         except TypeError:
109 |             return dtype
110 | 
111 |     def __init__(self, df: pd.DataFrame):
112 | 
113 |         if not isinstance(df, pd.DataFrame):
114 |             raise AssertionError(f"Input argument of type {type(df)} is not an instance of pandas DataFrame")
115 | 
116 |         super().__init__(df)
117 | 
118 |         if self.index_schema[1]:
119 |             if df.index.name != self.index_schema[0]:
120 |                 raise AssertionError(f"expected index name {self.index_schema[0]}, actual index name {df.index.name}")
121 |             try:
122 |                 if self._dtypes_mismatch(df.index.dtype, self.index_schema[1]):
123 |                     raise AssertionError(f"expected index dtype {self.index_schema[1]}, actual index dtype {df.index.dtype}")
124 |             except TypeError:
125 |                 raise AssertionError(f"expected index dtype {self.index_schema[1]}, actual index dtype {df.index.dtype}")
126 | 
127 |         categoricals = [df[c] for c in df.columns if isinstance(df[c].dtype, CategoricalDtype)]
128 |         for col in categoricals:
129 |             if object != col.values.categories.dtype:
130 |                 raise AssertionError("Categoricals must have str categories")
131 |             if np.nan in col.unique():
132 |                 raise AssertionError("Categoricals must not have NaNs")
133 | 
134 |         self.df = df
135 | 


--------------------------------------------------------------------------------
/typedframe/polars_.py:
--------------------------------------------------------------------------------
 1 | from typing import Any
 2 | from typing import Type, TypeVar, Any
 3 | 
 4 | import polars as pl
 5 | 
 6 | from typedframe.base import TypedDataFrameBase
 7 | 
 8 | T = TypeVar("T", bound="PolarsTypedFrame")
 9 | 
10 | 
11 | class PolarsTypedFrame(TypedDataFrameBase):
12 | 
13 |     @classmethod
14 |     def convert(cls: Type["T"], df: pl.DataFrame, add_optional_cols: bool = True) -> T:
15 | 
16 |         addon = {}
17 |         if add_optional_cols:
18 |             required = cls.dtype(with_optional=False)
19 |             addon = {col: dtype for col, dtype in cls.dtype().items() if col not in df.columns and col not in required}
20 | 
21 |         expected = cls.dtype()
22 |         df = df.with_columns([
23 |             pl.col(col).cast(expected[col]) for col in df.columns if col in expected
24 |         ] + [
25 |             pl.lit(None, dtype=dtype).alias(col) for col, dtype in addon.items()
26 |         ])
27 |         return cls(df)
28 | 
29 |     @classmethod
30 |     def _extract_actual_dtypes(cls, df: pl.DataFrame) -> dict:
31 |         return dict(zip(df.columns, df.dtypes))
32 | 
33 |     @classmethod
34 |     def _normalize_actual_dtype(cls, dtype: Any) -> Any:
35 |         return dtype
36 | 
37 |     @classmethod
38 |     def _normalize_expected_dtype(cls, dtype: Any) -> Any:
39 |         return dtype
40 | 
41 |     def __init__(self, df: pl.DataFrame):
42 | 
43 |         if not isinstance(df, pl.DataFrame):
44 |             raise AssertionError(f"Input argument of type {type(df)} is not an instance of polars DataFrame")
45 | 
46 |         super().__init__(df)
47 |         self.df = df
48 | 


--------------------------------------------------------------------------------