├── .flake8
├── .github
    └── workflows
    │   ├── docs.yml
    │   └── tests.yml
├── .gitignore
├── LICENSE
├── README.md
├── docs
    ├── CNAME
    ├── assets
    │   ├── api.png
    │   ├── cover.png
    │   ├── favicon.ico
    │   └── logo-white.png
    ├── index.md
    ├── models
    │   ├── image-classification.md
    │   ├── object-detection.md
    │   └── text-classification.md
    ├── requirements.txt
    ├── stylesheets
    │   ├── extra.css
    │   └── extra.js
    └── tutorial
    │   ├── deployment.md
    │   ├── experiment-tracking.md
    │   ├── intro.md
    │   ├── quickstart.ipynb
    │   ├── raw-models.md
    │   └── training.md
├── examples
    └── mnist-cnn-example.py
├── mkdocs.yml
├── requirements.txt
├── setup.py
├── tests
    ├── conftest.py
    ├── image_classification
    │   ├── test_preprocessing.py
    │   ├── test_sklearn_models.py
    │   └── test_torch_models.py
    ├── test_main.py
    └── test_model_wrapper.py
└── traintool
    ├── __init__.py
    ├── _version.txt
    ├── image_classification
        ├── __init__.py
        ├── preprocessing.py
        ├── sklearn_models.py
        ├── torch_models.py
        └── visualization.py
    ├── main.py
    ├── model_wrapper.py
    └── utils.py


/.flake8:
--------------------------------------------------------------------------------
1 | [flake8]
2 | max-line-length = 88
3 | extend-ignore = E203,W291,W293
4 | 


--------------------------------------------------------------------------------
/.github/workflows/docs.yml:
--------------------------------------------------------------------------------
 1 | name: docs
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - master
 7 | 
 8 | jobs:
 9 |   deploy:
10 |     runs-on: ubuntu-latest
11 |     steps:
12 |       - uses: actions/checkout@v2
13 |       - name: Set up Python 3.7
14 |         uses: actions/setup-python@v2
15 |         with:
16 |           python-version: 3.7
17 |       - name: Install dependencies for docs
18 |         run: pip install -r docs/requirements.txt
19 |       - name: Deploy to gh-pages
20 |         run: mkdocs gh-deploy --force


--------------------------------------------------------------------------------
/.github/workflows/tests.yml:
--------------------------------------------------------------------------------
 1 | name: tests
 2 | 
 3 | on: [push]
 4 | 
 5 | jobs:
 6 |   build:
 7 | 
 8 |     runs-on: ubuntu-latest
 9 |     strategy:
10 |       matrix:
11 |         python-version: [3.6, 3.7, 3.8]
12 |     # <3.6 is not possible because we use f-strings and type annotations
13 |     # 3.9 gives an error right now because pytorch doesn't support it yet apparently.
14 | 
15 |     steps:
16 |     - uses: actions/checkout@v2
17 |     - name: Set up Python
18 |       uses: actions/setup-python@v2
19 |       with:
20 |         python-version: ${{ matrix.python-version }}
21 |     - name: Install dependencies
22 |       run: |
23 |         python -m pip install --upgrade pip
24 |         pip install pytest pytest-cov
25 |         if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
26 |     # - name: Lint with flake8
27 |     #   run: |
28 |     #     # stop the build if there are Python syntax errors or undefined names
29 |     #     flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
30 |     #     # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
31 |     #     flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
32 |     - name: Test with pytest
33 |       run: |
34 |         pytest --cov=./ --cov-report=xml
35 |     - name: Upload coverage to Codecov
36 |       uses: codecov/codecov-action@v1
37 |       with:
38 |         token: ${{ secrets.CODECOV_TOKEN }} # not required for public repos
39 |         file: ./coverage.xml # optional
40 |         files: ./coverage1.xml,./coverage2.xml # optional
41 |         flags: unittests # optional
42 |         name: codecov-umbrella # optional
43 |         fail_ci_if_error: true # optional (default = false)


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | data
  2 | settings.json
  3 | .vscode
  4 | traintool-experiments
  5 | .VSCodeCounter
  6 | 
  7 | 
  8 | # Byte-compiled / optimized / DLL files
  9 | __pycache__/
 10 | *.py[cod]
 11 | *$py.class
 12 | 
 13 | # C extensions
 14 | *.so
 15 | 
 16 | # Distribution / packaging
 17 | .Python
 18 | build/
 19 | develop-eggs/
 20 | dist/
 21 | downloads/
 22 | eggs/
 23 | .eggs/
 24 | lib/
 25 | lib64/
 26 | parts/
 27 | sdist/
 28 | var/
 29 | wheels/
 30 | pip-wheel-metadata/
 31 | share/python-wheels/
 32 | *.egg-info/
 33 | .installed.cfg
 34 | *.egg
 35 | MANIFEST
 36 | 
 37 | # PyInstaller
 38 | #  Usually these files are written by a python script from a template
 39 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 40 | *.manifest
 41 | *.spec
 42 | 
 43 | # Installer logs
 44 | pip-log.txt
 45 | pip-delete-this-directory.txt
 46 | 
 47 | # Unit test / coverage reports
 48 | htmlcov/
 49 | .tox/
 50 | .nox/
 51 | .coverage
 52 | .coverage.*
 53 | .cache
 54 | nosetests.xml
 55 | coverage.xml
 56 | *.cover
 57 | *.py,cover
 58 | .hypothesis/
 59 | .pytest_cache/
 60 | 
 61 | # Translations
 62 | *.mo
 63 | *.pot
 64 | 
 65 | # Django stuff:
 66 | *.log
 67 | local_settings.py
 68 | db.sqlite3
 69 | db.sqlite3-journal
 70 | 
 71 | # Flask stuff:
 72 | instance/
 73 | .webassets-cache
 74 | 
 75 | # Scrapy stuff:
 76 | .scrapy
 77 | 
 78 | # Sphinx documentation
 79 | docs/_build/
 80 | 
 81 | # PyBuilder
 82 | target/
 83 | 
 84 | # Jupyter Notebook
 85 | .ipynb_checkpoints
 86 | 
 87 | # IPython
 88 | profile_default/
 89 | ipython_config.py
 90 | 
 91 | # pyenv
 92 | .python-version
 93 | 
 94 | # pipenv
 95 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 96 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 97 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 98 | #   install all needed dependencies.
 99 | #Pipfile.lock
100 | 
101 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow
102 | __pypackages__/
103 | 
104 | # Celery stuff
105 | celerybeat-schedule
106 | celerybeat.pid
107 | 
108 | # SageMath parsed files
109 | *.sage.py
110 | 
111 | # Environments
112 | .env
113 | .venv
114 | env/
115 | venv/
116 | ENV/
117 | env.bak/
118 | venv.bak/
119 | 
120 | # Spyder project settings
121 | .spyderproject
122 | .spyproject
123 | 
124 | # Rope project settings
125 | .ropeproject
126 | 
127 | # mkdocs documentation
128 | /site
129 | 
130 | # mypy
131 | .mypy_cache/
132 | .dmypy.json
133 | dmypy.json
134 | 
135 | # Pyre type checker
136 | .pyre/
137 | .pheasant_cache
138 | 
139 | config.json
140 | *config.json
141 | */tmp/*
142 | 
143 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 |                                  Apache License
  2 |                            Version 2.0, January 2004
  3 |                         http://www.apache.org/licenses/
  4 | 
  5 |    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 |    1. Definitions.
  8 | 
  9 |       "License" shall mean the terms and conditions for use, reproduction,
 10 |       and distribution as defined by Sections 1 through 9 of this document.
 11 | 
 12 |       "Licensor" shall mean the copyright owner or entity authorized by
 13 |       the copyright owner that is granting the License.
 14 | 
 15 |       "Legal Entity" shall mean the union of the acting entity and all
 16 |       other entities that control, are controlled by, or are under common
 17 |       control with that entity. For the purposes of this definition,
 18 |       "control" means (i) the power, direct or indirect, to cause the
 19 |       direction or management of such entity, whether by contract or
 20 |       otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |       outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |       "You" (or "Your") shall mean an individual or Legal Entity
 24 |       exercising permissions granted by this License.
 25 | 
 26 |       "Source" form shall mean the preferred form for making modifications,
 27 |       including but not limited to software source code, documentation
 28 |       source, and configuration files.
 29 | 
 30 |       "Object" form shall mean any form resulting from mechanical
 31 |       transformation or translation of a Source form, including but
 32 |       not limited to compiled object code, generated documentation,
 33 |       and conversions to other media types.
 34 | 
 35 |       "Work" shall mean the work of authorship, whether in Source or
 36 |       Object form, made available under the License, as indicated by a
 37 |       copyright notice that is included in or attached to the work
 38 |       (an example is provided in the Appendix below).
 39 | 
 40 |       "Derivative Works" shall mean any work, whether in Source or Object
 41 |       form, that is based on (or derived from) the Work and for which the
 42 |       editorial revisions, annotations, elaborations, or other modifications
 43 |       represent, as a whole, an original work of authorship. For the purposes
 44 |       of this License, Derivative Works shall not include works that remain
 45 |       separable from, or merely link (or bind by name) to the interfaces of,
 46 |       the Work and Derivative Works thereof.
 47 | 
 48 |       "Contribution" shall mean any work of authorship, including
 49 |       the original version of the Work and any modifications or additions
 50 |       to that Work or Derivative Works thereof, that is intentionally
 51 |       submitted to Licensor for inclusion in the Work by the copyright owner
 52 |       or by an individual or Legal Entity authorized to submit on behalf of
 53 |       the copyright owner. For the purposes of this definition, "submitted"
 54 |       means any form of electronic, verbal, or written communication sent
 55 |       to the Licensor or its representatives, including but not limited to
 56 |       communication on electronic mailing lists, source code control systems,
 57 |       and issue tracking systems that are managed by, or on behalf of, the
 58 |       Licensor for the purpose of discussing and improving the Work, but
 59 |       excluding communication that is conspicuously marked or otherwise
 60 |       designated in writing by the copyright owner as "Not a Contribution."
 61 | 
 62 |       "Contributor" shall mean Licensor and any individual or Legal Entity
 63 |       on behalf of whom a Contribution has been received by Licensor and
 64 |       subsequently incorporated within the Work.
 65 | 
 66 |    2. Grant of Copyright License. Subject to the terms and conditions of
 67 |       this License, each Contributor hereby grants to You a perpetual,
 68 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 69 |       copyright license to reproduce, prepare Derivative Works of,
 70 |       publicly display, publicly perform, sublicense, and distribute the
 71 |       Work and such Derivative Works in Source or Object form.
 72 | 
 73 |    3. Grant of Patent License. Subject to the terms and conditions of
 74 |       this License, each Contributor hereby grants to You a perpetual,
 75 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 76 |       (except as stated in this section) patent license to make, have made,
 77 |       use, offer to sell, sell, import, and otherwise transfer the Work,
 78 |       where such license applies only to those patent claims licensable
 79 |       by such Contributor that are necessarily infringed by their
 80 |       Contribution(s) alone or by combination of their Contribution(s)
 81 |       with the Work to which such Contribution(s) was submitted. If You
 82 |       institute patent litigation against any entity (including a
 83 |       cross-claim or counterclaim in a lawsuit) alleging that the Work
 84 |       or a Contribution incorporated within the Work constitutes direct
 85 |       or contributory patent infringement, then any patent licenses
 86 |       granted to You under this License for that Work shall terminate
 87 |       as of the date such litigation is filed.
 88 | 
 89 |    4. Redistribution. You may reproduce and distribute copies of the
 90 |       Work or Derivative Works thereof in any medium, with or without
 91 |       modifications, and in Source or Object form, provided that You
 92 |       meet the following conditions:
 93 | 
 94 |       (a) You must give any other recipients of the Work or
 95 |           Derivative Works a copy of this License; and
 96 | 
 97 |       (b) You must cause any modified files to carry prominent notices
 98 |           stating that You changed the files; and
 99 | 
100 |       (c) You must retain, in the Source form of any Derivative Works
101 |           that You distribute, all copyright, patent, trademark, and
102 |           attribution notices from the Source form of the Work,
103 |           excluding those notices that do not pertain to any part of
104 |           the Derivative Works; and
105 | 
106 |       (d) If the Work includes a "NOTICE" text file as part of its
107 |           distribution, then any Derivative Works that You distribute must
108 |           include a readable copy of the attribution notices contained
109 |           within such NOTICE file, excluding those notices that do not
110 |           pertain to any part of the Derivative Works, in at least one
111 |           of the following places: within a NOTICE text file distributed
112 |           as part of the Derivative Works; within the Source form or
113 |           documentation, if provided along with the Derivative Works; or,
114 |           within a display generated by the Derivative Works, if and
115 |           wherever such third-party notices normally appear. The contents
116 |           of the NOTICE file are for informational purposes only and
117 |           do not modify the License. You may add Your own attribution
118 |           notices within Derivative Works that You distribute, alongside
119 |           or as an addendum to the NOTICE text from the Work, provided
120 |           that such additional attribution notices cannot be construed
121 |           as modifying the License.
122 | 
123 |       You may add Your own copyright statement to Your modifications and
124 |       may provide additional or different license terms and conditions
125 |       for use, reproduction, or distribution of Your modifications, or
126 |       for any such Derivative Works as a whole, provided Your use,
127 |       reproduction, and distribution of the Work otherwise complies with
128 |       the conditions stated in this License.
129 | 
130 |    5. Submission of Contributions. Unless You explicitly state otherwise,
131 |       any Contribution intentionally submitted for inclusion in the Work
132 |       by You to the Licensor shall be under the terms and conditions of
133 |       this License, without any additional terms or conditions.
134 |       Notwithstanding the above, nothing herein shall supersede or modify
135 |       the terms of any separate license agreement you may have executed
136 |       with Licensor regarding such Contributions.
137 | 
138 |    6. Trademarks. This License does not grant permission to use the trade
139 |       names, trademarks, service marks, or product names of the Licensor,
140 |       except as required for reasonable and customary use in describing the
141 |       origin of the Work and reproducing the content of the NOTICE file.
142 | 
143 |    7. Disclaimer of Warranty. Unless required by applicable law or
144 |       agreed to in writing, Licensor provides the Work (and each
145 |       Contributor provides its Contributions) on an "AS IS" BASIS,
146 |       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147 |       implied, including, without limitation, any warranties or conditions
148 |       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149 |       PARTICULAR PURPOSE. You are solely responsible for determining the
150 |       appropriateness of using or redistributing the Work and assume any
151 |       risks associated with Your exercise of permissions under this License.
152 | 
153 |    8. Limitation of Liability. In no event and under no legal theory,
154 |       whether in tort (including negligence), contract, or otherwise,
155 |       unless required by applicable law (such as deliberate and grossly
156 |       negligent acts) or agreed to in writing, shall any Contributor be
157 |       liable to You for damages, including any direct, indirect, special,
158 |       incidental, or consequential damages of any character arising as a
159 |       result of this License or out of the use or inability to use the
160 |       Work (including but not limited to damages for loss of goodwill,
161 |       work stoppage, computer failure or malfunction, or any and all
162 |       other commercial damages or losses), even if such Contributor
163 |       has been advised of the possibility of such damages.
164 | 
165 |    9. Accepting Warranty or Additional Liability. While redistributing
166 |       the Work or Derivative Works thereof, You may choose to offer,
167 |       and charge a fee for, acceptance of support, warranty, indemnity,
168 |       or other liability obligations and/or rights consistent with this
169 |       License. However, in accepting such obligations, You may act only
170 |       on Your own behalf and on Your sole responsibility, not on behalf
171 |       of any other Contributor, and only if You agree to indemnify,
172 |       defend, and hold each Contributor harmless for any liability
173 |       incurred by, or claims asserted against, such Contributor by reason
174 |       of your accepting any such warranty or additional liability.
175 | 
176 |    END OF TERMS AND CONDITIONS
177 | 
178 |    APPENDIX: How to apply the Apache License to your work.
179 | 
180 |       To apply the Apache License to your work, attach the following
181 |       boilerplate notice, with the fields enclosed by brackets "[]"
182 |       replaced with your own identifying information. (Don't include
183 |       the brackets!)  The text should be enclosed in the appropriate
184 |       comment syntax for the file format. We also recommend that a
185 |       file or class name and description of purpose be included on the
186 |       same "printed page" as the copyright notice for easier
187 |       identification within third-party archives.
188 | 
189 |    Copyright 2020 Johannes Rieke
190 | 
191 |    Licensed under the Apache License, Version 2.0 (the "License");
192 |    you may not use this file except in compliance with the License.
193 |    You may obtain a copy of the License at
194 | 
195 |        http://www.apache.org/licenses/LICENSE-2.0
196 | 
197 |    Unless required by applicable law or agreed to in writing, software
198 |    distributed under the License is distributed on an "AS IS" BASIS,
199 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
200 |    See the License for the specific language governing permissions and
201 |    limitations under the License.


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | <p align="center">
  2 |     <img src="docs/assets/cover.png" alt="traintool">
  3 | </p>
  4 | 
  5 | <!--
  6 | <p align="center">
  7 |     <a href="example.com" style="color: white; padding: 15px; border-radius: 10px; margin-right: 10px; box-shadow: 2px 2px 5px 0px rgba(150,150,150,1); background: rgb(120,88,188); background: linear-gradient(327deg, rgba(120,88,188,1) 0%, rgba(72,146,236,1) 100%);">Try it out</a>
  8 |     <a href="example.com" style="color: white; background-color: #7858BC; padding: 15px; border-radius: 10px; box-shadow: 2px 2px 5px 0px rgba(150,150,150,1);">Documentation</a>
  9 | </p>
 10 | <br>
 11 | -->
 12 | 
 13 | <p align="center">
 14 |     <em>Train off-the-shelf machine learning models in one line of code</em>
 15 | </p>
 16 | 
 17 | <p align="center">
 18 |     <a href="https://pypi.org/project/traintool/"><img src="https://img.shields.io/pypi/pyversions/traintool" alt="python version"></a>
 19 |     <a href="https://github.com/jrieke/traintool/actions"><img src="https://github.com/jrieke/traintool/workflows/tests/badge.svg" alt="tests"></a>
 20 |     <a href="https://codecov.io/gh/jrieke/traintool"><img src="https://codecov.io/gh/jrieke/traintool/branch/master/graph/badge.svg?token=NVH72ZXX8Z" alt="codecov"/></a>
 21 |     <a href="https://github.com/psf/black"><img src="https://img.shields.io/badge/code%20style-black-000000.svg" alt="Code style: black"></a>
 22 | </p>
 23 | 
 24 | <p align="center">
 25 |     <b><a href="https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb">Try it out in Google Colab</a> • <a href="https://traintool.jrieke.com/">Documentation</a></b>
 26 | </p>
 27 | 
 28 | ---
 29 | 
 30 | traintool is the easiest Python library for **applied machine learning**. It allows you 
 31 | to train off-the-shelf models with minimum code: Just give your data 
 32 | and the model name, and traintool takes care of the rest. It combines **pre-implemented 
 33 | models** (built on top of sklearn & pytorch) with powerful **utilities** that get you 
 34 | started in seconds (automatic visualizations, experiment tracking, intelligent data 
 35 | preprocessing, API deployment). 
 36 | 
 37 | 
 38 | <sup>Alpha Release: traintool is in an early alpha release. The API can and will change 
 39 | without notice. If you find a bug, please file an issue on 
 40 | [Github](https://github.com/jrieke/traintool) or 
 41 | [write me](mailto:johannes.rieke@gmail.com).</sup>
 42 | 
 43 | 
 44 | 
 45 | <!-- <br>
 46 | <p align="center">
 47 |     <b><a href="https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb" style="padding: 10px; margin-right: 10px; color: white; background-color: #4892EC; border: 2px solid #4892EC; border-radius: 10px;">Try it out in Google Colab</a></b>
 48 |     <b><a href="https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb" style="padding: 10px; border: 2px solid #4892EC; border-radius: 10px;">View Docs</a></b>
 49 | </p> -->
 50 | 
 51 | <!--
 52 | 
 53 | ## Is traintool for you?
 54 | 
 55 | **YES** if you...
 56 | 
 57 | - need to solve standard ML tasks with standard, off-the-shelf models
 58 | - prefer 98 % accuracy with one line of code over 98.1 % with 1000 lines
 59 | - want to compare different model types (e.g. deep network vs. SVM)
 60 | - care about experiment tracking & deployment
 61 | 
 62 | 
 63 | **NO** if you...
 64 | 
 65 | - need to customize every aspect of your model, e.g. in basic research
 66 | - want to chase state of the art
 67 | 
 68 | -->
 69 | 
 70 | 
 71 | ## Installation
 72 | 
 73 | ```bash
 74 | pip install traintool
 75 | ```
 76 | 
 77 | 
 78 | ## Features
 79 | 
 80 | - **Minimum coding —** traintool is designed to require as few lines of code as 
 81 | possible. It offers a sleek and intuitive interface that gets you started in seconds. 
 82 | Training a model just takes a single line:
 83 | 
 84 |     ```python
 85 |     traintool.train("resnet18", train_data, test_data, config={"optimizer": "adam", "lr": 0.1})
 86 |     ```
 87 | 
 88 | - **Pre-implemented models —** The heart of traintool are fully implemented and tested 
 89 | models – from simple classifiers to deep neural networks; built on sklearn, pytorch, 
 90 | or tensorflow. Here are only a few of the models you can use:
 91 | 
 92 |     ```python
 93 |     "svc", "random-forest", "alexnet", "resnet50", "inception_v3", ...
 94 |     ```
 95 | 
 96 | - **Automatic visualizations & experiment tracking —** traintool automatically 
 97 | calculates metrics, creates beautiful visualizations (in 
 98 | [tensorboard](https://www.tensorflow.org/tensorboard) or 
 99 | [comet.ml](https://www.comet.ml/)), and stores experiment data and 
100 | model checkpoints – without needing a single additional line of code. 
101 | 
102 | - **Ready for your data —** traintool understands numpy arrays, pytorch datasets, 
103 | and files. It automatically converts and preprocesses everything based on the model you 
104 | use.
105 | 
106 | - **Instant deployment —** In one line of code, you can deploy your model to a REST 
107 | API that you can query from anywhere. Just call:
108 | 
109 |     ```python
110 |     model.deploy()
111 |     ```
112 | 
113 | 
114 | <!--
115 | Features & design principles:
116 | 
117 | - **pre-implemented models** for most major use cases
118 | - automatic experiment tracking with **tensorboard or comet.ml**
119 | - instant **deployment** through REST API
120 | - supports multiple data formats (numpy, pytorch/tensorflow, files, ...)
121 | - access to raw models from sklearn/pytorch/tensorflow
122 | -->
123 | 
124 | 
125 | 
126 | 
127 | ## Example: Image classification on MNIST
128 | 
129 | Run this example interactively in Google Colab:
130 | 
131 | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb)
132 | 
133 | ```python
134 | import mnist
135 | import traintool
136 | 
137 | # Load MNIST data as numpy
138 | train_data = [mnist.train_images(), mnist.train_labels()]
139 | test_data = [mnist.test_images(), mnist.test_labels()]
140 | 
141 | # Train SVM classifier
142 | svc = traintool.train("svc", train_data=train_data, test_data=test_data)
143 | 
144 | # Train ResNet with custom hyperparameters
145 | resnet = traintool.train("resnet", train_data=train_data, test_data=test_data, 
146 |                          config={"lr": 0.1, "optimizer": "adam"})
147 | 
148 | # Make prediction
149 | result = resnet.predict(test_data[0][0])
150 | print(result["predicted_class"])
151 | 
152 | # Deploy to REST API
153 | resnet.deploy()
154 | 
155 | # Get underlying pytorch model (e.g. for custom analysis)
156 | pytorch_model = resnet.raw()["model"]
157 | ```
158 | 
159 | For more information, check out the 
160 | [complete tutorial](https://traintool.jrieke.com/tutorial/quickstart/).
161 | 
162 | 
163 | ## Get in touch!
164 | 
165 | You have a question on traintool, want to use it in production, or miss a feature? I'm 
166 | happy to hear from you! Write me at [johannes.rieke@gmail.com](mailto:johannes.rieke@gmail.com). 
167 | 


--------------------------------------------------------------------------------
/docs/CNAME:
--------------------------------------------------------------------------------
1 | traintool.jrieke.com


--------------------------------------------------------------------------------
/docs/assets/api.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jrieke/traintool/0ada1ff20a9a570be5cfb4ac21f3f914604c9833/docs/assets/api.png


--------------------------------------------------------------------------------
/docs/assets/cover.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jrieke/traintool/0ada1ff20a9a570be5cfb4ac21f3f914604c9833/docs/assets/cover.png


--------------------------------------------------------------------------------
/docs/assets/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jrieke/traintool/0ada1ff20a9a570be5cfb4ac21f3f914604c9833/docs/assets/favicon.ico


--------------------------------------------------------------------------------
/docs/assets/logo-white.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jrieke/traintool/0ada1ff20a9a570be5cfb4ac21f3f914604c9833/docs/assets/logo-white.png


--------------------------------------------------------------------------------
/docs/index.md:
--------------------------------------------------------------------------------
  1 | <p align="center">
  2 |     <img src="assets/cover.png" alt="traintool">
  3 | </p>
  4 | 
  5 | <!--
  6 | <p align="center">
  7 |     <a href="example.com" style="color: white; padding: 15px; border-radius: 10px; margin-right: 10px; box-shadow: 2px 2px 5px 0px rgba(150,150,150,1); background: rgb(120,88,188); background: linear-gradient(327deg, rgba(120,88,188,1) 0%, rgba(72,146,236,1) 100%);">Try it out</a>
  8 |     <a href="example.com" style="color: white; background-color: #7858BC; padding: 15px; border-radius: 10px; box-shadow: 2px 2px 5px 0px rgba(150,150,150,1);">Documentation</a>
  9 | </p>
 10 | <br>
 11 | -->
 12 | 
 13 | <p align="center">
 14 |     <em>Train off-the-shelf machine learning models in one line of code</em>
 15 | </p>
 16 | 
 17 | <p align="center">
 18 |     <a href="https://pypi.org/project/traintool/"><img src="https://img.shields.io/pypi/pyversions/traintool" alt="python version"></a>
 19 |     <a href="https://github.com/jrieke/traintool/actions"><img src="https://github.com/jrieke/traintool/workflows/tests/badge.svg" alt="tests"></a>
 20 |     <a href="https://codecov.io/gh/jrieke/traintool"><img src="https://codecov.io/gh/jrieke/traintool/branch/master/graph/badge.svg?token=NVH72ZXX8Z" alt="codecov"/></a>
 21 |     <a href="https://github.com/psf/black"><img src="https://img.shields.io/badge/code%20style-black-000000.svg" alt="Code style: black"></a>
 22 | </p>
 23 | 
 24 | <p align="center">
 25 |     <b><a href="https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb">Try it out in Google Colab</a> • <a href="https://traintool.jrieke.com/">Documentation</a></b>
 26 | </p>
 27 | 
 28 | ---
 29 | 
 30 | traintool is the easiest Python library for **applied machine learning**. It allows you 
 31 | to train off-the-shelf models with minimum code: Just give your data 
 32 | and the model name, and traintool takes care of the rest. It combines **pre-implemented 
 33 | models** (built on top of sklearn & pytorch) with powerful **utilities** that get you 
 34 | started in seconds (automatic visualizations, experiment tracking, intelligent data 
 35 | preprocessing, API deployment). 
 36 | 
 37 | 
 38 | !!! warning "Alpha Release"
 39 |     traintool is in an early alpha release. The API can and will change 
 40 |     without notice. If you find a bug, please file an issue on 
 41 |     [Github](https://github.com/jrieke/traintool) or [write me](mailto:johannes.rieke@gmail.com).
 42 | 
 43 | 
 44 | 
 45 | <!-- <br>
 46 | <p align="center">
 47 |     <b><a href="https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb" style="padding: 10px; margin-right: 10px; color: white; background-color: #4892EC; border: 2px solid #4892EC; border-radius: 10px;">Try it out in Google Colab</a></b>
 48 |     <b><a href="https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb" style="padding: 10px; border: 2px solid #4892EC; border-radius: 10px;">View Docs</a></b>
 49 | </p> -->
 50 | 
 51 | <!--
 52 | 
 53 | ## Is traintool for you?
 54 | 
 55 | **YES** if you...
 56 | 
 57 | - need to solve standard ML tasks with standard, off-the-shelf models
 58 | - prefer 98 % accuracy with one line of code over 98.1 % with 1000 lines
 59 | - want to compare different model types (e.g. deep network vs. SVM)
 60 | - care about experiment tracking & deployment
 61 | 
 62 | 
 63 | **NO** if you...
 64 | 
 65 | - need to customize every aspect of your model, e.g. in basic research
 66 | - want to chase state of the art
 67 | 
 68 | -->
 69 | 
 70 | 
 71 | ## Installation
 72 | 
 73 | ```bash
 74 | pip install traintool
 75 | ```
 76 | 
 77 | 
 78 | 
 79 | ## Features
 80 | 
 81 | - **Minimum coding —** traintool is designed to require as few lines of code as 
 82 | possible. It offers a sleek and intuitive interface that gets you started in seconds. 
 83 | Training a model just takes a single line:
 84 | 
 85 |         traintool.train("resnet18", train_data, test_data, config={"optimizer": "adam", "lr": 0.1})
 86 | 
 87 | 
 88 | - **Pre-implemented models —** The heart of traintool are fully implemented and tested 
 89 | models – from simple classifiers to deep neural networks; built on sklearn, pytorch, 
 90 | or tensorflow. Here are only a few of the models you can use:
 91 | 
 92 |         "svc", "random-forest", "alexnet", "resnet50", "inception_v3", ...
 93 | 
 94 | - **Automatic visualizations & experiment tracking —** traintool automatically 
 95 | calculates metrics, creates beautiful visualizations (in 
 96 | [tensorboard](https://www.tensorflow.org/tensorboard) or 
 97 | [comet.ml](https://www.comet.ml/)), and stores experiment data and 
 98 | model checkpoints – without needing a single additional line of code. 
 99 | 
100 | - **Ready for your data —** traintool understands numpy arrays, pytorch datasets, 
101 | and files. It automatically converts and preprocesses everything based on the model you 
102 | use.
103 | 
104 | - **Instant deployment —** In one line of code, you can deploy your model to a REST 
105 | API that you can query from anywhere. Just call:
106 | 
107 |         model.deploy()
108 | 
109 | 
110 | <!--
111 | Features & design principles:
112 | 
113 | - **pre-implemented models** for most major use cases
114 | - automatic experiment tracking with **tensorboard or comet.ml**
115 | - instant **deployment** through REST API
116 | - supports multiple data formats (numpy, pytorch/tensorflow, files, ...)
117 | - access to raw models from sklearn/pytorch/tensorflow
118 | -->
119 | 
120 | 
121 | ## Example: Image classification on MNIST
122 | 
123 | Run this example interactively in Google Colab:
124 | 
125 | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb)
126 | 
127 | ```python
128 | import mnist
129 | import traintool
130 | 
131 | # Load MNIST data as numpy
132 | train_data = [mnist.train_images(), mnist.train_labels()]
133 | test_data = [mnist.test_images(), mnist.test_labels()]
134 | 
135 | # Train SVM classifier
136 | svc = traintool.train("svc", train_data=train_data, test_data=test_data)
137 | 
138 | # Train ResNet with custom hyperparameters
139 | resnet = traintool.train("resnet", train_data=train_data, test_data=test_data, 
140 |                          config={"lr": 0.1, "optimizer": "adam"})
141 | 
142 | # Make prediction
143 | result = resnet.predict(test_data[0][0])
144 | print(result["predicted_class"])
145 | 
146 | # Deploy to REST API
147 | resnet.deploy()
148 | 
149 | # Get underlying pytorch model (e.g. for custom analysis)
150 | pytorch_model = resnet.raw()["model"]
151 | ```
152 | 
153 | For more information, check out the 
154 | [complete tutorial](https://traintool.jrieke.com/tutorial/quickstart/).
155 | 
156 | 
157 | ## Get in touch!
158 | 
159 | You have a question on traintool, want to use it in production, or miss a feature? I'm 
160 | happy to hear from you! Write me at [johannes.rieke@gmail.com](mailto:johannes.rieke@gmail.com). 
161 | 


--------------------------------------------------------------------------------
/docs/models/image-classification.md:
--------------------------------------------------------------------------------
  1 | # Image classification
  2 | 
  3 | ![](https://devopedia.org/images/article/172/7316.1561043304.png)
  4 | 
  5 | Image classification models classify an image into one out of several categories or 
  6 | classes, based on the image content (e.g. "cat" or "dog"). 
  7 | 
  8 | ## Input formats
  9 | 
 10 | ### Numpy arrays
 11 | 
 12 | Each data set should be a list of two elements: The first element is a numpy array 
 13 | of all images of shape `(number of images, color channels (1 or 3), height, width)`. The second 
 14 | element is an array of labels (as integer indices).
 15 | 
 16 | Example:
 17 | 
 18 | ```python
 19 | train_images = np.zeros(32, 3, 256, 256)  # 32 images with 3 color channels and size 256x256
 20 | train_labels = np.zeros(32, dtype=int)
 21 | 
 22 | traintool.train(..., train_data=[train_images, train_labels])
 23 | ```
 24 | 
 25 | <!--
 26 | ### Pytorch datasets
 27 | 
 28 | Each element of the dataset should be a tuple: The first element is a torch tensor of 
 29 | the image of size `(color channels, width, height)`. The second element is the label as 
 30 | integer. All [datasets from torchvision](https://pytorch.org/docs/stable/torchvision/datasets.html) 
 31 | are compatible to this format. 
 32 | -->
 33 | 
 34 | ### Files
 35 | 
 36 | Image files should be arranged in one folder per class, similar to this:
 37 | 
 38 | ```
 39 | train
 40 | +-- dogs
 41 | |   +-- funny-dog.jpg
 42 | |   +-- another-dog.png
 43 | +-- cats
 44 | |   +-- brown-cat.png
 45 | |   +-- black-cat.png
 46 | ...
 47 | ```
 48 | 
 49 | Then simply pass the directory path to the `train` function:
 50 | 
 51 | ```python
 52 | traintool.train(..., train_data="./train")
 53 | ```
 54 | 
 55 | 
 56 | ## Scikit-learn models
 57 | 
 58 | These models implement simple classification algorithms that should train in a 
 59 | reasonable amount of time. Note that they are not GPU-accelerated so they might still
 60 | take quite long with large datasets. 
 61 | 
 62 | **Preprocessing:** Image files are first loaded to a size of 28 x 28. All images (numpy 
 63 | or files) are then flattened and scaled to mean 0, standard deviation 1 (based on the 
 64 | train set). 
 65 | 
 66 | **Config parameters:**
 67 | 
 68 | - `num_samples`: Set the number of samples to train on. This can be used to train on a 
 69 | subset of the data. Defaults to None (i.e. train on all data).
 70 | - `num_samples_to_plot`: Set the number of samples to plot to tensorboard for each 
 71 | dataset. Defaults to 5.
 72 | - All other config parameters are forwarded to the constructor of the sklearn object
 73 | 
 74 | **Models:**
 75 | 
 76 | - `random-forest`: A random forest classifier, from [sklearn.ensemble.RandomForestClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.ensemble.RandomForestClassifier.html)
 77 | - `gradient-boosting`: Gradient boosting for classification, from [sklearn.ensemble.GradientBoostingClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.ensemble.GradientBoostingClassifier.html)
 78 | - `gaussian-process`: Gaussian process classification based on Laplace approximation, from [sklearn.gaussian_process.GaussianProcessClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.gaussian_process.GaussianProcessClassifier.html#sklearn.gaussian_process.GaussianProcessClassifier)
 79 | - `logistic-regression`: Logistic Regression (aka logit, MaxEnt) classifier, from [sklearn.linear_model.LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html)
 80 | - `sgd`: Linear classifiers (SVM, logistic regression, etc.) with SGD training, from [sklearn.linear_model.SGDClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.SGDClassifier.html)
 81 | - `perceptron`: A perceptron classifier, from [sklearn.linear_model.Perceptron](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.Perceptron.html)
 82 | - `passive-aggressive`: Passive aggressive classifier, from [sklearn.linear_model.PassiveAggressiveClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.PassiveAggressiveClassifier.html)
 83 | - `gaussian-nb`: Gaussian Naive Bayes, from [sklearn.naive_bayes.GaussianNB](https://scikit-learn.org/stable/modules/generated/sklearn.naive_bayes.GaussianNB.html)
 84 | - `k-neighbors`: Classifier implementing the k-nearest neighbors vote, from [sklearn.neighbors.KNeighborsClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.neighbors.KNeighborsClassifier.html)
 85 | - `mlp`: Multi-layer Perceptron classifier, from [sklearn.neural_network.MLPClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.neural_network.MLPClassifier.html)
 86 | - `svc`: C-Support Vector Classification, from [sklearn.svm.SVC](https://scikit-learn.org/stable/modules/generated/sklearn.svm.SVC.html)
 87 | - `linear-svc`: Linear Support Vector Classification, from [sklearn.svm.LinearSVC](https://scikit-learn.org/stable/modules/generated/sklearn.svm.LinearSVC.html)
 88 | - `decision-tree`: A decision tree classifier, from [sklearn.tree.DecisionTreeClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.tree.DecisionTreeClassifier.html)
 89 | - `extra-tree`: An extra-trees classifier, from [sklearn.ensemble.ExtraTreesClassifier](https://scikit-learn.org/stable/modules/generated/sklearn.ensemble.ExtraTreesClassifier.html)
 90 | 
 91 | 
 92 | 
 93 | ## PyTorch models
 94 | 
 95 | These models implement deep neural networks that can give better results on complex 
 96 | datasets. They are GPU-accelerated if run on a machine with a GPU. 
 97 | 
 98 | **Preprocessing:** All images (numpy or files) are rescaled to 256 x 256, then 
 99 | center-cropped to 224 x 224, MEAN STD
100 | 
101 | **Config parameters:**
102 | 
103 | - `num_classes`: The number of classes/different output labels (and therefore number of 
104 | output neurons of the network). Defaults to None, in which case it will be automatically 
105 | inferred from the data. 
106 | - `num_samples`: Set the number of samples to train on. This can be used to train on a 
107 | subset of the data. Defaults to None (i.e. train on all data).
108 | - `num_samples_to_plot`: Set the number of samples to plot to tensorboard for each 
109 | dataset. Defaults to 5.
110 | - `pretrained`: Whether to use pretrained weights for the models (trained on ImageNet). 
111 | Note that this requires that there are 1000 classes (the ImageNet classes). Defaults to 
112 | False. 
113 | 
114 | **Models:**
115 | 
116 | More information on the [torchvision docs](https://pytorch.org/docs/stable/torchvision/models.html). 
117 | 
118 | - `alexnet`: AlexNet model architecture from the [“One weird trick…”](https://arxiv.org/abs/1404.5997) paper
119 | - `vgg11`, `vgg11_bn`, `vgg13`, `vgg13_bn`, `vgg16`, `vgg16_bn`, `vgg19`, or `vgg19_bn`: VGG model variants from [“Very Deep Convolutional Networks For Large-Scale Image Recognition”](https://arxiv.org/pdf/1409.1556.pdf)
120 | - `resnet18`, `resnet34`, `resnet50`, `resnet101`, or `resnet152`: ResNet model variants from [“Deep Residual Learning for Image Recognition”](https://arxiv.org/pdf/1512.03385.pdf)
121 | - `squeezenet1_0`, or `squeezenet1_1`: SqueezeNet model variants from the [“SqueezeNet: AlexNet-level accuracy with 50x fewer parameters and <0.5MB model size”](https://arxiv.org/abs/1602.07360) paper.
122 | - `densenet121`, `densenet169`, `densenet161`, or `densenet201`: Densenet model variants from [“Densely Connected Convolutional Networks”](https://arxiv.org/pdf/1608.06993.pdf)
123 | - `inception_v3`: Inception v3 model architecture from [“Rethinking the Inception Architecture for Computer Vision”](http://arxiv.org/abs/1512.00567)
124 | - `googlenet`: GoogLeNet (Inception v1) model architecture from [“Going Deeper with Convolutions”](http://arxiv.org/abs/1409.4842)
125 | - `shufflenet_v2_x0_5`, `shufflenet_v2_x1_0`, `shufflenet_v2_x1_5`, or `shufflenet_v2_x2_0`: ShuffleNetV2 variants, as described in [“ShuffleNet V2: Practical Guidelines for Efficient CNN Architecture Design”](https://arxiv.org/abs/1807.11164)
126 | - `mobilenet_v2`: MobileNetV2 architecture from [“MobileNetV2: Inverted Residuals and Linear Bottlenecks”](https://arxiv.org/abs/1801.04381)
127 | - `resnext50_32x4d` or `resnext101_32x8d`: ResNeXt model variants from [“Aggregated Residual Transformation for Deep Neural Networks”](https://arxiv.org/pdf/1611.05431.pdf)
128 | - `wide_resnet50_2` or `wide_resnet101_2`: Wide ResNet-50-2 model variants from [“Wide Residual Networks”](https://arxiv.org/pdf/1605.07146.pdf)
129 | - `mnasnet0_5`, `mnasnet0_75`, `mnasnet1_0`, or `mnasnet1_3`: MNASNet variants from [“MnasNet: Platform-Aware Neural Architecture Search for Mobile”](https://arxiv.org/pdf/1807.11626.pdf)
130 | 
131 | 
132 | <!--
133 | ### Random forest
134 | 
135 | 
136 | 
137 | 
138 | - `simple-cnn`: 
139 | - `resnet18`: 
140 | - `alexnet`: 
141 | - `vgg16`: 
142 | - `squeezenet`: 
143 | - `densenet`: 
144 | - `inception`: 
145 | - `googlenet`: 
146 | - `shufflenet`: 
147 | - `mobilenet`: 
148 | - `resnext50_32x4d`: 
149 | - `wide_resnet50_2`: 
150 | - `mnasnet`: 
151 | 
152 | 
153 |     `random-forest`: 
154 |     `gradient-boosting`: 
155 |     `gaussian-process`: 
156 |     `logistic-regression`: 
157 |     `sgd`: 
158 |     `perceptron`: 
159 |     `passive-aggressive`: 
160 |     `gaussian-nb`: 
161 |     `k-neighbors`: 
162 |     `mlp`: 
163 |     `svc`: 
164 |     `linear-svc`: 
165 |     `decision-tree`: 
166 |     `extra-tree`: 
167 | -->


--------------------------------------------------------------------------------
/docs/models/object-detection.md:
--------------------------------------------------------------------------------
1 | # Object detection
2 | 
3 | Coming soon!


--------------------------------------------------------------------------------
/docs/models/text-classification.md:
--------------------------------------------------------------------------------
1 | # Text classification
2 | 
3 | Coming soon!


--------------------------------------------------------------------------------
/docs/requirements.txt:
--------------------------------------------------------------------------------
 1 | mkdocs
 2 | mkdocs-material
 3 | pygments
 4 | pymdown-extensions
 5 | mkdocs-autolinks-plugin
 6 | mknotebooks
 7 | #mkdocs-table-reader-plugin
 8 | #mkdocs-jupyter  # NOTE: this requires nbconvert==5.6.1
 9 | #mkdocs-exclude
10 | #mkdocs-click
11 | #mkdocstrings
12 | 


--------------------------------------------------------------------------------
/docs/stylesheets/extra.css:
--------------------------------------------------------------------------------
  1 | /* header different color*/
  2 | /*
  3 | .md-header {
  4 |     background-color: #232f3e !important;
  5 |     border-bottom: 1px solid #1b2532 !important;
  6 | }
  7 | */
  8 | 
  9 | 
 10 | /* Active tab bold & color */
 11 | .md-tabs__link {
 12 |     font-size: .75rem !important;
 13 | }
 14 | .md-tabs__link--active {
 15 |     font-weight: bold !important;
 16 |     color: var(--md-accent-fg-color);
 17 | }
 18 | .md-tabs__link:hover {
 19 |     color: var(--md-accent-fg-color);
 20 | }
 21 | 
 22 | /* navigation bar active color*/
 23 | .md-nav__item .md-nav__link--active {
 24 |     font-weight: bold !important;
 25 |     color: var(--md-accent-fg-color);
 26 | }
 27 | .md-nav__item .md-nav__link--active {
 28 |     font-weight: bold !important;
 29 |     font-size: .75rem !important;
 30 |     color: var(--md-accent-fg-color);
 31 | }
 32 | 
 33 | /* frontpage elements */
 34 | .tx-hero h1 {
 35 |     font-size: 2.41rem !important;
 36 | }
 37 | a.md-button.md-button--primary {
 38 |     background-color: var(--md-accent-fg-color);
 39 |     border-color: var(--md-accent-fg-color);
 40 |     color: #ffffff;
 41 | }
 42 | a.md-button.md-button--primary:hover {
 43 |     color: #000000;
 44 | }
 45 | a.md-button.md-button:hover {
 46 |     color: #000000;
 47 | }
 48 | 
 49 | 
 50 | /* More visible headings*/
 51 | .md-main h1 {
 52 |     margin: 0.5em 0 1.0em 0;
 53 |     color: #333;
 54 |     font-weight: bold;
 55 |     font-size: 36px;
 56 |     line-height: 40px;
 57 |     /*
 58 |     counter-increment: section-1;
 59 |     counter-reset: section-2 section-3 section-4;
 60 |     */
 61 | }
 62 | .md-main h2 {
 63 |     margin: 1.5em 0 0.4em 0;
 64 |     color: #595959;
 65 |     font-weight: normal;
 66 |     font-size: 30px;
 67 |     line-height: 36px;
 68 |     border-bottom: 1px solid #fff;
 69 |     box-shadow: 0 1px 0 rgba(0,0,0,0.1);
 70 |     padding-bottom: 10px;
 71 |     /*
 72 |     counter-increment: section-2;
 73 |     counter-reset: section-3 section-4;
 74 |     */
 75 | }
 76 | .md-main h3 {
 77 |     margin: 1.2em 0 0.4em 0;
 78 |     color: #595959;
 79 |     font-weight: normal;
 80 |     font-size: 26px;
 81 |     line-height: 40px;
 82 |     /*
 83 |     counter-increment: section-3;
 84 |     counter-reset: section-4;
 85 |     */
 86 | }
 87 | .md-main h4 {
 88 |     margin: 1.0em 0 0.4em 0;
 89 |     color: #333;
 90 |     font-weight: normal;
 91 |     font-size: 20px;
 92 |     line-height: 20px;
 93 |     /* counter-increment: section-4; */
 94 | }
 95 | 
 96 | 
 97 | /* Define class for block image in block documentation trimmed*/
 98 | .blockimage {
 99 |     width: 200px;
100 |     margin-right: 20px;
101 |     margin-top: 7px;
102 |     position:relative;
103 |     float:left;
104 | }
105 | .blockimage img {
106 |    width:100%;
107 |    max-width:100%;
108 |     float:left;
109 | }
110 | 
111 | 
112 | /*Table styling*/
113 | table {
114 |   padding: 0; }
115 |   table tr {
116 |     border-top: 1px solid #cccccc;
117 |     background-color: white;
118 |     margin: 0;
119 |     padding: 0; }
120 |     table tr:nth-child(2n) {
121 |       background-color: #f8f8f8; }
122 |     table tr th {
123 |       font-weight: bold;
124 |       border: 0px solid #cccccc;
125 |       text-align: centre;
126 |       margin: 0;
127 |       padding: 6px 13px; }
128 |     table tr td {
129 |       border: 0px solid #cccccc;
130 |       text-align: centre;
131 |       margin: 0;
132 |       padding: 6px 13px; }
133 |     table tr th :first-child, table tr td :first-child {
134 |       margin-top: 0; }
135 |     table tr th :last-child, table tr td :last-child {
136 |       margin-bottom: 0; }
137 | 
138 | /*Neccessary css for tabbed extension*/
139 | .tabbed-set {
140 |   display: flex;
141 |   position: relative;
142 |   flex-wrap: wrap;
143 | }
144 | .tabbed-set .highlight {
145 |   background: #ddd;
146 | }
147 | .tabbed-set .tabbed-content {
148 |   display: none;
149 |   order: 99;
150 |   width: 100%;
151 | }
152 | .tabbed-set label {
153 |   width: auto;
154 |   margin: 0 0.5em;
155 |   padding: 0.25em;
156 |   font-size: 120%;
157 |   cursor: pointer;
158 | }
159 | .tabbed-set input {
160 |   position: absolute;
161 |   opacity: 0;
162 | }
163 | .tabbed-set input:nth-child(n+1) {
164 |   color: #333333;
165 | }
166 | .tabbed-set input:nth-child(n+1):checked + label {
167 |     color: #FF5252;
168 | }
169 | .tabbed-set input:nth-child(n+1):checked + label + .tabbed-content {
170 |     display: block;
171 | }
172 | 
173 | 
174 | /* Admonition settings option*/
175 | .md-typeset .admonition.settings, .md-typeset details.settings {
176 |     border-left: .22rem solid #448aff;
177 | }
178 | .md-typeset .admonition.settings>.admonition-title, .md-typeset details.settings>.admonition-title, .md-typeset details.settings>summary {
179 |     border-bottom: .1rem solid rgba(236, 243, 255), .1);
180 |     background-color: rgba(236, 243, 255), .1);
181 | }
182 | .md-typeset .admonition.settings>.admonition-title:before, .md-typeset details.settings>.admonition-title:before, .md-typeset details.settings>summary:before {
183 |     color: #448aff;
184 |     content: "settings"}
185 | 
186 | 
187 | /* Code block size, but then too small in blocks*/
188 | /*code { font-size: 0.75em !important; }*/
189 | 
190 | 
191 | /* Site width etc.*/
192 | .md-grid {
193 |     max-width: 64rem !important;
194 | }
195 | /*
196 | .framed-python{
197 |   margin-top:-70px;
198 |   overflow:hidden;
199 | }
200 | .framed-r{
201 |   margin-top:0px;
202 |   overflow:hidden;
203 | }
204 | .framed-r-api{
205 |   margin-top:-50px;
206 |   overflow:hidden;
207 | }
208 | .framed-github{
209 |   height:100vh !important;
210 |   width:100% !important;
211 | }
212 | */
213 | 
214 | 
215 | /*Toc right margins*/
216 | /*
217 | @media only screen and (min-width: 76.25em){
218 |   .framed-python{
219 |     margin-left:-45px;
220 |   }
221 |   .framed-r-api{
222 |     margin-left:-45px;
223 |   }
224 |   .md-sidebar--secondary {
225 |     margin-left: 100% !important;
226 |   }
227 | }
228 | */
229 | 
230 | 
231 | /* mkdocstrings styling
232 | /* Indentation of function doc */
233 | div.doc-contents:not(.first) {
234 |   padding-left: 25px;
235 |   border-left: 4px solid rgba(230, 230, 230);
236 |   margin-bottom: 80px;
237 | }
238 | /* Don't capitalize names. */
239 | h5.doc-heading {
240 |   text-transform: none !important;
241 | }
242 | /* Don't use vertical space on hidden ToC entries. */
243 | h6.hidden-toc {
244 |   margin: 0 !important;
245 |   position: relative;
246 |   top: -70px;
247 | }
248 | h6.hidden-toc::before {
249 |   margin-top: 0 !important;
250 |   padding-top: 0 !important;
251 | }
252 | /* Don't show permalink of hidden ToC entries. */
253 | h6.hidden-toc a.headerlink {
254 |   display: none;
255 | }
256 | /* Avoid breaking parameters name, etc. in table cells. */
257 | td code {
258 |   word-break: normal !important;
259 | }
260 | /* For pieces of Markdown rendered in table cells. */
261 | td p {
262 |   margin-top: 0;
263 |   margin-bottom: 0;
264 | }
265 | */
266 | 


--------------------------------------------------------------------------------
/docs/stylesheets/extra.js:
--------------------------------------------------------------------------------
 1 | 
 2 | /**
 3 | 
 4 | // Table of contents always expanded
 5 | document.addEventListener("DOMContentLoaded", function() {
 6 |     load_navpane();
 7 | });
 8 | 
 9 | function load_navpane() {
10 |     var width = window.innerWidth;
11 |     if (width <= 1200) {
12 |         return;
13 |     }
14 | 
15 |     var nav = document.getElementsByClassName("md-nav");
16 |     for(var i = 0; i < nav.length; i++) {
17 |         if (typeof nav.item(i).style === "undefined") {
18 |             continue;
19 |         }
20 | 
21 |         if (nav.item(i).getAttribute("data-md-level") && nav.item(i).getAttribute("data-md-component")) {
22 |             nav.item(i).style.display = 'block';
23 |             nav.item(i).style.overflow = 'visible';
24 |         }
25 |     }
26 | 
27 |     var nav = document.getElementsByClassName("md-nav__toggle");
28 |     for(var i = 0; i < nav.length; i++) {
29 |        nav.item(i).checked = true;
30 |     }
31 | }
32 | **/
33 | 
34 | 
35 | // Open links externally.
36 | var links = document.links;
37 | 
38 | for (var i = 0, linksLength = links.length; i < linksLength; i++) {
39 |    if (links[i].hostname != window.location.hostname) {
40 |        links[i].target = '_blank';
41 |    }
42 | }


--------------------------------------------------------------------------------
/docs/tutorial/deployment.md:
--------------------------------------------------------------------------------
 1 | # Deployment
 2 | 
 3 | traintool can easily deploy your model through a REST API. This allows you to access the model from a website or application without shipping it with your code. 
 4 | 
 5 | Deployment uses [FastAPI](https://fastapi.tiangolo.com/) under the hood, which makes the API fully compatible with [OpenAPI/Swagger](https://github.com/OAI/OpenAPI-Specification) and [JSON Schema](http://json-schema.org/). 
 6 | 
 7 | 
 8 | ## Deploying a model
 9 | 
10 | To deploy a model after training or loading, simply run:
11 | 
12 | ```python
13 | model.deploy()
14 | ```
15 | 
16 | Note that the call to `deploy` is blocking, i.e. it should be run in a separate script. Also, it might not work well with Jupyter notebooks.
17 | 
18 | !!! tip
19 |     By default, the API will run on 127.0.0.1 at port 8000, but you can modify this, e.g. `model.deploy(host=0.0.0.0, port=8001)`. 
20 | 
21 | 
22 | ## Accessing the API
23 | 
24 | To access the API, navigate your browser to http://127.0.0.1:8000/. If everything worked out, you should see some basic information about the deployed model like below:
25 | 
26 | ![](../assets/api.png) 
27 | 
28 | To find out more about the API, check out the API docs at http://127.0.0.1:8000/docs. They contain information about all endpoints and required data types. 
29 | 
30 | 
31 | ## Making predictions
32 | 
33 | If you want to make a prediction with the API, you need to make a POST request to the `/predict` endpoint (http://127.0.0.1:8000/predict). The request body should look like this:
34 | 
35 | ```json
36 | {
37 |     "image": [[[0, 0.5, 0, 1], [0, 1, 0, 0.5]]]
38 | }
39 | ```
40 | 
41 | 
42 | `"image"` is a list of lists with shape `color channels x height x width`(here: a grayscale 4x4 image). You can easily get this list format from a numpy array with [numpy.ndarray.tolist](https://numpy.org/doc/stable/reference/generated/numpy.ndarray.tolist.html). Note that you cannot pass raw numpy arrays into the request because they are not JSON serializable. 
43 | 
44 | As in training, images can be RGB (3 color channels) or grayscale (1 color channel). They will be automatically preprocessed in the same way as the train data. If you used numpy images for training, make sure the image here has the same size and pixel range. If you used files, everything should be converted to the correct format automatically. 
45 | 
46 | !!! tip
47 |     You can easily try out the `/predict` endpoint if you go to the API docs (http://127.0.0.1:8000/docs), click on `/predict` and then on the "Try it out" button on the right. 
48 | 
49 | The endpoint will return a JSON object which is very similar to the dictionary returned by `model.predict(...)`. Numpy arrays are again converted to lists of lists (convert back with [numpy.asarray](https://numpy.org/doc/stable/reference/generated/numpy.asarray.html)). The JSON should look like this:
50 | 
51 | ```json
52 | {
53 |   "predicted_class": 2,
54 |   "probabilities": [
55 |     0.1,
56 |     0.8,
57 |     0.1
58 |   ],
59 |   "runtime": "0:00:00.088831"
60 | }
61 | ```
62 | 
63 | 
64 | 
65 | 
66 | 


--------------------------------------------------------------------------------
/docs/tutorial/experiment-tracking.md:
--------------------------------------------------------------------------------
 1 | # Experiment tracking
 2 | 
 3 | traintool tracks common metrics automatically (e.g. accuracy on train and test set)
 4 | and has different options to store and visualize them. 
 5 | 
 6 | 
 7 | ## Tensorboard
 8 | 
 9 | [Tensorboard](https://www.tensorflow.org/tensorboard) is a popular visualization toolkit from Google's tensorflow framework. By default, traintool automatically stores logs for tensorboard along with the model, so that you can visualize the metrics of your experiments.
10 | 
11 | To start tensorboard, run on your terminal (from the project dir):
12 | 
13 | ```bash
14 | tensorboard --logdir traintool-experiments
15 | ```
16 | 
17 | Navigate your browser to [http://localhost:6006/](http://localhost:6006/) and you should see the tensorboard window:
18 | 
19 | INSERT IMAGE HERE
20 | 
21 | On the bottom left, you can select all the different runs (same names as the directories in `traintool-experiments`), on the right side you can view the metrics. 
22 | 
23 | 
24 | 
25 | ## Comet.ml
26 | 
27 | You can store these metrics in [comet.ml](https://www.comet.ml/), a popular platform 
28 | for experiment tracking. They offer free accounts (you can sign up with your Github 
29 | account), and free premium for students & academia. 
30 | 
31 | Once you have your account, log in to comet.ml, click on your profile in the upper 
32 | right corner, go on settings and on "Generate API Key". Pass this API key along to the 
33 | `train` function like this:
34 | 
35 | ```python
36 | traintool.train("resnet", train_data=train_data, test_data=test_data, 
37 |                 comet_config={"api_key": YOUR_API_KEY, "project_name": OPTIONAL_PROJECT_NAME})
38 | ```
39 | 
40 | Now you can head on over to [comet.ml](https://www.comet.ml/) and follow the metrics in 
41 | real time!
42 | 
43 | 


--------------------------------------------------------------------------------
/docs/tutorial/intro.md:
--------------------------------------------------------------------------------
 1 | # Intro
 2 | 
 3 | This tutorial shows you everything that **traintool** can do. 
 4 | 
 5 | We will train a few different models on MNIST, use automated experiment tracking, deploy 
 6 | the models via REST APIs, and get access to the underlying, raw models. 
 7 | 
 8 | 
 9 | ## Installation
10 | 
11 | If you haven't installed traintool yet, now is a good time:
12 | 
13 | ```bash
14 | pip install git+https://github.com/jrieke/traintool
15 | ```
16 | 
17 | 
18 | ## Dataset
19 | 
20 | We will use the MNIST dataset throughout this tutorial. Just in case you never heard of 
21 | it: MNIST is a popular dataset for image classification. It contains images of 
22 | handwritten digits and the task is to predict which digit is shown on a given image. 
23 | Below are some examples.
24 | 
25 | ![](https://upload.wikimedia.org/wikipedia/commons/2/27/MnistExamples.png)
26 | 


--------------------------------------------------------------------------------
/docs/tutorial/quickstart.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |   "nbformat": 4,
  3 |   "nbformat_minor": 0,
  4 |   "metadata": {
  5 |     "colab": {
  6 |       "name": "quickstart.ipynb",
  7 |       "provenance": [],
  8 |       "collapsed_sections": []
  9 |     },
 10 |     "kernelspec": {
 11 |       "name": "python3",
 12 |       "display_name": "Python 3"
 13 |     }
 14 |   },
 15 |   "cells": [
 16 |     {
 17 |       "cell_type": "markdown",
 18 |       "metadata": {
 19 |         "id": "ak4L7hONDZdx"
 20 |       },
 21 |       "source": [
 22 |         "# Quickstart\n",
 23 |         "\n",
 24 |         "Welcome to **traintool**!\n",
 25 |         "\n",
 26 |         "In this quickstart, we will train a few models on MNIST. This should give you a rough overview of what traintool can do. \n",
 27 |         "\n",
 28 |         "You can follow along interactively in **Google Colab** (a free Jupyter notebook service):\n",
 29 |         "\n",
 30 |         "[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/jrieke/traintool/blob/master/docs/tutorial/quickstart.ipynb)\n",
 31 |         "\n",
 32 |         "*We highly recommend to use Colab for this tutorial because it gives you free GPU access, which makes training much faster. Important: To enable GPU support, click on \"Runtime\" -> \"Change runtime type\", select \"GPU\" and hit \"Save\".*\n",
 33 |         "\n",
 34 |         "---\n"
 35 |       ]
 36 |     },
 37 |     {
 38 |       "cell_type": "markdown",
 39 |       "metadata": {
 40 |         "id": "ZHmp7C-GEpLH"
 41 |       },
 42 |       "source": [
 43 |         "First, let's install traintool:"
 44 |       ]
 45 |     },
 46 |     {
 47 |       "cell_type": "code",
 48 |       "metadata": {
 49 |         "id": "sBitaippDXMG"
 50 |       },
 51 |       "source": [
 52 |         "!pip install -U git+https://github.com/jrieke/traintool"
 53 |       ],
 54 |       "execution_count": null,
 55 |       "outputs": []
 56 |     },
 57 |     {
 58 |       "cell_type": "markdown",
 59 |       "metadata": {
 60 |         "id": "IJunE3-NEuCW"
 61 |       },
 62 |       "source": [
 63 |         "Next, we import traintool and load the mnist dataset (installed with traintool):"
 64 |       ]
 65 |     },
 66 |     {
 67 |       "cell_type": "code",
 68 |       "metadata": {
 69 |         "id": "1-dX_WnO1j08"
 70 |       },
 71 |       "source": [
 72 |         "import traintool\n",
 73 |         "import mnist"
 74 |       ],
 75 |       "execution_count": null,
 76 |       "outputs": []
 77 |     },
 78 |     {
 79 |       "cell_type": "code",
 80 |       "metadata": {
 81 |         "id": "IagipCnO1wfi"
 82 |       },
 83 |       "source": [
 84 |         "train_images = mnist.train_images()[:, None]  # add color dimension\n",
 85 |         "train_labels = mnist.train_labels()\n",
 86 |         "test_images = mnist.test_images()[:, None]\n",
 87 |         "test_labels = mnist.test_labels()\n",
 88 |         "\n",
 89 |         "print(\"Images shape:\", train_images.shape)\n",
 90 |         "print(\"Labels shape:\", train_labels.shape)"
 91 |       ],
 92 |       "execution_count": null,
 93 |       "outputs": []
 94 |     },
 95 |     {
 96 |       "cell_type": "markdown",
 97 |       "metadata": {
 98 |         "id": "NWfMdByHE5qM"
 99 |       },
100 |       "source": [
101 |         "As you can see, all data from the `mnist` package comes as numpy arrays. Images have the shape `num samples x color channels x height x width`. Note that traintool can handle numpy arrays like here as well as image files on your machine (see here)."
102 |       ]
103 |     },
104 |     {
105 |       "cell_type": "markdown",
106 |       "metadata": {
107 |         "id": "BTyAJVPGMOgs"
108 |       },
109 |       "source": [
110 |         "## Your first model"
111 |       ]
112 |     },
113 |     {
114 |       "cell_type": "markdown",
115 |       "metadata": {
116 |         "id": "x6mlF9hTGaEr"
117 |       },
118 |       "source": [
119 |         "Let's train our first model! We will use a very simple model, a support vector classifier (called `svc` in traintool). Training it requires only one line of code:\n",
120 |         "\n",
121 |         "*Note: We use the config parameter `num_samples` here to train only on a subset of the data to make it faster.*"
122 |       ]
123 |     },
124 |     {
125 |       "cell_type": "code",
126 |       "metadata": {
127 |         "id": "1OZvJ2kT2CVO"
128 |       },
129 |       "source": [
130 |         "svc = traintool.train(\"svc\", \n",
131 |         "                      train_data=[train_images, train_labels], \n",
132 |         "                      test_data=[test_images, test_labels], \n",
133 |         "                      config={\"num_samples\": 500})"
134 |       ],
135 |       "execution_count": null,
136 |       "outputs": []
137 |     },
138 |     {
139 |       "cell_type": "markdown",
140 |       "metadata": {
141 |         "id": "rBm1LQJnGnHl"
142 |       },
143 |       "source": [
144 |         "That looks very simple – but under the hood, a lot of stuff happened:\n",
145 |         "\n",
146 |         "1) traintool printed some **general information** about the experiment: Its ID, which model and configuration was used, where the model is saved and how you can load it later. \n",
147 |         "\n",
148 |         "2) Then, it **preprocessed** the data. It automatically converted all data to the correct format and applied some light preprocessing that makes sense with this model. \n",
149 |         "\n",
150 |         "3) It created and **trained** the model. Under the hood, traintool uses different frameworks for this step (e.g. scikit-learn or pytorch) but as a user, you don't have to worry about any of this. After training, traintool printed the resulting accuracies (should be 80-85 % here).\n",
151 |         "\n",
152 |         "4) traintool automatically **saved** the model, console output and tensorboard logs into a time-stamped folder (see below)."
153 |       ]
154 |     },
155 |     {
156 |       "source": [],
157 |       "cell_type": "markdown",
158 |       "metadata": {}
159 |     },
160 |     {
161 |       "source": [
162 |         "## Making predictions"
163 |       ],
164 |       "cell_type": "markdown",
165 |       "metadata": {}
166 |     },
167 |     {
168 |       "cell_type": "markdown",
169 |       "metadata": {
170 |         "id": "Mt2auldciv1f"
171 |       },
172 |       "source": [
173 |         "To make a prediction with this model, simply use its `predict` function:"
174 |       ]
175 |     },
176 |     {
177 |       "cell_type": "code",
178 |       "metadata": {
179 |         "id": "dQ6woUskinsi"
180 |       },
181 |       "source": [
182 |         "svc.predict(test_images[0])"
183 |       ],
184 |       "execution_count": null,
185 |       "outputs": []
186 |     },
187 |     {
188 |       "cell_type": "markdown",
189 |       "metadata": {
190 |         "id": "XVhM_hkLjAUF"
191 |       },
192 |       "source": [
193 |         "This gives you a dictionary with the predicted class and probabilities for each class. Note that for now, `predict` can only process a single image at a time. As the `train` method, it works with numpy arrays and image files (see here)."
194 |       ]
195 |     },
196 |     {
197 |       "cell_type": "markdown",
198 |       "metadata": {
199 |         "id": "zNhKQxCdMQ9G"
200 |       },
201 |       "source": [
202 |         "## Using other models"
203 |       ]
204 |     },
205 |     {
206 |       "cell_type": "markdown",
207 |       "metadata": {
208 |         "id": "BPamL3DbJ72B"
209 |       },
210 |       "source": [
211 |         "\n",
212 |         "Ok, now what if you want to train a different model? traintool makes this very easy: You only have to call the `train` function with a different model name – no need to rewrite the implementation or change the data just because you use a model from a different framework!\n",
213 |         "\n",
214 |         "Let's train a residual network (`resnet18`), a deep neural network from pytorch (make sure to use a GPU!):"
215 |       ]
216 |     },
217 |     {
218 |       "cell_type": "code",
219 |       "metadata": {
220 |         "id": "lskB7rhw2E37"
221 |       },
222 |       "source": [
223 |         "resnet = traintool.train(\"resnet18\", \n",
224 |         "                         train_data=[train_images, train_labels],\n",
225 |         "                         test_data=[test_images, test_labels],\n",
226 |         "                         config={\"batch_size\": 128, \"print_every\": 10, \"num_epochs\": 2, \"num_samples\": 10000})"
227 |       ],
228 |       "execution_count": null,
229 |       "outputs": []
230 |     },
231 |     {
232 |       "cell_type": "markdown",
233 |       "metadata": {
234 |         "id": "rYUNQIAEUSu3"
235 |       },
236 |       "source": [
237 |         "And with this simple command, you can train all models supported by traintool! See [here](https://traintool.jrieke.com/models/image-classification/) for a list of models. \n",
238 |         "\n",
239 |         "As you may have noticed, we set some parameters with the `config` argument above. `config` is the central place to define hyperparameters for training. The supported hyperparameters vary from model to model – it's best to have a look at the overview page linked above. \n",
240 |         "\n"
241 |       ]
242 |     },
243 |     {
244 |       "cell_type": "markdown",
245 |       "metadata": {
246 |         "id": "j8Mdq6AXcomF"
247 |       },
248 |       "source": [
249 |         "## Experiment tracking"
250 |       ]
251 |     },
252 |     {
253 |       "cell_type": "markdown",
254 |       "metadata": {
255 |         "id": "BlkMmxlZctbs"
256 |       },
257 |       "source": [
258 |         "traintool automatically keeps track of all experiments you run. Each experiment is stored in a time-stamped folder in `./traintool-experiments`. Have a look at this folder now to see the experiments you ran above! (If you are in Colab, click on the folder icon on the top left).\n",
259 |         "\n",
260 |         "*Tip: You can disable saving with `save=False`.*"
261 |       ]
262 |     },
263 |     {
264 |       "cell_type": "markdown",
265 |       "metadata": {
266 |         "id": "cyngzaQteHQ0"
267 |       },
268 |       "source": [
269 |         "Each experiment folder contains:\n",
270 |         "\n",
271 |         "- `info.yml`: General information about the experiment\n",
272 |         "- `stdout.log`: The entire console output\n",
273 |         "- model files and possibly checkpoints (e.g. the pytorch binary `model.pt` for resnet18)\n",
274 |         "- tensorboard logs (see below)"
275 |       ]
276 |     },
277 |     {
278 |       "source": [
279 |         "## Visualizations"
280 |       ],
281 |       "cell_type": "markdown",
282 |       "metadata": {}
283 |     },
284 |     {
285 |       "cell_type": "markdown",
286 |       "metadata": {
287 |         "id": "tl41Bq9teL-Y"
288 |       },
289 |       "source": [
290 |         "traintool writes all metrics and evaluations to [tensorboard](https://www.tensorflow.org/tensorboard), a powerful visualization platform from tensorflow. Let's start tensorboard now: If you are on a local machine, start a terminal in this dir and type `tensorboard --logdir traintool-experiments`. If you are on Colab, just run the cell below:"
291 |       ]
292 |     },
293 |     {
294 |       "cell_type": "code",
295 |       "metadata": {
296 |         "id": "Wk2eD-9mCeRn"
297 |       },
298 |       "source": [
299 |         "%load_ext tensorboard\n",
300 |         "%tensorboard --logdir traintool-experiments/"
301 |       ],
302 |       "execution_count": null,
303 |       "outputs": []
304 |     },
305 |     {
306 |       "cell_type": "markdown",
307 |       "metadata": {
308 |         "id": "Ldx4CtPHe5jC"
309 |       },
310 |       "source": [
311 |         "Let's see what's going on here: On the bottom left, you can select individual experiments. On the right, you should by default see scalar metrics: The loss and accuracy for train and test set. You can also click on `Images` at the top to see some sample images from both datasets along with classification results (use the sliders to look at different epochs!).\n",
312 |         "\n",
313 |         "*Tip: You can also store metrics in comet.ml, see here.*"
314 |       ]
315 |     },
316 |     {
317 |       "cell_type": "markdown",
318 |       "metadata": {
319 |         "id": "1bzWx_7Lh3Zn"
320 |       },
321 |       "source": [
322 |         "## Other functions"
323 |       ]
324 |     },
325 |     {
326 |       "cell_type": "markdown",
327 |       "metadata": {
328 |         "id": "Z66dv-Rnh6-D"
329 |       },
330 |       "source": [
331 |         "Before we end this quickstart, let's look at three other important functions:\n",
332 |         "\n",
333 |         "- **Loading:** To load a saved model, just pass its ID (or directory path) to `traintool.load(...)`. Check out the line starting with `Load via:` in the console output above – it shows you directly which command to call.\n",
334 |         "- **Deployment:** traintool can easily deploy your trained model through a REST API. Simply call `model.deploy()` to start the server (note that this call is blocking!). More information here.\n",
335 |         "- **Raw models:** traintool models are implemented in different frameworks, e.g. scikit-learn or pytorch. You can get access to the raw models by calling `model.raw()`. "
336 |       ]
337 |     },
338 |     {
339 |       "cell_type": "markdown",
340 |       "metadata": {
341 |         "id": "abU5z1zVkWRS"
342 |       },
343 |       "source": [
344 |         "\n",
345 |         "---"
346 |       ]
347 |     },
348 |     {
349 |       "cell_type": "markdown",
350 |       "metadata": {
351 |         "id": "D8FUSxzjj6pu"
352 |       },
353 |       "source": [
354 |         "That's it! You should now be able to start using traintool. Make sure to read the complete tutorial and documentation to learn more! \n",
355 |         "\n",
356 |         "Please also consider leaving a ⭐ on our [Github](https://github.com/jrieke/traintool)."
357 |       ]
358 |     }
359 |   ]
360 | }


--------------------------------------------------------------------------------
/docs/tutorial/raw-models.md:
--------------------------------------------------------------------------------
 1 | # Accessing raw models
 2 | 
 3 | traintool is built on top of powerful machine learning libraries like scikit-learn or p
 4 | ytorch. After training, it gives you full access to the raw models with: 
 5 | 
 6 | ```python
 7 | model.raw()
 8 | ```
 9 | 
10 | This returns a dict of all underlying model objects. It usually contains the model 
11 | itself (`model.raw()["model"]`) but might also contain some other 
12 | objects, e.g. data scalers (`model.raw()["scaler"]`).
13 | 


--------------------------------------------------------------------------------
/docs/tutorial/training.md:
--------------------------------------------------------------------------------
  1 | # Training and Prediction
  2 | 
  3 | ## Your first model
  4 | 
  5 | As a first example, we'll train a very simple model: A 
  6 | [Support Vector Machine](https://en.wikipedia.org/wiki/Support_vector_machine) or SVM. 
  7 | We will use the image classification dataset MNIST throughout this tutorial, so let's 
  8 | load it now (the `mnist` package was installed along with traintool):
  9 | 
 10 | ```python
 11 | import mnist
 12 | train_data = [mnist.train_images(), mnist.train_labels()]
 13 | test_data = [mnist.test_images(), mnist.test_labels()]
 14 | ```
 15 | 
 16 | !!! tip
 17 |     The code above loads the data as numpy arrays but traintool can also deal with 
 18 |     files and pytorch datasets (see here). More data formats will be added soon.
 19 | 
 20 | Training the SVM classifier is very simple now:
 21 | 
 22 | ```python
 23 | import traintool
 24 | svc = traintool.train("svc", train_data=train_data, test_data=test_data)
 25 | ```
 26 | 
 27 | That's it! traintool will take care of reading and converting the data, applying some 
 28 | light preprocessing, training and saving the model, and tracking all metrics. It will 
 29 | also print out the final loss and accuracy (the test accuracy should be around XX % 
 30 | here).
 31 | 
 32 | 
 33 | ## Making predictions
 34 | 
 35 | Of course, you can do predictions with the trained model. Let's run it on an image of 
 36 | the test set:
 37 | 
 38 | ```python
 39 | pred = svc.predict(test_data[0][0])
 40 | print("Predicted:", pred["predicted_class"], " - Is:", test_data[1][0])
 41 | ```
 42 | 
 43 | This should print out the predicted class and the ground truth. Note that `pred` is a 
 44 | dictionary with the predicted class (`pred["predicted_class"]`) and the probabilities 
 45 | for each class (`pred["probabilities"]`).
 46 | 
 47 | !!! tip
 48 |     Again, we use a numpy array for the test image here but traintool can also handle 
 49 |     pytorch tensors and files. You can even pass in a whole batch of images 
 50 |     (e.g. `test_data[0][0:2]`). 
 51 | 
 52 | 
 53 | ## Using other models
 54 | 
 55 | Now, let's check a more advanced model. We will train a [Residual Network](https://arxiv.org/abs/1512.03385) 
 56 | (ResNet), a modern deep neural network. Usually, training this model instead of an SVM 
 57 | would require you to use an advanced framework like pytorch or tensorflow and rewrite 
 58 | most of your codebase. With traintool, it's as simple replacing the model name in the `train` method:
 59 | 
 60 | ```python
 61 | resnet = traintool.train("resnet", train_data=train_data, test_data=test_data)
 62 | ```
 63 | 
 64 | And this syntax stays the same for every other model that traintool supports! This makes 
 65 | it really easy to compare a bunch of different models on your dataset and see what 
 66 | performs best. 
 67 | 
 68 | 
 69 | ## Custom hyperparameters
 70 | 
 71 | In machine learning, most models have some hyperparameters that control the training 
 72 | process (e.g. the learning rate). traintool uses sensible defaults specific to each 
 73 | model, but gives you the flexibility to fully customize everything. 
 74 | 
 75 | First, let's find out which hyperparameters the model supports and what their defaults 
 76 | are:
 77 | 
 78 | ```python
 79 | print(traintool.default_hyperparameters("resnet"))
 80 | ```
 81 | 
 82 | This should print out a dictionary of hyperparameters and defaults. Now, we want to 
 83 | change the learning rate and use a different optimizer. To do this, simply pass a 
 84 | `config` dict to the train method:
 85 | 
 86 | ```python
 87 | config = {"lr": 0.1, "optimizer": "adam"}
 88 | better_resnet = traintool.train("resnet", config=config, train_data=train_data, test_data=test_data)
 89 | ```
 90 | 
 91 | 
 92 | ## Saving and loading models
 93 | 
 94 | There are two options to save a model to disk. Either use the `save` method after 
 95 | training like this:
 96 | 
 97 | ```python
 98 | model = traintool.train("...")
 99 | model.save("path/to/dir")
100 | ```
101 | 
102 | Or you can specify an output directory directly during training. This makes sense for 
103 | long-running processes, so you don't lose the whole progress in case your machine is 
104 | interrupted:
105 | 
106 | ```python
107 | model = traintool.train("...", save="path/to/dir")
108 | ```
109 | 
110 | In both cases, loading a model works via:
111 | 
112 | ```python
113 | model = traintool.load("path/to/dir")
114 | ```
115 | 
116 | 
117 | <!--
118 | ---
119 | 
120 | This tutorial should show you everything to get started with traintool. We'll train and 
121 | use a few different models on MNIST. 
122 | 
123 | 
124 | ## Installation
125 | 
126 | In the terminal, type:
127 | 
128 | ```bash
129 | pip install git+https://github.com/jrieke/traintool
130 | ```
131 | 
132 | Note that traintool requires Python 3.
133 | 
134 | 
135 | ## Data
136 | 
137 | We will use the image classification dataset MNIST throughout this tutorial. It 
138 | contains images of handwritten digits, that need to be classified according to the 
139 | digit 0-9. To load it, start a Python console and enter: 
140 | 
141 | ```python
142 | import mnist
143 | train_data = [mnist.train_images(), mnist.train_labels()]
144 | test_data = [mnist.test_images(), mnist.test_labels()]
145 | ```
146 | 
147 | The `mnist` package should have been installed along with traintool. It loads the 
148 | images and labels as numpy arrays. 
149 | 
150 | !!! tip
151 |     Besides numpy arrays, traintool can also handle pytorch datasets and files. More 
152 |     data formats will be added soon.
153 | 
154 | 
155 | ## Training
156 | 
157 | Train a [Support Vector Machine](https://en.wikipedia.org/wiki/Support_vector_machine):
158 | 
159 | ```python
160 | import traintool
161 | svc = traintool.train("svc", train_data=train_data, test_data=test_data)
162 | ```
163 | 
164 | Or train a [Residual Network](https://arxiv.org/abs/1512.03385):
165 | 
166 | ```python
167 | resnet = traintool.train("resnet", train_data=train_data, test_data=test_data)
168 | ```
169 | 
170 | Or train any other model that traintool supports! It's as simple as changing the model 
171 | name – no need to learn a new framework or change your entire code base. traintool
172 | makes it super easy to compare different models.
173 | 
174 | 
175 | ## Prediction
176 | 
177 | Run an image from the test set through the model:
178 | 
179 | ```python
180 | pred = svc.predict(test_data[0][0])
181 | print("Predicted:", pred["predicted_class"], " - Is:", test_data[1][0])
182 | ```
183 | 
184 | `pred` is a dictionary with the predicted class (`pred["predicted_class"]`) and the 
185 | probabilities for each class (`pred["probabilities"]`)
186 | 
187 | 
188 | ## Hyperparameters
189 | 
190 | Every model comes with sensible defaults for the hyperparameters. You can get these 
191 | defaults via: 
192 | 
193 | ```python
194 | print(traintool.default_hyperparameters("resnet"))
195 | ```
196 | 
197 | To change hyperparameters, pass a `config` dict to the train method:
198 | 
199 | ```python
200 | config = {"lr": 0.1, "optimizer": "adam"}
201 | better_resnet = traintool.train("resnet", config=config, train_data=train_data, test_data=test_data)
202 | ```
203 | >


--------------------------------------------------------------------------------
/examples/mnist-cnn-example.py:
--------------------------------------------------------------------------------
 1 | # pylint: disable=wrong-import-order
 2 | 
 3 | import mnist
 4 | import traintool
 5 | from torchvision import datasets, transforms
 6 | 
 7 | # Connect traintool to comet.ml to track metrics
 8 | # api_key = ""  # ENTER HERE
 9 | # traintool.connect_comet(project_name="mnist-cnn", api_key=api_key)
10 | 
11 | # Load data (numpy).
12 | train_data = [mnist.train_images()[:, None] / 255, mnist.train_labels()]
13 | test_data = [mnist.test_images()[:, None] / 255, mnist.test_labels()]
14 | sample = (test_data[0][0], test_data[1][0])
15 | 
16 | # Load data (torch).
17 | # transform = transforms.Compose([transforms.ToTensor()])
18 | # train_data = datasets.MNIST("data", train=True, download=True, transform=transform)
19 | # test_data = datasets.MNIST("data", train=False, download=True, transform=transform)
20 | # sample = test_data[0]
21 | 
22 | # Set hyperparameters.
23 | config = {"epochs": 3, "lr": 0.1, "batch_size": 128}  # epochs: 14
24 | # config = {"n_estimators": 10}
25 | 
26 | # Start training a simple CNN
27 | # This spins up an AWS instance, installs dependencies, trains the model, logs metrics
28 | # to comet.ml, and saves the model. You can shutdown your PC while this is running.
29 | model_wrapper = traintool.train(
30 |     "simple-cnn",
31 |     train_data=train_data,
32 |     test_data=test_data,
33 |     config=config,
34 |     dry_run=False,
35 | )
36 | 
37 | 
38 | # Make prediction on sample from test set.
39 | # model_wrapper.predict(img_arr=sample[0])
40 | # print(
41 | #     f"Classified test image as class {result['predicted_class']} "
42 | #     f"(probability: {100*result['probabilities'][result['predicted_class']]:.1f} %), "
43 | #     f"is actually class {sample[1]}"
44 | # )
45 | # print()
46 | 
47 | 
48 | # Fetch model as native pytorch object (e.g. for further evaluation)
49 | # torch_model = model_wrapper.get_model(model_format="torch")
50 | # print("Here's the model as native pytorch object:")
51 | # print(torch_model)
52 | # print()
53 | 


--------------------------------------------------------------------------------
/mkdocs.yml:
--------------------------------------------------------------------------------
  1 | ## Project information
  2 | site_name: traintool
  3 | site_author: Johannes Rieke
  4 | site_description: Machine learning in one line of code
  5 | site_url: https://traintool.jrieke.com/
  6 | 
  7 | ## Repository
  8 | #repo_name: traintool
  9 | repo_url: https://github.com/jrieke/traintool
 10 | #edit_uri: ''  #disables edit button
 11 | 
 12 | ## Social Media
 13 | extra:
 14 |   social:
 15 |     - icon: fontawesome/brands/github-alt
 16 |       link: https://github.com/jrieke
 17 |     - icon: fontawesome/brands/twitter
 18 |       link: https://twitter.com/jrieke
 19 |     - icon: fontawesome/brands/linkedin
 20 |       link: https://www.linkedin.com/in/johannesrieke/
 21 |     - icon: fontawesome/solid/envelope
 22 |       link: mailto:johannes.rieke@gmail.com
 23 | 
 24 | ## Page tree
 25 | nav:
 26 |   - About: index.md
 27 |   - Quickstart: tutorial/quickstart.ipynb
 28 |   # - Tutorial:
 29 |   #     - tutorial/quickstart.ipynb
 30 |   #     - tutorial/training.md
 31 |   #     - tutorial/experiment-tracking.md
 32 |   #     - tutorial/deployment.md
 33 |   #     - tutorial/raw-models.md
 34 |   - Image Classification: models/image-classification.md
 35 |   - Deployment: tutorial/deployment.md
 36 |   # - Tasks and Models:
 37 |   #     - models/image-classification.md
 38 |   #     - models/object-detection.md
 39 |   #     - models/text-classification.md
 40 | 
 41 | ## Configuration
 42 | theme:
 43 |   name: material
 44 |   logo: assets/logo-white.png
 45 |   favicon: assets/favicon.ico
 46 |   palette:
 47 |     primary: blue
 48 |     accent: deep purple
 49 |   #   custom_dir: docs/theme_override_home/
 50 |   #   # 404 page
 51 |   #   static_templates:
 52 |   #     - 404.html
 53 |   #   # Don't include MkDocs' JavaScript
 54 |   #   include_search_page: false
 55 |   #   search_index_only: true
 56 |   #   # Default values, taken from mkdocs_theme.yml
 57 |   #   language: en
 58 |   features:
 59 |     - tabs
 60 |     - instant
 61 | 
 62 | # ## Plugins
 63 | plugins:
 64 |   - search
 65 |   - autolinks
 66 |   - mknotebooks:
 67 |       enable_default_jupyter_cell_styling: false
 68 |   #- mkdocs-jupyter
 69 | #   #- table-reader
 70 | #   #- mkdocs-jupyter
 71 | #   # - exclude:
 72 | #   #     glob:
 73 | #   #       - "*config*.json"
 74 | #   #       - "*cfg*.json"
 75 | #   #       - ".ipynb_checkpoints"
 76 | #   #       - "*examples/project*"
 77 | #   #       - "*examples/guides/*"
 78 | #   #- minify:
 79 | #   #    minify_html: false
 80 | #   - mkdocstrings:
 81 | #       default_handler: python
 82 | #       handlers:
 83 | #         python:
 84 | #           rendering:
 85 | #             show_root_heading: false
 86 | #             show_source: true
 87 | #           selection:
 88 | #             filters:
 89 | #               - "!^_"  # exlude all members starting with _
 90 | #       watch:
 91 | #         - src/my_library
 92 | #   #- pdf-export
 93 | 
 94 | # ## Custom theme additions
 95 | extra_javascript:
 96 |   - "stylesheets/extra.js"
 97 | # extra_css:
 98 | #   - stylesheets/extra.css
 99 | 
100 | ## Extensions
101 | markdown_extensions:
102 |   - markdown.extensions.admonition
103 |   - markdown.extensions.attr_list
104 |   - markdown.extensions.codehilite:
105 |       guess_lang: true # required for mknotebooks
106 |   - markdown.extensions.def_list
107 |   - markdown.extensions.footnotes
108 |   - markdown.extensions.meta
109 |   - markdown.extensions.toc:
110 |       permalink: true
111 |   - pymdownx.arithmatex
112 |   - pymdownx.betterem:
113 |       smart_enable: all
114 |   - pymdownx.caret
115 |   - pymdownx.critic
116 |   - pymdownx.details
117 |   - pymdownx.emoji
118 |   - pymdownx.highlight:
119 |       linenums_style: pymdownx.inline
120 |   - pymdownx.inlinehilite
121 |   - pymdownx.keys
122 |   - pymdownx.magiclink
123 |   - pymdownx.mark
124 |   - pymdownx.smartsymbols
125 |   - pymdownx.snippets:
126 |       check_paths: true
127 |   #- pymdownx.superfences # prevents syntax highlighting in mknotebooks
128 |   - pymdownx.tabbed
129 |   - pymdownx.tasklist:
130 |       custom_checkbox: true
131 |   - pymdownx.tilde
132 |   - pymdownx.tabbed
133 |   # - mkdocs-click
134 | # #google_analytics:
135 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | --find-links https://download.pytorch.org/whl/torch_stable.html
2 | torch==1.7.0+cpu
3 | torchvision==0.8.1+cpu
4 | -e .
5 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | from setuptools import setup, find_packages
 3 | 
 4 | parent_dir = Path(__file__).resolve().parent
 5 | 
 6 | setup(
 7 |     name="traintool",
 8 |     version=parent_dir.joinpath("traintool/_version.txt").read_text(encoding="utf-8"),
 9 |     author="Johannes Rieke",
10 |     author_email="johannes.rieke@gmail.com",
11 |     description="Machine learning in one line of code",
12 |     long_description=parent_dir.joinpath("README.md")
13 |     .read_text()
14 |     .replace(
15 |         "docs/assets/",
16 |         "https://raw.githubusercontent.com/jrieke/traintool/master/docs/assets/",
17 |     ),
18 |     long_description_content_type="text/markdown",
19 |     url="https://github.com/jrieke/traintool",
20 |     license="Apache-2.0 License",
21 |     packages=find_packages(exclude=("tests", "docs", "examples")),
22 |     package_data={"": ["_version.txt"]},
23 |     include_package_data=True,
24 |     zip_safe=False,
25 |     python_requires=">=3.6",
26 |     install_requires=[
27 |         "numpy",
28 |         "matplotlib",
29 |         "torch",
30 |         "torchvision",
31 |         "pytorch-ignite",
32 |         "comet_ml",
33 |         "pyyaml>=5.1",  # for sort_keys arg
34 |         "scikit-learn",
35 |         "fastapi",
36 |         "uvicorn",
37 |         "joblib",
38 |         "tensorboardX",
39 |         "tensorboard",
40 |         "imageio",
41 |         "loguru",
42 |         "editdistance",
43 |         "mnist",
44 |     ],
45 |     entry_points="""""",
46 |     classifiers=[
47 |         "Programming Language :: Python :: 3",
48 |         "Programming Language :: Python :: 3.6",
49 |         "Programming Language :: Python :: 3.7",
50 |         "Programming Language :: Python :: 3.8",
51 |         "Operating System :: OS Independent",
52 |         "Development Status :: 2 - Pre-Alpha",
53 |         "Intended Audience :: Developers",
54 |     ],
55 | )
56 | 


--------------------------------------------------------------------------------
/tests/conftest.py:
--------------------------------------------------------------------------------
 1 | import comet_ml  # noqa: F401
 2 | import sys
 3 | import os
 4 | import numpy as np
 5 | import torch
 6 | from torch.utils.data import TensorDataset
 7 | from typing import Union, List
 8 | from pathlib import Path
 9 | import imageio
10 | 
11 | 
12 | sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), "..")))
13 | 
14 | 
15 | # TODO: Maybe build generator around this which returns all the possible data formats
16 | #   that are allowed.
17 | def create_dataset(
18 |     data_format: str = "numpy",
19 |     size: int = 28,
20 |     grayscale: bool = True,
21 |     num_samples: int = 4,
22 |     num_classes: int = 4,
23 |     seed: int = 0,
24 |     tmp_path: Path = None,
25 | ) -> Union[List[np.ndarray], TensorDataset, Path]:
26 |     """
27 |     Create fake data for image classification, including images (values from 0 to 1) 
28 |     and labels (10 classes). 
29 | 
30 |     Args:
31 |         data_format (str, optional): "numpy" (for list of numpy arrays 
32 |             [images, labels]) or "torch" (for torch.utils.data.Dataset) or "files" 
33 |             (for directory of image files). Defaults to "numpy".
34 |         size (int, optional): Width and height of the images. Defaults to 28.
35 |         grayscale (bool, optional): If True, images are grayscale and of size 28x28, 
36 |             otherwise they have 3 color channels and are 224x224. Defaults to False.
37 |         num_samples (int, optional): Number of samples in the dataset. Defaults to 4.
38 |         seed (int, optional): Seed for data generation. Defaults to 0.
39 | 
40 |     Returns:
41 |         Union[List[np.ndarray], torch.utils.data.Dataset, Path]: The generated fake 
42 |             data. 
43 |     """
44 |     
45 |     if num_samples < num_classes:
46 |         raise ValueError("num_samples needs to be >= num_classes, so that each label "
47 |                          "can appear at least once")
48 | 
49 |     # Seed to make different datasets comparable.
50 |     np.random.seed(seed)
51 |     
52 |     # Create images in channels first format.
53 |     num_channels = 1 if grayscale else 3
54 |     images = np.random.rand(num_samples, num_channels, size, size)
55 |     
56 |     # Create random labels. Make sure all labels appear at least once by setting the 
57 |     # first few ones semi-random.
58 |     labels = np.random.randint(num_classes, size=num_samples)
59 |     labels[:num_classes] = np.random.permutation(num_classes)
60 |     
61 |     # Convert to correct output format.
62 |     if data_format == "numpy":
63 |         return [images, labels]
64 |     elif data_format == "torch":
65 |         dataset = TensorDataset(
66 |             torch.from_numpy(images).float(), torch.from_numpy(labels).long(),
67 |         )
68 |         return dataset
69 |     elif data_format == "files":
70 |         if tmp_path is None:
71 |             raise ValueError("tmp_path must be given if data_format is files")
72 |         for i, (image, label) in enumerate(zip(images, labels)):
73 |             image = image.transpose((1, 2, 0))
74 |             image_dir = tmp_path / "data" / f"{label}"
75 |             image_dir.mkdir(parents=True, exist_ok=True)
76 |             imageio.imwrite(image_dir / f"{i}.png", image)
77 |         return tmp_path / "data"
78 |     else:
79 |         raise ValueError(f"data_format not supported: {data_format}")
80 | 
81 | 
82 | def create_image(data_format: str = "numpy", **kwargs):
83 |     """Creates a single image, using the same keyword args as create_dataset."""
84 |     data = create_dataset(data_format=data_format, **kwargs)
85 |     # TODO: Maybe implement this without relying on create_dataset
86 |     #   to make it more efficient.
87 | 
88 |     if data_format == "numpy" or data_format == "torch":
89 |         return data[0][0]
90 |     elif data_format == "files":
91 |         return next(data.rglob("*.png"))
92 |     else:
93 |         raise RuntimeError()
94 | 


--------------------------------------------------------------------------------
/tests/image_classification/test_preprocessing.py:
--------------------------------------------------------------------------------
  1 | import comet_ml  # noqa: F401
  2 | import pytest
  3 | import numpy as np
  4 | import torch
  5 | 
  6 | from conftest import create_dataset, create_image
  7 | 
  8 | from traintool.image_classification.preprocessing import (
  9 |     recognize_data_format,
 10 |     torch_to_numpy,
 11 |     numpy_to_torch,
 12 |     files_to_numpy,
 13 |     files_to_torch,
 14 |     load_image,
 15 |     recognize_image_format,
 16 |     get_num_classes,
 17 | )
 18 | 
 19 | 
 20 | @pytest.fixture
 21 | def numpy_data():
 22 |     return create_dataset(data_format="numpy", seed=0, grayscale=False)
 23 | 
 24 | 
 25 | @pytest.fixture
 26 | def torch_data():
 27 |     return create_dataset(data_format="torch", seed=0, grayscale=False)
 28 | 
 29 | 
 30 | @pytest.fixture
 31 | def files_data(tmp_path):
 32 |     return create_dataset(data_format="files", seed=0, tmp_path=tmp_path)
 33 | 
 34 | 
 35 | @pytest.fixture
 36 | def numpy_image():
 37 |     return create_image(data_format="numpy", seed=0, grayscale=False)
 38 | 
 39 | 
 40 | @pytest.fixture
 41 | def torch_image():
 42 |     return create_image(data_format="torch", seed=0, grayscale=False)
 43 | 
 44 | 
 45 | @pytest.fixture
 46 | def files_image(tmp_path):
 47 |     return create_image(data_format="files", seed=0, tmp_path=tmp_path)
 48 | 
 49 | 
 50 | def test_recognize_data_format(numpy_data, torch_data, files_data):
 51 |     
 52 |     # correct data formats
 53 |     assert recognize_data_format(numpy_data) == "numpy"
 54 |     assert recognize_data_format(torch_data) == "pytorch-dataset"
 55 |     assert recognize_data_format(files_data) == "files"
 56 | 
 57 |     # incorrect data formats
 58 |     with pytest.raises(ValueError):
 59 |         recognize_data_format(None)
 60 |     with pytest.raises(ValueError):
 61 |         recognize_data_format([1, 2, 3])
 62 |     with pytest.raises(FileNotFoundError):
 63 |         recognize_data_format("non/existent/dir/123")
 64 | 
 65 | 
 66 | def test_recognize_image_format(numpy_image, torch_image, files_image):
 67 | 
 68 |     # correct image formats
 69 |     assert recognize_image_format(numpy_image) == "numpy"
 70 |     assert recognize_image_format(files_image) == "files"
 71 | 
 72 |     # incorrect image formats
 73 |     with pytest.raises(ValueError):
 74 |         recognize_image_format(None)
 75 |     with pytest.raises(ValueError):
 76 |         recognize_image_format([1, 2, 3])
 77 |     with pytest.raises(FileNotFoundError):
 78 |         recognize_image_format("non/existent/file/123")
 79 | 
 80 | 
 81 | def test_torch_to_numpy(numpy_data, torch_data):
 82 |     converted_data = torch_to_numpy(torch_data)
 83 |     assert np.allclose(converted_data[0], numpy_data[0])
 84 |     assert np.allclose(converted_data[1], numpy_data[1])
 85 | 
 86 | 
 87 | def test_numpy_to_torch(numpy_data, torch_data):
 88 |     converted_data = numpy_to_torch(numpy_data)
 89 |     # Note that we compare with tolerance of 0.1 here, because due to conversion to PIL,
 90 |     # values are not exactly preserved.
 91 |     assert torch.allclose(converted_data[0][0], torch_data[0][0], atol=0.1)
 92 |     assert converted_data[0][1] == torch_data[0][1]
 93 | 
 94 |     resized_converted_data = numpy_to_torch(
 95 |         numpy_data, resize=256, crop=224, mean=[0.1, 0.1, 0.1], std=[0.1, 0.1, 0.1]
 96 |     )
 97 |     assert resized_converted_data[0][0].shape[1] == 224
 98 |     assert resized_converted_data[0][0].shape[2] == 224
 99 | 
100 | 
101 | def test_files_to_numpy(files_data, numpy_data):
102 |     converted_data = files_to_numpy(files_data)
103 |     assert converted_data[0][0].shape == numpy_data[0][0].shape
104 | 
105 |     resized_converted_data = files_to_numpy(
106 |         files_data, resize=256, crop=224, mean=[0.1, 0.1, 0.1], std=[0.1, 0.1, 0.1]
107 |     )
108 |     assert resized_converted_data[0][0].shape[1] == 224
109 |     assert resized_converted_data[0][0].shape[2] == 224
110 | 
111 | 
112 | def test_files_to_torch(files_data, torch_data):
113 |     converted_data = files_to_torch(files_data)
114 |     assert converted_data[0][0].shape == torch_data[0][0].shape
115 | 
116 |     resized_converted_data = files_to_numpy(
117 |         files_data, resize=256, crop=224, mean=[0.1, 0.1, 0.1], std=[0.1, 0.1, 0.1]
118 |     )
119 |     assert resized_converted_data[0][0].shape[1] == 224
120 |     assert resized_converted_data[0][0].shape[2] == 224
121 | 
122 | 
123 | # TODO: Maybe add tests for to_numpy and to_torch, but note that these are kinda
124 | #   redundant to the tests above.
125 | 
126 | 
127 | def test_load_image(tmp_path):
128 |     data = create_dataset(grayscale=False, data_format="files", tmp_path=tmp_path)
129 | 
130 |     # Select a random image.
131 |     image_path = next(data.rglob("*.png"))
132 | 
133 |     # torch
134 |     img = load_image(image_path, resize=50, crop=40)
135 |     assert isinstance(img, torch.Tensor)
136 |     assert img.shape == (3, 40, 40)
137 | 
138 |     # numpy
139 |     img = load_image(image_path, resize=50, crop=40, to_numpy=True)
140 |     assert isinstance(img, np.ndarray)
141 |     assert img.shape == (3, 40, 40)
142 | 
143 | 
144 | def test_get_num_classes(numpy_data, files_data):
145 |     assert get_num_classes(numpy_data) == 4
146 |     assert get_num_classes(files_data) == 4
147 | 


--------------------------------------------------------------------------------
/tests/image_classification/test_sklearn_models.py:
--------------------------------------------------------------------------------
 1 | import comet_ml  # noqa: F401
 2 | import pytest
 3 | import numpy as np
 4 | from sklearn.ensemble import RandomForestClassifier
 5 | from tensorboardX import SummaryWriter
 6 | 
 7 | from conftest import create_dataset, create_image
 8 | 
 9 | from traintool.image_classification import SklearnImageClassificationWrapper
10 | from traintool.utils import DummyExperiment
11 | 
12 | 
13 | # TODO: Maybe persist this on module level to save time.
14 | @pytest.fixture
15 | def wrapper(tmp_path):
16 |     """A simple wrapper around random-forest model"""
17 |     data = create_dataset(grayscale=False)
18 |     wrapper = SklearnImageClassificationWrapper("random-forest", {}, tmp_path)
19 |     wrapper._train(
20 |         train_data=data,
21 |         val_data=None,
22 |         test_data=None,
23 |         writer=SummaryWriter(write_to_disk=False),
24 |         experiment=DummyExperiment(),
25 |         dry_run=True,
26 |     )
27 |     return wrapper
28 | 
29 | 
30 | def test_create_model(tmp_path):
31 |     wrapper = SklearnImageClassificationWrapper(
32 |         "random-forest", {"n_estimators": 10}, tmp_path
33 |     )
34 |     wrapper._create_model()
35 |     assert isinstance(wrapper.model, RandomForestClassifier)
36 |     assert wrapper.model.n_estimators == 10
37 | 
38 | 
39 | @pytest.mark.parametrize("data_format", ["numpy", "files"])
40 | @pytest.mark.parametrize("grayscale", [True, False])
41 | def test_train(data_format, grayscale, tmp_path):
42 |     data = create_dataset(
43 |         data_format=data_format, grayscale=grayscale, size=28, tmp_path=tmp_path,
44 |     )
45 |     wrapper = SklearnImageClassificationWrapper("random-forest", {}, tmp_path)
46 | 
47 |     wrapper._train(
48 |         train_data=data,
49 |         val_data=data,
50 |         test_data=data,
51 |         writer=SummaryWriter(write_to_disk=False),
52 |         experiment=DummyExperiment(),
53 |         dry_run=True,
54 |     )
55 | 
56 |     assert isinstance(wrapper.model, RandomForestClassifier)
57 |     assert wrapper.scaler is not None
58 |     assert (tmp_path / "model.joblib").exists()
59 | 
60 | 
61 | def test_load(wrapper):
62 |     loaded_wrapper = SklearnImageClassificationWrapper(
63 |         "random-forest", {}, wrapper.out_dir
64 |     )
65 |     loaded_wrapper._load()
66 |     assert isinstance(loaded_wrapper.model, RandomForestClassifier)
67 |     assert loaded_wrapper.scaler is not None
68 | 
69 | 
70 | @pytest.mark.parametrize("data_format", ["numpy", "files"])
71 | def test_predict(wrapper, data_format, tmp_path):
72 |     image = create_image(grayscale=False, data_format=data_format, tmp_path=tmp_path)
73 | 
74 |     result = wrapper.predict(image)
75 |     assert "predicted_class" in result
76 |     assert "probabilities" in result
77 |     print(result)
78 | 
79 |     assert isinstance(result["predicted_class"], int)
80 |     assert isinstance(result["probabilities"], np.ndarray)
81 |     assert result["probabilities"].ndim == 1
82 |     # TODO: Assert that length of probabilities is equal to the number of classes.
83 |     # TODO: Assert that predicted_class is below the number of classes.
84 | 
85 | 
86 | def test_raw(wrapper):
87 |     raw = wrapper.raw()
88 |     assert "model" in raw
89 |     assert "scaler" in raw
90 | 


--------------------------------------------------------------------------------
/tests/image_classification/test_torch_models.py:
--------------------------------------------------------------------------------
  1 | import comet_ml  # noqa: F401
  2 | import pytest
  3 | import numpy as np
  4 | import torch.nn as nn
  5 | from torch import optim
  6 | from tensorboardX import SummaryWriter
  7 | 
  8 | from conftest import create_dataset, create_image
  9 | 
 10 | from traintool.image_classification.torch_models import (
 11 |     TorchImageClassificationWrapper,
 12 |     SimpleCnn,
 13 | )
 14 | from traintool.utils import DummyExperiment
 15 | 
 16 | 
 17 | # TODO: Maybe persist this on module level to save time.
 18 | @pytest.fixture
 19 | def wrapper(tmp_path):
 20 |     """A simple wrapper around random-forest model"""
 21 |     data = create_dataset(data_format="numpy", grayscale=False, size=224)
 22 |     wrapper = TorchImageClassificationWrapper("resnet18", {}, tmp_path)
 23 |     wrapper._train(
 24 |         train_data=data,
 25 |         val_data=None,
 26 |         test_data=None,
 27 |         writer=SummaryWriter(write_to_disk=False),
 28 |         experiment=DummyExperiment(),
 29 |         dry_run=True,
 30 |     )
 31 |     return wrapper
 32 | 
 33 | 
 34 | def test_create_model(tmp_path):
 35 | 
 36 |     # resnet18
 37 |     wrapper = TorchImageClassificationWrapper("resnet18", {"num_classes": 10}, tmp_path)
 38 |     wrapper._create_model(num_classes=10)
 39 |     assert isinstance(wrapper.model, nn.Module)
 40 |     assert wrapper.model.fc.out_features == 10
 41 |     # pretrained=True is not tested here because it takes too long
 42 | 
 43 |     # simple-cnn
 44 |     wrapper = TorchImageClassificationWrapper("simple-cnn", {}, tmp_path)
 45 |     wrapper._create_model(num_classes=10)
 46 |     assert isinstance(wrapper.model, SimpleCnn)
 47 | 
 48 | 
 49 | # TODO: Test torch datasets as well.
 50 | # @pytest.mark.parametrize("data_format", ["numpy", "files"])
 51 | # @pytest.mark.parametrize("grayscale", [True, False])
 52 | # def test_preprocess_for_training(data_format, grayscale, tmp_path):
 53 | #     data = create_dataset(
 54 | #         data_format=data_format, grayscale=grayscale, tmp_path=tmp_path,
 55 | #     )
 56 | #     wrapper = TorchImageClassificationWrapper("resnet18")
 57 | #     batch_size = 2
 58 | #     loaders = wrapper._preprocess_for_training(
 59 | #         data, data, data, config={"batch_size": batch_size}
 60 | #     )
 61 | 
 62 | #     for loader in loaders:
 63 | #         assert isinstance(loader, DataLoader)
 64 | #         images, labels = next(iter(loader))
 65 | #         assert len(images) == batch_size
 66 | #         assert len(labels) == batch_size
 67 | #         assert len(labels.shape) == 1
 68 | #         assert len(images.shape) == 4
 69 | #         assert images.shape[1] == 3
 70 | #         assert images.shape[2] == 224
 71 | #         assert images.shape[3] == 224
 72 | 
 73 | 
 74 | def test_create_optimizer(tmp_path):
 75 |     wrapper = TorchImageClassificationWrapper("resnet18", {}, tmp_path)
 76 |     wrapper._create_model(num_classes=10)
 77 | 
 78 |     # default
 79 |     default_optimizer = wrapper._create_optimizer()
 80 |     assert isinstance(default_optimizer, optim.Optimizer)
 81 | 
 82 |     # adadelta
 83 |     wrapper.config["optimizer"] = "adadelta"
 84 |     adadelta = wrapper._create_optimizer()
 85 |     assert isinstance(adadelta, optim.Adadelta)
 86 | 
 87 |     # adadelta with lr
 88 |     wrapper.config["optimizer"] = "adadelta"
 89 |     wrapper.config["lr"] = 123
 90 |     adadelta_lr = wrapper._create_optimizer()
 91 |     assert isinstance(adadelta, optim.Adadelta)
 92 |     assert adadelta_lr.defaults["lr"] == 123
 93 | 
 94 |     # unknown optimizer
 95 |     wrapper.config["optimizer"] = "unknown-optimizer123"
 96 |     with pytest.raises(ValueError):
 97 |         wrapper._create_optimizer()
 98 | 
 99 | 
100 | # TODO: Test torch datasets.
101 | @pytest.mark.parametrize("data_format", ["numpy", "files"])
102 | @pytest.mark.parametrize("grayscale", [True, False])
103 | def test_train(data_format, grayscale, tmp_path):
104 |     # TODO: Test for grayscale = False and different size.
105 |     # data = create_dataset(
106 |     #     data_format=data_format, size=28, grayscale=True
107 |     # )
108 |     # wrapper = TorchImageClassificationWrapper("simple-cnn")
109 |     data = create_dataset(
110 |         data_format=data_format, grayscale=grayscale, tmp_path=tmp_path
111 |     )
112 |     wrapper = TorchImageClassificationWrapper("resnet18", {}, tmp_path)
113 | 
114 |     # TODO: Test both resnet18 and simple-cnn with a few different configurations of
115 |     #   data.
116 |     # TODO: Test with and without val/test data.
117 |     # TODO: Check that something was written to writer and experiment.
118 |     wrapper._train(
119 |         train_data=data,
120 |         val_data=data,
121 |         test_data=data,
122 |         writer=SummaryWriter(write_to_disk=False),
123 |         experiment=DummyExperiment(),
124 |         dry_run=True,  # True,
125 |     )
126 | 
127 |     assert isinstance(wrapper.model, nn.Module)
128 |     assert (tmp_path / "model.pt").exists()
129 | 
130 | 
131 | def test_load(wrapper):
132 |     loaded_wrapper = TorchImageClassificationWrapper("resnet18", {}, wrapper.out_dir)
133 |     loaded_wrapper._load()
134 |     assert isinstance(loaded_wrapper.model, nn.Module)
135 |     # TODO: Maybe do some more tests here.
136 | 
137 | 
138 | @pytest.mark.parametrize("data_format", ["numpy", "files"])
139 | def test_predict(wrapper, data_format, tmp_path):
140 |     image = create_image(grayscale=False, data_format=data_format, tmp_path=tmp_path)
141 | 
142 |     result = wrapper.predict(image)
143 |     assert "predicted_class" in result
144 |     assert "probabilities" in result
145 |     print(result)
146 | 
147 |     assert isinstance(result["predicted_class"], int)
148 |     assert isinstance(result["probabilities"], np.ndarray)
149 |     assert result["probabilities"].ndim == 1
150 |     # TODO: Assert that length of probabilities is equal to the number of classes.
151 |     # TODO: Assert that predicted_class is below the number of classes.
152 | 
153 | 
154 | def test_raw(wrapper):
155 |     raw = wrapper.raw()
156 |     assert "model" in raw
157 |     assert isinstance(raw["model"], nn.Module)
158 | 


--------------------------------------------------------------------------------
/tests/test_main.py:
--------------------------------------------------------------------------------
  1 | import comet_ml
  2 | import pytest
  3 | from tensorboardX import SummaryWriter
  4 | 
  5 | from conftest import create_dataset
  6 | 
  7 | from traintool.main import (
  8 |     connect_comet,
  9 |     train,
 10 |     load,
 11 |     # default_config,
 12 |     _resolve_model,
 13 |     # _update_config,
 14 |     _write_info_file,
 15 |     _read_info_file,
 16 |     _create_comet_experiment,
 17 |     _create_tensorboard_writer,
 18 | )
 19 | from traintool.model_wrapper import ModelWrapper
 20 | from traintool.utils import DummyExperiment
 21 | 
 22 | 
 23 | def test_resolve_model():
 24 |     assert issubclass(_resolve_model("resnet18"), ModelWrapper)
 25 |     with pytest.raises(ValueError):
 26 |         _resolve_model("non-existing-model-123")
 27 | 
 28 | 
 29 | # def test_update_config():
 30 | #     default_config = {"param1": 123, "param2": "hello"}
 31 | #     config = {"param2": "hello again"}
 32 | #     invalid_config = {"param3": "this doesn't exist"}
 33 | 
 34 | #     updated_config = _update_config(default_config, config)
 35 | #     assert isinstance(updated_config, dict)
 36 | #     assert len(updated_config.keys()) == 2
 37 | #     assert updated_config["param1"] == 123
 38 | #     assert updated_config["param2"] == "hello again"
 39 | #     with pytest.raises(ValueError):
 40 | #         _update_config(default_config, invalid_config)
 41 | 
 42 | 
 43 | def test_write_read_info_file(tmp_path):
 44 |     _write_info_file(tmp_path, status="Running", config={"param1": 123})
 45 |     assert (tmp_path / "info.yml").exists()
 46 | 
 47 |     # read the file and verify it matches
 48 |     content = _read_info_file(tmp_path)
 49 |     assert content["status"] == "Running"
 50 |     assert content["config"]["param1"] == 123
 51 | 
 52 |     # update and read again
 53 |     _write_info_file(tmp_path, status="Stopped", end_time=1)
 54 |     content = _read_info_file(tmp_path)
 55 |     assert content["status"] == "Stopped"
 56 |     assert content["config"]["param1"] == 123
 57 |     assert content["end_time"] == 1
 58 | 
 59 | 
 60 | def test_create_comet_experiment():
 61 |     # Fake experiment object (traintool.connect_comet not called)
 62 |     experiment = _create_comet_experiment(save=True)
 63 |     experiment.log_metric("fake-metric", 1)
 64 |     assert isinstance(experiment, DummyExperiment)
 65 | 
 66 |     # Real experiment object
 67 |     connect_comet("fake-api-key")  # won't connect with with dry_run == True
 68 |     experiment = _create_comet_experiment(save=True)
 69 |     experiment.log_metric("fake-metric", 1)
 70 |     assert isinstance(experiment, comet_ml.Experiment)
 71 | 
 72 | 
 73 | def test_create_tensorboard_writer(tmp_path):
 74 |     writer = _create_tensorboard_writer(tmp_path)
 75 |     assert isinstance(writer, SummaryWriter)
 76 |     writer.add_scalar("param", 123)
 77 |     writer.close()
 78 | 
 79 | 
 80 | def test_train(tmp_path):
 81 |     train_data = create_dataset()
 82 | 
 83 |     with pytest.raises(ValueError):
 84 |         train("non-existing-model-123", None)
 85 | 
 86 |     # with pytest.raises(ValueError):
 87 |     #     train("random-forest", None, config={"non-existing-parameter": 123})
 88 | 
 89 |     # With save=False (this has to be checked first, so tmp_path is still empty)
 90 |     model_wrapper = train(
 91 |         "random-forest", train_data=train_data, dry_run=True, save=False,
 92 |     )
 93 |     assert isinstance(model_wrapper, ModelWrapper)
 94 |     assert not any(tmp_path.iterdir())  # is empty dir
 95 | 
 96 |     # With all datasets
 97 |     model_wrapper = train(
 98 |         "random-forest",
 99 |         train_data=train_data,
100 |         val_data=train_data,
101 |         test_data=train_data,
102 |         dry_run=True,
103 |         save=tmp_path,
104 |     )
105 |     assert isinstance(model_wrapper, ModelWrapper)
106 |     assert (tmp_path / "info.yml").exists()
107 |     assert (tmp_path / "model.joblib").exists()
108 | 
109 |     # With only train data
110 |     model_wrapper = train(
111 |         "random-forest", train_data=train_data, dry_run=True, save=tmp_path,
112 |     )
113 |     assert isinstance(model_wrapper, ModelWrapper)
114 |     assert (tmp_path / "info.yml").exists()
115 |     assert (tmp_path / "model.joblib").exists()
116 | 
117 | 
118 | def test_load(tmp_path):
119 |     train_data = create_dataset()
120 |     train(
121 |         "random-forest",
122 |         train_data=train_data,
123 |         test_data=train_data,
124 |         dry_run=True,
125 |         save=tmp_path,
126 |     )
127 |     loaded_model_wrapper = load(tmp_path)
128 |     assert isinstance(loaded_model_wrapper, ModelWrapper)
129 |     assert loaded_model_wrapper.model is not None
130 |     # TODO: Make some more checks on loaded_model_wrapper, possibly using a dummy
131 |     #   wrapper class.
132 | 
133 | 
134 | # def test_default_config():
135 | #     assert isinstance(default_config("simple-cnn"), dict)
136 | #     assert "lr" in default_config("simple-cnn")
137 | #     assert "n_estimators" in default_config("random-forest")
138 | #     with pytest.raises(ValueError):
139 | #         default_config("non-existing-model-123")
140 | 


--------------------------------------------------------------------------------
/tests/test_model_wrapper.py:
--------------------------------------------------------------------------------
 1 | from fastapi.testclient import TestClient
 2 | import numpy as np
 3 | 
 4 | from traintool.model_wrapper import ModelWrapper
 5 | 
 6 | 
 7 | class DummyWrapper(ModelWrapper):
 8 |     def _train(
 9 |         self,
10 |         train_data,
11 |         val_data,
12 |         test_data,
13 |         writer,
14 |         experiment,
15 |         dry_run: bool = False,
16 |     ) -> None:
17 |         self.model = "a cool model"
18 | 
19 |     def _load(self) -> None:
20 |         self.model = "a cool model"
21 | 
22 |     def predict(self, image) -> dict:
23 |         return {"predicted_class": 0, "probabilities": np.array([0.1, 0.9])}
24 | 
25 |     def raw(self) -> dict:
26 |         return {"model": self.model}
27 | 
28 | 
29 | def test_wrapper_init(tmp_path):
30 |     wrapper = DummyWrapper("dummy", {}, tmp_path)  # noqa: F841
31 | 
32 | 
33 | def test_create_fastapi(tmp_path):
34 |     wrapper = DummyWrapper("dummy", {}, tmp_path)
35 |     app = wrapper._create_fastapi()
36 |     client = TestClient(app)
37 | 
38 |     # index endpoint
39 |     response = client.get("/")
40 |     assert response.status_code == 200
41 |     assert response.json()["model_name"] == "dummy"
42 |     assert response.json()["config"] == {}
43 | 
44 |     # predict endpoint
45 |     # TODO: Maybe test this for a properly trained model (especially the data
46 |     #   conversion).
47 |     response = client.post("/predict", json={"image": [[[0, 1], [1, 0]]]})
48 |     assert response.status_code == 200
49 |     assert response.json()["predicted_class"] == 0
50 |     assert np.all(np.array(response.json()["probabilities"]) == np.array([0.1, 0.9]))
51 | 


--------------------------------------------------------------------------------
/traintool/__init__.py:
--------------------------------------------------------------------------------
1 | from .main import train, connect_comet, load  # noqa: F401
2 | 
3 | # TODO: Make __version__ here
4 | 


--------------------------------------------------------------------------------
/traintool/_version.txt:
--------------------------------------------------------------------------------
1 | 0.0.3


--------------------------------------------------------------------------------
/traintool/image_classification/__init__.py:
--------------------------------------------------------------------------------
1 | from .sklearn_models import SklearnImageClassificationWrapper
2 | from .torch_models import TorchImageClassificationWrapper
3 | 


--------------------------------------------------------------------------------
/traintool/image_classification/preprocessing.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Preprocess image classification data for use in different frameworks.
  3 | """
  4 | 
  5 | import numpy as np
  6 | import torch
  7 | from torch.utils.data import Dataset
  8 | from torchvision import datasets, transforms
  9 | from typing import List, Union
 10 | from pathlib import Path
 11 | from PIL import Image
 12 | 
 13 | 
 14 | def channels_first(images: np.ndarray) -> np.ndarray:
 15 |     """Converts images from channels last to channels first format."""
 16 |     return images.transpose((0, 3, 1, 2))
 17 | 
 18 | 
 19 | def channels_last(images: np.ndarray) -> np.ndarray:
 20 |     """Converts images from channels first to channels last format."""
 21 |     return images.transpose((0, 2, 3, 1))
 22 | 
 23 | 
 24 | # TODO: Maybe rename to check_data_format.
 25 | def recognize_data_format(data) -> str:
 26 |     """Checks the data format and returns "pytorch-dataset" or "numpy" or "files"."""
 27 | 
 28 |     # Check for pytorch dataset.
 29 |     if isinstance(data, Dataset):
 30 |         return "pytorch-dataset"
 31 | 
 32 |     # Check for iterable of numpy arrays (images, labels).
 33 |     try:
 34 |         if (
 35 |             len(data) == 2
 36 |             and isinstance(data[0], np.ndarray)
 37 |             and isinstance(data[1], np.ndarray)
 38 |         ):
 39 |             # Check for correct shape of images.
 40 |             images, labels = data
 41 |             if len(images.shape) == 4 and (images.shape[1] in [1, 3]):
 42 |                 return "numpy"
 43 |             else:
 44 |                 raise ValueError(
 45 |                     "Shape of images not understood, should be "
 46 |                     "num_samples x color_channels (1 or 3) x height x width, "
 47 |                     f"is: {images.shape}"
 48 |                 )
 49 |     except TypeError:  # data is no iterable
 50 |         pass
 51 | 
 52 |     # Check for path to directory.
 53 |     try:
 54 |         if Path(data).exists():
 55 |             return "files"
 56 |         else:
 57 |             raise FileNotFoundError(f"Data directory does not exist: {data}")
 58 |     except TypeError:  # not a file or dir
 59 |         pass
 60 | 
 61 |     # If all checks failed...
 62 |     raise ValueError(
 63 |         "Data format not recognized. Supported formats: list of numpy "
 64 |         "arrays, torch dataset, directory of image files"
 65 |     )
 66 | 
 67 | 
 68 | def recognize_image_format(image) -> str:
 69 |     """Checks the image format and returns "numpy" or "file"."""
 70 | 
 71 |     # Check for numpy array.
 72 |     if isinstance(image, np.ndarray):
 73 |         if len(image.shape) == 3 and (image.shape[0] in [1, 3]):
 74 |             return "numpy"
 75 |         else:
 76 |             raise ValueError(
 77 |                 "Shape of image not understood, should be "
 78 |                 "color_channels (1 or 3) x height x width, "
 79 |                 f"is: {image.shape}"
 80 |             )
 81 | 
 82 |     # TODO: Check for torch tensor.
 83 | 
 84 |     # Check for path to directory.
 85 |     try:
 86 |         if Path(image).exists():
 87 |             # TODO: Maybe check that image can be read.
 88 |             return "files"
 89 |         else:
 90 |             raise FileNotFoundError(f"Image path does not exist: {image}")
 91 |     except TypeError:  # not a file or dir
 92 |         pass
 93 | 
 94 |     # If all checks failed...
 95 |     raise ValueError(
 96 |         "Image format not recognized. Supported formats: numpy arrays, path to image "
 97 |         "file"
 98 |     )
 99 | 
100 | 
101 | def to_torch(
102 |     data, resize: int = None, crop: int = None, mean: List = None, std: List = None,
103 | ) -> Union[Dataset, None]:
104 |     """Convert data from any format to torch datasets."""
105 | 
106 |     # Handle empty dataset.
107 |     if data is None:
108 |         return None
109 | 
110 |     # Recognize data format and convert accordingly.
111 |     data_format = recognize_data_format(data)
112 |     if data_format == "pytorch-dataset":
113 |         # TODO: Maybe apply transformations to torch dataset as well.
114 |         return data
115 |     elif data_format == "numpy":
116 |         return numpy_to_torch(data, resize=resize, crop=crop, mean=mean, std=std)
117 |     elif data_format == "files":
118 |         return files_to_torch(data, resize=resize, crop=crop, mean=mean, std=std)
119 |     else:
120 |         raise RuntimeError()
121 | 
122 | 
123 | def to_numpy(
124 |     data, resize: int = None, crop: int = None, mean: List = None, std: List = None,
125 | ) -> Union[List[np.ndarray], None]:
126 |     """Convert data from any format to lists of numpy arrays [input, target]."""
127 |     # Handle empty dataset.
128 |     if data is None:
129 |         return None
130 | 
131 |     # Recognize data format and convert accordingly.
132 |     data_format = recognize_data_format(data)
133 |     if data_format == "pytorch-dataset":
134 |         # TODO: Maybe apply transformations here as well.
135 |         return torch_to_numpy(data)
136 |     elif data_format == "numpy":
137 |         # TODO: Maybe apply transformations here as well.
138 |         return data
139 |     elif data_format == "files":
140 |         return files_to_numpy(data, resize=resize, crop=crop, mean=mean, std=std)
141 |     else:
142 |         raise RuntimeError()
143 | 
144 | 
145 | class ImageDataset(Dataset):
146 |     """
147 |     Generic dataset for images that can deal with PIL images, numpy arrays,
148 |     or torch tensors.
149 |     """
150 | 
151 |     def __init__(self, images, labels, transform=None):
152 |         self.images = images
153 |         self.labels = labels
154 |         self.transform = transform
155 | 
156 |     def __len__(self):
157 |         return len(self.images)
158 | 
159 |     def __getitem__(self, idx):
160 |         if torch.is_tensor(idx):
161 |             idx = idx.tolist()
162 | 
163 |         image = self.images[idx]
164 |         label = self.labels[idx]
165 | 
166 |         if self.transform:
167 |             image = self.transform(image)
168 | 
169 |         return image, label
170 | 
171 | 
172 | def numpy_to_torch(
173 |     data: List[np.ndarray],
174 |     resize: int = None,
175 |     crop: int = None,
176 |     mean: List = None,
177 |     std: List = None,
178 | ) -> Dataset:
179 |     """Convert data from list of numpy arrays [input, target] to torch datasets."""
180 |     # Unpack arrays.
181 |     images, labels = data
182 | 
183 |     # Rescale images to 0-255 and convert to uint8.
184 |     # TODO: Right now this is done for each dataset individually, which is probably
185 |     #   not a big deal, because all datasets should usually contain values from the
186 |     #   complete range of values. Ideally though, this should probably be done based
187 |     #   on the values of the train dataset.
188 |     images = (images - np.min(images)) / np.ptp(images) * 255
189 |     images = images.astype(np.uint8)
190 | 
191 |     # If images are grayscale, convert to RGB by duplicating channels.
192 |     if images.shape[1] == 1:
193 |         images = np.stack((images[:, 0],) * 3, axis=1)
194 | 
195 |     # Convert to channels last format (required for transforms.ToPILImage).
196 |     images = channels_last(images)
197 | 
198 |     # Set up transform to convert to PIL image, do manipulations, and convert to tensor.
199 |     # TODO: Converting to PIL and then to tensor is not super efficient, find a better
200 |     #   method.
201 |     transform = create_transform(
202 |         from_numpy=True, resize=resize, crop=crop, mean=mean, std=std
203 |     )
204 | 
205 |     # Convert labels to tensors.
206 |     labels = torch.from_numpy(labels).long()
207 | 
208 |     # Construct dataset.
209 |     dataset = ImageDataset(images, labels, transform=transform)
210 |     return dataset
211 | 
212 | 
213 | def torch_to_numpy(data: Dataset) -> List[np.ndarray]:
214 |     """Convert data from torch dataset to list of numpy arrays [input, target]."""
215 | 
216 |     # Create empty numpy arrays.
217 |     images_shape = (len(data), *data[0][0].shape)
218 |     images = np.zeros(images_shape)
219 |     labels = np.zeros(len(data))
220 | 
221 |     # Fill arrays with samples from torch dataset.
222 |     # Note that samples in torch datasets may change from iteration to iteration
223 |     # because of random transforms.
224 |     # TODO: What to do if data is too large for memory?
225 |     for i, (image, label) in enumerate(data):
226 |         images[i] = image
227 |         labels[i] = label
228 |     return [images, labels]
229 | 
230 | 
231 | def files_to_numpy(
232 |     root: Path,
233 |     resize: int = None,
234 |     crop: int = None,
235 |     mean: List = None,
236 |     std: List = None,
237 | ) -> List[np.ndarray]:
238 |     """Load image files into pytorch dataset and convert to numpy arrays."""
239 |     dataset = files_to_torch(root, resize=resize, crop=crop, mean=mean, std=std)
240 |     numpy_data = torch_to_numpy(dataset)
241 |     return numpy_data
242 | 
243 | 
244 | def files_to_torch(
245 |     root: Path,
246 |     resize: int = None,
247 |     crop: int = None,
248 |     mean: List = None,
249 |     std: List = None,
250 | ) -> Dataset:
251 |     """Load image files into pytorch dataset."""
252 |     # Set up transform for loading and converting files.
253 |     transform = create_transform(resize=resize, crop=crop, mean=mean, std=std)
254 | 
255 |     # Load images from folder.
256 |     dataset = datasets.ImageFolder(root, transform=transform)
257 |     return dataset
258 | 
259 | 
260 | def create_transform(
261 |     from_numpy: bool = False,
262 |     resize: int = None,
263 |     crop: int = None,
264 |     mean: List = None,
265 |     std: List = None,
266 | ):
267 |     """Creates a torchvision transform to convert images from PIL or numpy."""
268 |     t = []
269 |     if from_numpy:
270 |         t.append(transforms.ToPILImage())
271 |     if resize is not None:
272 |         t.append(transforms.Resize(resize))
273 |     if crop is not None:
274 |         t.append(transforms.CenterCrop(crop))
275 |     t.append(transforms.ToTensor())
276 |     if mean is not None and std is not None:
277 |         t.append(transforms.Normalize(mean=mean, std=std),)
278 |     return transforms.Compose(t)
279 | 
280 | 
281 | def load_image(
282 |     filename: Union[str, Path],
283 |     to_numpy: bool = False,
284 |     resize: int = None,
285 |     crop: int = None,
286 |     mean: list = None,
287 |     std: list = None,
288 | ) -> torch.Tensor:
289 |     """Load an image from file, convert it and return as torch or numpy."""
290 | 
291 |     # Load image.
292 |     filename = Path(filename)
293 |     img = Image.open(filename).convert("RGB")
294 | 
295 |     # Transform.
296 |     transform = create_transform(resize=resize, crop=crop, mean=mean, std=std)
297 |     img_torch = transform(img)
298 | 
299 |     # Convert to numpy.
300 |     if to_numpy:
301 |         return img_torch.numpy()
302 |     else:
303 |         return img_torch
304 | 
305 | 
306 | def get_num_classes(data) -> int:
307 |     """Returns the number of classes (unique labels) in the dataset."""
308 |     data_format = recognize_data_format(data)
309 |     if data_format == "numpy":
310 |         images, labels = data
311 |         # TODO: Right now, we just assume that the labels are properly indexed (e.g.
312 |         #   from 0 to 9), so we return the max value + 1 here. Instead, we should map
313 |         #   the labels to a dictionary and then figure out the number of classes from
314 |         #   there. E.g. so that labels can be [0, 2, 5] or even ["dog", "cat", "horse"].
315 |         return np.max(labels) + 1
316 |     elif data_format == "files":
317 |         dataset = datasets.ImageFolder(data)
318 |         return len(dataset.targets)
319 |     else:
320 |         raise RuntimeError()
321 | 


--------------------------------------------------------------------------------
/traintool/image_classification/sklearn_models.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Wrapper around scikit-learn image classification models.
  3 | """
  4 | 
  5 | import sklearn.preprocessing
  6 | from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
  7 | from sklearn.gaussian_process import GaussianProcessClassifier
  8 | from sklearn.linear_model import (
  9 |     LogisticRegression,
 10 |     SGDClassifier,
 11 |     Perceptron,
 12 |     PassiveAggressiveClassifier,
 13 | )
 14 | from sklearn.naive_bayes import GaussianNB
 15 | from sklearn.neighbors import KNeighborsClassifier
 16 | from sklearn.neural_network import MLPClassifier
 17 | from sklearn.svm import SVC, LinearSVC
 18 | from sklearn.tree import DecisionTreeClassifier, ExtraTreeClassifier
 19 | from sklearn.utils import shuffle
 20 | import joblib
 21 | import numpy as np
 22 | from loguru import logger
 23 | 
 24 | from ..model_wrapper import ModelWrapper
 25 | from . import preprocessing, visualization
 26 | 
 27 | 
 28 | classifier_dict = {
 29 |     "random-forest": RandomForestClassifier,
 30 |     "gradient-boosting": GradientBoostingClassifier,
 31 |     "gaussian-process": GaussianProcessClassifier,
 32 |     "logistic-regression": LogisticRegression,
 33 |     "sgd": SGDClassifier,
 34 |     "perceptron": Perceptron,
 35 |     "passive-aggressive": PassiveAggressiveClassifier,
 36 |     "gaussian-nb": GaussianNB,
 37 |     "k-neighbors": KNeighborsClassifier,
 38 |     "mlp": MLPClassifier,
 39 |     "svc": SVC,
 40 |     "linear-svc": LinearSVC,
 41 |     "decision-tree": DecisionTreeClassifier,
 42 |     "extra-tree": ExtraTreeClassifier,
 43 | }
 44 | 
 45 | 
 46 | class SklearnImageClassificationWrapper(ModelWrapper):
 47 |     """
 48 |     This wrapper handles sklearn models for image classification.
 49 |     """
 50 | 
 51 |     def _create_model(self) -> None:
 52 |         """Create the model based on self.model_name and store it in self.model."""
 53 | 
 54 |         # All config params not used anywhere else are passed on to the sklearn model.
 55 |         model_config = self.config.copy()
 56 |         model_config.pop("num_samples", None)
 57 |         model_config.pop("num_samples_to_plot", None)
 58 | 
 59 |         # Some models need probability=True so that we can predict the probability
 60 |         # further down.
 61 |         try:
 62 |             self.model = classifier_dict[self.model_name](
 63 |                 probability=True, **model_config
 64 |             )
 65 |         except TypeError:  # no probability arg
 66 |             self.model = classifier_dict[self.model_name](**model_config)
 67 | 
 68 |     # def _preprocess_for_prediction(self, images: np.ndarray):
 69 |     #     """Preprocess images for use in training and prediction."""
 70 | 
 71 |     #     # Flatten images.
 72 |     #     images = images.reshape(len(images), -1)
 73 | 
 74 |     #     # Scale mean and std.
 75 |     #     images = self.scaler.transform(images)
 76 |     #     return images
 77 | 
 78 |     def _preprocess_for_training(self, name, data):
 79 |         """Preprocess a dataset with images and labels for use in training."""
 80 | 
 81 |         if data is None:  # val/test can be empty´
 82 |             logger.info(f"{name}: Not given")
 83 |             return None, None
 84 |         else:
 85 |             # Convert format.
 86 |             logger.info(f"{name}:")
 87 |             logger.info(f"    data format: {preprocessing.recognize_data_format(data)}")
 88 |             # TODO: Properly resize numpy arrays.
 89 |             data = preprocessing.to_numpy(data, resize=28, crop=28)
 90 |             images, labels = data
 91 |             logger.info(f"    samples: {len(images)}")
 92 |             logger.info(f"    image shape: {images.shape[1:]}")
 93 | 
 94 |             # Get number of classes.
 95 |             # TODO: Raise error if num_classes diverges between datasets.
 96 |             # TODO: Raise error if num_classes config param is given.
 97 |             num_classes = len(np.unique(labels))
 98 |             logger.info(f"    classes: {num_classes}")
 99 | 
100 |             # Flatten.
101 |             self._original_image_size = images.shape[1:]
102 |             images = images.reshape(len(images), -1)
103 |             logger.info(f"    flattened images (to {images.shape[1]} features)")
104 | 
105 |             # Scale mean and std.
106 |             if name == "train":
107 |                 self.scaler = sklearn.preprocessing.StandardScaler().fit(images)
108 |             images = self.scaler.transform(images)
109 |             logger.info("    scaled to mean 0, std 1 (based on train set)")
110 | 
111 |             # Shuffle train set.
112 |             if name == "train":
113 |                 images, labels = shuffle(images, labels)
114 |                 logger.info("    shuffled")
115 | 
116 |             return images, labels
117 | 
118 |     def _train(
119 |         self,
120 |         train_data,
121 |         val_data,
122 |         test_data,
123 |         writer,
124 |         experiment,
125 |         dry_run: bool = False,
126 |     ) -> None:
127 |         """Trains the model, evaluates it on val/test data and saves it to file."""
128 | 
129 |         # Preprocess all datasets and log some stats about them.
130 |         logger.info("Preprocessing datasets...")
131 |         train_images, train_labels = self._preprocess_for_training("train", train_data)
132 |         val_images, val_labels = self._preprocess_for_training("val", val_data)
133 |         test_images, test_labels = self._preprocess_for_training("test", test_data)
134 |         logger.info("")
135 | 
136 |         # Create the model.
137 |         logger.info("Creating model...")
138 |         self._create_model()
139 |         logger.info("")
140 | 
141 |         # Train the model
142 |         if dry_run:
143 |             # TODO: Ideally, this should only use one sample, but then there are errors
144 |             #   further down (specifically when plotting samples) because there's only 
145 |             #   one class present in the training data.
146 |             logger.info(f"Training model... (DRY RUN, only 100 samples)")
147 |             self.model.fit(train_images[:100], train_labels[:100])
148 |         elif "num_samples" in self.config:
149 |             logger.info(
150 |                 f"Training model... (using {self.config['num_samples']} of "
151 |                 f"{len(train_images)} samples)"
152 |             )
153 |             self.model.fit(
154 |                 train_images[: self.config["num_samples"]],
155 |                 train_labels[: self.config["num_samples"]],
156 |             )
157 |         else:
158 |             logger.info("Training model...")
159 |             logger.info(
160 |                 "(if this takes too long, train on less data with the config "
161 |                 "parameter 'num_samples')"
162 |             )
163 |             self.model.fit(train_images, train_labels)
164 | 
165 |         # Evaluate and log accuracy on all datasets.
166 |         def log_accuracy(name, images, labels):
167 |             if images is None:
168 |                 return
169 |             acc = self.model.score(images, labels)
170 |             logger.info(f"{name.capitalize()} accuracy:".ljust(18) + str(acc))
171 |             writer.add_scalar(f"{name}_accuracy", acc)
172 |             experiment.log_metric(f"{name}_accuracy", acc)
173 | 
174 |         log_accuracy("train", train_images, train_labels)
175 |         log_accuracy("val", val_images, val_labels)
176 |         log_accuracy("test", test_images, test_labels)
177 | 
178 |         # Plot a few samples from each dataset to tensorboard.
179 |         num_samples_to_plot = self.config.get("num_samples_to_plot", 5)
180 | 
181 |         def plot_samples(name, images, labels):
182 |             if images is None:
183 |                 return
184 |             num = min(len(images), num_samples_to_plot)
185 |             pred = self.model.predict_proba(images[:num])
186 |             # TODO: Save sample images before shuffling train_data, and before
187 |             #   preprocessing.
188 |             original_images = images[:num].reshape(num, *self._original_image_size)
189 |             visualization.plot_samples(
190 |                 writer, name, 1, original_images, labels[:num], pred,
191 |             )
192 | 
193 |         plot_samples("train-samples", train_images, train_labels)
194 |         plot_samples("val-samples", val_images, val_labels)
195 |         plot_samples("test-samples", test_images, test_labels)
196 | 
197 |         # Save model.
198 |         self._save()
199 | 
200 |     def _save(self):
201 |         """Saves the model and scaler to file."""
202 |         joblib.dump(self.model, self.out_dir / "model.joblib")
203 |         joblib.dump(self.scaler, self.out_dir / "scaler.joblib")
204 | 
205 |     def _load(self):
206 |         """Loads the model from the out dir."""
207 |         self.model = joblib.load(self.out_dir / "model.joblib")
208 |         self.scaler = joblib.load(self.out_dir / "scaler.joblib")
209 | 
210 |     def predict(self, image) -> dict:
211 |         """Runs data through the model and returns output."""
212 |         # TODO: This deals with single image right now, maybe extend for batch.
213 | 
214 |         # Convert data format if required.
215 |         # TODO: Maybe refactor this with the code in torch_models.predict.
216 |         image_format = preprocessing.recognize_image_format(image)
217 |         if image_format == "files":
218 |             # TODO: If the network was trained with numpy images,
219 |             #   we need to convert to the same size and potentially convert to
220 |             #   grayscale.
221 |             image = preprocessing.load_image(image, to_numpy=True, resize=28, crop=28)
222 |         elif image_format == "numpy":
223 |             pass  # no conversion
224 |         else:
225 |             raise RuntimeError()
226 | 
227 |         # Wrap image in batch.
228 |         image_batch = image[None]
229 | 
230 |         # Flatten dimensions.
231 |         image_batch = image_batch.reshape(len(image_batch), -1)
232 | 
233 |         # Scale mean and std.
234 |         image_batch = self.scaler.transform(image_batch)
235 | 
236 |         # Run through model and calculate most likely class.
237 |         probabilities = self.model.predict_proba(image_batch)[0]
238 |         predicted_class = int(np.argmax(probabilities))
239 |         return {"predicted_class": predicted_class, "probabilities": probabilities}
240 | 
241 |     def raw(self) -> dict:
242 |         """Returns the raw model object."""
243 |         return {"model": self.model, "scaler": self.scaler}
244 | 
245 |     # @staticmethod
246 |     # def default_config(model_name: str):
247 |     #     # TODO: Implement other models.
248 |     #     if model_name == "random-forest":
249 |     #         return {"n_estimators": 10}
250 |     #     else:
251 |     #         raise NotImplementedError()
252 | 
253 | 
254 | # class RandomForestWrapper(SklearnImageClassificationWrapper):
255 | #     def _create_model(self, config: dict) -> None:
256 | #         self.model = RandomForestClassifier(**config)
257 | 
258 | #     @staticmethod
259 | #     def default_config() -> dict:
260 | #         return {"n_estimators": 100, "criterion": "gini"}
261 | 


--------------------------------------------------------------------------------
/traintool/image_classification/torch_models.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Wrapper around pytorch image classification models.
  3 | """
  4 | 
  5 | import comet_ml  # noqa: F401
  6 | import torch
  7 | import torch.nn as nn
  8 | import torch.nn.functional as F
  9 | import torch.optim as optim
 10 | from torch.utils.data import DataLoader
 11 | import torchvision
 12 | from ignite.engine import Events, create_supervised_trainer, create_supervised_evaluator
 13 | from ignite.metrics import Accuracy, Loss
 14 | import numpy as np
 15 | from loguru import logger
 16 | 
 17 | from ..model_wrapper import ModelWrapper
 18 | from . import preprocessing, visualization
 19 | from .. import utils
 20 | 
 21 | # TODO: This isn't actually used anymore. See if we still need it at some point or it
 22 | #   can be deleted.
 23 | # torchvision_models = [
 24 | #     "alexnet",
 25 | #     "vgg11",
 26 | #     "vgg11_bn",
 27 | #     "vgg13",
 28 | #     "vgg13_bn",
 29 | #     "vgg16",
 30 | #     "vgg16_bn",
 31 | #     "vgg19",
 32 | #     "vgg19_bn",
 33 | #     "resnet18",
 34 | #     "resnet34",
 35 | #     "resnet50",
 36 | #     "resnet101",
 37 | #     "resnet152",
 38 | #     "squeezenet1_0",
 39 | #     "squeezenet1_1",
 40 | #     "densenet121",
 41 | #     "densenet169",
 42 | #     "densenet161",
 43 | #     "densenet201",
 44 | #     "inception_v3",
 45 | #     "googlenet",
 46 | #     "shufflenet_v2_x0_5",
 47 | #     "shufflenet_v2_x1_0",
 48 | #     "shufflenet_v2_x1_5",
 49 | #     "shufflenet_v2_x2_0",
 50 | #     "mobilenet_v2",
 51 | #     "resnext50_32x4d",
 52 | #     "resnext101_32x8d",
 53 | #     "wide_resnet50_2",
 54 | #     "wide_resnet101_2",
 55 | #     "mnasnet0_5",
 56 | #     "mnasnet0_75",
 57 | #     "mnasnet1_0",
 58 | #     "mnasnet1_3",
 59 | # ]
 60 | 
 61 | 
 62 | class SimpleCnn(nn.Module):
 63 |     """
 64 |     A simple CNN module for MNIST, similar to pytorch's MNIST example.
 65 | 
 66 |     See: https://github.com/pytorch/examples/blob/master/mnist/main.py
 67 |     """
 68 | 
 69 |     def __init__(self):
 70 |         super().__init__()
 71 |         self.conv1 = nn.Conv2d(1, 32, 3, 1)
 72 |         self.conv2 = nn.Conv2d(32, 64, 3, 1)
 73 |         self.dropout1 = nn.Dropout2d(0.25)
 74 |         self.dropout2 = nn.Dropout2d(0.5)
 75 |         self.fc1 = nn.Linear(9216, 128)
 76 |         self.fc2 = nn.Linear(128, 10)
 77 | 
 78 |     def forward(self, x):
 79 |         x = self.conv1(x)
 80 |         x = F.relu(x)
 81 |         x = self.conv2(x)
 82 |         x = F.relu(x)
 83 |         x = F.max_pool2d(x, 2)
 84 |         x = self.dropout1(x)
 85 |         x = torch.flatten(x, 1)
 86 |         x = self.fc1(x)
 87 |         x = F.relu(x)
 88 |         x = self.dropout2(x)
 89 |         x = self.fc2(x)
 90 |         output = F.log_softmax(x, dim=1)
 91 |         return output
 92 | 
 93 | 
 94 | class TorchImageClassificationWrapper(ModelWrapper):
 95 |     """
 96 |     This wrapper handles torch models for image classification.
 97 | 
 98 |     It can either support models from torchvision.models (resnet18, alexnet, ...) or a
 99 |     simple CNN for MNIST (simple-cnn, see SimpleCnn class).
100 |     """
101 | 
102 |     def _create_model(self, num_classes) -> None:
103 |         """Create the model based on self.model_name and store it in self.model."""
104 |         if self.model_name == "simple-cnn":
105 |             self.model = SimpleCnn()
106 |         else:
107 |             # Raise error if pretrained model doesn't have 1000 classes.
108 |             pretrained = self.config.get("pretrained", False)
109 |             if pretrained and num_classes != 1000:
110 |                 raise ValueError(
111 |                     "Using a pretrained model requires config parameter num_classes "
112 |                     f"to be 1000, is: {num_classes}"
113 |                 )
114 | 
115 |             # Create model.
116 |             # TODO: Pass additional kwargs on to model (is this possible?).
117 |             self.model = getattr(torchvision.models, self.model_name)(
118 |                 pretrained=pretrained, num_classes=num_classes
119 |             )
120 | 
121 |     def _create_optimizer(self) -> optim.Optimizer:
122 |         """Create the optimizer based on the config"""
123 |         model_params = self.model.parameters()
124 |         optimizer_name = self.config.get("optimizer", "adam")
125 |         logger.info(f"    optimizer: {optimizer_name}")
126 |         if optimizer_name == "adam":
127 |             kwargs = utils.filter_dict(
128 |                 self.config, ["lr", "betas", "eps", "weight_decay", "amsgrad"]
129 |             )
130 |             logger.info(f"    optimizer args: {kwargs}")
131 |             return optim.Adam(model_params, **kwargs)
132 |         elif optimizer_name == "adadelta":
133 |             kwargs = utils.filter_dict(
134 |                 self.config, ["lr", "rho", "eps", "weight_decay"]
135 |             )
136 |             logger.info(f"    optimizer args: {kwargs}")
137 |             return optim.Adadelta(model_params, **kwargs)
138 |         elif optimizer_name == "adagrad":
139 |             kwargs = utils.filter_dict(
140 |                 self.config,
141 |                 ["lr", "lr_decay", "weight_decay", "initial_accumulator_value", "eps"],
142 |             )
143 |             logger.info(f"    optimizer args: {kwargs}")
144 |             return optim.Adagrad(model_params, **kwargs)
145 |         elif optimizer_name == "rmsprop":
146 |             kwargs = utils.filter_dict(
147 |                 self.config,
148 |                 ["lr", "alpha", "eps", "weight_decay", "momentum", "centered"],
149 |             )
150 |             logger.info(f"    optimizer args: {kwargs}")
151 |             return optim.RMSprop(model_params, **kwargs)
152 |         elif optimizer_name == "sgd":
153 |             kwargs = utils.filter_dict(
154 |                 self.config, ["momentum", "dampening", "weight_decay", "nesterov"]
155 |             )
156 |             logger.info(f"    optimizer args: {kwargs}")
157 |             # In contrast to other optimizers, lr is a required param for SGD.
158 |             return optim.SGD(model_params, lr=self.config.get("lr", 0.1), **kwargs)
159 |         else:
160 |             raise ValueError(f"Optimizer not known: {optimizer_name}")
161 | 
162 |         # TODO: Implement other optimizers.
163 | 
164 |     def _preprocess_for_training(self, name, data, use_cuda=False):
165 |         if data is None:  # val/test can be empty´
166 |             logger.info(f"{name}: Not given")
167 |             return None
168 |         else:
169 |             logger.info(f"{name}:")
170 | 
171 |             # Get number of classes from config or infer from train_data (needs to be
172 |             # done before the conversion!).
173 |             if "num_classes" in self.config:
174 |                 self.num_classes = self.config["num_classes"]
175 |             elif name == "train":
176 |                 self.num_classes = preprocessing.get_num_classes(data)
177 | 
178 |             # Convert format.
179 |             logger.info(f"    data format: {preprocessing.recognize_data_format(data)}")
180 |             # TODO: Properly do mean/std normalization.
181 |             # TODO: Give error if resize/crop are in config (we always need these values
182 |             #   here!).
183 |             data = preprocessing.to_torch(
184 |                 data,
185 |                 resize=256,
186 |                 crop=224,
187 |                 mean=[0.485, 0.456, 0.406],
188 |                 std=[0.229, 0.224, 0.225],
189 |             )
190 |             logger.info(f"    resized to 256 x 256")
191 |             logger.info(f"    center-cropped to 224 x 224")
192 |             logger.info(f"    samples: {len(data)}")
193 |             logger.info(f"    image shape: {tuple(data[0][0].shape)}")
194 | 
195 |             # TODO: Either write num classes for each dataset here or
196 |             # TODO: Raise error if num_classes diverges between datasets.
197 |             logger.info(f"    classes: {self.num_classes}")
198 | 
199 |             # Wrap in data loader.
200 |             batch_size = self.config.get("batch_size", 128)
201 |             kwargs = {"batch_size": batch_size}
202 |             logger.info(f"    batch size: {batch_size}")
203 |             if use_cuda:
204 |                 kwargs["pin_memory"] = True
205 |                 kwargs["num_workers"] = 1
206 |             if name == "train":
207 |                 kwargs["shuffle"] = True
208 |                 logger.info(f"    shuffled")
209 |             loader = DataLoader(data, **kwargs)
210 |             return loader
211 | 
212 |     def _train(
213 |         self,
214 |         train_data,
215 |         val_data,
216 |         test_data,
217 |         writer,
218 |         experiment,
219 |         dry_run: bool = False,
220 |     ) -> None:
221 | 
222 |         use_cuda = torch.cuda.is_available()
223 | 
224 |         # Preprocess all datasets.
225 |         logger.info("Preprocessing datasets...")
226 |         train_loader = self._preprocess_for_training("train", train_data, use_cuda)
227 |         val_loader = self._preprocess_for_training("val", val_data, use_cuda)
228 |         test_loader = self._preprocess_for_training("test", test_data, use_cuda)
229 |         logger.info("")
230 | 
231 |         # Set up model and move it to device.
232 |         logger.info("Creating model...")
233 |         self._create_model(self.num_classes)
234 |         device = torch.device("cuda" if use_cuda else "cpu")
235 |         logger.info(f"    device: {device}")
236 |         self.model = self.model.to(device)
237 | 
238 |         # Set up optimizer and loss.
239 |         optimizer = self._create_optimizer()
240 |         loss_func = nn.CrossEntropyLoss()
241 |         logger.info(f"    loss function: cross-entropy")
242 |         logger.info("")
243 | 
244 |         # Dedicate a few images that will be plotted as samples to tensorboard.
245 |         num_samples_to_plot = self.config.get("num_samples_to_plot", 5)
246 | 
247 |         def get_samples(loader):
248 |             if loader is None:
249 |                 return None, None
250 |             else:
251 |                 return next(
252 |                     iter(DataLoader(loader.dataset, batch_size=num_samples_to_plot))
253 |                 )
254 | 
255 |         train_sample_images, train_sample_labels = get_samples(train_loader)
256 |         val_sample_images, val_sample_labels = get_samples(val_loader)
257 |         test_sample_images, test_sample_labels = get_samples(test_loader)
258 | 
259 |         # Configure trainer and metrics.
260 |         accumulate_train_metrics = self.config.get("accumulate_train_metrics", True)
261 | 
262 |         # We need to transform the output of the trainer and metrics here to accumulate
263 |         # metrics during training (otherwise, we have to re-evaluate on the complete
264 |         # train set which takes a long time). By default, the trainer outputs
265 |         # `loss.item()` and the metrics expect `y_pred, y` (which is what the evaluator
266 |         # outputs). We are now outputting `y_pred, y, loss` from the trainer and then
267 |         # slicing off the `loss` before it goes into the metric.
268 |         # See also the footnote here but note that it's a bit wrong:
269 |         # https://pytorch.org/ignite/quickstart.html#
270 |         def trainer_output_transform(x, y, y_pred, loss):
271 |             return y_pred, y, loss.item()
272 | 
273 |         def metrics_output_transform(output):
274 |             return output[:2]  # use only y_pred, y
275 | 
276 |         trainer = create_supervised_trainer(
277 |             self.model,
278 |             optimizer,
279 |             loss_func,
280 |             device=device,
281 |             output_transform=trainer_output_transform,
282 |         )
283 |         if accumulate_train_metrics:
284 |             # TODO: Maybe put train_metrics and val_metrics into one dict.
285 |             train_metrics = {
286 |                 "accuracy": Accuracy(output_transform=metrics_output_transform),
287 |                 "loss": Loss(loss_func, output_transform=metrics_output_transform),
288 |                 # "confusion_matrix": ConfusionMatrix(num_classes),
289 |             }
290 |             for name, metric in train_metrics.items():
291 |                 # Attach metrics to trainer to accumulate them during training.
292 |                 metric.attach(trainer, name)
293 |         val_metrics = {
294 |             "accuracy": Accuracy(),
295 |             "loss": Loss(loss_func),
296 |             # "confusion_matrix": ConfusionMatrix(num_classes),
297 |         }
298 |         evaluator = create_supervised_evaluator(
299 |             self.model, metrics=val_metrics, device=device
300 |         )
301 | 
302 |         @trainer.on(
303 |             Events.ITERATION_COMPLETED(every=self.config.get("print_every", 100))
304 |         )
305 |         def log_batch(trainer):
306 |             batch = (trainer.state.iteration - 1) % trainer.state.epoch_length + 1
307 |             logger.info(
308 |                 f"Epoch {trainer.state.epoch} / {num_epochs}, "
309 |                 f"batch {batch} / {trainer.state.epoch_length}: "
310 |                 f"Loss: {trainer.state.output[2]:.3f}"
311 |                 # f"Loss: {trainer.state.output:.3f}"
312 |             )
313 | 
314 |         def log_results(name, metrics, epoch):
315 |             """Log results of an epoch to stdout, tensorboard and comet."""
316 |             logger.info(
317 |                 f"{name}: Average loss: {metrics['loss']:.3f}, "
318 |                 f"Average accuracy: {metrics['accuracy']:.3f}"
319 |             )
320 |             experiment.log_metric(f"{name}_loss", metrics["loss"])
321 |             experiment.log_metric(f"{name}_accuracy", metrics["accuracy"])
322 |             writer.add_scalar(f"{name}_loss", metrics["loss"], epoch)
323 |             writer.add_scalar(f"{name}_accuracy", metrics["accuracy"], epoch)
324 | 
325 |         # TODO: This iterates over complete train set again, maybe accumulate as in the
326 |         #   example in the footnote here: https://pytorch.org/ignite/quickstart.html#
327 |         @trainer.on(Events.EPOCH_COMPLETED)
328 |         def log_epoch(trainer):
329 |             logger.info("")
330 |             logger.info(f"Epoch {trainer.state.epoch} / {num_epochs} results: ")
331 | 
332 |             # Train data.
333 |             if accumulate_train_metrics:
334 |                 log_results("train", trainer.state.metrics, trainer.state.epoch)
335 |                 logger.info("(train metrics are accumulated during training; "
336 |                             "to re-evaluate on the complete train set after training, "
337 |                             "use config parameter 'accumulate_train_metrics': False)")
338 |             else:
339 |                 evaluator.run(train_loader)
340 |                 log_results("train", evaluator.state.metrics, trainer.state.epoch)
341 | 
342 |             # Val data.
343 |             if val_loader:
344 |                 evaluator.run(val_loader)
345 |                 log_results("val", evaluator.state.metrics, trainer.state.epoch)
346 | 
347 |             # Test data.
348 |             if test_loader:
349 |                 evaluator.run(test_loader)
350 |                 log_results("test", evaluator.state.metrics, trainer.state.epoch)
351 | 
352 |             logger.info("")
353 | 
354 |         @trainer.on(Events.EPOCH_COMPLETED)
355 |         def checkpoint_model(trainer):
356 |             # TODO: Do not checkpoint at every step.
357 |             checkpoint_dir = (
358 |                 self.out_dir / "checkpoints" / f"epoch{trainer.state.epoch}"
359 |             )
360 |             checkpoint_dir.mkdir(parents=True, exist_ok=True)
361 |             torch.save(self.model, checkpoint_dir / "model.pt")
362 | 
363 |         @trainer.on(Events.EPOCH_COMPLETED)
364 |         def plot_samples(trainer):
365 |             """Plot a few sample images and probabilites to tensorboard."""
366 | 
367 |             def write_samples_plot(name, sample_images, sample_labels):
368 |                 # TODO: This can be improved by just using the outputs already
369 |                 #   calculated in evaluator.state.output in the functions above.
370 |                 #   Problem: At least in the train evaluator, the batches are not equal,
371 |                 #   so the plotted images will differ from run to run.
372 |                 if sample_images is None:
373 |                     return
374 | 
375 |                 with torch.no_grad():
376 |                     sample_output = self.model(sample_images.to(device))
377 |                     sample_pred = torch.softmax(sample_output, dim=1)
378 | 
379 |                 visualization.plot_samples(
380 |                     writer,
381 |                     f"{name}-samples",
382 |                     trainer.state.epoch,
383 |                     sample_images.to("cpu").numpy(),
384 |                     sample_labels.to("cpu").numpy(),
385 |                     sample_pred.to("cpu").numpy(),
386 |                 )
387 | 
388 |             write_samples_plot("train", train_sample_images, train_sample_labels)
389 |             write_samples_plot("val", val_sample_images, val_sample_labels)
390 |             write_samples_plot("test", test_sample_images, test_sample_labels)
391 | 
392 |         # Start training.
393 |         num_epochs = 1 if dry_run else self.config.get("num_epochs", 5)
394 |         if dry_run:
395 |             num_batches = 1
396 |             logger.info(f"Training model on device {device}... (DRY RUN, only 1 batch)")
397 |         elif "num_samples" in self.config:
398 |             # TODO: Make sure batch_size doesn't differ from the value extracted during
399 |             #   preprocessing.
400 |             batch_size = self.config.get("batch_size", 128)
401 |             # TODO: This always uses a few more samples than num_samples. Maybe get it
402 |             #   to the correct value.
403 |             num_batches = int(self.config["num_samples"] / batch_size) + 1
404 |             logger.info(
405 |                 f"Training model on device {device}... (using "
406 |                 f"{self.config['num_samples']} of {len(train_loader.dataset)} samples)"
407 |             )
408 |         else:
409 |             num_batches = None  # all batches
410 |             logger.info(f"Training model on device {device}...")
411 |             logger.info(
412 |                 "(if this takes too long, train on less data with the config "
413 |                 "parameter 'num_samples')"
414 |             )
415 |         logger.info("(show more steps by setting the config parameter 'print_every')")
416 |         logger.info("")
417 |         trainer.run(train_loader, max_epochs=num_epochs, epoch_length=num_batches)
418 |         logger.info("Training finished!")
419 | 
420 |         # Save the trained model.
421 |         torch.save(self.model, self.out_dir / "model.pt")
422 | 
423 |     def _load(self) -> None:
424 |         """Loads the model from file."""
425 |         self.model = torch.load(self.out_dir / "model.pt")
426 | 
427 |     def predict(self, image) -> dict:
428 |         """Runs data through the model and returns output."""
429 | 
430 |         # Convert data format if required.
431 |         image_format = preprocessing.recognize_image_format(image)
432 |         if image_format == "files":
433 |             image = preprocessing.load_image(
434 |                 image,
435 |                 to_numpy=False,
436 |                 resize=256,
437 |                 crop=224,
438 |                 mean=[0.485, 0.456, 0.406],
439 |                 std=[0.229, 0.224, 0.225],
440 |             )
441 |         elif image_format == "numpy":
442 |             # TODO: This is almost the same code as in preprocessing.numpy_to_torch,
443 |             #   maybe refactor it.
444 | 
445 |             # Rescale images to 0-255 and convert to uint8.
446 |             # TODO: This should probably be done with the same min/max values as train
447 |             #   set, see note in preprocessing.numpy_to_torch.
448 |             image = (image - np.min(image)) / np.ptp(image) * 255
449 |             image = image.astype(np.uint8)
450 | 
451 |             # If images are grayscale, convert to RGB by duplicating channels.
452 |             if image.shape[0] == 1:
453 |                 image = np.stack((image[0],) * 3, axis=0)
454 | 
455 |             # Convert to channels last format (required for transforms.ToPILImage).
456 |             image = image.transpose((1, 2, 0))
457 | 
458 |             # Set up transform to convert to PIL image, do manipulations, and convert
459 |             # to tensor.
460 |             # TODO: Converting to PIL and then to tensor is not super efficient, find
461 |             #   a better method.
462 |             transform = preprocessing.create_transform(
463 |                 from_numpy=True,
464 |                 resize=256,
465 |                 crop=224,
466 |                 mean=[0.485, 0.456, 0.406],
467 |                 std=[0.229, 0.224, 0.225],
468 |             )
469 |             image = transform(image)
470 |         else:
471 |             raise RuntimeError()
472 | 
473 |         # Wrap image in batch.
474 |         image_batch = image.unsqueeze(dim=0)
475 | 
476 |         self.model.eval()
477 |         with torch.no_grad():
478 |             output = self.model(image_batch)[0]
479 |             probabilities = torch.softmax(output, dim=0).numpy()
480 |             predicted_class = output.argmax().item()
481 |         return {"predicted_class": predicted_class, "probabilities": probabilities}
482 | 
483 |     def raw(self) -> dict:
484 |         """Returns the raw model object."""
485 |         return {"model": self.model}
486 | 
487 |     # @staticmethod
488 |     # def default_config(model_name: str) -> dict:
489 |     #     # TODO: Implement other models.
490 |     #     if model_name == "simple-cnn":
491 |     #         return {"lr": 0.1}
492 |     #     else:
493 |     #         raise NotImplementedError()
494 | 


--------------------------------------------------------------------------------
/traintool/image_classification/visualization.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Plots to visualize training results in tensorboard.
 3 | """
 4 | 
 5 | # from tensorboardX import SummaryWriter
 6 | import matplotlib as mpl
 7 | import matplotlib.pyplot as plt
 8 | import numpy as np
 9 | import io
10 | from tensorboardX import SummaryWriter
11 | 
12 | 
13 | def plot_confusion_matrix(writer: SummaryWriter, name: str, epoch: int) -> None:
14 |     """Plot confusion matrix to tensorboard."""
15 |     fig = plt.figure()
16 |     plt.plot([1, 3, 2])
17 |     writer.add_image(name, figure_to_array(fig), epoch)
18 | 
19 | 
20 | def plot_samples(
21 |     writer: SummaryWriter,
22 |     name: str,
23 |     epoch: int,
24 |     images: np.ndarray,
25 |     labels: np.ndarray,
26 |     predictions: np.ndarray,
27 | ) -> None:
28 |     """Plot a few sample images and classification results to tensorboard."""
29 |     num_samples = len(images)
30 |     num_classes = predictions.shape[1]
31 |     #print(num_samples)
32 | 
33 |     fig, axes = plt.subplots(2, num_samples, figsize=(10, 3))
34 |     # fig.suptitle("Samples and probabilites from train_data. Red is ground truth.")
35 | 
36 |     # Scale images to [0, 1] (they may have another range for classification).
37 |     images = (images - np.min(images)) / np.ptp(images)
38 | 
39 |     # Plot images.
40 |     for i, ax in enumerate(axes[0]):
41 |         plt.sca(ax)
42 |         plt.axis("off")
43 |         if images.shape[1] == 1:  # grayscale
44 |             plt.imshow(images[i][0], cmap="gray")
45 |         elif images.shape[1] == 3:  # RGB
46 |             plt.imshow(images[i].transpose(1, 2, 0))
47 |         else:
48 |             raise RuntimeError()
49 | 
50 |     # Plot predictions in bar charts.
51 |     for i, ax in enumerate(axes[1]):
52 |         plt.sca(ax)
53 |         bars = ax.bar(np.arange(num_classes), predictions[i], zorder=3)
54 |         bars[int(labels[i])].set_color("red")
55 |         ax.spines["top"].set_visible(False)
56 |         ax.spines["right"].set_visible(False)
57 |         ax.spines["left"].set_visible(False)
58 |         ax.set_xticks(np.arange(num_classes))
59 |         # TODO: Set class labels via ax.set_xticklabels(class_names, rotation=0)
60 |         ax.yaxis.set_major_formatter(mpl.ticker.PercentFormatter(1.0))
61 |         ax.grid(axis="y", zorder=0)
62 |         ax.yaxis.set_tick_params(length=0)
63 |         if i > 0:
64 |             ax.yaxis.set_tick_params(labelleft=False)
65 |         if i == 0:
66 |             ax.set_ylabel("Probability")
67 |         ax.set_ylim(0, 1)
68 |         ax.get_xticklabels()[int(labels[i])].set_color("red")
69 | 
70 |     # Add common x label by drawing above the figure.
71 |     fig.add_subplot(111, frameon=False)
72 |     plt.tick_params(labelcolor="none", top=False, bottom=False, left=False, right=False)
73 |     plt.xlabel("Class (red = ground truth)")
74 | 
75 |     writer.add_image(name, figure_to_array(fig), epoch)
76 | 
77 | 
78 | def figure_to_array(fig):
79 |     """Convert matplotlib figure to RGBA numpy array (channels-first format)."""
80 |     buf = io.BytesIO()
81 |     fig.savefig(buf, format="rgba")
82 |     buf.seek(0)
83 |     img_arr = np.reshape(
84 |         np.frombuffer(buf.getvalue(), dtype=np.uint8),
85 |         newshape=(int(fig.bbox.bounds[3]), int(fig.bbox.bounds[2]), -1),
86 |     )
87 |     buf.close()
88 |     plt.close(fig)  # close here so it doesn't show up in jupyter notebook
89 |     img_arr = img_arr.transpose((2, 0, 1))  # make channels first for tensorboardX
90 |     return img_arr
91 | 


--------------------------------------------------------------------------------
/traintool/main.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Main API methods for traintool (this is what's called by the user).
  3 | """
  4 | 
  5 | from comet_ml import Experiment
  6 | from typing import Union, Type
  7 | from pathlib import Path
  8 | import yaml
  9 | from tensorboardX import SummaryWriter
 10 | import tempfile
 11 | import editdistance
 12 | import numpy as np
 13 | from datetime import datetime
 14 | from loguru import logger
 15 | import sys
 16 | 
 17 | from . import utils
 18 | from . import image_classification
 19 | from .model_wrapper import ModelWrapper
 20 | 
 21 | # Configure default logger so that it's equal to print.
 22 | logger.remove()
 23 | logger.add(
 24 |     sys.stderr, format="{message}", level="INFO", backtrace=False, diagnose=False
 25 | )
 26 | 
 27 | comet_config = {}
 28 | # TODO: Add a method to change the project dir.
 29 | project_dir = Path.cwd() / "traintool-experiments"
 30 | 
 31 | 
 32 | model_dict = {
 33 |     "simple-cnn": image_classification.TorchImageClassificationWrapper,
 34 |     "resnet18": image_classification.TorchImageClassificationWrapper,
 35 |     "alexnet": image_classification.TorchImageClassificationWrapper,
 36 |     "vgg16": image_classification.TorchImageClassificationWrapper,
 37 |     "squeezenet": image_classification.TorchImageClassificationWrapper,
 38 |     "densenet": image_classification.TorchImageClassificationWrapper,
 39 |     "inception": image_classification.TorchImageClassificationWrapper,
 40 |     "googlenet": image_classification.TorchImageClassificationWrapper,
 41 |     "shufflenet": image_classification.TorchImageClassificationWrapper,
 42 |     "mobilenet": image_classification.TorchImageClassificationWrapper,
 43 |     "resnext50_32x4d": image_classification.TorchImageClassificationWrapper,
 44 |     "wide_resnet50_2": image_classification.TorchImageClassificationWrapper,
 45 |     "mnasnet": image_classification.TorchImageClassificationWrapper,
 46 |     "random-forest": image_classification.SklearnImageClassificationWrapper,
 47 |     "gradient-boosting": image_classification.SklearnImageClassificationWrapper,
 48 |     "gaussian-process": image_classification.SklearnImageClassificationWrapper,
 49 |     "logistic-regression": image_classification.SklearnImageClassificationWrapper,
 50 |     "sgd": image_classification.SklearnImageClassificationWrapper,
 51 |     "perceptron": image_classification.SklearnImageClassificationWrapper,
 52 |     "passive-aggressive": image_classification.SklearnImageClassificationWrapper,
 53 |     "gaussian-nb": image_classification.SklearnImageClassificationWrapper,
 54 |     "k-neighbors": image_classification.SklearnImageClassificationWrapper,
 55 |     "mlp": image_classification.SklearnImageClassificationWrapper,
 56 |     "svc": image_classification.SklearnImageClassificationWrapper,
 57 |     "linear-svc": image_classification.SklearnImageClassificationWrapper,
 58 |     "decision-tree": image_classification.SklearnImageClassificationWrapper,
 59 |     "extra-tree": image_classification.SklearnImageClassificationWrapper,
 60 | }
 61 | 
 62 | 
 63 | def _resolve_model(model_name: str) -> Type[ModelWrapper]:
 64 |     """Return class of model wrapper that is used for model_name."""
 65 |     if model_name in model_dict:
 66 |         return model_dict[model_name]
 67 |     else:
 68 |         # Find most similar model name.
 69 |         models = list(model_dict.keys())
 70 |         distances = [editdistance.eval(model_name, model) for model in models]
 71 |         most_similar = models[np.argmin(distances)]
 72 | 
 73 |         raise ValueError(
 74 |             f"Model not recognized: {model_name} " f"(did you mean {most_similar}?)"
 75 |         )
 76 | 
 77 | 
 78 | # def _update_config(default_config: dict, config: dict) -> dict:
 79 | #     """Update values in default_config with values in config"""
 80 | #     final_config = default_config.copy()
 81 | #     for key, value in config.items():
 82 | #         if key not in final_config:
 83 | #             raise ValueError(
 84 | #                 "config contains a parameter that is not supported for this model: "
 85 | #                 f"{key}"
 86 | #             )
 87 | #         else:
 88 | #             final_config[key] = value
 89 | #     return final_config
 90 | 
 91 | 
 92 | # def _write_info_file(
 93 | #     out_dir: Path, model_name: str, config: dict, start_time: datetime
 94 | # ) -> None:
 95 | #     """
 96 | #     Create a file info.yml in out_dir that contains some information about the run
 97 | #     """
 98 | #     # TODO: Add more stuff, e.g. start time, status, machine configuration.
 99 | #     info = {
100 | #         "model_name": model_name,
101 | #         "config": config,
102 | #         "start_time": start_time,
103 | #         "status": "Running",
104 | #     }
105 | #     with (out_dir / "info.yml").open("w") as f:
106 | #         yaml.dump(info, f)
107 | 
108 | 
109 | def _write_info_file(out_dir: Path, **kwargs) -> None:
110 |     """
111 |     Create a yaml file info.yml in out_dir that contains kwargs. 
112 |     If the file already exists, it will be updated.
113 |     """
114 |     if (out_dir / "info.yml").exists():
115 |         info = _read_info_file(out_dir)
116 |         info.update(kwargs)
117 |     else:
118 |         info = kwargs
119 |     with (out_dir / "info.yml").open("w") as f:
120 |         yaml.dump(info, f, sort_keys=False)
121 | 
122 | 
123 | def _read_info_file(out_dir: Path) -> None:
124 |     """Read the file out_dir / info.yml and return its content."""
125 |     with (out_dir / "info.yml").open("r") as f:
126 |         return yaml.load(f, Loader=yaml.FullLoader)
127 | 
128 | 
129 | def _create_comet_experiment(
130 |     config: dict = None, save: bool = False
131 | ) -> Union[Experiment, utils.DummyExperiment]:
132 |     """
133 |     Creates a comet_ml.Experiment object, or a dummy replacement object. 
134 |     
135 |     If traintool.connect_comet was not called, this returns a dummy object instead, 
136 |     which offers the same methods as comet_ml.Experiment, but does nothing. This 
137 |     function should be called right before the experiment starts because comet_ml 
138 |     prints some logs.
139 |     """
140 |     if "api_key" in comet_config:
141 |         experiment = Experiment(
142 |             api_key=comet_config["api_key"],
143 |             project_name=comet_config["project_name"],
144 |             disabled=save,  # does not write to server if save is False
145 |             display_summary_level=0,
146 |         )
147 |         experiment.log_parameters(config)
148 |     else:
149 |         experiment = utils.DummyExperiment()
150 |     return experiment
151 | 
152 | 
153 | def _create_tensorboard_writer(out_dir: Path, write_to_disk: bool = True):
154 |     """Returns a writer for tensorboard that logs to out_dir"""
155 |     return SummaryWriter(logdir=(out_dir / "tb").resolve(), write_to_disk=write_to_disk)
156 | 
157 | 
158 | def connect_comet(api_key: str = None, project_name: str = None) -> None:
159 |     """Connect comet.ml account to traintool (required to track metrics)."""
160 |     comet_config["api_key"] = api_key
161 |     comet_config["project_name"] = project_name
162 | 
163 | 
164 | def train(
165 |     model_name: str,
166 |     train_data,
167 |     val_data=None,
168 |     test_data=None,
169 |     config: dict = None,
170 |     save: Union[bool, str, Path] = True,
171 |     dry_run: bool = False,
172 | ) -> ModelWrapper:
173 |     """
174 |     Starts a training run and returns a wrapper around the model.
175 | 
176 |     Args:
177 |         model_name (str): Name of the model to train
178 |         train_data: Training data. Multiple formats available, see docs.
179 |         val_data (optional): Validation data. Multiple formats available, see docs. 
180 |             Defaults to None.
181 |         test_data (optional): Test data. Multiple formats available, see docs. 
182 |             Defaults to None.
183 |         config (dict, optional): Configuration of hyperparameters. If None (default), 
184 |             some default hyperparameters for each model are used.
185 |         save (Union[bool, str, Path], optional): Whether to store model and logs to disk
186 |             (and to comet.ml if connected). If False, nothing will be saved. If True, 
187 |             artefacts will be saved to a timestamped directory in 
188 |             ./traintool-experiments. If a directory (str or Path) is given, artefacts 
189 |             will be saved there. Defaults to True. 
190 |         dry_run (bool, optional): If True, the model will only be trained for one batch 
191 |             to check that everything works. This will still save the model to 
192 |             disk; use save=False to prevent this. Defaults to False.
193 |         
194 |     Returns:
195 |         ModelWrapper: A wrapper around the original model
196 |     """
197 | 
198 |     # TODO: Disabled for now, so that we can pass parameters more dynamically (e.g. pass
199 |     #   along sklearn model params without specifying them explicitly), think about if
200 |     #   this is still required.
201 |     # Get default config and fill up with values from config (checking that all keys
202 |     # are correct)
203 |     # default_config = model_wrapper_class.default_config(model_name)
204 |     # if config is None:
205 |     #     config = default_config
206 |     # else:
207 |     #     config = _update_config(default_config, config)
208 | 
209 |     start_time = datetime.now()
210 | 
211 |     with tempfile.TemporaryDirectory() as tmp_dir:  # only used when save=True
212 | 
213 |         if config is None:
214 |             config = {}
215 | 
216 |         # Resolve model class (done here so no output dir is created if model_name is
217 |         # invalid).
218 |         model_wrapper_class = _resolve_model(model_name)
219 | 
220 |         # Create out_dir.
221 |         experiment_id = f"{start_time.strftime('%Y-%m-%d_%H-%M-%S')}_{model_name}"
222 |         if save is True:  # timestamped dir in ./traintool-experiments
223 |             out_dir = project_dir / experiment_id
224 |             out_dir.mkdir(parents=True, exist_ok=False)
225 |         elif save is False:  # temporary dir
226 |             # TODO: For convenience, we are just making out_dir a temporary directory
227 |             #   here, which will be discarded. Instead, we shouldn't save anything at
228 |             #   all because it might be more performant.
229 |             out_dir = Path(tmp_dir)
230 |         else:  # use save as dir
231 |             out_dir = Path(save)
232 |             out_dir.mkdir(parents=True, exist_ok=True)
233 | 
234 |         # Create yml file in out_dir with some information about the experiment.
235 |         _write_info_file(
236 |             out_dir,
237 |             status="Running",
238 |             model_name=model_name,
239 |             config=config,
240 |             start_time=str(start_time),
241 |         )
242 | 
243 |         # Stream stdout to log file in out_dir.
244 |         logger.add(
245 |             out_dir / "stdout.log",
246 |             format="{time:YYYY-MM-DD HH:mm:ss.SSS} | {level: <8} | {message}",
247 |             backtrace=True,
248 |             diagnose=True,
249 |         )
250 | 
251 |         # Print some info.
252 |         logger.info("  traintool experiment  ".center(80, "="))
253 |         logger.info("ID:".ljust(12) + str(experiment_id))
254 |         logger.info("Model:".ljust(12) + str(model_name))
255 |         logger.info("Config:".ljust(12) + str(config))
256 |         logger.info("Output dir:".ljust(12) + str(out_dir))
257 |         if save is False:
258 |             logger.info(
259 |                 " " * 12 + "(temporary directory, will be automatically removed)"
260 |             )
261 |         if "api_key" in comet_config:
262 |             if comet_config["project_name"] is None:
263 |                 project = "Uncategorized Experiments"
264 |             else:
265 |                 project = comet_config["project_name"]
266 |             logger.info("Comet.ml:".ljust(12) + f"Enabled (project: {project})")
267 |         if save is not False:
268 |             logger.info("Load via:".ljust(12) + f'traintool.load("{experiment_id}")')
269 |         logger.info("=" * 80)
270 |         if dry_run:
271 |             logger.info(">>> THIS IS JUST A DRY RUN <<<")
272 |             logger.info("")
273 | 
274 |         # Create tensorboard writer
275 |         writer = _create_tensorboard_writer(out_dir=out_dir)
276 | 
277 |         # Create comet.ml experiment (or dummy object if comet is not used).
278 |         # This has to be done right before training because it prints some stuff.
279 |         experiment = _create_comet_experiment(config=config, save=save)
280 | 
281 |         try:
282 |             # Create model wrapper and start training.
283 |             model_wrapper = model_wrapper_class(model_name, config, out_dir)
284 |             model_wrapper._train(
285 |                 train_data=train_data,
286 |                 val_data=val_data,
287 |                 test_data=test_data,
288 |                 writer=writer,
289 |                 experiment=experiment,
290 |                 dry_run=dry_run,
291 |             )
292 |         except:  # noqa: E722
293 |             status = "Failed"
294 |             logger.exception("ERROR: Training interrupted by an exception (see below)")
295 |             raise
296 |         else:
297 |             status = "Finished"
298 |         finally:
299 |             # End experiment and write to log and info file.
300 |             # TODO: Check if error is still tracked in comet ml experiment.
301 |             experiment.end()
302 |             writer.close()
303 |             end_time = datetime.now()
304 |             duration = end_time - start_time
305 |             _write_info_file(
306 |                 out_dir, status=status, end_time=str(end_time), duration=str(duration)
307 |             )
308 |             logger.info(
309 |                 f"  {status}! (after {utils.format_timedelta(duration)})  ".center(
310 |                     80, "="
311 |                 )
312 |             )
313 | 
314 |         return model_wrapper
315 | 
316 | 
317 | def load(name_or_dir: Union[str, Path]) -> ModelWrapper:
318 |     """
319 |     Load a model that was trained previously.
320 | 
321 |     Args:
322 |         name_or_dir (Union[str, Path]): The name of the experiment (will search for 
323 |             model files in ./{name} and ./traintool-experiments/{name}) or the complete 
324 |             path to the output directory.
325 | 
326 |     Returns:
327 |         ModelWrapper: The loaded model
328 |     """
329 | 
330 |     # Find output dir, checking that it exists
331 |     if Path(name_or_dir).is_dir():  # path = name_or_dir
332 |         out_dir = Path(name_or_dir)
333 |     elif (Path.cwd() / name_or_dir).is_dir():  # path = ./name_or_dir
334 |         out_dir = Path.cwd() / name_or_dir
335 |     elif (
336 |         Path.cwd() / "traintool-experiments" / name_or_dir
337 |     ).is_dir():  # path = ./traintool-experiments/name_or_dir
338 |         out_dir = Path.cwd() / "traintool-experiments" / name_or_dir
339 |     else:
340 |         raise FileNotFoundError(f"Could not find experiment or path: {name_or_dir}")
341 | 
342 |     # Read model_name from out_dir / info.yml
343 |     info = _read_info_file(out_dir)
344 |     model_name = info["model_name"]
345 | 
346 |     # Resolve model wrapper class and call load method
347 |     model_wrapper_class = _resolve_model(model_name)
348 |     model_wrapper = model_wrapper_class(model_name, info["config"], out_dir)
349 |     model_wrapper._load()
350 |     return model_wrapper
351 | 
352 | 
353 | # TODO: Maybe change this to more general method `model_info`.
354 | # def default_config(model_name: str) -> dict:
355 | #     # TODO: Get actual values here.
356 | #     """
357 | #     Returns the default hyperparameter configuration for a model.
358 | 
359 | #     Args:
360 | #         model_name (str): The model.
361 | 
362 | #     Returns:
363 | #         dict: Default hyperparameters for model_name
364 | #     """
365 | #     # TODO: Actually implement this for all subclasses.
366 | #     model_wrapper_class = _resolve_model(model_name)
367 | #     return model_wrapper_class.default_config(model_name)
368 | 


--------------------------------------------------------------------------------
/traintool/model_wrapper.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Base class for all model wrappers.
  3 | """
  4 | 
  5 | from pathlib import Path
  6 | from fastapi import FastAPI
  7 | import uvicorn
  8 | import numpy as np
  9 | from abc import ABC, abstractmethod
 10 | from datetime import datetime
 11 | from pydantic import BaseModel
 12 | 
 13 | 
 14 | class PredictRequest(BaseModel):
 15 |     image: list
 16 | 
 17 | 
 18 | class ModelWrapper(ABC):
 19 |     """
 20 |     A basic wrapper for machine learning models.
 21 | 
 22 |     This wrapper should contain the model itself and any additional configuration or
 23 |     resources required to run the model/make predictions. It offers a standard interface
 24 |     to interact with models regardless of their implementation or framework, e.g. to
 25 |     save/load a model to file or make a prediction.
 26 |     """
 27 | 
 28 |     def __init__(self, model_name: str, config: dict, out_dir: Path) -> None:
 29 |         self.model_name = model_name
 30 |         self.config = config
 31 |         self.out_dir = out_dir
 32 | 
 33 |     @abstractmethod
 34 |     def _train(
 35 |         self,
 36 |         train_data,
 37 |         val_data,
 38 |         test_data,
 39 |         writer,
 40 |         experiment,
 41 |         dry_run: bool = False,
 42 |     ) -> None:
 43 |         """Trains the model, evaluates it on val/test data and saves it to file."""
 44 |         pass
 45 | 
 46 |     # @abstractmethod
 47 |     # def save(self, out_dir: Path):
 48 |     #     """Saves the model to file."""
 49 |     #     pass
 50 | 
 51 |     @abstractmethod
 52 |     def _load(self) -> None:
 53 |         """Loads the model from the out dir."""
 54 |         pass
 55 | 
 56 |     # TODO: Maybe check in predict, raw, and deploy that model was trained or loaded.
 57 |     @abstractmethod
 58 |     def predict(self, image) -> dict:
 59 |         """Runs data through the model and returns output."""
 60 |         pass
 61 | 
 62 |     @abstractmethod
 63 |     def raw(self) -> dict:
 64 |         """Returns a dict of raw model objects."""
 65 |         pass
 66 | 
 67 |     def _create_fastapi(self):
 68 |         """
 69 |         Create a FastAPI app that can be used to deploy the model.
 70 |         
 71 |         This needs to be a separate method from deploy so that the API can be tested 
 72 |         properly.
 73 |         """
 74 |         # TODO: Set version here via version arg. Maybe read _version.txt file or
 75 |         #   implement version in __version__.
 76 |         app = FastAPI(title="traintool")
 77 |         deploy_time = datetime.now()
 78 | 
 79 |         @app.get("/")
 80 |         def index():
 81 |             # TODO: Maybe return the same information as in info.yml file,
 82 |             #   or experiment ID.
 83 |             return {
 84 |                 "model_name": self.model_name,
 85 |                 "config": self.config,
 86 |                 "deploy_time": deploy_time,
 87 |             }
 88 | 
 89 |         @app.post("/predict")
 90 |         def predict(predict_request: PredictRequest):
 91 |             """Endpoint to classify an image with a deployed model"""
 92 | 
 93 |             start_time = datetime.now()
 94 | 
 95 |             # Convert image to numpy array (is list of lists, i.e. what
 96 |             # array.tolist() prints out).
 97 |             # TODO: Accept image files and paths to images online.
 98 |             # TODO: Think about which other parameters to include in predict_request.
 99 |             img_arr = np.asarray(predict_request.image)
100 | 
101 |             # Run through model.
102 |             result = self.predict(img_arr)
103 | 
104 |             # Convert numpy arrays in result dict to lists.
105 |             for key, value in result.items():
106 |                 try:
107 |                     result[key] = value.tolist()
108 |                 except AttributeError:
109 |                     pass  # not an array
110 | 
111 |             result["runtime"] = str(datetime.now() - start_time)
112 |             return result
113 | 
114 |         return app
115 | 
116 |     def deploy(self, **kwargs) -> None:
117 |         """Deploys the model through a REST API. kwargs are forwarded to uvicorn."""
118 |         app = self._create_fastapi()
119 |         uvicorn.run(app, **kwargs)
120 | 
121 |     def __repr__(self):
122 |         # TODO: Maybe print something a bit shorter.
123 |         return (
124 |             f"Model '{self.model_name}' with config {self.config}, "
125 |             f"saved in {self.out_dir}"
126 |         )
127 | 
128 |     # @staticmethod
129 |     # @abstractmethod
130 |     # def default_config(model_name: str) -> dict:
131 |     #     pass
132 | 
133 | 
134 | # class DummyModelWrapper(ModelWrapper):
135 | #     def __init__(self, model_name: str) -> None:
136 | #         self.model_name = model_name
137 | #         self.model = None
138 | 
139 | #     def train(
140 | #         self,
141 | #         train_data,
142 | #         val_data,
143 | #         test_data,
144 | #         config: dict,
145 | #         out_dir: Path,
146 | #         writer,
147 | #         experiment,
148 | #         dry_run: bool = False,
149 | #     ) -> None:
150 | #         self.model = "a cool model"
151 | #         print("Dummy model has accuracy 100 %")
152 | #         with (out_dir / "model.txt").open("w") as f:
153 | #             f.write(self.model)
154 | 
155 | #     @classmethod
156 | #     def load(cls, out_dir: Path, model_name: str) -> DummyModelWrapper:
157 | #         model_wrapper = cls(model_name)
158 | #         with (out_dir / "model.txt").open() as f:
159 | #             model_wrapper.model = f.read()
160 | #         return model_wrapper
161 | 
162 | #     def predict(self, data):
163 | #         return {"probabilities": 0}
164 | 
165 | #     def raw(self) -> dict:
166 | #         return {"model": self.model}
167 | 
168 | # @staticmethod
169 | # def default_config(model_name: str) -> dict:
170 | #     return {"dummy_param": 1}
171 | 
172 | 
173 | # class ClassificationModelWrapper(BaseModelWrapper):
174 | #     def classify(self, data, config):
175 | #         """
176 | #         Runs data through the model and returns the predicted class and class
177 | #         probabilites.
178 | #         """
179 | #         probabilites = self.predict(data, config)
180 | #         predicted_class = probabilities.argmax()
181 | #         return predicted_class, probabilities
182 | 


--------------------------------------------------------------------------------
/traintool/utils.py:
--------------------------------------------------------------------------------
 1 | from datetime import datetime
 2 | 
 3 | 
 4 | def filter_dict(d, keys):
 5 |     """Returns a dictionary which contains only the keys in the list `keys`."""
 6 |     return {k: v for k, v in d.items() if k in keys}
 7 | 
 8 | 
 9 | class DummyWith:
10 |     """Placeholder for object in a with statement."""
11 | 
12 |     def __enter__(self):
13 |         pass
14 | 
15 |     def __exit__(self, model_type, value, tb):
16 |         pass
17 | 
18 | 
19 | class DummyExperiment:
20 |     """Placeholder for comet_ml.Experiment object if comet is not connected."""
21 | 
22 |     def __init__(self):
23 |         pass
24 | 
25 |     def train(self):
26 |         return DummyWith()
27 | 
28 |     def test(self):
29 |         return DummyWith()
30 | 
31 |     def validate(self):
32 |         return DummyWith()
33 | 
34 |     def log_metric(self, name, value, step=None):
35 |         pass
36 | 
37 |     def end(self):
38 |         pass
39 | 
40 | 
41 | def timestamp() -> str:
42 |     """Return a string timestamp."""
43 |     return datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
44 | 
45 | 
46 | def format_timedelta(delta) -> str:
47 |     """Formats timedelta to x days, x h, x min, x s."""
48 |     s = delta.total_seconds()
49 |     days, remainder = divmod(s, 86400)
50 |     hours, remainder = divmod(s, 3600)
51 |     mins, secs = divmod(remainder, 60)
52 |     
53 |     days = int(days)
54 |     hours = int(hours)
55 |     mins = int(mins)
56 |     secs = int(secs)
57 | 
58 |     output = f"{secs} s"
59 |     if mins:
60 |         output = f"{mins} min, " + output
61 |     if hours:
62 |         output = f"{hours} h, " + output
63 |     if days:
64 |         output = f"{days} days, " + output
65 |     return output
66 | 


--------------------------------------------------------------------------------