├── .gitignore
├── .travis.yml
├── LICENSE.md
├── Makefile
├── Pioneer.ipynb
├── README.md
├── cython
    └── dali
    │   ├── .gitignore
    │   ├── core.pyx.pre
    │   └── core
    │       ├── .gitignore
    │       ├── data_processing
    │           └── Batch.pyx
    │       ├── layers
    │           ├── GRU.pyx.pre
    │           ├── LSTM.pyx.pre
    │           └── Layers.pyx.pre
    │       ├── math
    │           ├── TensorInternal.pyx
    │           ├── memory_bank
    │           │   ├── MemoryBankWrapper.cpp
    │           │   └── MemoryBankWrapper.h
    │           ├── memory_status.cpp
    │           └── memory_status.h
    │       ├── tensor
    │           ├── Mat.pyx.pre
    │           ├── MatOps.pyx.pre
    │           ├── Solver.pyx.pre
    │           ├── Tape.pyx
    │           ├── matrix_initializations.cpp
    │           ├── matrix_initializations.h
    │           ├── python_tape.cpp
    │           ├── python_tape.h
    │           └── random.pyx.pre
    │       └── utils
    │           ├── config.pyx
    │           ├── core_utils.pyx
    │           ├── cpp_utils.cpp
    │           └── cpp_utils.h
├── dali
    ├── __init__.py
    ├── activation.py
    ├── beam_search.py
    ├── data
    │   ├── __init__.py
    │   ├── batch.py
    │   ├── process.py
    │   ├── translation.py
    │   └── utils.py
    ├── models
    │   ├── __init__.py
    │   └── mlp.py
    └── utils
    │   ├── __init__.py
    │   ├── capture.py
    │   ├── misc.py
    │   ├── scoring.py
    │   ├── solver.py
    │   ├── throttled.py
    │   └── vocab.py
├── examples
    ├── mlbasics_learn_to_add.py
    ├── mlbasics_rnn_binary_addition.py
    └── translation
    │   ├── predict.py
    │   ├── train.py
    │   └── translation.py
├── libcpp11
    ├── __init__.pxd
    ├── memory.pxd
    ├── stringstream.pxd
    ├── unordered_map.pxd
    └── vector.pxd
├── modern_numpy
    └── __init__.pxd
├── notebooks
    ├── LSTM.ipynb
    ├── Machine Translation.ipynb
    ├── NTM.ipynb
    └── language_model.ipynb
├── preprocessor_utils.py
├── requirements.txt
├── setup.py
└── tests
    ├── __init__.py
    ├── test.txt
    ├── tests_beam_search.py
    ├── tests_data.py
    └── tests_vocab.py


/.gitignore:
--------------------------------------------------------------------------------
 1 | # Compiled source #
 2 | ###################
 3 | *.com
 4 | *.class
 5 | *.dll
 6 | *.exe
 7 | *.o
 8 | *.so
 9 | *.dali
10 | MANIFEST
11 | 
12 | # Compiled protobuffs #
13 | *.pb.cc
14 | *.pb.h
15 | *_pb2.py
16 | 
17 | # Outputs of Cython
18 | cython/dali/core.cpp
19 | cython/dali/layers/Layer.pyx
20 | cython/dali/layers/LSTM.pyx
21 | cython/dali/tensor/Mat.pyx
22 | cython/dali/tensor/Solver.pyx
23 | cython/dali/tensor/random.pyx
24 | 
25 | # Packages #
26 | ############
27 | # it's better to unpack these files and commit the raw source
28 | # git has its own built in compression methods
29 | *.7z
30 | *.dmg
31 | *.gz
32 | *.iso
33 | *.jar
34 | *.rar
35 | *.tar
36 | *.zip
37 | *.gem
38 | *.pem
39 | 
40 | # Special redis file (???)
41 | *.rdb
42 | 
43 | .ipynb_checkpoints/
44 | 
45 | # Saves #
46 | #########
47 | *.npy
48 | *.mat
49 | *.vocab
50 | *.svocab
51 | text8
52 | __pycache__/*
53 | *.pyc
54 | *.egg-info
55 | 
56 | # NPM modules
57 | node_modules
58 | 
59 | # Logs and databases #
60 | ######################
61 | *.log
62 | *.sql
63 | *.sqlite
64 | 
65 | # OS generated files #
66 | ######################
67 | .DS_Store
68 | .DS_Store?
69 | ._*
70 | .Spotlight-V100
71 | .Trashes
72 | ehthumbs.db
73 | Thumbs.db
74 | .DS_Store
75 | build/
76 | 
77 | # file manifest is auto-generated by setup.py
78 | MANIFEST.in
79 | MANIFEST
80 | 


--------------------------------------------------------------------------------
/.travis.yml:
--------------------------------------------------------------------------------
 1 | language: python
 2 | dist: trusty
 3 | sudo: required
 4 | python:
 5 | - '3.3'
 6 | - '3.4'
 7 | - '3.5'
 8 | os:
 9 | - linux
10 | before_install:
11 |     - sudo add-apt-repository ppa:ubuntu-toolchain-r/test -y
12 |     - sudo apt-get update
13 |     - sudo apt-get install -y git
14 |     - sudo apt-get install -y cmake
15 |     - sudo apt-get install -y gcc
16 |     - sudo apt-get install -y zlib1g-dev
17 |     - sudo apt-get install -y libgflags2 libgflags-dev
18 |     - sudo apt-get install -y build-essential
19 |     - sudo apt-get install -y libblas-dev
20 |     - sudo apt-get install -y gcc-4.9 g++-4.9 cpp-4.9
21 |     - sudo apt-get install -y libgtest-dev
22 |     - export URL='https://github.com/JonathanRaiman/Dali/releases/download/v1.0.0/dali-1.0.0-Linux-x86_64-cpu.deb'
23 |     - export FILE=`mktemp`
24 |     - wget "$URL" -qO $FILE
25 |     - sudo dpkg -i $FILE
26 |     - rm $FILE
27 | install:
28 |     - pip3 install -r requirements.txt
29 |     - python3 setup.py install
30 |     - pip3 install nose2
31 |     - cp $(find . -name "core*.so") dali/
32 | script: nose2
33 | notifications:
34 |     email:
35 |         recipients:
36 |         - szymon.sidor@gmail.com
37 |         - jonathanraiman@gmail.com
38 |         on_success: change
39 |         on_failure: always
40 |     slack:
41 |         secure: UEkhyrjDPiwRYwLJ9yRNfH8iq57YdUKrQ2kY/trSaZTRv5cPGiUfoLYo1Vj65d8aGwyPeyWd/1/z4KOJ1+qWCIcqTLDrdrjig64v3qVfJt/054eEEUSGjMQgR9ureQ2DjR3fzbyJJLxt7IZJl8ytZtXLp13LpWBPJJOhKHcK1OLG70jUqPRj/cQ2RSFVLfcpvls+uJ8NHSJpM1434ML8DI/0Ucifp8j3NMi71odrTMcRl5AAouFgG5U5A9FvIKIIGAomArwaEKIIr+O/i10Gy6vKZxb82Hq+VQx6yow6mNEkvV40w9QZUmmTgXgsEgILcdMMeOw5iifPBg7wD1dEIBTN3PO+l+JXSv+CTx3sQdSWZb66ZSybWc6m8z5LnEGa1+ygagWBPs5CgzAXkmLQSkIdgocPCAMBSPxuxj2Hi+7s7SF8INut/aeP5/mCVxKRfcJo4Za56QTExXYqQPTQobdAKgoNOcwzK7nh2K2JDfh0qA8kaE59AZaQKnyZBLnFrQ4wSXHzcZ3kjF+nlQx/oFwQetFgu5ocNZQ5OFzToV+iLKBz+seoU0L1/e4Eweds+EjYtBHfqVB1hHmk4piFHgzQ8mC9WuL3Z9LZVRp4vykUb8yZrxbGB5Xc5WQfiAzXzsDYWDia4ZLKqcnPYq5fFw86gSf0gWCVZidVK33Yj3g=
42 | 


--------------------------------------------------------------------------------
/LICENSE.md:
--------------------------------------------------------------------------------
 1 | The MIT License (MIT)
 2 | 
 3 | Copyright (c) 2015 Jonathan Raiman, Szymon Sidor
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/Makefile:
--------------------------------------------------------------------------------
 1 | default:
 2 | 	python3 setup.py clean
 3 | 	python3 setup.py build_ext --inplace
 4 | 
 5 | cuda:
 6 | 	python3 setup.py clean cuda
 7 | 	python3 setup.py build_ext --inplace cuda
 8 | 
 9 | test:
10 | 	nose2
11 | 
12 | clean:
13 | 	python3 setup.py clean
14 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Dali in Python
 2 | 
 3 | [![PyPI version](https://badge.fury.io/py/dali.svg)](https://badge.fury.io/py/dali)
 4 | [![Build Status](https://travis-ci.org/dali-ml/dali-cython.svg?branch=master)](https://travis-ci.org/dali-ml/dali-cython)
 5 | [![License](https://img.shields.io/badge/license-MIT-blue.svg)](LICENSE.md)
 6 | 
 7 | This repository contains an early version of Python bindings to [Dali](https://github.com/dali-ml/Dali), the automatic differentiation framework.
 8 | 
 9 | With this module you can construct arbitrary mathematical models, including differentiating through control code and loops, optimize and run them using your GPU or CPU.
10 | 
11 | The bindings are light-weight, and the resulting module retains about 90%-95% of the C++ performance in most use-cases (with this performance going up for larger models and GPU intensive computations).
12 | 
13 | [![Jonathan Raiman, author](https://img.shields.io/badge/Author-Jonathan%20Raiman%20-blue.svg)](https://github.com/JonathanRaiman/) [![Szymon Sidor, author](https://img.shields.io/badge/Author-Szymon%20Sidor%20-blue.svg)](https://github.com/nivwusquorum)
14 | 
15 | ### Installation
16 | 
17 | 1. Install [Dali](https://github.com/dali-ml/Dali#installation) using `homebrew`, `yum`, or `apt-get`.
18 | 
19 | 2. `pip3 install dali`
20 | 
21 | ### Usage
22 | 
23 | See examples under notebooks.
24 | 


--------------------------------------------------------------------------------
/cython/dali/.gitignore:
--------------------------------------------------------------------------------
1 | core.pyx
2 | 


--------------------------------------------------------------------------------
/cython/dali/core.pyx.pre:
--------------------------------------------------------------------------------
 1 | pyp
 2 | from preprocessor_utils import (
 3 |     type_repeat,
 4 | )
 5 | ypy
 6 | 
 7 | 
 8 | from libcpp.string   cimport string
 9 | from libcpp11.vector cimport vector
10 | from libcpp11.memory cimport shared_ptr
11 | # Import the Python-level symbols of numpy
12 | import numpy as np
13 | # Import the C-level symbols of numpy
14 | cimport modern_numpy as np
15 | 
16 | cdef string normalize_s(s):
17 |     if type(s) is str:
18 |         return s.encode("utf-8")
19 |     elif type(s) is bytes:
20 |         return s
21 |     else:
22 |         raise TypeError("Must pass a str or bytes object.")
23 | 
24 | cdef bint is_fdtype(np.NPY_TYPES type_id) nogil:
25 |     return type_id == np.NPY_FLOAT32 or \
26 |            type_id == np.NPY_FLOAT64
27 | 
28 | cdef inline void ensure_fdtype(np.NPY_TYPES type_id):
29 |     if not is_fdtype(type_id):
30 |         raise ValueError(
31 |             "Invalid dtype: " +
32 |             str(np.PyArray_DescrFromType(type_id)) +
33 |             " (should be one of float32, float64)")
34 | 
35 | include "core/utils/config.pyx"
36 | 
37 | # File IO, save / load, etc...
38 | include "core/utils/core_utils.pyx"
39 | 
40 | # Used for storing Tensor buffers
41 | include "core/math/TensorInternal.pyx"
42 | 
43 | # Matrix class
44 | include "core/tensor/Mat.pyx"
45 | 
46 | pypinline type_repeat(pyp,
47 | cdef TYPED(copy_name)(const CMat[TYPE_NAME]& source, const CMat[TYPE_NAME]& dest):
48 |     if source.name == NULL:
49 |         (<CMat[TYPE_NAME]&>source).set_name('')
50 |     (<CMat[TYPE_NAME]&>dest).name = source.name
51 | ypy
52 | 
53 | # Matrix initialization with random numbers.
54 | include "core/tensor/random.pyx"
55 | 
56 | # Softmax, crossentropy etc....
57 | include "core/tensor/MatOps.pyx"
58 | 
59 | # Related to backpropagation.
60 | include "core/tensor/Tape.pyx"
61 | 
62 | # Layer, RNN, StackedInputLayer, etc...
63 | include "core/layers/Layers.pyx"
64 | 
65 | include "core/layers/GRU.pyx"
66 | 
67 | include "core/layers/LSTM.pyx"
68 | 
69 | # # Matrix class
70 | include "core/data_processing/Batch.pyx"
71 | 
72 | # SGD, Adagrad, Adadelta, etc...
73 | include "core/tensor/Solver.pyx"
74 | 


--------------------------------------------------------------------------------
/cython/dali/core/.gitignore:
--------------------------------------------------------------------------------
 1 | tensor/Mat.pyx
 2 | tensor/MatOps.pyx
 3 | tensor/random.pyx
 4 | 
 5 | layers/Layers.pyx
 6 | layers/LSTM.pyx
 7 | layers/GRU.pyx
 8 | 
 9 | tensor/Solver.pyx
10 | layers/Layers.pyx
11 | 


--------------------------------------------------------------------------------
/cython/dali/core/data_processing/Batch.pyx:
--------------------------------------------------------------------------------
 1 | cdef extern from "dali/data_processing/Batch.h":
 2 | 	cdef cppclass CBatch "Batch" [T]:
 3 | 		CMat[int] data
 4 | 		CMat[int] target
 5 | 		CMat[T]   mask
 6 | 		vector[int] code_lengths
 7 | 		int total_codes
 8 | 		CBatch()
 9 | 		size_t size() const
10 | 		size_t max_length() const
11 | 		void insert_example(
12 | 			const vector[string]& example,
13 | 			const CVocab& vocab,
14 | 			size_t example_idx,
15 | 			int offset)
16 | 		int example_length(const int& idx) const
17 | 


--------------------------------------------------------------------------------
/cython/dali/core/layers/GRU.pyx.pre:
--------------------------------------------------------------------------------
  1 | pyp
  2 | from preprocessor_utils import (
  3 |     typed_fexpression,
  4 |     typed_fexpression_args,
  5 |     typed_fexpression_list,
  6 |     type_frepeat
  7 | )
  8 | ypy
  9 | 
 10 | cdef extern from "dali/layers/GRU.h" nogil:
 11 |     cdef cppclass CGRU "GRU" [T]:
 12 |         CStackedInputLayer[T] reset_layer
 13 |         CStackedInputLayer[T] memory_interpolation_layer
 14 |         CStackedInputLayer[T] memory_to_memory_layer
 15 |         int input_size
 16 |         int hidden_size
 17 | 
 18 |         CGRU()
 19 |         CGRU(int _input_size, int _hidden_size)
 20 |         CGRU(const CGRU[T]&, bint copy_w, bint copy_dw)
 21 | 
 22 |         CGRU[T] shallow_copy() const
 23 |         CMat[T] activate(CMat[T] input_vector, CMat[T] previous_state) except +
 24 |         CMat[T] activate_sequence(
 25 |             const vector[CMat[T]]& input_sequence) except +
 26 |         CMat[T] activate_sequence(
 27 |             const vector[CMat[T]]& input_sequence,
 28 |             CMat[T] state) except +
 29 | 
 30 |         vector[CMat[T]] parameters() const
 31 |         CMat[T] initial_states() const
 32 | 
 33 | cdef class GRU:
 34 |     cdef void* layerinternal
 35 |     cdef np.NPY_TYPES dtypeinternal
 36 | 
 37 |     def __cinit__(GRU self, int input_size, int hidden_size, dtype=np.float32):
 38 |         self.layerinternal = NULL
 39 |         self.dtypeinternal = np.NPY_NOTYPE
 40 |         self.dtypeinternal = np.dtype(dtype).num
 41 |         ensure_fdtype(self.dtypeinternal)
 42 | 
 43 |         pypinline typed_fexpression(pyp,
 44 |             self.layerinternal = new CGRU[TYPE_NAME](input_size, hidden_size)
 45 |         ypy
 46 | 
 47 |     def __dealloc__(GRU self):
 48 |         self.free_internal()
 49 | 
 50 |     cdef free_internal(GRU self):
 51 |         pypinline type_frepeat(pyp,
 52 |         cdef CGRU[TYPE_NAME]* TYPED(ptr_internal)
 53 |         ypy
 54 |         if self.layerinternal != NULL:
 55 |             pypinline typed_fexpression(pyp,
 56 |                 TYPED(ptr_internal) = PTR_GRU(self)
 57 |                 with nogil:
 58 |                     del TYPED(ptr_internal)
 59 |             ypy
 60 |             self.layerinternal = NULL
 61 | 
 62 |     property dtype:
 63 |         def __get__(GRU self):
 64 |             return np.PyArray_DescrFromType(self.dtypeinternal)
 65 | 
 66 | pyprepeat PROPERTY_NAME in ['input_size', 'hidden_size',]
 67 |     property PROPERTY_NAME:
 68 |         def __get__(GRU self):
 69 |             pypinline typed_fexpression(pyp,
 70 |                 return DEREF_GRU(self).PROPERTY_NAME
 71 |             ypy
 72 | ypyrepeat
 73 | 
 74 | pyprepeat INTERNAL_LAYER_NAME in ['reset_layer', 'memory_interpolation_layer', 'memory_to_memory_layer']
 75 |     property INTERNAL_LAYER_NAME:
 76 |         def __get__(GRU self):
 77 |             pypinline typed_fexpression(pyp,
 78 |                 return WRAP_STACKEDLAYER(DEREF_GRU(self).INTERNAL_LAYER_NAME)
 79 |             ypy
 80 | ypyrepeat
 81 | 
 82 |     def activate(GRU self, Mat input_vector, Mat previous_state):
 83 |         """
 84 |         Activate
 85 |         --------
 86 | 
 87 |         Inputs
 88 |         ------
 89 | 
 90 |         Mat input_vector
 91 |         Mat previous_state
 92 | 
 93 |         Outputs
 94 |         -------
 95 | 
 96 |         Mat next_state
 97 |         """
 98 |         assert(
 99 |             (self.dtypeinternal == input_vector.dtypeinternal) and
100 |             (previous_state.dtypeinternal == self.dtypeinternal)
101 |         ), "All arguments must be of the same type"
102 | 
103 |         pypinline type_frepeat(pyp,
104 |         cdef CMat[TYPE_NAME] TYPED(out)
105 |         ypy
106 | 
107 |         pypinline typed_fexpression(pyp,
108 |             with nogil:
109 |                 TYPED(out) = DEREF_GRU(self).activate(DEREF_MAT(input_vector), DEREF_MAT(previous_state))
110 |             return WRAP_MAT(TYPED(out))
111 |         ypy
112 | 
113 |     def initial_states(GRU self):
114 |         pypinline typed_fexpression(pyp,
115 |             return WRAP_MAT(DEREF_GRU(self).initial_states())
116 |         ypy
117 | 
118 |     def parameters(GRU self):
119 |         params = []
120 |         pypinline type_frepeat(pyp,
121 |         cdef CMat[TYPE_NAME]         TYPED(param)
122 |         cdef vector[CMat[TYPE_NAME]] TYPED(param_vec)
123 | 
124 |         ypy
125 |         pypinline typed_fexpression(pyp,
126 |             TYPED(param_vec) = DEREF_GRU(self).parameters()
127 |             for TYPED(param) in TYPED(param_vec):
128 |                 params.append(WRAP_MAT(TYPED(param)))
129 |         ypy
130 |         return params
131 | 
132 |     def __setstate__(GRU self, state):
133 |         for param, saved_param in zip(self.parameters(), state["parameters"]):
134 |             param.w = saved_param.w
135 |             self.dtypeinternal = state["dtype"].num
136 | 
137 |     def __getstate__(self):
138 |         return {
139 |             "parameters" : self.parameters(),
140 |             "dtype" : self.dtype
141 |         }
142 | 
143 |     def __reduce__(self):
144 |         return (
145 |             self.__class__,
146 |             (
147 |                 self.input_size,
148 |                 self.hidden_size,
149 |             ), self.__getstate__(),
150 |         )
151 | 
152 |     def activate_sequence(GRU self, list input_sequence, initial_state = None):
153 |         pypinline type_frepeat(pyp,
154 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_input_sequence)
155 |         cdef CMat[TYPE_NAME] TYPED(out)
156 |         ypy
157 | 
158 |         if initial_state is None:
159 |             pypinline typed_fexpression_list(pyp, "input_sequence", "Mat",
160 |                 TYPED(c_input_sequence) = TYPED(mats_to_vec)(input_sequence)
161 |                 if self.dtypeinternal != TYPE_NPYINTERNAL:
162 |                     raise ValueError("Invalid dtype for input_sequence: " + str(input_sequence[0].dtype) + ", when GRU is " + str(self.dtype))
163 |                 with nogil:
164 |                     TYPED(out) = DEREF_GRU(self).activate_sequence(TYPED(c_input_sequence))
165 |                 return WRAP_MAT(TYPED(out))
166 |             ypy
167 |         else:
168 |             if type(initial_state) is not Mat:
169 |                 raise ValueError("initial_state must be a Mat")
170 |             pypinline typed_fexpression_list(pyp, "input_sequence", "Mat",
171 |                 TYPED(c_input_sequence) = TYPED(mats_to_vec)(input_sequence)
172 |                 if self.dtypeinternal != TYPE_NPYINTERNAL:
173 |                     raise ValueError("Invalid dtype for input_sequence: " + str(input_sequence[0].dtype) + ", when GRU is " + str(self.dtype))
174 |                 if (<Mat>initial_state).dtypeinternal != self.dtypeinternal:
175 |                     raise ValueError("Invalid dtype for initial_state: " + str(initial_state.dtype) + ", when GRU is " + str(self.dtype))
176 |                 with nogil:
177 |                     TYPED(out) = DEREF_GRU(self).activate_sequence(TYPED(c_input_sequence), DEREF_MAT(initial_state))
178 |                 return WRAP_MAT(TYPED(out))
179 |             ypy
180 | 
181 |     def __str__(GRU self):
182 |         return "<GRU in=%d, hidden=%d>" % (self.input_size, self.hidden_size)
183 | 
184 |     def __repr__(GRU self):
185 |         return str(self)
186 | 
187 | pypinline type_frepeat(pyp,
188 | cdef inline GRU TYPED(WrapGRU)(const CGRU[TYPE_NAME]& internal):
189 |     cdef GRU output = GRU(0,0)
190 |     output.free_internal()
191 |     output.layerinternal = new CGRU[TYPE_NAME](internal, False, False)
192 |     output.dtypeinternal = TYPE_NPYINTERNAL
193 |     return output
194 | ypy
195 | 


--------------------------------------------------------------------------------
/cython/dali/core/layers/Layers.pyx.pre:
--------------------------------------------------------------------------------
  1 | pyp
  2 | from preprocessor_utils import (
  3 |     typed_expression,
  4 |     typed_fexpression,
  5 |     typed_expression_args,
  6 |     typed_fexpression_args,
  7 |     typed_expression_args_with_types,
  8 |     typed_expression_list,
  9 |     type_repeat,
 10 |     type_frepeat,
 11 |     type_repeat_with_types,
 12 | )
 13 | ypy
 14 | 
 15 | 
 16 | cdef extern from "dali/layers/Layers.h" nogil:
 17 |     cdef cppclass CLayer "Layer" [T]:
 18 |         int hidden_size
 19 |         int input_size
 20 |         CMat[T] W
 21 |         CMat[T] b
 22 | 
 23 |         vector[CMat[T]] parameters() const
 24 |         # constructors
 25 |         CLayer()
 26 |         CLayer(int input_size, int hidden_size)
 27 |         CLayer(const CLayer& other, bint copy_w, bint copy_dw)
 28 | 
 29 |         CMat[T] activate(CMat[T]) except +
 30 |         CLayer[T] shallow_copy() const
 31 | 
 32 |     cdef cppclass CRNN "RNN" [T] nogil:
 33 |         int input_size
 34 |         int hidden_size
 35 |         int output_size
 36 | 
 37 |         CMat[T] Wx
 38 |         CMat[T] Wh
 39 |         CMat[T] b
 40 | 
 41 |         CRNN()
 42 |         CRNN(int input_size, int hidden_size)
 43 |         CRNN(int input_size, int hidden_size, int output_size)
 44 |         CRNN(CRNN[T]&, bool, bool)
 45 |         CMat[T] activate(CMat[T] input_vector, CMat[T] prev_hidden) except +
 46 |         CRNN[T] shallow_copy() const
 47 |         vector[CMat[T]] parameters() const
 48 | 
 49 |     cdef cppclass CStackedInputLayer "StackedInputLayer" [T] nogil:
 50 |         vector[int] input_sizes() const
 51 |         int hidden_size
 52 |         vector[CMat[T]] matrices
 53 |         CMat[T] b
 54 | 
 55 |         vector[CMat[T]] parameters() const
 56 |         CStackedInputLayer()
 57 |         CStackedInputLayer(vector[int] input_sizes, int output_size)
 58 |         CStackedInputLayer(const CStackedInputLayer& other, bint copy_w, bint copy_dw)
 59 | 
 60 |         CMat[T] activate(const vector[CMat[T]]&) except +
 61 |         CMat[T] activate(CMat[T]) except +
 62 |         CMat[T] activate(CMat[T], const vector[CMat[T]]&) except +
 63 | 
 64 |         CStackedInputLayer[T] shallow_copy() const
 65 | 
 66 | 
 67 | cdef class Layer:
 68 |     cdef void* layerinternal
 69 |     cdef np.NPY_TYPES dtypeinternal
 70 | 
 71 |     property dtype:
 72 |         def __get__(Layer self):
 73 |             return np.PyArray_DescrFromType(self.dtypeinternal)
 74 | 
 75 | 
 76 | 
 77 | pyprepeat PROPERTY_NAME in ['input_size', 'hidden_size',]
 78 |     property PROPERTY_NAME:
 79 |         def __get__(Layer self):
 80 |             pypinline typed_fexpression_args(pyp, ["self"],
 81 |                 return DEREF_LAYER(self).PROPERTY_NAME
 82 |             ypy
 83 | ypyrepeat
 84 | 
 85 | pyprepeat PARAM_NAME in ['W', 'b']
 86 | 
 87 |     property PARAM_NAME:
 88 |         def __get__(Layer self):
 89 |             pypinline typed_fexpression_args(pyp, ["self"],
 90 |                 return WRAP_MAT(DEREF_LAYER(self).PARAM_NAME)
 91 |             ypy
 92 | ypyrepeat
 93 | 
 94 |     def name_parameters(self, prefix):
 95 |         self.W.name = prefix + ".W"
 96 |         self.b.name = prefix + ".b"
 97 | 
 98 |     def __cinit__(Layer self, int input_size, int hidden_size, dtype=np.float32):
 99 |         self.layerinternal = NULL
100 |         self.dtypeinternal = np.NPY_NOTYPE
101 | 
102 | 
103 |         self.dtypeinternal = np.dtype(dtype).num
104 |         pypinline typed_fexpression_args(pyp, ["self"],
105 |             self.layerinternal = new CLayer[TYPE_NAME](input_size, hidden_size)
106 |         ypy
107 | 
108 |     def __dealloc__(Layer self):
109 |         self.free_internal()
110 | 
111 |     cdef free_internal(Layer self):
112 |         pypinline type_frepeat(pyp,
113 |         cdef CLayer[TYPE_NAME]* TYPED(ptr_internal)
114 |         ypy
115 |         if self.layerinternal != NULL:
116 |             pypinline typed_fexpression_args(pyp, ["self"],
117 |                 TYPED(ptr_internal) = PTR_LAYER(self)
118 |                 with nogil:
119 |                     del TYPED(ptr_internal)
120 |             ypy
121 |             self.layerinternal = NULL
122 | 
123 |     def activate(Layer self, Mat input_vector):
124 |         assert self.dtypeinternal == input_vector.dtypeinternal, \
125 |                "All arguments must be of the same type"
126 |         pypinline type_frepeat(pyp,
127 |         cdef CMat[TYPE_NAME] TYPED(out)
128 |         ypy
129 | 
130 |         pypinline typed_fexpression(pyp,
131 |             with nogil:
132 |                 TYPED(out) = DEREF_LAYER(self).activate(DEREF_MAT(input_vector))
133 |             return WRAP_MAT(TYPED(out))
134 |         ypy
135 | 
136 | 
137 |     def shallow_copy(Layer self):
138 |         cdef Layer copy = Layer(0,0)
139 |         copy.free_internal()
140 |         pypinline typed_fexpression(pyp,
141 |             copy.layerinternal = new CLayer[TYPE_NAME](DEREF_LAYER(self), False, True)
142 |         ypy
143 |         return copy
144 | 
145 |     def parameters(Layer self):
146 |         params = []
147 |         pypinline type_frepeat(pyp,
148 |         cdef CMat[TYPE_NAME]         TYPED(param)
149 |         cdef vector[CMat[TYPE_NAME]] TYPED(param_vec)
150 |         ypy
151 |         pypinline typed_fexpression_args(pyp, ["self"],
152 |             TYPED(param_vec) = DEREF_LAYER(self).parameters()
153 |             for TYPED(param) in TYPED(param_vec):
154 |                 params.append(WRAP_MAT(TYPED(param)))
155 |         ypy
156 |         return params
157 | 
158 |     def __setstate__(Layer self, state):
159 |         for param, saved_param in zip(self.parameters(), state["parameters"]):
160 |             param.w = saved_param.w
161 |         self.dtypeinternal = state["dtype"].num
162 | 
163 |     def __getstate__(Layer self):
164 |         return {
165 |             "parameters" : self.parameters(),
166 |             "dtype" : self.dtype
167 |         }
168 | 
169 |     def __reduce__(Layer self):
170 |         return (
171 |             self.__class__,
172 |             (
173 |                 self.input_size,
174 |                 self.hidden_size,
175 |             ), self.__getstate__(),
176 |         )
177 | 
178 |     def __str__(self):
179 |         return "<Layer in=%d, hidden=%d>" % (self.input_size, self.hidden_size)
180 | 
181 |     def __repr__(Layer self):
182 |         return str(self)
183 | 
184 | pypinline type_repeat(pyp,
185 | cdef void TYPED(copy_name_layer)(const CLayer[TYPE_NAME]& internal, const CLayer[TYPE_NAME]& output):
186 |     TYPED(copy_name)(internal.W, output.W)
187 |     TYPED(copy_name)(internal.b, output.b)
188 | ypy
189 | 
190 | pypinline type_repeat(pyp,
191 | cdef inline Layer TYPED(WrapLayer)(const CLayer[TYPE_NAME]& internal):
192 |     cdef Layer output = Layer(0,0)
193 |     output.free_internal()
194 |     output.layerinternal = new CLayer[TYPE_NAME](internal, False, False)
195 |     output.dtypeinternal = TYPE_NPYINTERNAL
196 | 
197 |     TYPED(copy_name_layer)(internal, DEREF_LAYER(output))
198 | 
199 |     return output
200 | ypy
201 | 
202 | 
203 | cdef class RNN:
204 |     cdef void*        layerinternal
205 |     cdef np.NPY_TYPES dtypeinternal
206 | 
207 |     property dtype:
208 |         def __get__(RNN self):
209 |             return np.PyArray_DescrFromType(self.dtypeinternal)
210 | 
211 | pyprepeat PROPERTY_NAME in ['input_size', 'hidden_size', 'output_size']
212 |     property PROPERTY_NAME:
213 |         def __get__(RNN self):
214 |             pypinline typed_fexpression(pyp,
215 |                 return DEREF_RNN(self).PROPERTY_NAME
216 |             ypy
217 | ypyrepeat
218 | 
219 | pyprepeat PARAM_NAME in ['Wx', 'Wh', 'b']
220 | 
221 |     property PARAM_NAME:
222 |         def __get__(RNN self):
223 |             pypinline typed_fexpression(pyp,
224 |                 return WRAP_MAT(DEREF_RNN(self).PARAM_NAME)
225 |             ypy
226 | ypyrepeat
227 | 
228 |     def name_parameters(self, prefix):
229 |         self.Wx.name = prefix + ".Wx"
230 |         self.Wh.name = prefix + ".Wh"
231 |         self.b.name = prefix + ".b"
232 | 
233 | 
234 |     def __cinit__(self, int input_size, int hidden_size, output_size = None, dtype=np.float32):
235 |         self.layerinternal = NULL
236 |         self.dtypeinternal = np.NPY_NOTYPE
237 | 
238 |         if output_size is None:
239 |             output_size = hidden_size
240 |         assert(input_size > -1 and hidden_size > -1 and output_size > -1), "Only positive dimensions may be used."
241 |         cdef int out_size = output_size
242 | 
243 |         self.dtypeinternal = np.dtype(dtype).num
244 | 
245 |         pypinline typed_fexpression_args(pyp, ["<RNN>self"],
246 |             self.layerinternal = new CRNN[TYPE_NAME](input_size, hidden_size, out_size)
247 |         ypy
248 | 
249 |     def __dealloc__(RNN self):
250 |         self.free_internal()
251 | 
252 |     cdef free_internal(RNN self):
253 |         pypinline type_frepeat(pyp,
254 |         cdef CRNN[TYPE_NAME]* TYPED(ptr_internal)
255 |         ypy
256 |         if self.layerinternal != NULL:
257 |             pypinline typed_fexpression(pyp,
258 |                 TYPED(ptr_internal) = PTR_RNN(self)
259 |                 with nogil:
260 |                     del TYPED(ptr_internal)
261 |             ypy
262 |             self.layerinternal = NULL
263 | 
264 | 
265 | 
266 |     def __setstate__(RNN self, state):
267 |         for param, saved_param in zip(self.parameters(), state["parameters"]):
268 |             param.w = saved_param.w
269 |         self.dtypeinternal = state["dtype"].num
270 | 
271 | 
272 |     def __getstate__(self):
273 |         return {
274 |             "parameters" : self.parameters(),
275 |             "dtype" : self.dtype
276 |         }
277 | 
278 |     def __reduce__(self):
279 |         return (
280 |             self.__class__,
281 |             (
282 |                 self.input_size,
283 |                 self.hidden_size,
284 |                 self.output_size
285 |             ), self.__getstate__(),
286 |         )
287 | 
288 | 
289 |     def activate(RNN self, Mat input_vector,  Mat prev_hidden):
290 |         assert self.dtypeinternal == input_vector.dtypeinternal and \
291 |                self.dtypeinternal == prev_hidden.dtypeinternal, \
292 |                "All arguments must be of the same type"
293 |         pypinline type_frepeat(pyp,
294 |         cdef CMat[TYPE_NAME] TYPED(out)
295 |         ypy
296 | 
297 |         pypinline typed_fexpression(pyp,
298 |             with nogil:
299 |                 TYPED(out) = DEREF_RNN(self).activate(DEREF_MAT(input_vector), DEREF_MAT(prev_hidden))
300 |             return WRAP_MAT(TYPED(out))
301 |         ypy
302 | 
303 | 
304 |     def shallow_copy(RNN self):
305 |         cdef RNN copy = RNN(0,0)
306 |         copy.free_internal()
307 |         pypinline typed_fexpression(pyp,
308 |             copy.layerinternal = new CRNN[TYPE_NAME](DEREF_RNN(self), False, True)
309 |         ypy
310 |         return copy
311 | 
312 |     def parameters(RNN self):
313 |         params = []
314 |         pypinline type_frepeat(pyp,
315 |         cdef CMat[TYPE_NAME]         TYPED(param)
316 |         cdef vector[CMat[TYPE_NAME]] TYPED(param_vec)
317 | 
318 |         ypy
319 |         pypinline typed_fexpression(pyp,
320 |             TYPED(param_vec) = DEREF_RNN(self).parameters()
321 |             for TYPED(param) in TYPED(param_vec):
322 |                 params.append(WRAP_MAT(TYPED(param)))
323 |         ypy
324 |         return params
325 | 
326 | 
327 |     def __str__(self):
328 |         return "<RNN in=%d, hidden=%d out=%d>" % (self.input_size, self.hidden_size, self.output_size)
329 | 
330 |     def __repr__(Layer self):
331 |         return str(self)
332 | 
333 | 
334 | cdef class StackedInputLayer:
335 |     cdef void* layerinternal
336 |     cdef np.NPY_TYPES dtypeinternal
337 | 
338 |     property dtype:
339 |         def __get__(StackedInputLayer self):
340 |             return np.PyArray_DescrFromType(self.dtypeinternal)
341 | 
342 | 
343 |     property input_sizes:
344 |         def __get__(StackedInputLayer self):
345 |             pypinline typed_fexpression(pyp,
346 |                 return DEREF_STACKEDLAYER(self).input_sizes()
347 |             ypy
348 | 
349 |     property hidden_size:
350 |         def __get__(StackedInputLayer self):
351 |             pypinline typed_fexpression(pyp,
352 |                 return DEREF_STACKEDLAYER(self).hidden_size
353 |             ypy
354 | 
355 |     property matrices:
356 |         def __get__(StackedInputLayer self):
357 |             cdef int i
358 |             params = []
359 |             pypinline typed_fexpression(pyp,
360 |                 for i in range(DEREF_STACKEDLAYER(self).matrices.size()):
361 |                     params.append(WRAP_MAT(DEREF_STACKEDLAYER(self).matrices[i]))
362 |             ypy
363 |             return params
364 | 
365 |     property b:
366 |         def __get__(StackedInputLayer self):
367 |             pypinline typed_fexpression(pyp,
368 |                 return WRAP_MAT(DEREF_STACKEDLAYER(self).b)
369 |             ypy
370 | 
371 |     def name_parameters(self, prefix):
372 |         for matidx, matrix in enumerate(self.matrices):
373 |             matrix.name = prefix + ".matrices[%d]" % (matidx,)
374 |         self.b.name = prefix + ".b"
375 | 
376 |     def __cinit__(StackedInputLayer self, list input_sizes, int hidden_size, dtype=np.float32):
377 |         self.layerinternal = NULL
378 |         self.dtypeinternal = np.NPY_NOTYPE
379 | 
380 |         self.dtypeinternal = np.dtype(dtype).num
381 | 
382 |         pypinline typed_fexpression(pyp,
383 |             self.layerinternal = new CStackedInputLayer[TYPE_NAME](<vector[int]>input_sizes, hidden_size)
384 |         ypy
385 | 
386 |     def __dealloc__(StackedInputLayer self):
387 |         self.free_internal()
388 | 
389 |     cdef free_internal(StackedInputLayer self):
390 |         pypinline type_frepeat(pyp,
391 |         cdef CStackedInputLayer[TYPE_NAME]* TYPED(ptr_internal)
392 |         ypy
393 |         if self.layerinternal != NULL:
394 |             pypinline typed_fexpression(pyp,
395 |                 TYPED(ptr_internal) = PTR_STACKEDLAYER(self)
396 |                 with nogil:
397 |                     del TYPED(ptr_internal)
398 |             ypy
399 |             self.layerinternal = NULL
400 | 
401 |     def __setstate__(StackedInputLayer self, state):
402 |         for param, saved_param in zip(self.parameters(), state["parameters"]):
403 |             param.w = saved_param.w
404 |             self.dtypeinternal = state["dtype"].num
405 | 
406 |     def __getstate__(self):
407 |         return {
408 |             "parameters" : self.parameters(),
409 |             "dtype" : self.dtype,
410 |         }
411 | 
412 |     def __reduce__(self):
413 |         return (
414 |             self.__class__,
415 |             (
416 |                 self.input_sizes,
417 |                 self.hidden_size
418 |             ), self.__getstate__(),
419 |         )
420 | 
421 |     def activate(StackedInputLayer self, input_vectors):
422 |         pypinline type_frepeat(pyp,
423 |         cdef vector[CMat[TYPE_NAME]]  TYPED(input_vec)
424 |         cdef CMat[TYPE_NAME]          TYPED(input_mat)
425 |         cdef CMat[TYPE_NAME]          TYPED(out)
426 |         ypy
427 | 
428 |         if type(input_vectors) is Mat:
429 |             assert (<Mat>input_vectors).dtypeinternal == self.dtypeinternal, \
430 |                     "input mat must be of the same type as StackedInputLayer"
431 | 
432 |             pypinline typed_fexpression_args(pyp, ["self"],
433 |                 TYPED(input_mat) = DEREF_MAT(input_vectors)
434 |                 with nogil:
435 |                     TYPED(out) = DEREF_STACKEDLAYER(self).activate(TYPED(input_mat))
436 |                 return WRAP_MAT(TYPED(out))
437 |             ypy
438 |         elif type(input_vectors) == list:
439 |             for v in input_vectors:
440 |                 assert type(v) == Mat, "Matrices required for Stacked Input Layer"
441 |                 assert (<Mat>v).dtypeinternal == self.dtypeinternal, "All arguments must have the same type."
442 | 
443 | 
444 |             pypinline typed_fexpression_args(pyp, ["self"],
445 |                 TYPED(input_vec).clear()
446 |                 for inpt in input_vectors:
447 |                     TYPED(input_vec).push_back(DEREF_MAT(inpt))
448 |                 with nogil:
449 |                     TYPED(out) = DEREF_STACKEDLAYER(self).activate(TYPED(input_vec))
450 |                 return WRAP_MAT(TYPED(out))
451 |             ypy
452 |         else:
453 |             raise TypeError("activate takes a list of Mat or single Mat as input.")
454 | 
455 |     def shallow_copy(StackedInputLayer self):
456 |         cdef StackedInputLayer copy = StackedInputLayer(0,0)
457 |         copy.free_internal()
458 |         pypinline typed_fexpression_args(pyp, ["self"],
459 |             copy.layerinternal = new CStackedInputLayer[TYPE_NAME](DEREF_STACKEDLAYER(self), False, True)
460 |         ypy
461 |         return copy
462 | 
463 | 
464 |     def parameters(StackedInputLayer self):
465 |         params = []
466 |         pypinline type_frepeat(pyp,
467 |         cdef CMat[TYPE_NAME]         TYPED(param)
468 |         cdef vector[CMat[TYPE_NAME]] TYPED(param_vec)
469 | 
470 |         ypy
471 |         pypinline typed_fexpression_args(pyp, ["self"],
472 |             TYPED(param_vec) = DEREF_STACKEDLAYER(self).parameters()
473 |             for TYPED(param) in TYPED(param_vec):
474 |                 params.append(WRAP_MAT(TYPED(param)))
475 |         ypy
476 |         return params
477 | 
478 |     def __str__(self):
479 |         return "<StackedInputLayer in=%s, out=%d>" % (str(self.input_sizes), self.hidden_size)
480 | 
481 |     def __repr__(StackedInputLayer self):
482 |         return str(self)
483 | 
484 | pypinline type_repeat(pyp,
485 | cdef void TYPED(copy_name_stackedlayer)(const CStackedInputLayer[TYPE_NAME]& internal, const CStackedInputLayer[TYPE_NAME]& output):
486 |     for i in range(internal.matrices.size()):
487 |         TYPED(copy_name)(internal.matrices[i], output.matrices[i])
488 |     TYPED(copy_name)(internal.b, output.b)
489 | ypy
490 | 
491 | 
492 | pypinline type_repeat(pyp,
493 | cdef inline StackedInputLayer TYPED(WrapStackedLayer)(const CStackedInputLayer[TYPE_NAME]& internal):
494 |     cdef StackedInputLayer output = StackedInputLayer([0],0)
495 |     output.free_internal()
496 |     output.layerinternal = new CStackedInputLayer[TYPE_NAME](internal, False, False)
497 |     output.dtypeinternal = TYPE_NPYINTERNAL
498 | 
499 |     TYPED(copy_name_stackedlayer)(internal, DEREF_STACKEDLAYER(output))
500 | 
501 |     return output
502 | ypy
503 | 


--------------------------------------------------------------------------------
/cython/dali/core/math/TensorInternal.pyx:
--------------------------------------------------------------------------------
1 | cdef extern from "dali/math/TensorInternal.h":
2 |     cdef cppclass TensorInternal [T]:
3 |         T* data() const
4 |         TensorInternal(const TensorInternal[T]& other)
5 | 


--------------------------------------------------------------------------------
/cython/dali/core/math/memory_bank/MemoryBankWrapper.cpp:
--------------------------------------------------------------------------------
 1 | #include "MemoryBankWrapper.h"
 2 | #include <dali/math/SynchronizedMemory.h>
 3 | 
 4 | template<typename R>
 5 | void MemoryBankWrapper<R>::clear_cpu() {
 6 | 	SynchronizedMemory<R>::clear_cpu();
 7 | }
 8 | template<typename R>
 9 | void MemoryBankWrapper<R>::clear_gpu() {
10 | 	#ifdef DALI_USE_CUDA
11 | 		SynchronizedMemory<R>::clear_gpu();
12 | 	#else
13 | 		throw std::runtime_error("Dali when compiled without cuda cannot clear GPU.");
14 | 	#endif
15 | }
16 | 
17 | template class MemoryBankWrapper<float>;
18 | template class MemoryBankWrapper<double>;
19 | template class MemoryBankWrapper<int>;
20 | 


--------------------------------------------------------------------------------
/cython/dali/core/math/memory_bank/MemoryBankWrapper.h:
--------------------------------------------------------------------------------
 1 | #ifndef DALI_CORE_MATH_MEMORY_BANK_MEMORY_BANK_WRAPPER_H
 2 | #define DALI_CORE_MATH_MEMORY_BANK_MEMORY_BANK_WRAPPER_H
 3 | template<typename R>
 4 | class MemoryBankWrapper {
 5 | 	public:
 6 | 		static void clear_gpu();
 7 | 		static void clear_cpu();
 8 | };
 9 | 
10 | #endif
11 | 


--------------------------------------------------------------------------------
/cython/dali/core/math/memory_status.cpp:
--------------------------------------------------------------------------------
 1 | #include "memory_status.h"
 2 | 
 3 | 
 4 | template<typename R>
 5 | bool is_gpu_fresh(const Mat<R>& mat) {
 6 |     #ifdef DALI_USE_CUDA
 7 |         if (!mat.empty()) {
 8 |             return mat.w().memory().gpu_fresh;
 9 |         } else {
10 |             return false;
11 |         }
12 |     #else
13 |         return false;
14 |     #endif
15 | }
16 | 
17 | template<typename R>
18 | bool is_cpu_fresh(const Mat<R>& mat) {
19 |     if (!mat.empty()) {
20 |         return mat.w().memory().cpu_fresh;
21 |     } else {
22 |         return false;
23 |     }
24 | }
25 | 
26 | template<typename R>
27 | bool is_gpu_allocated(const Mat<R>& mat) {
28 |     #ifdef DALI_USE_CUDA
29 |         if (!mat.empty()) {
30 |             return mat.w().memory().allocated_gpu;
31 |         } else {
32 |             return false;
33 |         }
34 |     #else
35 |         return false;
36 |     #endif
37 | }
38 | 
39 | template<typename R>
40 | bool is_cpu_allocated(const Mat<R>& mat) {
41 |     if (!mat.empty()) {
42 |         return mat.w().memory().allocated_cpu;
43 |     } else {
44 |         return false;
45 |     }
46 | }
47 | 
48 | template<typename R>
49 | void to_cpu(const Mat<R>& mat) {
50 |     mat.to_cpu();
51 | }
52 | 
53 | template<typename R>
54 | void to_gpu(const Mat<R>& mat) {
55 |     #ifdef DALI_USE_CUDA
56 |         mat.to_gpu();
57 |     #else
58 |         throw std::runtime_error("Dali compiled without CUDA. Cannot move to GPU.");
59 |     #endif
60 | }
61 | 
62 | 
63 | template bool is_gpu_fresh(const Mat<int>& mat);
64 | template bool is_gpu_fresh(const Mat<float>& mat);
65 | template bool is_gpu_fresh(const Mat<double>& mat);
66 | 
67 | template bool is_cpu_fresh(const Mat<int>& mat);
68 | template bool is_cpu_fresh(const Mat<float>& mat);
69 | template bool is_cpu_fresh(const Mat<double>& mat);
70 | 
71 | template bool is_gpu_allocated(const Mat<int>& mat);
72 | template bool is_gpu_allocated(const Mat<float>& mat);
73 | template bool is_gpu_allocated(const Mat<double>& mat);
74 | 
75 | template bool is_cpu_allocated(const Mat<int>& mat);
76 | template bool is_cpu_allocated(const Mat<float>& mat);
77 | template bool is_cpu_allocated(const Mat<double>& mat);
78 | 
79 | template void to_cpu(const Mat<int>& mat);
80 | template void to_cpu(const Mat<float>& mat);
81 | template void to_cpu(const Mat<double>& mat);
82 | 
83 | template void to_gpu(const Mat<int>& mat);
84 | template void to_gpu(const Mat<float>& mat);
85 | template void to_gpu(const Mat<double>& mat);
86 | 


--------------------------------------------------------------------------------
/cython/dali/core/math/memory_status.h:
--------------------------------------------------------------------------------
 1 | #ifndef DALI_MATH_MEMORY_STATUS_H
 2 | #define DALI_MATH_MEMORY_STATUS_H
 3 | 
 4 | 
 5 | #include "dali/tensor/Mat.h"
 6 | 
 7 | template<typename R>
 8 | bool is_gpu_fresh(const Mat<R>& mat);
 9 | 
10 | template<typename R>
11 | bool is_cpu_fresh(const Mat<R>& mat);
12 | 
13 | template<typename R>
14 | bool is_gpu_allocated(const Mat<R>& mat);
15 | 
16 | template<typename R>
17 | bool is_cpu_allocated(const Mat<R>& mat);
18 | 
19 | template<typename R>
20 | void to_cpu(const Mat<R>& mat);
21 | 
22 | template<typename R>
23 | void to_gpu(const Mat<R>& mat);
24 | 
25 | #endif
26 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/Solver.pyx.pre:
--------------------------------------------------------------------------------
  1 | pyp
  2 | from preprocessor_utils import (
  3 |     typed_fexpression_args,
  4 |     typed_fexpression,
  5 |     type_frepeat,
  6 |     typed_fexpression_list)
  7 | ypy
  8 | 
  9 | cdef extern from "dali/tensor/Solver.h" nogil:
 10 |     cdef cppclass CSGD "Solver::SGD" [T]:
 11 |         T clip_abs
 12 |         T clip_norm
 13 |         T smooth_eps
 14 |         T regc
 15 |         T step_size
 16 |         # default parameters look like overloaded
 17 |         # functions to cython:
 18 |         CSGD(T clip_norm, T smooth_eps, T regc)
 19 |         CSGD(T clip_norm, T regc)
 20 |         CSGD(T clip_norm)
 21 |         CSGD()
 22 |         CSGD(vector[CMat[T]]&, T clip_norm, T regc)
 23 |         void step(vector[CMat[T]]&)
 24 |         void step(vector[CMat[T]]&, T step_size)
 25 |         void reset_caches(vector[CMat[T]]&)
 26 | 
 27 |     cdef cppclass CAdaGrad "Solver::AdaGrad" [T]:
 28 |         T clip_abs
 29 |         T clip_norm
 30 |         T smooth_eps
 31 |         T regc
 32 |         T step_size
 33 |         CAdaGrad()
 34 |         CAdaGrad(T smooth_eps, T clip_norm, T regc)
 35 |         CAdaGrad(vector[CMat[T]]&, T smooth_eps, T clip_norm, T regc)
 36 |         void step(vector[CMat[T]]&) except +
 37 |         void step(vector[CMat[T]]&, T step_size) except +
 38 |         void reset_caches(vector[CMat[T]]&) except +
 39 |         void create_gradient_caches(vector[CMat[T]]&)
 40 | 
 41 |     cdef cppclass CRMSProp "Solver::RMSProp" [T]:
 42 |         T clip_abs
 43 |         T clip_norm
 44 |         T smooth_eps
 45 |         T regc
 46 |         T step_size
 47 |         T decay_rate
 48 |         CRMSProp()
 49 |         CRMSProp(T decay_rate, T smooth_eps, T clip_norm, T regc)
 50 |         CRMSProp(vector[CMat[T]]&, T decay_rate, T smooth_eps, T clip_norm, T regc)
 51 |         void step(vector[CMat[T]]&) except +
 52 |         void step(vector[CMat[T]]&, T step_size) except +
 53 |         void reset_caches(vector[CMat[T]]&) except +
 54 |         void create_gradient_caches(vector[CMat[T]]&)
 55 | 
 56 |     cdef cppclass CAdaDelta "Solver::AdaDelta" [T]:
 57 |         T clip_abs
 58 |         T clip_norm
 59 |         T smooth_eps
 60 |         T regc
 61 |         T rho
 62 |         CAdaDelta()
 63 |         CAdaDelta(T rho, T smooth_eps, T clip_norm, T regc)
 64 |         CAdaDelta(vector[CMat[T]]&, T rho, T smooth_eps, T clip_norm, T regc)
 65 |         void step(vector[CMat[T]]&) except +
 66 |         void reset_caches(vector[CMat[T]]&) except +
 67 |         void create_gradient_caches(vector[CMat[T]]&)
 68 | 
 69 |     cdef cppclass CAdam "Solver::Adam" [T]:
 70 |         T clip_abs
 71 |         T clip_norm
 72 |         T smooth_eps
 73 |         T regc
 74 |         T step_size
 75 |         T b1
 76 |         T b2
 77 |         unsigned long long epoch
 78 |         CAdam()
 79 |         CAdam(T step_size, T b1, T b2, T smooth_eps, T clip_norm, T regc)
 80 |         CAdam(vector[CMat[T]]&, T step_size, T b1, T b2, T smooth_eps, T clip_norm, T regc)
 81 |         void step(vector[CMat[T]]&) except +
 82 |         void step(vector[CMat[T]]&, T step_size) except +
 83 |         void reset_caches(vector[CMat[T]]&) except +
 84 |         void create_gradient_caches(vector[CMat[T]]&)
 85 | 
 86 | cdef class SGD:
 87 |     cdef void * solverinternal
 88 |     cdef np.NPY_TYPES dtypeinternal
 89 | 
 90 |     property dtype:
 91 |         def __get__(SGD self):
 92 |             return np.PyArray_DescrFromType(self.dtypeinternal)
 93 | 
 94 | pyprepeat PROP_NAME in ['step_size', 'clip_norm', 'clip_abs', 'regc', 'smooth_eps']
 95 |     property PROP_NAME:
 96 |         def __get__(SGD self):
 97 |             pypinline typed_fexpression(pyp,
 98 |                 return DEREF_SGD(self).PROP_NAME
 99 |             ypy
100 | 
101 |         def __set__(SGD self, float val):
102 |             pypinline typed_fexpression(pyp,
103 |                 DEREF_SGD(self).PROP_NAME = val
104 |             ypy
105 | ypyrepeat
106 | 
107 |     def __dealloc__(SGD self):
108 |         pypinline type_frepeat(pyp,
109 |         cdef CSGD[TYPE_NAME]* TYPED(ptr_internal)
110 |         ypy
111 |         if self.solverinternal != NULL:
112 |             pypinline typed_fexpression(pyp,
113 |                 TYPED(ptr_internal) = PTR_SGD(self)
114 |                 with nogil:
115 |                     del TYPED(ptr_internal)
116 |             ypy
117 |             self.solverinternal = NULL
118 | 
119 |     def __cinit__(SGD self, params = None, float clip_abs = 0.0, float clip_norm = 5.0, float regc = 0.0, float step_size = 0.01, dtype = None):
120 |         pypinline type_frepeat(pyp,
121 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
122 |         ypy
123 |         self.dtypeinternal = np.NPY_NOTYPE
124 |         # get the dtype from kwargs
125 |         if dtype is not None:
126 |             self.dtypeinternal = np.dtype(dtype).num
127 |             ensure_fdtype(self.dtypeinternal)
128 | 
129 |         if params is not None and len(params) > 0:
130 |             pypinline typed_fexpression_list(pyp, "params", "Mat",
131 |                 TYPED(c_params) = TYPED(mats_to_vec)(params)
132 |                 if TYPED(c_params).size() > 0:
133 |                     if self.dtypeinternal == np.NPY_NOTYPE:
134 |                         self.dtypeinternal = TYPE_NPYINTERNAL
135 |                     else:
136 |                         if self.dtypeinternal != TYPE_NPYINTERNAL:
137 |                             raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
138 |             ypy
139 |         if self.dtypeinternal == np.NPY_NOTYPE:
140 |             self.dtypeinternal = np.NPY_FLOAT32
141 | 
142 |         pypinline typed_fexpression(pyp,
143 |             self.solverinternal = new CSGD[TYPE_NAME](
144 |                 TYPED(c_params), clip_norm, regc)
145 |             DEREF_SGD(self).step_size = step_size
146 |             DEREF_SGD(self).clip_abs = clip_abs
147 |         ypy
148 | 
149 |     def reset_caches(SGD self, list params):
150 |         pypinline type_frepeat(pyp,
151 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
152 |         ypy
153 | 
154 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
155 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
156 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
157 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
158 |             with nogil:
159 |                 DEREF_SGD(self).reset_caches(TYPED(c_params))
160 |         ypy
161 | 
162 |     def step(SGD self, list params, step_size = None):
163 |         pypinline type_frepeat(pyp,
164 |         cdef TYPE_NAME TYPED(cstep_size)
165 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
166 |         ypy
167 | 
168 |         if step_size is not None:
169 |             pypinline typed_fexpression(pyp,
170 |                 TYPED(cstep_size) = step_size
171 |             ypy
172 |         else:
173 |             pypinline typed_fexpression(pyp,
174 |                 TYPED(cstep_size) = DEREF_SGD(self).step_size
175 |             ypy
176 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
177 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
178 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
179 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
180 |             with nogil:
181 |                 DEREF_SGD(self).step(TYPED(c_params), TYPED(cstep_size))
182 |         ypy
183 | 
184 | cdef class AdaGrad:
185 |     cdef void * solverinternal
186 |     cdef np.NPY_TYPES dtypeinternal
187 | 
188 |     property dtype:
189 |         def __get__(AdaGrad self):
190 |             return np.PyArray_DescrFromType(self.dtypeinternal)
191 | 
192 | pyprepeat PROP_NAME in ['step_size', 'clip_abs', 'clip_norm', 'regc', 'smooth_eps']
193 |     property PROP_NAME:
194 |         def __get__(AdaGrad self):
195 |             pypinline typed_fexpression(pyp,
196 |                 return DEREF_ADAGRAD(self).PROP_NAME
197 |             ypy
198 | 
199 |         def __set__(AdaGrad self, float val):
200 |             pypinline typed_fexpression(pyp,
201 |                 DEREF_ADAGRAD(self).PROP_NAME = val
202 |             ypy
203 | ypyrepeat
204 | 
205 |     def __dealloc__(AdaGrad self):
206 |         pypinline type_frepeat(pyp,
207 |         cdef CAdaGrad[TYPE_NAME]* TYPED(ptr_internal)
208 |         ypy
209 |         if self.solverinternal != NULL:
210 |             pypinline typed_fexpression(pyp,
211 |                 TYPED(ptr_internal) = PTR_ADAGRAD(self)
212 |                 with nogil:
213 |                     del TYPED(ptr_internal)
214 |             ypy
215 |             self.solverinternal = NULL
216 | 
217 |     def __cinit__(AdaGrad self, params = None, float eps = 1e-6, float clip_norm = 5.0, float clip_abs = 0.0, float regc = 0.0, float step_size = 0.01, dtype = None):
218 |         pypinline type_frepeat(pyp,
219 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
220 |         ypy
221 |         self.dtypeinternal = np.NPY_NOTYPE
222 |         # get the dtype from kwargs
223 |         if dtype is not None:
224 |             self.dtypeinternal = np.dtype(dtype).num
225 |             ensure_fdtype(self.dtypeinternal)
226 | 
227 |         if params is not None and len(params) > 0:
228 |             pypinline typed_fexpression_list(pyp, "params", "Mat",
229 |                 TYPED(c_params) = TYPED(mats_to_vec)(params)
230 |                 if TYPED(c_params).size() > 0:
231 |                     if self.dtypeinternal == np.NPY_NOTYPE:
232 |                         self.dtypeinternal = TYPE_NPYINTERNAL
233 |                     else:
234 |                         if self.dtypeinternal != TYPE_NPYINTERNAL:
235 |                             raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
236 |             ypy
237 |         if self.dtypeinternal == np.NPY_NOTYPE:
238 |             self.dtypeinternal = np.NPY_FLOAT32
239 | 
240 |         pypinline typed_fexpression(pyp,
241 |             self.solverinternal = new CAdaGrad[TYPE_NAME](
242 |                 TYPED(c_params), eps, clip_norm, regc)
243 |             DEREF_ADAGRAD(self).step_size = step_size
244 |             DEREF_ADAGRAD(self).clip_abs = clip_abs
245 |         ypy
246 | 
247 |     def reset_caches(AdaGrad self, list params):
248 |         pypinline type_frepeat(pyp,
249 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
250 |         ypy
251 | 
252 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
253 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
254 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
255 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
256 |             with nogil:
257 |                 DEREF_ADAGRAD(self).reset_caches(TYPED(c_params))
258 |         ypy
259 | 
260 |     def create_gradient_caches(AdaGrad self, list params):
261 |         pypinline type_frepeat(pyp,
262 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
263 |         ypy
264 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
265 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
266 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
267 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
268 |             with nogil:
269 |                 DEREF_ADAGRAD(self).create_gradient_caches(TYPED(c_params))
270 |         ypy
271 | 
272 |     def step(AdaGrad self, list params, step_size = None):
273 |         pypinline type_frepeat(pyp,
274 |         cdef TYPE_NAME TYPED(cstep_size)
275 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
276 |         ypy
277 | 
278 |         if step_size is not None:
279 |             pypinline typed_fexpression(pyp,
280 |                 TYPED(cstep_size) = step_size
281 |             ypy
282 |         else:
283 |             pypinline typed_fexpression(pyp,
284 |                 TYPED(cstep_size) = DEREF_ADAGRAD(self).step_size
285 |             ypy
286 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
287 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
288 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
289 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
290 |             with nogil:
291 |                 DEREF_ADAGRAD(self).step(TYPED(c_params), TYPED(cstep_size))
292 |         ypy
293 | 
294 | 
295 | cdef class RMSProp:
296 |     cdef void * solverinternal
297 |     cdef np.NPY_TYPES dtypeinternal
298 | 
299 |     property dtype:
300 |         def __get__(RMSProp self):
301 |             return np.PyArray_DescrFromType(self.dtypeinternal)
302 | 
303 | pyprepeat PROP_NAME in ['step_size', 'clip_abs', 'clip_norm', 'regc', 'smooth_eps', 'decay_rate']
304 |     property PROP_NAME:
305 |         def __get__(RMSProp self):
306 |             pypinline typed_fexpression(pyp,
307 |                 return DEREF_RMSPROP(self).PROP_NAME
308 |             ypy
309 | 
310 |         def __set__(RMSProp self, float val):
311 |             pypinline typed_fexpression(pyp,
312 |                 DEREF_RMSPROP(self).PROP_NAME = val
313 |             ypy
314 | ypyrepeat
315 | 
316 |     def __dealloc__(RMSProp self):
317 |         pypinline type_frepeat(pyp,
318 |         cdef CRMSProp[TYPE_NAME]* TYPED(ptr_internal)
319 |         ypy
320 |         if self.solverinternal != NULL:
321 |             pypinline typed_fexpression(pyp,
322 |                 TYPED(ptr_internal) = PTR_RMSPROP(self)
323 |                 with nogil:
324 |                     del TYPED(ptr_internal)
325 |             ypy
326 |             self.solverinternal = NULL
327 | 
328 |     def __cinit__(RMSProp self, params = None, float decay_rate = 0.999, float eps = 1e-6, float clip_norm = 5.0, float clip_abs = 0.0, float regc = 0.0, float step_size = 0.01, dtype = None):
329 |         pypinline type_frepeat(pyp,
330 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
331 |         ypy
332 |         self.dtypeinternal = np.NPY_NOTYPE
333 |         # get the dtype from kwargs
334 |         if dtype is not None:
335 |             self.dtypeinternal = np.dtype(dtype).num
336 |             ensure_fdtype(self.dtypeinternal)
337 | 
338 |         if params is not None and len(params) > 0:
339 |             pypinline typed_fexpression_list(pyp, "params", "Mat",
340 |                 TYPED(c_params) = TYPED(mats_to_vec)(params)
341 |                 if TYPED(c_params).size() > 0:
342 |                     if self.dtypeinternal == np.NPY_NOTYPE:
343 |                         self.dtypeinternal = TYPE_NPYINTERNAL
344 |                     else:
345 |                         if self.dtypeinternal != TYPE_NPYINTERNAL:
346 |                             raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
347 |             ypy
348 |         if self.dtypeinternal == np.NPY_NOTYPE:
349 |             self.dtypeinternal = np.NPY_FLOAT32
350 | 
351 |         pypinline typed_fexpression(pyp,
352 |             self.solverinternal = new CRMSProp[TYPE_NAME](
353 |                 TYPED(c_params), decay_rate, eps, clip_norm, regc)
354 |             DEREF_RMSPROP(self).step_size = step_size
355 |             DEREF_RMSPROP(self).clip_abs = clip_abs
356 |         ypy
357 | 
358 |     def reset_caches(RMSProp self, list params):
359 |         pypinline type_frepeat(pyp,
360 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
361 |         ypy
362 | 
363 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
364 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
365 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
366 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
367 |             with nogil:
368 |                 DEREF_RMSPROP(self).reset_caches(TYPED(c_params))
369 |         ypy
370 | 
371 |     def create_gradient_caches(RMSProp self, list params):
372 |         pypinline type_frepeat(pyp,
373 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
374 |         ypy
375 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
376 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
377 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
378 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
379 |             with nogil:
380 |                 DEREF_RMSPROP(self).create_gradient_caches(TYPED(c_params))
381 |         ypy
382 | 
383 |     def step(RMSProp self, list params, step_size = None):
384 |         pypinline type_frepeat(pyp,
385 |         cdef TYPE_NAME TYPED(cstep_size)
386 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
387 |         ypy
388 | 
389 |         if step_size is not None:
390 |             pypinline typed_fexpression(pyp,
391 |                 TYPED(cstep_size) = step_size
392 |             ypy
393 |         else:
394 |             pypinline typed_fexpression(pyp,
395 |                 TYPED(cstep_size) = DEREF_RMSPROP(self).step_size
396 |             ypy
397 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
398 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
399 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
400 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
401 |             with nogil:
402 |                 DEREF_RMSPROP(self).step(TYPED(c_params), TYPED(cstep_size))
403 |         ypy
404 | 
405 | 
406 | cdef class AdaDelta:
407 |     cdef void * solverinternal
408 |     cdef np.NPY_TYPES dtypeinternal
409 | 
410 |     property dtype:
411 |         def __get__(AdaDelta self):
412 |             return np.PyArray_DescrFromType(self.dtypeinternal)
413 | 
414 | pyprepeat PROP_NAME in ['clip_abs', 'clip_norm', 'regc', 'smooth_eps', 'rho']
415 |     property PROP_NAME:
416 |         def __get__(AdaDelta self):
417 |             pypinline typed_fexpression(pyp,
418 |                 return DEREF_ADADELTA(self).PROP_NAME
419 |             ypy
420 | 
421 |         def __set__(AdaDelta self, float val):
422 |             pypinline typed_fexpression(pyp,
423 |                 DEREF_ADADELTA(self).PROP_NAME = val
424 |             ypy
425 | ypyrepeat
426 | 
427 |     def __dealloc__(AdaDelta self):
428 |         pypinline type_frepeat(pyp,
429 |         cdef CAdaDelta[TYPE_NAME]* TYPED(ptr_internal)
430 |         ypy
431 |         if self.solverinternal != NULL:
432 |             pypinline typed_fexpression(pyp,
433 |                 TYPED(ptr_internal) = PTR_ADADELTA(self)
434 |                 with nogil:
435 |                     del TYPED(ptr_internal)
436 |             ypy
437 |             self.solverinternal = NULL
438 | 
439 |     def __cinit__(AdaDelta self, params = None, float rho = 0.95, float eps = 1e-4, float clip_norm = 5.0, float clip_abs = 0.0, float regc = 0.0, dtype = None):
440 | 
441 |         pypinline type_frepeat(pyp,
442 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
443 |         ypy
444 |         self.dtypeinternal = np.NPY_NOTYPE
445 |         # get the dtype from kwargs
446 |         if dtype is not None:
447 |             self.dtypeinternal = np.dtype(dtype).num
448 |             ensure_fdtype(self.dtypeinternal)
449 | 
450 |         if params is not None and len(params) > 0:
451 |             pypinline typed_fexpression_list(pyp, "params", "Mat",
452 |                 TYPED(c_params) = TYPED(mats_to_vec)(params)
453 |                 if TYPED(c_params).size() > 0:
454 |                     if self.dtypeinternal == np.NPY_NOTYPE:
455 |                         self.dtypeinternal = TYPE_NPYINTERNAL
456 |                     else:
457 |                         if self.dtypeinternal != TYPE_NPYINTERNAL:
458 |                             raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
459 |             ypy
460 |         if self.dtypeinternal == np.NPY_NOTYPE:
461 |             self.dtypeinternal = np.NPY_FLOAT32
462 | 
463 |         pypinline typed_fexpression(pyp,
464 |             self.solverinternal = new CAdaDelta[TYPE_NAME](
465 |                 TYPED(c_params), rho, eps, clip_norm, regc)
466 |             DEREF_ADADELTA(self).clip_abs = clip_abs
467 |         ypy
468 | 
469 |     def reset_caches(AdaDelta self, list params):
470 |         pypinline type_frepeat(pyp,
471 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
472 |         ypy
473 | 
474 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
475 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
476 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
477 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
478 |             with nogil:
479 |                 DEREF_ADADELTA(self).reset_caches(TYPED(c_params))
480 |         ypy
481 | 
482 |     def create_gradient_caches(AdaDelta self, list params):
483 |         pypinline type_frepeat(pyp,
484 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
485 |         ypy
486 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
487 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
488 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
489 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
490 |             with nogil:
491 |                 DEREF_ADADELTA(self).create_gradient_caches(TYPED(c_params))
492 |         ypy
493 | 
494 |     def step(AdaDelta self, list params):
495 |         pypinline type_frepeat(pyp,
496 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
497 |         ypy
498 | 
499 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
500 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
501 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
502 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
503 |             with nogil:
504 |                 DEREF_ADADELTA(self).step(TYPED(c_params))
505 |         ypy
506 | 
507 | 
508 | cdef class Adam:
509 |     cdef void * solverinternal
510 |     cdef np.NPY_TYPES dtypeinternal
511 | 
512 |     property dtype:
513 |         def __get__(Adam self):
514 |             return np.PyArray_DescrFromType(self.dtypeinternal)
515 | 
516 | pyprepeat PROP_NAME in ['clip_abs', 'clip_norm', 'regc', 'smooth_eps', 'b1', 'b2', 'step_size']
517 |     property PROP_NAME:
518 |         def __get__(Adam self):
519 |             pypinline typed_fexpression(pyp,
520 |                 return DEREF_ADAM(self).PROP_NAME
521 |             ypy
522 | 
523 |         def __set__(Adam self, float val):
524 |             pypinline typed_fexpression(pyp,
525 |                 DEREF_ADAM(self).PROP_NAME = val
526 |             ypy
527 | ypyrepeat
528 | 
529 |     property epoch:
530 |         def __get__(Adam self):
531 |             pypinline typed_fexpression(pyp,
532 |                 return DEREF_ADAM(self).epoch
533 |             ypy
534 | 
535 |         def __set__(Adam self, unsigned long long val):
536 |             pypinline typed_fexpression(pyp,
537 |                 DEREF_ADAM(self).epoch = val
538 |             ypy
539 | 
540 |     def __dealloc__(Adam self):
541 |         pypinline type_frepeat(pyp,
542 |         cdef CAdam[TYPE_NAME]* TYPED(ptr_internal)
543 |         ypy
544 |         if self.solverinternal != NULL:
545 |             pypinline typed_fexpression(pyp,
546 |                 TYPED(ptr_internal) = PTR_ADAM(self)
547 |                 with nogil:
548 |                     del TYPED(ptr_internal)
549 |             ypy
550 |             self.solverinternal = NULL
551 | 
552 |     def __cinit__(Adam self, params = None, float step_size = 0.0002, float b1 = 0.5, float b2 = 1e-6, float eps = 1e-4, float clip_norm = 5.0, float clip_abs = 0.0, float regc = 0.0, dtype = None):
553 |         pypinline type_frepeat(pyp,
554 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
555 |         ypy
556 |         self.dtypeinternal = np.NPY_NOTYPE
557 |         # get the dtype from kwargs
558 |         if dtype is not None:
559 |             self.dtypeinternal = np.dtype(dtype).num
560 |             ensure_fdtype(self.dtypeinternal)
561 | 
562 |         if params is not None and len(params) > 0:
563 |             pypinline typed_fexpression_list(pyp, "params", "Mat",
564 |                 TYPED(c_params) = TYPED(mats_to_vec)(params)
565 |                 if TYPED(c_params).size() > 0:
566 |                     if self.dtypeinternal == np.NPY_NOTYPE:
567 |                         self.dtypeinternal = TYPE_NPYINTERNAL
568 |                     else:
569 |                         if self.dtypeinternal != TYPE_NPYINTERNAL:
570 |                             raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
571 |             ypy
572 |         if self.dtypeinternal == np.NPY_NOTYPE:
573 |             self.dtypeinternal = np.NPY_FLOAT32
574 | 
575 |         pypinline typed_fexpression(pyp,
576 |             self.solverinternal = new CAdam[TYPE_NAME](
577 |                 TYPED(c_params), step_size, b1, b2, eps, clip_norm, regc)
578 |             DEREF_ADAM(self).clip_abs = clip_abs
579 |         ypy
580 | 
581 |     def reset_caches(Adam self, list params):
582 |         pypinline type_frepeat(pyp,
583 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
584 |         ypy
585 | 
586 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
587 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
588 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
589 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
590 |             with nogil:
591 |                 DEREF_ADAM(self).reset_caches(TYPED(c_params))
592 |         ypy
593 | 
594 |     def create_gradient_caches(Adam self, list params):
595 |         pypinline type_frepeat(pyp,
596 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
597 |         ypy
598 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
599 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
600 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
601 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
602 |             with nogil:
603 |                 DEREF_ADAM(self).create_gradient_caches(TYPED(c_params))
604 |         ypy
605 | 
606 |     def step(Adam self, list params):
607 |         pypinline type_frepeat(pyp,
608 |         cdef vector[CMat[TYPE_NAME]] TYPED(c_params)
609 |         ypy
610 | 
611 |         pypinline typed_fexpression_list(pyp, "params", "Mat",
612 |             TYPED(c_params) = TYPED(mats_to_vec)(params)
613 |             if self.dtypeinternal != TYPE_NPYINTERNAL:
614 |                 raise ValueError("Invalid dtype for parameters: " + str(params[0].dtype) + ", when solver is " + str(self.dtype))
615 |             with nogil:
616 |                 DEREF_ADAM(self).step(TYPED(c_params))
617 |         ypy
618 | 
619 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/Tape.pyx:
--------------------------------------------------------------------------------
 1 | from cpython.ref cimport PyObject
 2 | 
 3 | cdef extern from "core/tensor/python_tape.h" nogil:
 4 |     void emplace_back(PyObject* callback)
 5 | 
 6 | cdef extern from "dali/tensor/Tape.h" namespace "graph" nogil:
 7 |     void backward() except+
 8 |     bint backprop_enabled()
 9 |     void clear()
10 |     void _set_backprop_enabled(bint value);
11 |     size_t size();
12 | 
13 | class Graph:
14 |     @staticmethod
15 |     def emplace_back(backprop):
16 |         cdef PyObject* backprop_ptr = (<PyObject*>backprop)
17 |         with nogil:
18 |             emplace_back(backprop_ptr)
19 | 
20 |     @staticmethod
21 |     def backward():
22 |         backward()
23 | 
24 |     @staticmethod
25 |     def clear():
26 |         clear()
27 | 
28 |     @staticmethod
29 |     def backprop_enabled():
30 |         return backprop_enabled()
31 | 
32 |     @staticmethod
33 |     def size():
34 |         return size();
35 | 
36 | 
37 | cdef class NoBackprop:
38 |     cdef bint old_value
39 |     cdef bint _enabled
40 | 
41 |     def __cinit__(NoBackprop self, enabled=True):
42 |         self._enabled = enabled
43 | 
44 |     def __enter__(NoBackprop self):
45 |         if self._enabled:
46 |             self.old_value = Graph.backprop_enabled()
47 |             _set_backprop_enabled(False)
48 | 
49 |     def __exit__(NoBackprop self, *args, **kwargs):
50 |         if self._enabled:
51 |             _set_backprop_enabled(self.old_value)
52 | 
53 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/matrix_initializations.cpp:
--------------------------------------------------------------------------------
 1 | #include "dali/tensor/Weights.h"
 2 | 
 3 | #include "matrix_initializations.h"
 4 | 
 5 | template<typename R>
 6 | Mat<R>* matrix_initializations<R>::uniform(R low, R high, int rows, int cols) {
 7 |     return new Mat<R>(rows, cols, weights<R>::uniform(low, high));
 8 | }
 9 | template<typename R>
10 | Mat<R>* matrix_initializations<R>::gaussian(R mean, R std, int rows, int cols) {
11 |     return new Mat<R>(rows, cols, weights<R>::gaussian(mean, std));
12 | }
13 | template<typename R>
14 | Mat<R>* matrix_initializations<R>::bernoulli(R prob, int rows, int cols) {
15 |     return new Mat<R>(rows, cols, weights<R>::bernoulli(prob));
16 | }
17 | 
18 | template<typename R>
19 | Mat<R>* matrix_initializations<R>::bernoulli_normalized(R prob, int rows, int cols) {
20 |     return new Mat<R>(rows, cols, weights<R>::bernoulli_normalized(prob));
21 | }
22 | 
23 | template<typename R>
24 | Mat<R>* matrix_initializations<R>::eye(R diag, int width) {
25 |     return new Mat<R>(width, width, weights<R>::eye(diag));
26 | }
27 | 
28 | template<typename R>
29 | Mat<R>* matrix_initializations<R>::empty(int rows, int cols) {
30 |     return new Mat<R>(rows, cols, weights<R>::empty());
31 | }
32 | 
33 | template<typename R>
34 | Mat<R>* matrix_initializations<R>::ones(int rows, int cols) {
35 |     return new Mat<R>(rows, cols, weights<R>::ones());
36 | }
37 | 
38 | template<typename R>
39 | Mat<R>* matrix_initializations<R>::zeros(int rows, int cols) {
40 |     return new Mat<R>(rows, cols, weights<R>::zeros());
41 | }
42 | 
43 | template<typename R>
44 | Mat<R>* matrix_initializations<R>::from_pointer(R* ptr, int rows, int cols) {
45 | 	Mat<R>* mat = new Mat<R>(rows, cols);
46 | 	if ((rows * cols) > 0) {
47 | 		// not actually allocated memory
48 | 		mat->w().memory().cpu_ptr       = ptr;
49 | 		mat->w().memory().allocated_cpu = true;
50 | 		mat->w().memory().cpu_fresh     = true;
51 | 		mat->w().memory().total_memory = rows * cols;
52 | 	}
53 | 	return mat;
54 | }
55 | template<typename R>
56 | Mat<R>* matrix_initializations<R>::as_pointer(const Mat<R>& matrix) {
57 |     Mat<R>* ptr = new Mat<R>(matrix);
58 |     return ptr;
59 | }
60 | 
61 | 
62 | template struct matrix_initializations<float>;
63 | template struct matrix_initializations<double>;
64 | template struct matrix_initializations<int>;
65 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/matrix_initializations.h:
--------------------------------------------------------------------------------
 1 | #ifndef DALI_TENSOR_MATRIX_INITIALIZATIONS_H
 2 | #define DALI_TENSOR_MATRIX_INITIALIZATIONS_H
 3 | 
 4 | #include "dali/tensor/Mat.h"
 5 | 
 6 | template<typename R>
 7 | struct matrix_initializations {
 8 | 	static Mat<R>* uniform(R low, R high, int rows, int cols);
 9 | 	static Mat<R>* gaussian(R mean, R std, int rows, int cols);
10 | 	static Mat<R>* bernoulli(R prob, int rows, int cols);
11 | 	static Mat<R>* bernoulli_normalized(R prob, int rows, int cols);
12 | 	static Mat<R>* eye(R diag, int width);
13 | 	static Mat<R>* empty(int rows, int cols);
14 |     static Mat<R>* ones(int rows, int cols);
15 |     static Mat<R>* zeros(int rows, int cols);
16 | 	static Mat<R>* from_pointer(R* ptr, int rows, int cols);
17 |     static Mat<R>* as_pointer(const Mat<R>& matrix);
18 | };
19 | 
20 | #endif
21 | 
22 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/python_tape.cpp:
--------------------------------------------------------------------------------
 1 | #include "python_tape.h"
 2 | 
 3 | #include <memory>
 4 | #include <stdexcept>
 5 | #include "dali/tensor/Tape.h"
 6 | 
 7 | class PyObjectHolder {
 8 |     public:
 9 |         PyObject * pyobject;
10 |         PyObjectHolder(PyObject* _pyobject) : pyobject(_pyobject) {
11 |             Py_XINCREF(_pyobject);
12 |         }
13 |         ~PyObjectHolder() {
14 |             Py_XDECREF(pyobject);
15 |         }
16 | };
17 | 
18 | void emplace_back(PyObject * callback) {
19 |     auto callback_holder = std::make_shared<PyObjectHolder>(callback);
20 | 
21 |     graph::emplace_back([callback_holder]() {
22 |         PyObject *arglist;
23 |         PyObject *result;
24 |         arglist = Py_BuildValue("()");
25 |         result = PyEval_CallObject(callback_holder->pyobject, arglist);
26 |         Py_DECREF(arglist);
27 |         if (result == NULL) {
28 |             throw std::runtime_error("Error in callback");
29 |         }
30 |         Py_DECREF(result);
31 |     });
32 | }
33 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/python_tape.h:
--------------------------------------------------------------------------------
 1 | #ifndef DALI_TENSOR_PYTHON_TAPE_H
 2 | #define DALI_TENSOR_PYTHON_TAPE_H
 3 | 
 4 | #include "Python.h"
 5 | #include <functional>
 6 | 
 7 | void emplace_back(PyObject * callback);
 8 | 
 9 | #endif
10 | 


--------------------------------------------------------------------------------
/cython/dali/core/tensor/random.pyx.pre:
--------------------------------------------------------------------------------
  1 | pyp
  2 | from preprocessor_utils import typed_expression, typed_expression_args
  3 | ypy
  4 | 
  5 | cdef extern from "core/tensor/matrix_initializations.h" nogil:
  6 |     cdef cppclass matrix_initializations [T]:
  7 |         @staticmethod
  8 |         CMat[T] uniform(T low, T high, int rows, int cols)
  9 |         @staticmethod
 10 |         CMat[T] gaussian(T mean, T std, int rows, int cols)
 11 |         @staticmethod
 12 |         CMat[T] eye(T diag, int width)
 13 |         @staticmethod
 14 |         CMat[T] bernoulli(T prob, int rows, int cols)
 15 |         @staticmethod
 16 |         CMat[T] bernoulli_normalized(T prob, int rows, int cols)
 17 |         @staticmethod
 18 |         CMat[T] empty(int rows, int cols)
 19 | 
 20 | 
 21 | class random:
 22 |     @staticmethod
 23 |     def uniform(low = 0, high = 1, size=None, dtype=None):
 24 |         cdef Mat output = Mat(0,0, dtype=dtype)
 25 |         cdef bint error = False
 26 |         pypinline typed_expression_args(pyp, ["output"],
 27 |             if type(size) == list or type(size) == tuple and len(size) == 2:
 28 |                 output.matinternal = matrix_initializations[TYPE_NAME].uniform(low, high, size[0], size[1])
 29 |             elif type(size) == int:
 30 |                 output.matinternal = matrix_initializations[TYPE_NAME].uniform(low, high, size, 1)
 31 |             else:
 32 |                 error = True
 33 |         ypy
 34 |         if error:
 35 |             raise ValueError("size must be of type int, tuple, or list")
 36 |         return output
 37 | 
 38 |     @staticmethod
 39 |     def normal(loc=0, scale=1, size=None, dtype=None):
 40 |         cdef Mat output = Mat(0,0, dtype=dtype)
 41 |         cdef bint error = False
 42 |         pypinline typed_expression_args(pyp, ["output"],
 43 |             if type(size) == list or type(size) == tuple and len(size) == 2:
 44 |                 output.matinternal = matrix_initializations[TYPE_NAME].gaussian(loc, scale, size[0], size[1])
 45 |             elif type(size) == int:
 46 |                 output.matinternal = matrix_initializations[TYPE_NAME].gaussian(loc, scale, size, 1)
 47 |             else:
 48 |                 error = True
 49 |         ypy
 50 |         if error:
 51 |             raise ValueError("size must be of type int, tuple, or list")
 52 |         return output
 53 | 
 54 |     @staticmethod
 55 |     def standard_normal(size=None, dtype=None):
 56 |         cdef Mat output = Mat(0,0, dtype=dtype)
 57 |         cdef bint error = False
 58 |         pypinline typed_expression_args(pyp, ["output"],
 59 |             if type(size) == list or type(size) == tuple and len(size) == 2:
 60 |                 output.matinternal = matrix_initializations[TYPE_NAME].gaussian(0, 1, size[0], size[1])
 61 |             elif type(size) == int:
 62 |                 output.matinternal = matrix_initializations[TYPE_NAME].gaussian(0, 1, size, 1)
 63 |             else:
 64 |                 error = True
 65 |         ypy
 66 |         if error:
 67 |             raise ValueError("size must be of type int, tuple, or list")
 68 |         return output
 69 | 
 70 |     @staticmethod
 71 |     def bernoulli(prob, size=None, dtype=None):
 72 |         cdef Mat output = Mat(0,0, dtype=dtype)
 73 |         cdef bint error = False
 74 |         pypinline typed_expression_args(pyp, ["output"],
 75 |             if type(size) == list or type(size) == tuple and len(size) == 2:
 76 |                 output.matinternal = matrix_initializations[TYPE_NAME].bernoulli(prob, size[0], size[1])
 77 |             elif type(size) == int:
 78 |                 output.matinternal = matrix_initializations[TYPE_NAME].bernoulli(prob, size, 1)
 79 |             else:
 80 |                     error = True
 81 |         ypy
 82 |         if error:
 83 |             raise ValueError("size must be of type int, tuple, or list")
 84 |         return output
 85 | 
 86 |     @staticmethod
 87 |     def bernoulli_normalized(prob, size=None, dtype=None):
 88 |         cdef Mat output = Mat(0,0, dtype=dtype)
 89 |         cdef bint error = False
 90 |         pypinline typed_expression_args(pyp, ["output"],
 91 |             if type(size) == list or type(size) == tuple and len(size) == 2:
 92 |                 output.matinternal = matrix_initializations[TYPE_NAME].bernoulli_normalized(prob, size[0], size[1])
 93 |             elif type(size) == int:
 94 |                 output.matinternal = matrix_initializations[TYPE_NAME].bernoulli_normalized(prob, size, 1)
 95 |             else:
 96 |                     error = True
 97 |         ypy
 98 |         if error:
 99 |             raise ValueError("size must be of type int, tuple, or list")
100 |         return output
101 | 


--------------------------------------------------------------------------------
/cython/dali/core/utils/config.pyx:
--------------------------------------------------------------------------------
 1 | cdef extern from "dali/math/SynchronizedMemory.h":
 2 |     cdef enum Device:
 3 |         DEVICE_GPU,
 4 |         DEVICE_CPU
 5 |     Device default_preferred_device
 6 | 
 7 | cdef extern from "core/math/memory_bank/MemoryBankWrapper.h":
 8 |     cdef cppclass MemoryBankWrapper [T]:
 9 |         @staticmethod
10 |         void clear_cpu()
11 | 
12 |         @staticmethod
13 |         void clear_gpu() except +
14 | 
15 | cdef extern from "core/utils/cpp_utils.h" nogil:
16 |     void set_default_gpu(int) except +
17 |     string get_gpu_name(int device) except +
18 |     int num_gpus() except +
19 | 
20 | cdef class Config:
21 |     property num_gpus:
22 |         def __get__(self):
23 |             return num_gpus()
24 | 
25 |     property default_gpu:
26 |         def __set__(self, int device):
27 |             set_default_gpu(device)
28 | 
29 |     def gpu_id_to_name(self, int device_id):
30 |         return get_gpu_name(device_id)
31 | 
32 |     property default_device:
33 |         def __get__(self):
34 |             global default_preferred_device
35 |             if default_preferred_device == DEVICE_CPU:
36 |                 return 'cpu'
37 |             elif default_preferred_device == DEVICE_GPU:
38 |                 return 'gpu'
39 |             else:
40 |                 raise ValueError("default_preferred_device is not set correctly.")
41 | 
42 |         def __set__(self, device):
43 |             assert(type(device) == str), "Device must be a string (gpu, cpu)."
44 |             global default_preferred_device
45 |             if device.lower() == 'cpu':
46 |                 default_preferred_device = DEVICE_CPU
47 |             elif device.lower() == 'gpu':
48 |                 default_preferred_device = DEVICE_GPU
49 |             else:
50 |                 raise ValueError("Device must be one of cpu, gpu.")
51 | 
52 |     def clear_gpu(self, dtype=np.float32):
53 |         if dtype == np.float32:
54 |             MemoryBankWrapper["float"].clear_gpu()
55 |         elif dtype == np.float64:
56 |             MemoryBankWrapper["double"].clear_gpu()
57 |         elif dtype == np.int32:
58 |             MemoryBankWrapper["int"].clear_gpu()
59 |         else:
60 |             raise ValueError("dtype must be one of np.float32, np.float64, or np.int32")
61 | 
62 |     def clear_cpu(self, dtype=np.float32):
63 |         if dtype == np.float32:
64 |             MemoryBankWrapper["float"].clear_cpu()
65 |         elif dtype == np.float64:
66 |             MemoryBankWrapper["double"].clear_cpu()
67 |         elif dtype == np.int32:
68 |             MemoryBankWrapper["int"].clear_cpu()
69 |         else:
70 |             raise ValueError("dtype must be one of np.float32, np.float64, or np.int32")
71 | 
72 | 
73 | config = Config()
74 | 
75 | __all__ = [ 'config' ]
76 | 


--------------------------------------------------------------------------------
/cython/dali/core/utils/core_utils.pyx:
--------------------------------------------------------------------------------
  1 | from libcpp11.unordered_map cimport unordered_map
  2 | 
  3 | # source : https://github.com/cython/cython/blob/master/Cython/Includes/libcpp/unordered_map.pxd
  4 | 
  5 | cdef extern from "core/utils/cpp_utils.h" nogil:
  6 |     void print_str(string)
  7 | 
  8 | cdef extern from "dali/utils/random.h" namespace "utils::random" nogil:
  9 |     void reseed()
 10 |     void set_seed(int)
 11 | 
 12 | cdef extern from "dali/utils/random.h" namespace "utils" nogil:
 13 |     double randdouble(double, double)
 14 |     int randint(int,int)
 15 | 
 16 | cdef extern from "dali/utils/core_utils.h" namespace "utils" nogil:
 17 |     string cpp_trim "utils::trim" (string)
 18 |     string cpp_ltrim "utils::ltrim" (string)
 19 |     string cpp_rtrim "utils::rtrim" (string)
 20 | 
 21 |     const char* c_end_symbol "utils::end_symbol"
 22 | 
 23 |     cdef cppclass CVocab "utils::Vocab":
 24 |         unordered_map[string, unsigned int] word2index
 25 |         vector[string] index2word
 26 |         size_t size() const
 27 |         unsigned int unknown_word
 28 |         CVocab()
 29 |         CVocab(vector[string]&)
 30 |         CVocab(vector[string]&, bint unknown_word)
 31 | 
 32 | class utils:
 33 |     end_symbol = c_end_symbol.decode("utf-8")
 34 | 
 35 |     @staticmethod
 36 |     def trim(s):
 37 |         """Trim a string, remove whitespace on either side"""
 38 |         cdef string s_norm = normalize_s(s)
 39 |         return cpp_trim(s_norm)
 40 | 
 41 |     @staticmethod
 42 |     def randint(int low=0, int high=1):
 43 |         cdef int out
 44 |         with nogil:
 45 |             out = randint(low,high)
 46 |         return out
 47 | 
 48 |     @staticmethod
 49 |     def randdouble(float low=0.0, float high=1.0):
 50 |         cdef double out
 51 |         with nogil:
 52 |             out = randdouble(low,high)
 53 |         return out
 54 | 
 55 |     @staticmethod
 56 |     def reseed():
 57 |         with nogil:
 58 |             reseed()
 59 | 
 60 |     @staticmethod
 61 |     def set_seed(int newseed):
 62 |         with nogil:
 63 |             set_seed(newseed)
 64 | 
 65 |     @staticmethod
 66 |     def rtrim(s):
 67 |         """Trim right-side of a string."""
 68 |         cdef string s_norm = normalize_s(s)
 69 |         return cpp_rtrim(s_norm)
 70 | 
 71 |     @staticmethod
 72 |     def ltrim(s):
 73 |         """Trim left-side of a string."""
 74 |         cdef string s_norm = normalize_s(s)
 75 |         return cpp_ltrim(s_norm)
 76 | 
 77 | cdef vector[string] list_string_to_vector(list words):
 78 |     cdef vector[string] out
 79 |     for word in words:
 80 |         out.push_back(word.encode("utf-8"))
 81 |     return out
 82 | 
 83 | cdef list vector_string_to_list(vector[string]& words):
 84 |     out = []
 85 |     for word in words:
 86 |         out.append(word.decode("utf-8"))
 87 |     return out
 88 | 
 89 | cdef dict unordered_map_string_to_dict(unordered_map[string, unsigned int]& word2index):
 90 |     word2index_dict = {}
 91 |     for pair in word2index:
 92 |         word2index_dict[pair.first.decode("utf-8")] = pair.second
 93 |     return word2index_dict
 94 | 
 95 | cdef unordered_map[string, unsigned int] dict_string_to_unordered_map(dict word2index):
 96 |     cdef unordered_map[string, unsigned int] word2index_map
 97 |     for key, value in word2index.items():
 98 |         word2index_map[key.encode("utf-8")] = value
 99 |     return word2index_map
100 | 
101 | cdef class Vocab:
102 |     """
103 |     Vocab
104 |     -----
105 | 
106 |     Holds a mapping between words and indices.
107 | 
108 |     """
109 |     cdef CVocab vocabinternal
110 |     def __cinit__(self, list words = [], bint unknown_word = True):
111 |         self.vocabinternal = CVocab(list_string_to_vector(words), unknown_word)
112 | 
113 |     def __len__(self):
114 |         return self.vocabinternal.size()
115 | 
116 |     def __getitem__(self, index):
117 |         if type(index) == int:
118 |             word = self.vocabinternal.index2word.at(index)
119 |             return word.decode("utf-8")
120 |         elif type(index) == str:
121 |             return self.vocabinternal.word2index.at(index.encode("utf-8"))
122 |         else:
123 |             raise TypeError("Vocab only get items using int or str as keys.")
124 | 
125 |     def __setitem__(self, index, value):
126 |         if type(index) == int:
127 |             if index < 0:
128 |                 raise IndexError("list index must be positive")
129 |             if index >= self.vocabinternal.index2word.size():
130 |                 raise IndexError("list index out of range")
131 |             self.vocabinternal.index2word[index] = value.encode("utf-8")
132 |         elif type(index) == str:
133 |             self.vocabinternal.word2index[index.encode("utf-8")] = value
134 |         else:
135 |             raise TypeError("Vocab only sets items using int or str as keys.")
136 | 
137 |     property unknown_word:
138 |         def __get__(self):
139 |             return self.vocabinternal.unknown_word
140 | 
141 |         def __set__(self, int value):
142 |             self.vocabinternal.unknown_word = value
143 | 
144 |     property index2word:
145 |         def __get__(self):
146 |             return vector_string_to_list(self.vocabinternal.index2word)
147 | 
148 |         def __set__(self, list words):
149 |             self.vocabinternal.index2word = list_string_to_vector(words)
150 | 
151 |     property word2index:
152 |         def __get__(self):
153 |             return unordered_map_string_to_dict(self.vocabinternal.word2index)
154 | 
155 |         def __set__(self, dict words):
156 |             self.vocabinternal.word2index = dict_string_to_unordered_map(words)
157 | 


--------------------------------------------------------------------------------
/cython/dali/core/utils/cpp_utils.cpp:
--------------------------------------------------------------------------------
 1 | #include "cpp_utils.h"
 2 | 
 3 | #include <iostream>
 4 | #include <dali/math/SynchronizedMemory.h>
 5 | 
 6 | void print_str(std::string s )  {
 7 |     std::cout << s << std::endl;
 8 | }
 9 | 
10 | void set_default_gpu(int gpu_id) {
11 |     #ifdef DALI_USE_CUDA
12 |         gpu_utils::set_default_gpu(gpu_id);
13 |     #else
14 |         throw std::runtime_error("Dali when compiled without cuda cannot set default GPU.");
15 |     #endif
16 | }
17 | 
18 | std::string get_gpu_name(int device) {
19 |     #ifdef DALI_USE_CUDA
20 |         return gpu_utils::get_gpu_name(device);
21 |     #else
22 |         throw std::runtime_error("Dali when compiled without cuda cannot get GPU name.");
23 |         return "";
24 |     #endif
25 | }
26 | 
27 | int num_gpus() {
28 |     #ifdef DALI_USE_CUDA
29 |         return gpu_utils::num_gpus();
30 |     #else
31 |         throw std::runtime_error("Dali when compiled without cuda cannot get the number of GPUs.");
32 |         return 0;
33 |     #endif
34 | }
35 | 


--------------------------------------------------------------------------------
/cython/dali/core/utils/cpp_utils.h:
--------------------------------------------------------------------------------
 1 | #ifndef UTILS_CPP_UTILS_H
 2 | #define UTILS_CPP_UTILS_H
 3 | 
 4 | #include <string>
 5 | #include <dali/utils/gpu_utils.h>
 6 | 
 7 | void print_str(std::string s);
 8 | 
 9 | void set_default_gpu(int);
10 | std::string get_gpu_name(int device);
11 | int num_gpus();
12 | 
13 | #endif
14 | 
15 | 


--------------------------------------------------------------------------------
/dali/__init__.py:
--------------------------------------------------------------------------------
1 | import dali.utils
2 | import dali.data
3 | 
4 | from .beam_search import *
5 | 


--------------------------------------------------------------------------------
/dali/activation.py:
--------------------------------------------------------------------------------
 1 | """
 2 | The point of this file is to make those
 3 | functions pickle friendly
 4 | """
 5 | from dali.core import MatOps as ops
 6 | 
 7 | class tanh_object(object):
 8 |     def __call__(self, *args, **kwargs):
 9 |         return ops.tanh(*args, **kwargs)
10 | 
11 | class relu_object(object):
12 |     def __call__(self, *args, **kwargs):
13 |         return ops.relu(*args, **kwargs)
14 | 
15 | class sigmoid_object(object):
16 |     def __call__(self, *args, **kwargs):
17 |         return ops.sigmoid(*args, **kwargs)
18 | 
19 | class identity_object(object):
20 |     def __call__(self, *args, **kwargs):
21 |         assert len(args) == 1
22 |         assert len(kwargs) == 0
23 |         return args[0]
24 | 
25 | tanh     = tanh_object()
26 | relu     = relu_object()
27 | sigmoid  = sigmoid_object()
28 | identity = identity_object()
29 | 
30 | __all__ = ["tanh", "relu", "sigmoid", "identity"]
31 | 


--------------------------------------------------------------------------------
/dali/beam_search.py:
--------------------------------------------------------------------------------
 1 | from collections import namedtuple
 2 | from types import FunctionType
 3 | import dali.core as D
 4 | 
 5 | Beam = namedtuple("Beam", ["solution", "score", "state"])
 6 | 
 7 | def beam_search(initial_state,
 8 |                 candidate_scores,
 9 |                 make_choice,
10 |                 beam_width=5,
11 |                 eos_symbol = None,
12 |                 max_sequence_length=None,
13 |                 blacklist=[]):
14 | 
15 |     if beam_width <= 0:
16 |         raise ValueError("Beam width must be positive, received: " + str(beam_width))
17 | 
18 |     iterations = 0
19 |     results = [
20 |         Beam([], D.Mat(1,1), initial_state)
21 |     ]
22 | 
23 |     def lazy_beam(prev_beam, candidate, new_score):
24 |         def generate():
25 |             choice = make_choice(prev_beam.state, candidate)
26 |             if type(choice) == tuple:
27 |                 choice_repr, new_state  = choice
28 |             else:
29 |                 choice_repr, new_state = candidate, choice
30 |             return Beam(
31 |                 prev_beam.solution + [choice_repr],
32 |                 new_score,
33 |                 new_state,
34 |             )
35 |         return generate
36 | 
37 |     def lazy_identity(beam):
38 |         def generate():
39 |             return beam
40 |         return generate
41 | 
42 |     if eos_symbol is None:
43 |         check_eos = lambda beam: False
44 |     elif type(eos_symbol) != FunctionType:
45 |         check_eos = lambda beam: len(beam.solution) > 0 and beam.solution[-1] == eos_symbol
46 |     else:
47 |         check_eos = eos_symbol
48 | 
49 |     while max_sequence_length is None or iterations < max_sequence_length:
50 |         proposals = []
51 |         for beam in results:
52 |             if check_eos(beam):
53 |                 proposals.append((beam.score, lazy_identity(beam)))
54 |             else:
55 |                 scores = candidate_scores(beam.state)
56 |                 sorted_candidates = D.MatOps.argsort(scores)
57 | 
58 |                 sorted_candidates = sorted_candidates[::-1]
59 |                 candidates_remaining = beam_width
60 |                 for candidate_idx in sorted_candidates:
61 |                     if candidate_idx in blacklist:
62 |                         continue
63 |                     new_score = beam.score + scores.T()[candidate_idx]
64 |                     proposals.append((new_score, lazy_beam(beam, candidate_idx, new_score)))
65 |                     candidates_remaining -= 1
66 |                     if candidates_remaining <= 0:
67 |                         break
68 |         proposals.sort(reverse=True, key=lambda x: x[0].w[0])
69 |         results = [ eval_beam() for _, eval_beam in proposals[:beam_width]]
70 | 
71 |         iterations += 1
72 | 
73 |     return results
74 | 
75 | __all__ = ["beam_search", "Beam"]
76 | 


--------------------------------------------------------------------------------
/dali/data/__init__.py:
--------------------------------------------------------------------------------
1 | from .process import *
2 | from . import batch
3 | from . import translation
4 | 


--------------------------------------------------------------------------------
/dali/data/batch.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | 
  3 | import dali.core as D
  4 | 
  5 | class Batch(object):
  6 |     def __init__(self):
  7 |         self.timesteps = 0
  8 |         self.examples  = 0
  9 |     def inputs(timestep):
 10 |         return None
 11 |     def targets(timestep):
 12 |         return None
 13 |     def __repr__(self):
 14 |         return 'Batch(timesteps=%d, examples=%d)' % (self.timesteps, self.examples)
 15 | 
 16 | START_TOKEN = '**START**'
 17 | 
 18 | def create_lines_batch(lines, vocab, add_start_token=False, fill_eos=False, add_eos=False, align_right=False):
 19 |     encoded_lines = []
 20 |     for l in lines:
 21 |         if type(l) == str:
 22 |             l = l.split(" ")
 23 |         if add_start_token:
 24 |             l = [START_TOKEN] + l
 25 |         encoded_lines.append(vocab.encode(l, add_eos=add_eos))
 26 | 
 27 | 
 28 |     seq_length = max(map(len, encoded_lines))
 29 |     # we add one index to account for start of sequence token
 30 |     data = np.empty((seq_length, len(lines)), dtype=np.int32)
 31 |     if fill_eos:
 32 |         data.fill(vocab.eos)
 33 |     else:
 34 |         data.fill(0)
 35 | 
 36 |     for line_idx, encoded_line in enumerate(encoded_lines):
 37 |         if align_right:
 38 |             data[-len(encoded_line):, line_idx] = encoded_line
 39 |         else:
 40 |             data[:len(encoded_line), line_idx] = encoded_line
 41 |     data = D.Mat(data, borrow=True, dtype=np.int32)
 42 |     return data
 43 | 
 44 | class LMBatch(object):
 45 |     @staticmethod
 46 |     def given_vocab(vocab, **kwargs):
 47 |         def wrapper(sentences):
 48 |             return LMBatch(sentences, vocab, **kwargs)
 49 |         return wrapper
 50 | 
 51 |     def __init__(self, sentences, vocab, store_originals=False, fill_eos=True, add_eos=True, add_start_token=True):
 52 |         if store_originals:
 53 |             self.sentences = sentences
 54 |         self.sentence_lengths = [len(s) for s in sentences]
 55 |         self.data = create_lines_batch(
 56 |             sentences,
 57 |             vocab,
 58 |             add_start_token=add_start_token,
 59 |             fill_eos=fill_eos,
 60 |             add_eos=add_eos
 61 |         )
 62 |         self.timesteps = self.data.shape[0] - 1
 63 |         self.examples  = self.data.shape[1]
 64 | 
 65 |     def inputs(self, timestep):
 66 |         return self.data[timestep]
 67 | 
 68 |     def targets(self, timestep):
 69 |          # predictions are offset by 1 to inputs, so
 70 |         return self.data[timestep + 1]
 71 | 
 72 | 
 73 | class TranslationBatch(object):
 74 |     @staticmethod
 75 |     def given_vocabs(vocabs, **kwargs):
 76 |         def wrapper(sentence_pairs):
 77 |             return TranslationBatch(sentence_pairs, vocabs, **kwargs)
 78 |         return wrapper
 79 | 
 80 | 
 81 |     def __init__(self, sentence_pairs, vocabs, store_originals=False, input_add_eos=False, output_add_eos=True, add_start_token=False, reverse_input=True):
 82 |         if store_originals:
 83 |             self.sentence_pairs = sentence_pairs
 84 |         from_sentences = [sentence_pair[0] for sentence_pair in sentence_pairs]
 85 |         to_sentences   = [sentence_pair[1] for sentence_pair in sentence_pairs]
 86 | 
 87 |         if reverse_input:
 88 |             from_sentences = [list(reversed(s)) for s in from_sentences]
 89 | 
 90 | 
 91 |         from_vocab, to_vocab = vocabs
 92 | 
 93 |         from_eos_correction = (1 if input_add_eos else 0)
 94 |         to_eos_correction   = (1 if output_add_eos else 0)
 95 | 
 96 |         self.from_data = create_lines_batch(
 97 |             from_sentences,
 98 |             from_vocab,
 99 |             add_start_token=add_start_token,
100 |             fill_eos=False,
101 |             add_eos=input_add_eos,
102 |             align_right=True
103 |         )
104 | 
105 |         self.to_data = create_lines_batch(
106 |             to_sentences,
107 |             to_vocab,
108 |             add_start_token=add_start_token,
109 |             fill_eos=True,
110 |             add_eos=output_add_eos
111 |         )
112 |         self.from_tokens  = sum(map(len, from_sentences)) + from_eos_correction * len(from_sentences)
113 |         self.to_tokens    = sum(map(len, to_sentences))   + to_eos_correction  * len(to_sentences)
114 | 
115 |         self.target_mask = D.Mat(*self.to_data.shape)
116 |         for example_idx, sentence in enumerate(to_sentences):
117 |             for ts in range(len(sentence) + to_eos_correction):
118 |                 self.target_mask.w[ts, example_idx] = 1
119 |                 self.target_mask.constant = True
120 | 
121 |         self.from_timesteps = self.from_data.shape[0]
122 |         self.timesteps = self.from_data.shape[0] + self.to_data.shape[0]
123 |         self.examples  = len(sentence_pairs)
124 | 
125 |     def inputs(self, timestep):
126 |         if timestep < self.from_timesteps:
127 |             return self.from_data[timestep]
128 |         else:
129 |             return None
130 | 
131 |     def targets(self, timestep):
132 |         if timestep >= self.from_timesteps:
133 |             return self.to_data[timestep - self.from_timesteps]
134 |         else:
135 |             return None
136 | 
137 |     def masks(self, timestep):
138 |         if timestep >= self.from_timesteps:
139 |             return self.target_mask[timestep - self.from_timesteps]
140 |         else:
141 |             return None
142 | 


--------------------------------------------------------------------------------
/dali/data/process.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import random
  3 | 
  4 | from queue import Queue
  5 | 
  6 | from dali.data.utils import split_punctuation as split_punctuation_f
  7 | 
  8 | class Process(object):
  9 |     def __init__(self, files, mapper, reducer):
 10 |         if files == str:
 11 |             files = (make_me_iterator for make_me_iterator in [files])
 12 |         self.files   = files
 13 |         self.mapper  = mapper
 14 |         self.reducer = reducer
 15 | 
 16 |     def __iter__(self):
 17 |         return self
 18 | 
 19 |     def __next__(self):
 20 |         while True:
 21 |             try:
 22 |                 return next(self.reducer)
 23 |             except StopIteration:
 24 |                 pass
 25 |             # if we got here it means reducer run out of elements
 26 |             # and we need to add more from mapper.
 27 |             try:
 28 |                 self.reducer.add(next(self.mapper))
 29 |                 continue
 30 |             except StopIteration:
 31 |                 pass
 32 |             # if we got here it means that mapper run out of elements and we need to give
 33 |             # if another file
 34 |             next_file = next(self.files)
 35 |             self.mapper.set_file(next_file)
 36 | 
 37 | class DiscoverFiles(object):
 38 |     def __init__(self, root_path, extension=None):
 39 |         self.files = []
 40 |         self.next_file = 0
 41 |         for path, dirs, files in os.walk(root_path):
 42 |             for file in files:
 43 |                 if extension is None or file.endswith(extension):
 44 |                     self.files.append(os.path.join(path, file))
 45 | 
 46 |     def __iter__(self):
 47 |         return self
 48 | 
 49 |     def __next__(self):
 50 |         if self.next_file >= len(self.files):
 51 |             raise StopIteration()
 52 |         else:
 53 |             self.next_file += 1
 54 |             return self.files[self.next_file - 1]
 55 | 
 56 | 
 57 | class FileMapper(object):
 58 |     FILTER      = 1
 59 |     TRANSFORMER = 2
 60 | 
 61 |     def __init__(self):
 62 |         self._transformations = []
 63 |         self.file_name = None
 64 |         self.file_handle = None
 65 | 
 66 |     def set_file(self, file_name):
 67 |         if self.file_handle is not None:
 68 |             self.file_handle.close()
 69 |             self.file_handle = None
 70 |         self.file_name = file_name
 71 |         self.file_handle = None
 72 | 
 73 | 
 74 |     def get_file(self, fargs="rt"):
 75 |         if self.file_handle is None:
 76 |             self.file_handle = open(self.file_name, fargs)
 77 |         return self.file_handle
 78 | 
 79 |     def __del__(self):
 80 |         if self.file_handle is not None:
 81 |             self.file_handle.close()
 82 |             self.file_handle = None
 83 | 
 84 |     def __next__(self):
 85 |         if self.file_name is None:
 86 |             raise StopIteration()
 87 |         while True:
 88 |             item = self.next_item_no_filter()
 89 |             if item is not None:
 90 |                 return item
 91 | 
 92 |     def next_item_no_filter(self):
 93 |         """By default __next__ does not even return an item
 94 |            if it does not pass a filer. This function, returns
 95 |            None even if the filters are not passing. This
 96 |            is useful for example for translation where,
 97 |            we want to ensure that two different file streams
 98 |            are always aligned
 99 |         """
100 |         if self.file_name is None:
101 |             raise StopIteration()
102 | 
103 |         item = self.next_item()
104 |         item = self.transform_item(item)
105 | 
106 |         return item
107 | 
108 |     def transform_item(self, item):
109 |         for transform_f in self._transformations:
110 |             item = transform_f(item)
111 |             if item is None:
112 |                 break
113 |         return item
114 | 
115 |     def next_item(self):
116 |         raise StopIteration()
117 | 
118 | 
119 |     def add_filter(self, filter_f):
120 |         def wrapper(element):
121 |             if filter_f(element):
122 |                 return element
123 |             return None
124 |         self.add_transform(wrapper)
125 |         return self
126 | 
127 |     def add_transform(self, transform_f):
128 |         self._transformations.append(transform_f)
129 |         return self
130 | 
131 |     def __iter__(self):
132 |         return self
133 | 
134 |     def __getstate__(self):
135 |         # Copy the object's state from self.__dict__ which contains
136 |         # all our instance attributes. Always use the dict.copy()
137 |         # method to avoid modifying the original state.
138 |         state = self.__dict__.copy()
139 |         # Remove the unpicklable entries.
140 |         del state['file_handle']
141 |         if self.file_handle is not None:
142 |             state['__file_position'] = self.file_handle.tell()
143 |         return state
144 | 
145 |     def __setstate__(self, state):
146 |         # Restore instance attributes (i.e., filename and lineno).
147 |         self.__dict__.update(state)
148 |         # Restore the previously opened file's state. To do so, we need to
149 |         # reopen it and read from it until the line count is restored.
150 |         self.file_handle = open(self.file_name)
151 |         if '__file_position' in state:
152 |             self.file_handle.seek(state['__file_position'])
153 | 
154 | 
155 | class Lines(FileMapper):
156 |     def next_item(self):
157 |         res = self.get_file().readline()
158 |         if len(res) == 0:
159 |             raise StopIteration()
160 |         if len(res) > 0 and res[-1] == '\n':
161 |             return res[:-1]
162 |         else:
163 |             return res
164 | 
165 |     def lower(self):
166 |         return self.add_transform(lambda x: x.lower())
167 | 
168 |     def bound_length(self, lower_bound=None, upper_bound=None):
169 |         if lower_bound:
170 |             self.add_filter(lambda x: lower_bound <= len(x))
171 |         if upper_bound:
172 |             self.add_filter(lambda x: len(x) <= upper_bound)
173 |         return self
174 | 
175 |     def split_spaces(self):
176 |         return self.add_transform(lambda x: x.split(' '))
177 | 
178 |     def reverse(self):
179 |         return self.add_transform(lambda x: list(reversed(x)))
180 | 
181 |     def split_punctuation(self):
182 |         return self.add_transform(split_punctuation_f)
183 | 
184 | 
185 | class Multiplexer(object):
186 |     def __init__(self, *mappers):
187 |         self.mappers = mappers
188 | 
189 |     def set_file(self, args):
190 |         assert len(args) == len(self.mappers)
191 | 
192 |         for mapper, arg in zip(self.mappers, args):
193 |             mapper.set_file(arg)
194 | 
195 |     def __iter__(self):
196 |         return self
197 | 
198 |     def __next__(self):
199 |         while True:
200 |             ret = tuple([m.next_item_no_filter() for m in self.mappers])
201 |             if all(ret_i is not None for ret_i in ret):
202 |                 return ret
203 | 
204 | 
205 | 
206 | class BatchBenefactor(object):
207 |     def __init__(self, minibatch_size,
208 |                  minibatch_class=None,
209 |                  examples_until_minibatches=None,
210 |                  sorting_key=None):
211 |         self.minibatch_size = minibatch_size
212 |         self.minibatch_class = minibatch_class
213 |         self.examples_until_minibatches = examples_until_minibatches or minibatch_size
214 |         self.sorting_key = sorting_key
215 | 
216 |         self.collected = []
217 |         self.batches = []
218 |         self.next_batch = 0
219 | 
220 |     def add(self, element):
221 |         self.collected.append(element)
222 | 
223 |         if len(self.collected) >= self.examples_until_minibatches:
224 |             self.batches = []
225 |             self.next_batch = 0
226 | 
227 |             sorting_key = self.sorting_key or (lambda x: len(x))
228 |             self.collected.sort(key=sorting_key)
229 | 
230 | 
231 |             batch_start_idxes = list(range(0, len(self.collected), self.minibatch_size))
232 |             random.shuffle(batch_start_idxes)
233 |             for i in batch_start_idxes:
234 |                 if i + self.minibatch_size <= len(self.collected):
235 |                     self.batches.append(self.collected[i:(i + self.minibatch_size)])
236 |             self.collected = []
237 | 
238 |     def __iter__(self):
239 |         return self
240 | 
241 |     def __next__(self):
242 |         if len(self.batches) == 0 or self.next_batch == len(self.batches):
243 |             self.batches = []
244 |             self.next_batch = 0
245 |             raise StopIteration()
246 |         else:
247 |             assert self.next_batch < len(self.batches)
248 |             self.next_batch += 1
249 |             minibatch_class = self.minibatch_class or (lambda x:x)
250 |             return minibatch_class(self.batches[self.next_batch - 1])
251 | 
252 | 
253 | 
254 |     def update_minibatch_size(self, minibatch_size):
255 |         self.minibatch_size = minibatch_size
256 | 
257 | 
258 | class IdentityReducer(object):
259 |     def __init__(self):
260 |         self.q = Queue()
261 | 
262 |     def add(self, element):
263 |         self.q.put(element)
264 | 
265 |     def __iter__(self):
266 |         return self
267 | 
268 |     def __next__(self):
269 |         if self.q.empty():
270 |             raise StopIteration()
271 |         else:
272 |             return self.q.get()
273 | 


--------------------------------------------------------------------------------
/dali/data/translation.py:
--------------------------------------------------------------------------------
 1 | from collections import defaultdict
 2 | 
 3 | from .batch import TranslationBatch
 4 | from .process import Process, Multiplexer, Lines, DiscoverFiles, IdentityReducer, BatchBenefactor
 5 | from dali.utils import Vocab
 6 | 
 7 | 
 8 | class TranslationFiles(object):
 9 |     def __init__(self, root_path, from_lang, to_lang):
10 |         files_from = set(DiscoverFiles(root_path, "." + from_lang))
11 |         files_to   = set(DiscoverFiles(root_path, "." + to_lang))
12 | 
13 |         self.pairs = []
14 |         for file_name in files_from:
15 |             pref = file_name[:-(len(from_lang) + 1)]
16 |             hypothetical_to_file = pref + '.' + to_lang
17 |             if hypothetical_to_file in files_to:
18 |                 self.pairs.append((file_name, hypothetical_to_file))
19 | 
20 |         self.next_pair = 0
21 | 
22 |     def __iter__(self):
23 |         return self
24 | 
25 |     def __next__(self):
26 |         if self.next_pair >= len(self.pairs):
27 |             raise StopIteration()
28 |         else:
29 |             self.next_pair += 1
30 |             return self.pairs[self.next_pair - 1]
31 | 
32 | 
33 | def TranslationMapper(sentence_bounds=(None, None)):
34 |     def translation_lines():
35 |         lines =  Lines()                         \
36 |                  .split_punctuation()            \
37 |                  .split_spaces()                 \
38 |                  .bound_length(*sentence_bounds)
39 |         return lines
40 | 
41 | 
42 |     return Multiplexer(translation_lines(), translation_lines())
43 | 
44 | 
45 | def build_vocabs(path, from_lang, to_lang, from_max_size=None, to_max_size=None):
46 |     from_occurence = defaultdict(lambda: 0)
47 |     to_occurence   = defaultdict(lambda: 0)
48 |     try:
49 |         for from_sentence, to_sentence in Process(files=TranslationFiles(path, from_lang, to_lang),
50 |                                                   mapper=TranslationMapper(sentence_bounds=(None, None)),
51 |                                                   reducer=IdentityReducer()):
52 |             for word in from_sentence:
53 |                 from_occurence[word] += 1
54 | 
55 |             for word in to_sentence:
56 |                 to_occurence[word] += 1
57 |     except KeyboardInterrupt:
58 |         print('Impatient User Detected, file processing halted, proceeding to build vocab.')
59 | 
60 | 
61 |     from_occurence = list(from_occurence.items())
62 |     to_occurence   = list(to_occurence.items())
63 | 
64 |     # highest occurrence first
65 |     from_occurence.sort(key=lambda x: x[1], reverse=True)
66 |     to_occurence  .sort(key=lambda x: x[1], reverse=True)
67 | 
68 |     # remove occurences, keep sorted words
69 |     from_occurence = [x[0] for x in from_occurence]
70 |     to_occurence =   [x[0] for x in to_occurence]
71 | 
72 |     from_vocab = Vocab(from_occurence[:from_max_size])
73 |     to_vocab   = Vocab(to_occurence[:to_max_size])
74 | 
75 |     return from_vocab, to_vocab
76 | 
77 | def iterate_examples(root_path, from_lang, to_lang, vocabs, minibatch_size, reverse_input=True, sentences_until_minibatch=None, sentence_length_bounds=(None, None)):
78 |     sentences_until_minibatch = sentences_until_minibatch or 10000 * minibatch_size
79 |     files   = TranslationFiles(root_path, from_lang, to_lang)
80 |     mapper = TranslationMapper(sentence_bounds=sentence_length_bounds)
81 |     sorting_key = lambda sentence_pair: (len(sentence_pair[0]), len(sentence_pair[1])) # sort by length of the input sentence first and then by the length of the output sentence
82 | 
83 |     reducer = BatchBenefactor(minibatch_size,
84 |                               TranslationBatch.given_vocabs(vocabs, store_originals=True, reverse_input=reverse_input),
85 |                               sentences_until_minibatch,
86 |                               sorting_key=sorting_key)
87 |     return Process(files=files, mapper=mapper, reducer=reducer)
88 | 


--------------------------------------------------------------------------------
/dali/data/utils.py:
--------------------------------------------------------------------------------
 1 | PUNCTUATION_CHARS = set(list('.,?!-"\'()[]{}:;'))
 2 | 
 3 | def split_punctuation(sentence, punctuation=PUNCTUATION_CHARS):
 4 |     res = []
 5 |     for i, char in enumerate(list(sentence)):
 6 |         if char in punctuation:
 7 |             if i - 1 >= 0 and sentence[i-1] != ' ':
 8 |                 res.append(' ')
 9 |             res.append(char)
10 |             if i + 1 < len(sentence) and sentence[i + 1] != ' ':
11 |                 res.append(' ')
12 |         else:
13 |             res.append(char)
14 |     return ''.join(res)
15 | 


--------------------------------------------------------------------------------
/dali/models/__init__.py:
--------------------------------------------------------------------------------
1 | from .mlp import *
2 | 


--------------------------------------------------------------------------------
/dali/models/mlp.py:
--------------------------------------------------------------------------------
 1 | import dali.core as D
 2 | 
 3 | class MLP(object):
 4 |     def __init__(self, input_sizes, hiddens, nonlinearities):
 5 |         self.input_sizes = input_sizes
 6 |         self.hiddens = hiddens
 7 |         self.input_nonlinearity, self.layer_nonlinearities = nonlinearities[0], nonlinearities[1:]
 8 | 
 9 |         self.input_layer = D.StackedInputLayer(input_sizes, hiddens[0])
10 |         self.layers = [D.Layer(h_from, h_to) for h_from, h_to in zip(hiddens[:-1], hiddens[1:])]
11 | 
12 |     def activate(self, inputs):
13 |         assert len(self.layers) == len(self.layer_nonlinearities)
14 |         hidden = self.input_nonlinearity(self.input_layer.activate(inputs))
15 |         for l, nonlinearity in zip(self.layers, self.layer_nonlinearities):
16 |             hidden = nonlinearity(l.activate(hidden))
17 |         return hidden
18 | 
19 |     def parameters(self):
20 |         ret = self.input_layer.parameters()
21 |         for l in self.layers:
22 |             ret.extend(l.parameters())
23 |         return ret
24 | 
25 |     def name_parameters(self, prefix):
26 |         self.input_layer.name_parameters(prefix + "_input_layer")
27 |         for layer_idx, layer in enumerate(self.layers):
28 |             layer.name_parameters(prefix + '_layer%d' % (layer_idx,))
29 | 


--------------------------------------------------------------------------------
/dali/utils/__init__.py:
--------------------------------------------------------------------------------
1 | from .misc import *
2 | from .throttled import *
3 | from .vocab import *
4 | from .solver import *
5 | from .capture import *
6 | 


--------------------------------------------------------------------------------
/dali/utils/capture.py:
--------------------------------------------------------------------------------
 1 | from collections import defaultdict
 2 | 
 3 | class Capture(object):
 4 |     instances = set()
 5 | 
 6 |     def __init__(self):
 7 |         self.state = defaultdict(lambda: [])
 8 | 
 9 |     @classmethod
10 |     def add(cls, name, value):
11 |         for instance in cls.instances:
12 |             instance.state[name].append(value)
13 | 
14 |     def __enter__(self):
15 |         Capture.instances.add(self)
16 | 
17 |     def __exit__(self, *args, **kwargs):
18 |         Capture.instances.remove(self)
19 | 


--------------------------------------------------------------------------------
/dali/utils/misc.py:
--------------------------------------------------------------------------------
  1 | import dill as pickle
  2 | import inspect
  3 | import numpy as np
  4 | import types
  5 | 
  6 | from os import makedirs, listdir
  7 | from os.path import join, exists
  8 | 
  9 | import dali.core as D
 10 | 
 11 | class RunningAverage(object):
 12 |     def __init__(self, alpha=0.95):
 13 |         self.alpha = alpha
 14 |         self.value = None
 15 | 
 16 |     def update(self, measurement):
 17 |         if self.value is None:
 18 |             self.value = measurement
 19 |         else:
 20 |             self.value = (self.alpha * self.value +
 21 |                          (1.0 - self.alpha) * measurement)
 22 | 
 23 |     def __float__(self):
 24 |         return float(self.value)
 25 | 
 26 | 
 27 | def apply_recursively_on_type(x, f, target_type, list_callback=None):
 28 |     if type(x) == target_type:
 29 |         return f(x)
 30 |     elif type(x) == list or isinstance(x, types.GeneratorType):
 31 |         ret = [ apply_recursively_on_type(el, f, target_type, list_callback) for el in x]
 32 |         if list_callback and all(type(el) == target_type for el in x):
 33 |             ret = list_callback(ret)
 34 |         return ret
 35 |     elif type(x) == dict:
 36 |         res = {}
 37 |         for k,v in x.items():
 38 |             res[k] = apply_recursively_on_type(v, f, target_type, list_callback)
 39 |         return res
 40 |     else:
 41 |         return x
 42 | 
 43 | def integer_ceil(a, b):
 44 |     return (a + b - 1) // b
 45 | 
 46 | def subsample(seq, maximum_length):
 47 |     if seq == []:
 48 |         return seq
 49 |     return seq[::integer_ceil(len(seq), maximum_length)]
 50 | 
 51 | def median_smoothing(signal, window=10):
 52 |     res = []
 53 |     for i in range(window, len(signal)):
 54 |         actual_window = signal[i-window:i]
 55 |         res.append(np.median(actual_window))
 56 |     return res
 57 | 
 58 | def pickle_from_scope(directory, variables, caller_globals=None, caller_locals=None):
 59 |     if not exists(directory):
 60 |         makedirs(directory)
 61 | 
 62 |     if caller_globals is None or caller_locals is None:
 63 |         stack = inspect.stack()
 64 |         if caller_globals is None:
 65 |             caller_globals = stack[1][0].f_globals
 66 |         if caller_locals is None:
 67 |             caller_locals  = stack[1][0].f_locals
 68 |         del stack
 69 | 
 70 |     for var in variables:
 71 |         with open(join(directory, var + ".pkz"), "wb") as f:
 72 |             value = caller_locals.get(var) or caller_globals.get(var)
 73 |             assert value is not None
 74 |             pickle.dump(value, f)
 75 | 
 76 | def unpickle_as_dict(directory, whitelist=None, extension='.pkz'):
 77 |     assert exists(directory)
 78 | 
 79 |     res = {}
 80 | 
 81 |     for file_name in listdir(directory):
 82 |         if file_name.endswith(extension):
 83 |             var_name = file_name[:-len(extension)]
 84 |             if whitelist is None or var_name in whitelist:
 85 |                 with open(join(directory, file_name), "rb") as f:
 86 |                     res[var_name] = pickle.load(f)
 87 | 
 88 |     return res
 89 | 
 90 | def add_device_args(parser):
 91 |     parser.add_argument("--device",    type=str, default='gpu', choices=['gpu','cpu'], help="Whether model should run on GPU or CPU.")
 92 |     parser.add_argument("--gpu_id",    type=int, default=0, help="Which GPU to use (zero-indexed just like in CUDA APIs)")
 93 | 
 94 | def set_device_from_args(args, verbose=False):
 95 |     D.config.default_device = args.device
 96 |     if args.device == 'gpu':
 97 |         D.config.default_gpu = args.gpu_id
 98 |         if verbose:
 99 |             print("Using %s" % (D.config.gpu_id_to_name(args.gpu_id)))
100 | 
101 | __all__ = [
102 |     "apply_recursively_on_type",
103 |     "integer_ceil",
104 |     "subsample",
105 |     "median_smoothing",
106 |     "pickle_from_scope",
107 |     "unpickle_as_dict",
108 |     "RunningAverage",
109 |     "add_device_args",
110 |     "set_device_from_args"
111 | ]
112 | 


--------------------------------------------------------------------------------
/dali/utils/scoring.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | import os
  3 | import subprocess
  4 | import stat
  5 | import tempfile
  6 | 
  7 | from os.path import join, exists
  8 | from urllib.request import urlretrieve
  9 | 
 10 | from dali.core import Mat
 11 | from .misc import subsample, median_smoothing
 12 | 
 13 | MULTIBLEU_SCRIPT = 'multi-bleu.perl'
 14 | MULTIBLEU_URL = "https://raw.githubusercontent.com/moses-smt/mosesdecoder/master/scripts/generic/multi-bleu.perl"
 15 | 
 16 | class ErrorTracker(object):
 17 |     def __init__(self):
 18 |         self.epoch_error = []
 19 |         self.error_evolution = []
 20 | 
 21 |     def append(self, error):
 22 |         if type(error) == Mat:
 23 |             self.epoch_error.append(error.w[0,0])
 24 |         elif type(error) == np.ndarray:
 25 |             self.epoch_error.append(error[0,0])
 26 |         else:
 27 |             self.epoch_error.append(error)
 28 | 
 29 |     def finalize_epoch(self):
 30 |         if len(self.epoch_error) > 0:
 31 |             self.epoch_error = subsample(self.epoch_error, maximum_length=1000)
 32 |             self.error_evolution.append(self.epoch_error)
 33 |             self.epoch_error = []
 34 | 
 35 |     def raw(self):
 36 |         x = []
 37 |         y = []
 38 |         for epoch_no, error_epoch in enumerate(self.error_evolution):
 39 |             x.extend(float(epoch_no) + float(t) / len(error_epoch) for t in range(len(error_epoch)))
 40 |             y.extend(error_epoch)
 41 | 
 42 |         if len(y) > 100:
 43 |             y = median_smoothing(y, 30)
 44 |             x = x[:len(y)]
 45 |         return x,y
 46 | 
 47 |     def num_epochs(self):
 48 |         return len(self.error_evolution)
 49 | 
 50 |     def recent(self, tsteps=1):
 51 |         if len(self.epoch_error) == 0:
 52 |             return np.nan
 53 |         else:
 54 |             recent = self.epoch_error[-tsteps:]
 55 |             return sum(recent)/len(recent)
 56 | 
 57 | def bleu(reference, hypotheses, script_location=None):
 58 |     if script_location is None:
 59 |         script_location = join(tempfile.gettempdir(), MULTIBLEU_SCRIPT)
 60 |         if not exists(script_location):
 61 |             urlretrieve(MULTIBLEU_URL, script_location)
 62 |     else:
 63 |         assert(exists(script_location))
 64 | 
 65 | 
 66 |     def process_input(val):
 67 |         if type(val) == str:
 68 |             assert exists(val)
 69 |             return open(val)
 70 |         elif type(val) == list:
 71 |             ret = tempfile.NamedTemporaryFile("wt")
 72 |             for example in val:
 73 |                 if len(example) > 0 and example[-1] == '\n':
 74 |                     ret.write(example)
 75 |                 else:
 76 |                     ret.write(example + '\n')
 77 |             ret.seek(0)
 78 |             return ret
 79 | 
 80 |     try:
 81 |         reference  = process_input(reference)
 82 |         hypotheses = process_input(hypotheses)
 83 |         prefix = "BLEU = "
 84 | 
 85 |         try:
 86 |             res_str = subprocess.check_output([script_location, reference.name], stdin=hypotheses, universal_newlines=True)
 87 |         except PermissionError:
 88 |             current_permissions = os.stat(script_location).st_mode
 89 |             os.chmod(script_location, current_permissions | stat.S_IEXEC)
 90 |             res_str = subprocess.check_output([script_location, reference.name], stdin=hypotheses, universal_newlines=True)
 91 | 
 92 |         assert(res_str.startswith(prefix))
 93 |         res_str = res_str[len(prefix):]
 94 |         res_str = res_str.split(',')[0]
 95 |         return float(res_str)
 96 |     finally:
 97 |         if hasattr(reference, 'close'):
 98 |             reference.close()
 99 |         if hasattr(hypotheses, 'close'):
100 |             hypotheses.close()
101 | 
102 | __all__ = [
103 |     "ErrorTracker",
104 |     "bleu"
105 | ]
106 | 
107 | 
108 | 
109 | 
110 | 


--------------------------------------------------------------------------------
/dali/utils/solver.py:
--------------------------------------------------------------------------------
  1 | import copy
  2 | from dali.core import Mat, MatOps
  3 | from dali.utils.throttled import Throttled
  4 | 
  5 | class SolverBase(object):
  6 |     t = Throttled(1)
  7 |     known_solvers = [
  8 |         'sgd',
  9 |         'adagrad',
 10 |         'rmsprop',
 11 |         'rmsprop_momentum',
 12 |         'adadelta',
 13 |         'adam',
 14 |     ]
 15 |     known_params = [
 16 |         'learning_rate',
 17 |         'clipval',
 18 |         'regc',
 19 |         'smooth_eps',
 20 |         'rho',
 21 |         'b1',
 22 |         'b2',
 23 |         'decay_rate',
 24 |         'gradient_normalization',
 25 |         'debug',
 26 |     ]
 27 | 
 28 |     def __init__(self, solver_type, **kwargs):
 29 |         self.solver_type = solver_type
 30 |         if solver_type not in SolverBase.known_solvers:
 31 |             raise AttributeError("Unknown solver " + str(solver_type))
 32 |         self.kwargs = kwargs
 33 |         for key in kwargs:
 34 |             if key not in SolverBase.known_params:
 35 |                 raise AttributeError("Unknown keyword argument " + key)
 36 | 
 37 |     def get_arg(self, override, name, default_val):
 38 |         if name in override:
 39 |             return override[name]
 40 |         if name in self.kwargs:
 41 |             return self.kwargs[name]
 42 |         return default_val
 43 | 
 44 |     def param_to_cache(self, param):
 45 |         if 'solver_cache' not in param.extra_state:
 46 |             param.extra_state['solver_cache'] = {}
 47 |         return param.extra_state['solver_cache']
 48 | 
 49 |     def step(self, params, param_caches=None, **kwargs_override):
 50 |         if type(params) != list:
 51 |             params = [params]
 52 |             if param_caches is not None:
 53 |                 param_caches = [param_caches]
 54 | 
 55 |         if param_caches is None:
 56 |             param_caches = [None for _ in range(params)]
 57 |         assert len(params) == len(param_caches)
 58 | 
 59 |         for key in kwargs_override:
 60 |             if not key in SolverBase.known_params:
 61 |                 raise AttributeError("Unknown keyword argument " + key)
 62 | 
 63 |         debug = self.get_arg(kwargs_override, 'debug', ['nans'])
 64 |         clip_val = self.get_arg(kwargs_override, 'clipval', 5.0)
 65 |         regc     = self.get_arg(kwargs_override, 'regc',     0.0)
 66 | 
 67 |         ########## GRADIENT NORMALIZATION ###########
 68 | 
 69 |         gradient_normalization = self.get_arg(kwargs_override, 'gradient_normalization', 'norm')
 70 |         if gradient_normalization == 'norm':
 71 |             for param in params:
 72 |                 MatOps.clip_and_regularize(param, 0.0, clip_val, regc)
 73 |         elif gradient_normalization == 'clipping':
 74 |             for param in params:
 75 |                 MatOps.clip_and_regularize(param, clip_val, 0.0, regc)
 76 |         elif gradient_normalization == 'discard':
 77 |             params_exceeding = []
 78 |             for param in params:
 79 |                 if MatOps.grad_norm(param).w[0,0] > clip_val:
 80 |                     params_exceeding.append(param.name if param.name != '' else '(unnamed parameter)')
 81 |             if len(params_exceeding) > 0:
 82 |                 if 'discards' in debug:
 83 |                     print('Discarding gradient update due to exceeded norm for the following parameters: %s' % (params_exceeding,))
 84 |                 for param in params:
 85 |                     param.clear_grad()
 86 |                 return
 87 |         elif gradient_normalization == 'none':
 88 |             if regc > 0.0:
 89 |                 MatOps.regularize(param, regc)
 90 |         else:
 91 |             raise AttributeError("Unknown gradient_normalization mode : " + gradient_normalization)
 92 | 
 93 | 
 94 |         ########## SOLVING ###########
 95 | 
 96 |         for param, param_cache in zip(params, param_caches):
 97 |             if param_cache is None:
 98 |                 param_cache = self.param_to_cache(param)
 99 | 
100 |             learning_rate = self.get_arg(kwargs_override, "learning_rate", 0.01)
101 | 
102 |             lr_multiplier = param.extra_state.get('lr_multiplier', 1.0)
103 |             learning_rate *= lr_multiplier
104 |             if MatOps.is_grad_nan(param):
105 |                 if SolverBase.t.should_i_run() and 'nans' in debug:
106 |                     name_str = ' (unnamed parameter)'
107 |                     if param.name is not None:
108 |                         name_str = ' (name: %s)' % (param.name,)
109 |                     print("Warning ignoring grad update due to NaNs%s." % (name_str,))
110 |             else:
111 |                 if self.solver_type == 'sgd':
112 |                     MatOps.sgd_update(param, learning_rate)
113 |                 elif self.solver_type == 'adagrad':
114 |                     smooth_eps = self.get_arg(kwargs_override, "smooth_eps", 1e-6)
115 |                     cache = self.get_cache(param, param_cache, 'adagrad_cache')
116 |                     MatOps.adagrad_update(param, cache, learning_rate, smooth_eps)
117 |                 elif self.solver_type == 'rmsprop':
118 |                     smooth_eps = self.get_arg(kwargs_override, "smooth_eps", 1e-6)
119 |                     decay_rate = self.get_arg(kwargs_override, "decay_rate", 0.95)
120 |                     cache = self.get_cache(param, param_cache, 'rmsprop_cache')
121 |                     MatOps.rmsprop_update(param, cache, decay_rate, learning_rate, smooth_eps)
122 |                 elif self.solver_type == 'rmsprop_momentum':
123 |                     decay_rate = self.get_arg(kwargs_override,    "decay_rate", 0.95)
124 |                     momentum = self.get_arg(kwargs_override,      "momentum",   0.9)
125 |                     smooth_eps = self.get_arg(kwargs_override,    "smooth_eps", 1e-4)
126 |                     n_cache = self.get_cache(param, param_cache, 'rmsprop_momentum_n_cache')
127 |                     g_cache = self.get_cache(param, param_cache, 'rmsprop_momentum_g_cache')
128 |                     momentum_cache = self.get_cache(param, param_cache, 'rmsprop_momentum_momentum_cache')
129 |                     MatOps.rmsprop_momentum_update(param, n_cache, g_cache, momentum_cache, decay_rate, momentum, learning_rate, smooth_eps)
130 |                 elif self.solver_type == 'adadelta':
131 |                     smooth_eps = self.get_arg(kwargs_override, "smooth_eps", 1e-4)
132 |                     rho        = self.get_arg(kwargs_override, "rho",        0.95)
133 |                     gsum = self.get_cache(param, param_cache, 'adadelta_gsum')
134 |                     xsum = self.get_cache(param, param_cache, 'adadelta_xsum')
135 |                     MatOps.adadelta_update(param, gsum, xsum, rho, smooth_eps)
136 |                 elif self.solver_type == 'adam':
137 |                     smooth_eps = self.get_arg(kwargs_override, "smooth_eps", 1e-4)
138 |                     b1         = self.get_arg(kwargs_override, "b1",        0.5)
139 |                     b2         = self.get_arg(kwargs_override, "b2",        1e-6)
140 |                     m  = self.get_cache(param, param_cache, 'adam_m')
141 |                     v  = self.get_cache(param, param_cache, 'adam_v')
142 |                     epoch = param.extra_state.get('adam_epoch', 1)
143 | 
144 |                     MatOps.adam_update(param, m, v, b1, b2, smooth_eps, learning_rate, epoch)
145 | 
146 |                     param_cache['adam_epoch'] = epoch + 1
147 |                 else:
148 |                     assert False
149 |             param.clear_grad()
150 | 
151 |     def set_lr_multiplier(self, param, lr_multiplier):
152 |         param.extra_state["lr_multiplier"] = lr_multiplier
153 | 
154 |     def get_cache(self, param, cache_state, cache_name):
155 |         if cache_name not in cache_state:
156 |             cache_state[cache_name] = Mat.zeros(param.shape, dtype=param.dtype)
157 |         ret = cache_state[cache_name]
158 |         assert ret.shape == param.shape, \
159 |                 "Wrong parameter passed to solver (cache shape does not match parameter's shape)"
160 |         return ret
161 | 
162 |     def reset_caches(self, param, param_caches=None):
163 |         if type(param) == list:
164 |             if param_caches is not None:
165 |                 assert len(param) == len(param_caches)
166 |                 for p,c  in zip(param, param_caches):
167 |                     self.reset_caches(p, c)
168 |             else:
169 |                 for p in param:
170 |                     self.reset_caches(p)
171 |         elif type(param) == Mat:
172 |             # get caches
173 |             if param_caches is None:
174 |                 param_caches = self.param_to_cache(param)
175 |             # reset
176 |             if self.solver_type == 'adagrad':
177 |                 self.get_cache(param, param_caches, 'adagrad_cache').clear()
178 |             elif self.solver_type == 'rmsprop':
179 |                 self.get_cache(param, param_caches, 'rmsprop_cache').clear()
180 |             elif self.solver_type == 'adadelta':
181 |                 self.get_cache(param, param_caches, 'adadelta_gsum').clear()
182 |                 self.get_cache(param, param_caches, 'adadelta_xsum').clear()
183 |             elif self.solver_type == 'adam':
184 |                 self.get_cache(param, param_caches, 'adam_m').clear()
185 |                 self.get_cache(param, param_caches, 'adam_v').clear()
186 |                 if 'adam_epoch' in param:
187 |                     del param_caches["adam_epoch"]
188 |             else:
189 |                 assert False
190 | 
191 | class Solver(object):
192 |     def __init__(self, parameters, *args, **kwargs):
193 |         """Solver
194 | 
195 |         It is pickleable.
196 |         """
197 |         self.base = SolverBase(*args, **kwargs)
198 | 
199 |         if type(parameters) == list:
200 |             self._parameters = parameters
201 |         else:
202 |             self._parameters = [parameters]
203 |         self.caches =  [{} for _ in range(len(self._parameters))]
204 | 
205 |         self.lr_multipliers = [None for _ in range(len(self._parameters))]
206 | 
207 |     @property
208 |     def parameters(self):
209 |         return self._parameters
210 | 
211 |     @parameters.setter
212 |     def parameters(self, val):
213 |         assert self._parameters is None or \
214 |                 len(self._parameters) == len(val), \
215 |                 "Number of parameters must remain unchanged"
216 |         self._parameters = val
217 |         for lr_multiplier, param in zip(self.lr_multipliers, self._parameters):
218 |             if lr_multiplier is not None:
219 |                 self.base.set_lr_multiplier(param, lr_multiplier)
220 | 
221 |     def set_lr_multiplier(self, where, val):
222 |         indices = []
223 |         if type(where) == str:
224 |             for i, param in enumerate(self.parameters):
225 |                 if param.name == where:
226 |                     indices.append(i)
227 |             assert len(indices) > 0, \
228 |                     "Could not find parameters %s" % (where,)
229 |         elif type(where) == int:
230 |             indices.append(where)
231 |         else:
232 |             raise ValueError("where must be int or str")
233 |         for i in indices:
234 |             self.lr_multipliers[i] = val
235 |             self.base.set_lr_multiplier(self.parameters[i], val)
236 | 
237 |     def step(self):
238 |         assert self.parameters is not None, \
239 |                 "Remeber to use set parameters after unpickling."
240 |         self.base.step(self.parameters, self.caches)
241 | 
242 |     def reset_caches(self):
243 |         assert self.parameters is not None, \
244 |                 "Remeber to use set parameters after unpickling."
245 |         self.base.reset_caches(self.parameters, self.caches)
246 | 
247 |     @property
248 |     def solver_type(self):
249 |         return self.base.solver_type
250 | 
251 |     def __setstate__(self, state):
252 |         self.base          = state['solver']
253 |         self.caches       = state['caches']
254 |         self.lr_multipliers = state['lr_multipliers']
255 |         self._parameters = None
256 | 
257 |     def __getstate__(self):
258 |         return {
259 |             'solver'      : self.base,
260 |             'caches'      : self.caches,
261 |             'lr_multipliers': self.lr_multipliers
262 |         }
263 | 
264 | class CombinedSolver(object):
265 |     def __init__(self, solvers):
266 |         self.solvers = solvers
267 | 
268 |     def step(self):
269 |         for solver in self.solvers:
270 |             solver.step()
271 | 
272 |     def reset_caches(self):
273 |         for solver in self.solvers:
274 |             solver.reset_caches()
275 | 
276 | __all__ = [
277 |     "CombinedSolver",
278 |     "SolverBase",
279 |     "Solver",
280 | ]
281 | 


--------------------------------------------------------------------------------
/dali/utils/throttled.py:
--------------------------------------------------------------------------------
 1 | import time
 2 | 
 3 | 
 4 | 
 5 | 
 6 | class Throttled(object):
 7 |     def __init__(self, min_time_since_last_run_s=5):
 8 |         """Used for simple throttled execution.
 9 | 
10 |         Here's a simple example:
11 | 
12 |             @Throttled(1)
13 |             def lol(i):
14 |                 print('epoch %d' % (i,), flush=True)
15 | 
16 |             for i in range(100000000):
17 |                 lol(i)
18 | 
19 |         Above code will report the epoch every second.
20 | 
21 |         Here's another way:
22 | 
23 |             throttled = Throttled(1)
24 | 
25 | 
26 |             for i in range(100000000000):
27 |                 if throttled.should_i_run():
28 |                     print('epoch %d' % (i,), flush=True)
29 |         """
30 |         self.last_time = None
31 |         self.min_time_since_last_run_s = min_time_since_last_run_s
32 | 
33 | 
34 |     def should_i_run(self, min_time_since_last_run_s=None):
35 |         min_time_since_last_run_s = min_time_since_last_run_s or self.min_time_since_last_run_s
36 |         now = time.time()
37 |         if self.last_time is None or (now - self.last_time) > min_time_since_last_run_s:
38 |             self.last_time = now
39 |             return True
40 |         else:
41 |             return False
42 | 
43 |     def maybe_run(self, f, min_time_since_last_run_s=None):
44 |         if self.should_i_run(min_time_since_last_run_s):
45 |             return f()
46 |         else:
47 |             return None
48 | 
49 |     def __call__(self, f):
50 |         def wrapper(*args, **kwargs):
51 |             return self.maybe_run(lambda: f(*args, **kwargs))
52 |         return wrapper
53 | 


--------------------------------------------------------------------------------
/dali/utils/vocab.py:
--------------------------------------------------------------------------------
 1 | from dali.utils import apply_recursively_on_type
 2 | 
 3 | class VocabEncoded(int):
 4 |     pass
 5 | 
 6 | class Vocab(object):
 7 |     UNK = '**UNK**'
 8 |     EOS = '**EOS**'
 9 | 
10 |     def __init__(self, words=None, add_eos=True, add_unk=True):
11 |         self.index2word = []
12 |         self.word2index = {}
13 |         self.eos = None
14 |         self.unk = None
15 |         if add_unk:
16 |             self.add(Vocab.UNK)
17 |         if add_eos:
18 |             self.add(Vocab.EOS)
19 | 
20 |         if words:
21 |             self.add(words)
22 | 
23 | 
24 |     def __contains__(self, key):
25 |         if isinstance(key, int):
26 |             return key in range(len(self.index2word))
27 |         elif isinstance(key, str):
28 |             return key in self.word2index
29 |         else:
30 |             raise ValueError("expected(index or string)")
31 | 
32 |     def add(self, obj):
33 |         def add_f(word):
34 |             idx = self.word2index.get(word)
35 |             if idx is None:
36 |                 idx = len(self.index2word)
37 |                 self.index2word.append(word)
38 |                 self.word2index[word] = idx
39 |                 if word is Vocab.UNK:
40 |                     self.unk = idx
41 |                 if word is Vocab.EOS:
42 |                     self.eos = idx
43 |             return word
44 |         apply_recursively_on_type(obj, add_f, str)
45 | 
46 |     def words(self):
47 |         return self.word2index.keys()
48 | 
49 |     def __len__(self):
50 |         return len(self.index2word)
51 | 
52 |     def __getitem__(self, index):
53 |         if isinstance(index, int):
54 |             return self.index2word[index]
55 |         elif isinstance(index, str):
56 |             if self.unk is not None:
57 |                 return VocabEncoded(self.word2index.get(index) or self.unk)
58 |             else:
59 |                 return VocabEncoded(self.word2index[index])
60 |         else:
61 |             raise ValueError("expected(index or string)")
62 | 
63 |     def decode(self, obj, strip_eos=False, decode_type=int):
64 |         def decode_f(word_idx):
65 |             return self.index2word[word_idx]
66 |         def decode_list_f(lst):
67 |             if strip_eos:
68 |                 assert self.eos is not None
69 |                 return [el for el in lst if el != Vocab.EOS]
70 |             else:
71 |                 return lst
72 |         return apply_recursively_on_type(obj, decode_f, decode_type, list_callback=decode_list_f)
73 | 
74 |     def encode(self, obj, add_eos=False, encode_type=int):
75 |         def encode_f(word):
76 |             if self.unk is not None:
77 |                 return encode_type(self.word2index.get(word) or self.unk)
78 |             else:
79 |                 return encode_type(self.word2index[word])
80 |         def encode_list_f(lst):
81 |             lst = [encode_f(word) for word in lst]
82 |             if add_eos:
83 |                 assert self.eos is not None
84 |                 lst.append(VocabEncoded(self.eos))
85 |             return lst
86 |         return apply_recursively_on_type(obj, lambda x:x, str, list_callback=encode_list_f)
87 | 
88 | __all__ = [
89 |     "VocabEncoded","Vocab"
90 | ]
91 | 


--------------------------------------------------------------------------------
/examples/mlbasics_learn_to_add.py:
--------------------------------------------------------------------------------
 1 | from test_dali import Mat, random, MatOps, Graph
 2 | 
 3 | num_examples = 100
 4 | example_size = 3
 5 | iterations   = 150
 6 | lr           = 0.01
 7 | 
 8 | X = random.uniform(
 9 |     0.0,
10 |     1.0 / example_size,
11 |     size=(num_examples, example_size)
12 | )
13 | ones = Mat.ones((X.shape[1], 1))
14 | Y = X.dot(ones)
15 | 
16 | X = MatOps.consider_constant(X)
17 | Y = MatOps.consider_constant(Y)
18 | 
19 | W = random.uniform(-1.0, 1.0, (example_size, 1))
20 | print(repr(W))
21 | for i in range(iterations):
22 |     predY = X.dot(W)
23 |     error = ((predY - Y) ** 2).sum()
24 |     print(repr(error))
25 |     # line below can be replaced by simply error.grad()
26 |     error.dw += 1
27 |     Graph.backward()
28 |     # there are much nicer solvers in Dali,
29 |     # but here we write out gradient descent
30 |     # explicitly
31 |     W.w -= W.dw * lr
32 |     W.dw = 0
33 | print(repr(W))
34 | 


--------------------------------------------------------------------------------
/examples/mlbasics_rnn_binary_addition.py:
--------------------------------------------------------------------------------
 1 | import sys
 2 | from os.path import dirname, realpath
 3 | sys.path.append(dirname(dirname(realpath(__file__))))
 4 | 
 5 | import random
 6 | from test_dali import Mat, MatOps, Graph, SGD, RNN, Layer
 7 | 
 8 | def as_bytes(num, final_size):
 9 |     res = []
10 |     for _ in range(final_size):
11 |         res.append(num % 2)
12 |         num //= 2
13 |     return res
14 | 
15 | def generate_example(num_bits):
16 |     a = random.randint(0, 2**(num_bits - 1) - 1)
17 |     b = random.randint(0, 2**(num_bits - 1) - 1)
18 |     res = a + b
19 |     return (as_bytes(a,  num_bits),
20 |             as_bytes(b,  num_bits),
21 |             as_bytes(res,num_bits))
22 | 
23 | ITERATIONS_PER_EPOCH = 30
24 | NUM_BITS             = 30
25 | INPUT_SIZE           = 2
26 | OUTPUT_SIZE          = 1
27 | MEMORY_SIZE          = 5
28 | MAX_EPOCHS           = 5000
29 | 
30 | rnn                  = RNN(INPUT_SIZE, MEMORY_SIZE)
31 | classifier           = Layer(MEMORY_SIZE, OUTPUT_SIZE)
32 | rnn_initial          = Mat(1, MEMORY_SIZE)
33 | 
34 | solver               = SGD()
35 | solver.step_size     = 0.001
36 | params               = rnn.parameters() + classifier.parameters() + [rnn_initial]
37 | 
38 | for epoch in range(MAX_EPOCHS):
39 |     for _ in range(ITERATIONS_PER_EPOCH):
40 |         a, b, res = generate_example(NUM_BITS)
41 |         error = Mat.zeros((1,1))
42 |         prev_hidden = rnn_initial
43 |         for bit_idx in range(NUM_BITS):
44 |             input_i = Mat([a[bit_idx], b[bit_idx]], dtype=rnn.dtype)
45 |             prev_hidden = rnn.activate(input_i, prev_hidden).tanh()
46 |             #prev_hidden = (rnn.Wx.dot(input_i) + rnn.Wh.dot(prev_hidden) + rnn.b).tanh()
47 |             output_i    = classifier.activate(prev_hidden).sigmoid()
48 |             # print(repr(output_i))
49 |             error = error + MatOps.binary_cross_entropy(output_i, res[bit_idx])
50 |         error.grad()
51 |         Graph.backward()
52 |     if epoch % 20 == 0:
53 |         print("epoch %d, error = %.3f" % (epoch, error.w[0,0]))
54 |     solver.step(params)
55 | 


--------------------------------------------------------------------------------
/examples/translation/predict.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | import random
 3 | import math
 4 | 
 5 | from dali.utils import (
 6 |     set_device_from_args,
 7 |     add_device_args,
 8 |     unpickle_as_dict,
 9 | )
10 | from dali.data.utils import split_punctuation
11 | 
12 | from translation import TranslationModel
13 | 
14 | def parse_args():
15 |     parser = argparse.ArgumentParser()
16 |     add_device_args(parser)
17 |     parser.add_argument("--path",              type=str,  required='True',  help="Path to saved model")
18 |     parser.add_argument("--beam_width",        type=int,  default=5,        help="Beam width used when prediction")
19 |     parser.add_argument("--max_output_length", type=int,  default=40,       help="Maximum number of words in the translation")
20 |     parser.add_argument("--show_beams",        action='store_true', default=False,
21 |                                                help="If true shows all the beams and probabilities")
22 | 
23 |     return parser.parse_args()
24 | 
25 | def show_reconstructions(model, example_pair, vocabs, max_sentence_length):
26 |     from_words, to_words = example_pair
27 |     from_vocab, to_vocab = vocabs
28 |     from_with_unk = ' '.join(from_vocab.decode(from_vocab.encode(from_words)))
29 |     to_with_unk   = ' '.join(to_vocab.decode(to_vocab.encode(to_words)))
30 |     print('TRANSLATING: %s' % from_with_unk)
31 |     print('REFERENCE:   %s' % to_with_unk)
32 |     print('')
33 | 
34 | 
35 | def main(args):
36 |     set_device_from_args(args)
37 | 
38 |     RELEVANT_VARIABLES = ["model", "vocabs"]
39 |     loaded = unpickle_as_dict(args.path, RELEVANT_VARIABLES)
40 |     model = loaded["model"]
41 |     from_vocab, to_vocab = loaded["vocabs"]
42 | 
43 |     while True:
44 |         from_sentence = split_punctuation(input()).split(' ')
45 |         encoded       = from_vocab.encode(list(reversed(from_sentence)), add_eos=False)
46 | 
47 |         beams = model.predict(encoded,
48 |                               eos_symbol=to_vocab.eos,
49 |                               max_sequence_length=args.max_output_length + 1,
50 |                               beam_width=args.beam_width)
51 | 
52 |         if args.show_beams:
53 |             for solution, score, _ in beams:
54 |                 score = math.exp(score.w[0])
55 |                 # reveal the unks
56 |                 solution = ' '.join(to_vocab.decode(solution, strip_eos=True))
57 |                 print('%f => %s' % (score, to_vocab.decode(solution, True)))
58 |         else:
59 |             print(' '.join(to_vocab.decode(beams[0].solution, strip_eos=True)))
60 | 
61 | 
62 | 
63 | if __name__ == '__main__':
64 |     main(parse_args())
65 | 


--------------------------------------------------------------------------------
/examples/translation/train.py:
--------------------------------------------------------------------------------
  1 | import argparse
  2 | import dali.core as D
  3 | from dali.data import Lines, Process, DiscoverFiles, BatchBenefactor, IdentityReducer
  4 | from dali.data.batch import TranslationBatch
  5 | from dali.data.translation import TranslationFiles, TranslationMapper, build_vocabs, iterate_examples
  6 | from dali.utils.scoring import bleu, ErrorTracker
  7 | from dali.utils import (
  8 |     Vocab,
  9 |     Solver,
 10 |     median_smoothing,
 11 |     subsample,
 12 |     Throttled,
 13 |     pickle_from_scope,
 14 |     unpickle_as_dict,
 15 |     set_device_from_args,
 16 |     add_device_args,
 17 | )
 18 | import math
 19 | import os
 20 | import sys
 21 | import time
 22 | import random
 23 | 
 24 | 
 25 | from translation import TranslationModel
 26 | 
 27 | def parse_args():
 28 |     parser = argparse.ArgumentParser()
 29 |     # device
 30 |     add_device_args(parser)
 31 | 
 32 |     # paths and data
 33 |     parser.add_argument("--train",     type=str, required=True)
 34 |     parser.add_argument("--validate",  type=str, required=True)
 35 |     parser.add_argument("--save",      type=str, default=None)
 36 |     parser.add_argument("--from_lang", type=str, required=True)
 37 |     parser.add_argument("--to_lang",   type=str, required=True)
 38 |     parser.add_argument("--max_from_vocab", type=int, default=20000)
 39 |     parser.add_argument("--max_to_vocab",   type=int, default=20000)
 40 | 
 41 |     # training
 42 |     parser.add_argument("--minibatch",           type=int, default=64)
 43 |     parser.add_argument("--max_sentence_length", type=int, default=40)
 44 | 
 45 |     # model
 46 |     parser.add_argument("--input_size",   type=int, default=512)
 47 |     parser.add_argument("--hidden_sizes", type=int, nargs='+', default=[512,512,512,512])
 48 | 
 49 |     # solver
 50 |     parser.add_argument("--solver_type",   type=str,   default="sgd")
 51 |     parser.add_argument("--learning_rate", type=float, default=0.003)
 52 | 
 53 |     return parser.parse_args()
 54 | 
 55 | def load_raw_validation(path, from_lang, to_lang, max_sentence_length):
 56 |     """List of validation sentences as strings.
 57 | 
 58 |     Used for reconstructions and BLEU.
 59 |     """
 60 |     p = Process(files=TranslationFiles(path, from_lang, to_lang),
 61 |             mapper=TranslationMapper(sentence_bounds=(0, max_sentence_length)),
 62 |             reducer=IdentityReducer())
 63 |     return list(p)
 64 | 
 65 | def show_reconstructions(model, example_pair, vocabs, max_sentence_length):
 66 |     from_words, to_words = example_pair
 67 |     from_vocab, to_vocab = vocabs
 68 |     from_with_unk = ' '.join(from_vocab.decode(from_vocab.encode(from_words)))
 69 |     to_with_unk   = ' '.join(to_vocab.decode(to_vocab.encode(to_words)))
 70 |     print('TRANSLATING: %s' % from_with_unk)
 71 |     print('REFERENCE:   %s' % to_with_unk)
 72 |     print('')
 73 |     for solution, score, _ in model.predict(from_vocab.encode(list(reversed(from_words)), add_eos=False),
 74 |                                            eos_symbol=to_vocab.eos,
 75 |                                            max_sequence_length=max_sentence_length + 1):
 76 |         score = math.exp(score.w[0])
 77 |         # reveal the unks
 78 |         solution = ' '.join(to_vocab.decode(solution, False))
 79 |         print('    %f => %s' % (score, to_vocab.decode(solution, True)))
 80 | 
 81 | def main(args):
 82 |     set_device_from_args(args, verbose=True)
 83 | 
 84 |     ############### MODEL/DATA LOADING ####################
 85 | 
 86 |     RELEVANT_VARIABLES = ["model", "vocabs", "solver", "data", "train_error", "validate_error"]
 87 | 
 88 |     if args.save is not None and os.path.exists(args.save):
 89 |         print("Resuming saved experiment at %s." % (args.save,))
 90 |         loaded = unpickle_as_dict(args.save)
 91 |         model, vocabs, solver, data, train_error, validate_error = [loaded[x] for x in RELEVANT_VARIABLES]
 92 |         solver.parameters = model.parameters()
 93 |     else:
 94 |         print("Loading vocabs - for monstrous datasets hit ctrl+C after you feel like probably enough words have been sampled.")
 95 |         vocabs = build_vocabs(args.train, args.from_lang, args.to_lang,
 96 |                               from_max_size=args.max_from_vocab,
 97 |                               to_max_size=args.max_to_vocab)
 98 |         print("Creating model")
 99 |         model  = TranslationModel(args.input_size,
100 |                                   args.hidden_sizes,
101 |                                   len(vocabs[0]),
102 |                                   len(vocabs[1]))
103 |         model.name_parameters("model")
104 |         solver = Solver(model.parameters(), args.solver_type, learning_rate=args.learning_rate)
105 | 
106 |         solver.set_lr_multiplier("model.encoder_embedding", 2)
107 |         solver.set_lr_multiplier("model.decoder_embedding", 2)
108 | 
109 |         data             = []
110 |         train_error      = ErrorTracker()
111 |         validate_error   = ErrorTracker()
112 | 
113 |     from_vocab, to_vocab = vocabs
114 | 
115 |     print("Input size:   ",        args.input_size)
116 |     print("Hidden sizes: ",        args.hidden_sizes)
117 |     print("max sentence length: ", args.max_sentence_length)
118 | 
119 |     print (args.from_lang + " vocabulary containts", len(from_vocab), "words")
120 |     print (args.to_lang   + " vocabulary containts", len(to_vocab),   "words")
121 | 
122 | 
123 |     def create_dataset_iterator(dataset, sentences_until_minibatch):
124 |         return iterate_examples(dataset, args.from_lang, args.to_lang, vocabs,
125 |                                 minibatch_size=args.minibatch,
126 |                                 sentence_length_bounds=(0, args.max_sentence_length),
127 |                                 sentences_until_minibatch=sentences_until_minibatch)
128 | 
129 | 
130 |     validation_pairs_text = load_raw_validation(args.validate, args.from_lang, args.to_lang, args.max_sentence_length)
131 |     validation_batches    = list(create_dataset_iterator(args.validate, args.minibatch))
132 | 
133 | 
134 |     t = Throttled(10)
135 | 
136 |     while True:
137 |         total_time  = 0.0
138 |         num_words, num_batches = 0, 0
139 | 
140 |         if solver.solver_type == 'adagrad':
141 |             solver.reset_caches(params)
142 | 
143 |         for batch in data:
144 |             batch_start_time = time.time()
145 |             error = model.error(batch)
146 |             (error / batch.examples).grad()
147 |             D.Graph.backward()
148 | 
149 |             solver.step()
150 |             batch_end_time = time.time()
151 | 
152 |             train_error.append(error / batch.to_tokens)
153 | 
154 |             total_time += batch_end_time - batch_start_time
155 |             num_words   += batch.from_tokens + batch.to_tokens
156 |             num_batches += 1
157 | 
158 |             if num_batches % 10 == 0:
159 |                 val_batch = random.choice(validation_batches)
160 |                 with D.NoBackprop():
161 |                     validate_error.append(model.error(val_batch) / val_batch.to_tokens)
162 | 
163 |             if t.should_i_run() and num_batches > 0 and abs(total_time) > 1e-6:
164 |                 print('Epochs completed:  ', train_error.num_epochs())
165 |                 print('Error:             ', train_error.recent(10))
166 |                 print('Time per batch:    ', total_time  / num_batches)
167 |                 print('Words per second:  ', num_words   / total_time )
168 |                 print('Batches processed: ', num_batches)
169 |                 if hasattr(solver, 'step_size'):
170 |                     print('Solver step size:  ', solver.step_size)
171 |                 show_reconstructions(model, random.choice(validation_pairs_text), vocabs, args.max_sentence_length)
172 |                 sys.stdout.flush()
173 | 
174 |             # free memory as soon as possible
175 |             del batch
176 | 
177 |         train_error.finalize_epoch()
178 |         validate_error.finalize_epoch()
179 |         if train_error.num_epochs() > 0 and args.save is not None:
180 |             print("Saving model to %s." % (args.save,))
181 |             pickle_from_scope(args.save, RELEVANT_VARIABLES)
182 | 
183 |         data = create_dataset_iterator(args.train, 1000 * args.minibatch)
184 | 
185 | if __name__ == '__main__':
186 |     main(parse_args())
187 | 


--------------------------------------------------------------------------------
/examples/translation/translation.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | 
 3 | import dali.core as D
 4 | import dali
 5 | 
 6 | from dali import beam_search
 7 | 
 8 | class TranslationModel(object):
 9 |     def __init__(self, input_size, hiddens,
10 |                        encoder_vocab_size, decoder_vocab_size,
11 |                        softmax_input_size=None, dtype=np.float32):
12 |         self.input_size = input_size
13 |         self.hiddens    = hiddens
14 |         self.encoder_vocab_size = encoder_vocab_size
15 |         self.decoder_vocab_size = decoder_vocab_size
16 |         self.softmax_input_size = softmax_input_size
17 |         self.dtype = dtype
18 | 
19 |         self.encoder_embedding = D.random.uniform(-0.05, 0.05, (encoder_vocab_size, input_size), dtype=dtype)
20 |         self.decoder_embedding = D.random.uniform(-0.05, 0.05, (decoder_vocab_size, input_size), dtype=dtype)
21 | 
22 |         self.encoder_lstm    = D.StackedLSTM(input_size, hiddens, memory_feeds_gates=True, dtype=dtype)
23 |         self.decoder_lstm    = D.StackedLSTM(input_size, hiddens, memory_feeds_gates=True, dtype=dtype)
24 | 
25 |         if self.softmax_input_size is not None:
26 |             self.predecoder = D.StackedInputLayer(self.hiddens, self.softmax_input_size)
27 |             self.decoder = D.Layer(self.softmax_input_size, decoder_vocab_size, dtype=dtype)
28 |         else:
29 |             self.decoder = D.Layer(hiddens[-1], decoder_vocab_size, dtype=dtype)
30 | 
31 |     def decode_state(self, state):
32 |         if self.softmax_input_size is not None:
33 |             decoder_input = self.predecoder.activate([s.hidden for s in state])
34 |         else:
35 |             decoder_input = state[-1].hidden
36 |         return self.decoder.activate(decoder_input)
37 | 
38 |     def error(self, batch):
39 |         error = D.Mat(1,1)
40 |         state = self.encoder_lstm.initial_states()
41 |         for ts in range(batch.timesteps):
42 |             inputs  = batch.inputs(ts)
43 |             targets = batch.targets(ts)
44 |             if ts < batch.from_timesteps:
45 |                 assert targets is None
46 |                 encoded = self.encoder_embedding[inputs]
47 |                 state = self.encoder_lstm.activate(encoded, state)
48 |             else:
49 |                 assert inputs is None
50 |                 decoded = self.decode_state(state)
51 |                 # mask the error - only for the relevant sentences
52 |                 tstep_error = batch.masks(ts).T() * D.MatOps.softmax_cross_entropy(decoded, targets)
53 |                 #tstep_error = D.MatOps.softmax_cross_entropy(decoded, targets)
54 |                 error = error + tstep_error.sum()
55 |                 # feedback the predictions
56 |                 if ts + 1 != batch.timesteps:
57 |                     # for the last timestep encoding is not necessary
58 |                     encoded = self.decoder_embedding[targets]
59 |                     state = self.decoder_lstm.activate(encoded, state)
60 | 
61 |         return error
62 | 
63 |     def predict(self, input_sentence, **kwargs):
64 |         with D.NoBackprop():
65 |             state = self.encoder_lstm.initial_states()
66 |             for word_idx in input_sentence:
67 |                 encoded = self.encoder_embedding[word_idx]
68 |                 state = self.encoder_lstm.activate(encoded, state)
69 |             def candidate_scores(state):
70 |                 decoded = self.decode_state(state)
71 |                 return D.MatOps.softmax(decoded).log()
72 |             def make_choice(state, candidate_idx):
73 |                 encoded = self.decoder_embedding[candidate_idx]
74 |                 return self.decoder_lstm.activate(encoded, state)
75 | 
76 |             return beam_search(state,
77 |                                candidate_scores,
78 |                                make_choice,
79 |                                **kwargs)
80 | 
81 |     def parameters(self):
82 |         ret = ([self.encoder_embedding,
83 |                self.decoder_embedding]
84 |             + self.encoder_lstm.parameters()
85 |             + self.decoder_lstm.parameters()
86 |             + self.decoder.parameters())
87 |         if self.softmax_input_size is not None:
88 |             ret.extend(self.predecoder.parameters())
89 |         return ret
90 | 
91 |     def name_parameters(self, prefix):
92 |         self.encoder_embedding.name = prefix + ".encoder_embedding"
93 |         self.decoder_embedding.name = prefix + ".decoder_embedding"
94 |         self.encoder_lstm.name_parameters(prefix + ".encoder_lstm")
95 |         self.decoder_lstm.name_parameters(prefix + ".decoder_lstm")
96 |         self.decoder.name_parameters(prefix + ".decoder")
97 |         if self.softmax_input_size is not None:
98 |             self.predecoder.name_parameters(prefix + ".predecoder")
99 | 


--------------------------------------------------------------------------------
/libcpp11/__init__.pxd:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dali-ml/dali-cython/e258469aeb1d4cb3e4cdf5c07e8948f461a038f1/libcpp11/__init__.pxd


--------------------------------------------------------------------------------
/libcpp11/memory.pxd:
--------------------------------------------------------------------------------
 1 | from libcpp cimport bool
 2 | 
 3 | cdef extern from "<memory>" namespace "std" nogil:
 4 |     ctypedef void* nullptr_t; # Should be decltype(nullptr)
 5 | 
 6 |     cdef cppclass unique_ptr[T]:
 7 |         unique_ptr()
 8 |         unique_ptr(nullptr_t)
 9 |         unique_ptr(T*)
10 |         unique_ptr(unique_ptr[T]&)
11 | 
12 |         # Modifiers
13 |         T* release()
14 |         void reset()
15 |         void reset(nullptr_t)
16 |         void reset(T*)
17 |         void swap(unique_ptr&)
18 | 
19 |         # Observers
20 |         T* get()
21 |         T& operator*()
22 |         #T* operator->() # Not Supported
23 |         #bool operator bool() # Not Supported
24 | 
25 |         bool operator==(const unique_ptr&)
26 |         bool operator!=(const unique_ptr&)
27 |         bool operator<(const unique_ptr&)
28 |         bool operator>(const unique_ptr&)
29 |         bool operator<=(const unique_ptr&)
30 |         bool operator>=(const unique_ptr&)
31 | 
32 |         bool operator==(nullptr_t)
33 |         bool operator!=(nullptr_t)
34 | 
35 | 
36 |     # Forward Declaration not working ("Compiler crash in AnalyseDeclarationsTransform")
37 |     #cdef cppclass weak_ptr[T]
38 | 
39 |     cdef cppclass shared_ptr[T]:
40 |         shared_ptr()
41 |         shared_ptr(nullptr_t)
42 |         shared_ptr(T*)
43 |         shared_ptr(shared_ptr[T]&)
44 |         shared_ptr(shared_ptr[T]&, T*)
45 |         shared_ptr(unique_ptr[T]&)
46 |         #shared_ptr(weak_ptr[T]&) # Not Supported
47 | 
48 |         # Modifiers
49 |         void reset()
50 |         void reset(T*)
51 |         void swap(shared_ptr&)
52 | 
53 |         # Observers
54 |         T* get()
55 |         T& operator*()
56 |         #T* operator->() # Not Supported
57 |         long use_count()
58 |         bool unique()
59 |         #bool operator bool() # Not Supported
60 |         #bool owner_before[Y](const weak_ptr[Y]&) # Not Supported
61 |         bool owner_before[Y](const shared_ptr[Y]&)
62 | 
63 |         bool operator==(const shared_ptr&)
64 |         bool operator!=(const shared_ptr&)
65 |         bool operator<(const shared_ptr&)
66 |         bool operator>(const shared_ptr&)
67 |         bool operator<=(const shared_ptr&)
68 |         bool operator>=(const shared_ptr&)
69 | 
70 |         bool operator==(nullptr_t)
71 |         bool operator!=(nullptr_t)
72 | 
73 | 
74 |     cdef cppclass weak_ptr[T]:
75 |         weak_ptr()
76 |         weak_ptr(weak_ptr[T]&)
77 |         weak_ptr(shared_ptr[T]&)
78 | 
79 |         # Modifiers
80 |         void reset()
81 |         void swap(weak_ptr&)
82 | 
83 |         # Observers
84 |         long use_count()
85 |         bool expired()
86 |         shared_ptr[T] lock()
87 |         bool owner_before[Y](const weak_ptr[Y]&)
88 |         bool owner_before[Y](const shared_ptr[Y]&)
89 | 
90 | 


--------------------------------------------------------------------------------
/libcpp11/stringstream.pxd:
--------------------------------------------------------------------------------
 1 | from libcpp.string cimport string
 2 | 
 3 | cdef extern from "<sstream>" namespace "std" nogil:
 4 |     cdef cppclass stringstream:
 5 |         stringstream& push "operator<<" (bint val);
 6 |         stringstream& push "operator<<" (short val);
 7 |         stringstream& push "operator<<" (unsigned short val);
 8 |         stringstream& push "operator<<" (int val);
 9 |         stringstream& push "operator<<" (unsigned int val);
10 |         stringstream& push "operator<<" (long val);
11 |         stringstream& push "operator<<" (unsigned long val);
12 |         stringstream& push "operator<<" (float val);
13 |         stringstream& push "operator<<" (double val);
14 |         stringstream& push "operator<<" (long double val);
15 |         stringstream& push "operator<<" (void* val);
16 |         stringstream()
17 |         string to_string "str" () const
18 | 


--------------------------------------------------------------------------------
/libcpp11/unordered_map.pxd:
--------------------------------------------------------------------------------
 1 | from libcpp.utility cimport pair
 2 | 
 3 | cdef extern from "<unordered_map>" namespace "std" nogil:
 4 |     cdef cppclass unordered_map[T, U]:
 5 |         cppclass iterator:
 6 |             pair[T, U]& operator*()
 7 |             iterator operator++()
 8 |             iterator operator--()
 9 |             bint operator==(iterator)
10 |             bint operator!=(iterator)
11 |         cppclass reverse_iterator:
12 |             pair[T, U]& operator*()
13 |             iterator operator++()
14 |             iterator operator--()
15 |             bint operator==(reverse_iterator)
16 |             bint operator!=(reverse_iterator)
17 |         cppclass const_iterator(iterator):
18 |             pass
19 |         cppclass const_reverse_iterator(reverse_iterator):
20 |             pass
21 |         unordered_map() except +
22 |         unordered_map(unordered_map&) except +
23 |         #unordered_map(key_compare&)
24 |         U& operator[](T&)
25 |         #unordered_map& operator=(unordered_map&)
26 |         bint operator==(unordered_map&, unordered_map&)
27 |         bint operator!=(unordered_map&, unordered_map&)
28 |         bint operator<(unordered_map&, unordered_map&)
29 |         bint operator>(unordered_map&, unordered_map&)
30 |         bint operator<=(unordered_map&, unordered_map&)
31 |         bint operator>=(unordered_map&, unordered_map&)
32 |         U& at(T&) except +
33 |         iterator begin()
34 |         const_iterator const_begin "begin"()
35 |         void clear()
36 |         size_t count(T&)
37 |         bint empty()
38 |         iterator end()
39 |         const_iterator const_end "end"()
40 |         pair[iterator, iterator] equal_range(T&)
41 |         #pair[const_iterator, const_iterator] equal_range(key_type&)
42 |         void erase(iterator)
43 |         void erase(iterator, iterator)
44 |         size_t erase(T&)
45 |         iterator find(T&)
46 |         const_iterator const_find "find"(T&)
47 |         pair[iterator, bint] insert(pair[T, U]) # XXX pair[T,U]&
48 |         iterator insert(iterator, pair[T, U]) # XXX pair[T,U]&
49 |         #void insert(input_iterator, input_iterator)
50 |         #key_compare key_comp()
51 |         iterator lower_bound(T&)
52 |         const_iterator const_lower_bound "lower_bound"(T&)
53 |         size_t max_size()
54 |         reverse_iterator rbegin()
55 |         const_reverse_iterator const_rbegin "rbegin"()
56 |         reverse_iterator rend()
57 |         const_reverse_iterator const_rend "rend"()
58 |         size_t size()
59 |         void swap(unordered_map&)
60 |         iterator upper_bound(T&)
61 |         const_iterator const_upper_bound "upper_bound"(T&)
62 |         #value_compare value_comp()
63 |         void max_load_factor(float)
64 |         float max_load_factor()
65 | 


--------------------------------------------------------------------------------
/libcpp11/vector.pxd:
--------------------------------------------------------------------------------
 1 | cdef extern from "<vector>" namespace "std" nogil:
 2 |     cdef cppclass vector[T]:
 3 |         cppclass iterator:
 4 |             T& operator*()
 5 |             iterator operator++()
 6 |             iterator operator--()
 7 |             iterator operator+(size_t)
 8 |             iterator operator-(size_t)
 9 |             bint operator==(iterator)
10 |             bint operator!=(iterator)
11 |             bint operator<(iterator)
12 |             bint operator>(iterator)
13 |             bint operator<=(iterator)
14 |             bint operator>=(iterator)
15 |         cppclass reverse_iterator:
16 |             T& operator*()
17 |             iterator operator++()
18 |             iterator operator--()
19 |             iterator operator+(size_t)
20 |             iterator operator-(size_t)
21 |             bint operator==(reverse_iterator)
22 |             bint operator!=(reverse_iterator)
23 |             bint operator<(reverse_iterator)
24 |             bint operator>(reverse_iterator)
25 |             bint operator<=(reverse_iterator)
26 |             bint operator>=(reverse_iterator)
27 |         cppclass const_iterator(iterator):
28 |             pass
29 |         cppclass const_reverse_iterator(reverse_iterator):
30 |             pass
31 |         vector() except +
32 |         vector(vector&) except +
33 |         vector(size_t) except +
34 |         vector(size_t, T&) except +
35 |         #vector[input_iterator](input_iterator, input_iterator)
36 |         T& operator[](size_t)
37 |         #vector& operator=(vector&)
38 |         bint operator==(vector&, vector&)
39 |         bint operator!=(vector&, vector&)
40 |         bint operator<(vector&, vector&)
41 |         bint operator>(vector&, vector&)
42 |         bint operator<=(vector&, vector&)
43 |         bint operator>=(vector&, vector&)
44 |         void assign(size_t, const T&)
45 |         void assign[input_iterator](input_iterator, input_iterator) except +
46 |         T& at(size_t) except +
47 |         T& back()
48 |         iterator begin()
49 |         const_iterator const_begin "begin"()
50 |         size_t capacity()
51 |         void clear()
52 |         bint empty()
53 |         iterator end()
54 |         const_iterator const_end "end"()
55 |         iterator erase(iterator)
56 |         iterator erase(iterator, iterator)
57 |         T& front()
58 |         iterator insert(iterator, const T&) except +
59 |         void insert(iterator, size_t, const T&) except +
60 |         void insert[Iter](iterator, Iter, Iter) except +
61 |         size_t max_size()
62 |         void pop_back()
63 |         void push_back(T&) except +
64 |         reverse_iterator rbegin()
65 |         const_reverse_iterator const_rbegin "rbegin"()
66 |         reverse_iterator rend()
67 |         const_reverse_iterator const_rend "rend"()
68 |         void reserve(size_t)
69 |         void resize(size_t) except +
70 |         void resize(size_t, T&) except +
71 |         size_t size()
72 |         void swap(vector&)
73 | 
74 |         # C++11 methods
75 |         T* data()
76 |         void shrink_to_fit()
77 | 


--------------------------------------------------------------------------------
/notebooks/LSTM.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 1,
  6 |    "metadata": {
  7 |     "collapsed": false
  8 |    },
  9 |    "outputs": [],
 10 |    "source": [
 11 |     "import sys\n",
 12 |     "sys.path.append('..')"
 13 |    ]
 14 |   },
 15 |   {
 16 |    "cell_type": "code",
 17 |    "execution_count": 2,
 18 |    "metadata": {
 19 |     "collapsed": false
 20 |    },
 21 |    "outputs": [],
 22 |    "source": [
 23 |     "from dali.core import LSTM, Mat, LSTMState, StackedLSTM\n",
 24 |     "\n",
 25 |     "import pickle\n",
 26 |     "import random\n",
 27 |     "import matplotlib.pyplot as plt\n",
 28 |     "%matplotlib inline"
 29 |    ]
 30 |   },
 31 |   {
 32 |    "cell_type": "code",
 33 |    "execution_count": 3,
 34 |    "metadata": {
 35 |     "collapsed": false
 36 |    },
 37 |    "outputs": [
 38 |     {
 39 |      "name": "stdout",
 40 |      "output_type": "stream",
 41 |      "text": [
 42 |       "float32\n",
 43 |       "[[ 1.  2.  3.]]\n",
 44 |       "[[ 4.  2.  1.]]\n"
 45 |      ]
 46 |     }
 47 |    ],
 48 |    "source": [
 49 |     "s = LSTMState(Mat([1,2,3]), Mat([4,2,1]))\n",
 50 |     "print(s.dtype)\n",
 51 |     "print(s.memory.w)\n",
 52 |     "print(s.hidden.w)"
 53 |    ]
 54 |   },
 55 |   {
 56 |    "cell_type": "code",
 57 |    "execution_count": 4,
 58 |    "metadata": {
 59 |     "collapsed": false
 60 |    },
 61 |    "outputs": [],
 62 |    "source": [
 63 |     "l = LSTM(2, 5)"
 64 |    ]
 65 |   },
 66 |   {
 67 |    "cell_type": "code",
 68 |    "execution_count": 5,
 69 |    "metadata": {
 70 |     "collapsed": false,
 71 |     "scrolled": true
 72 |    },
 73 |    "outputs": [
 74 |     {
 75 |      "name": "stdout",
 76 |      "output_type": "stream",
 77 |      "text": [
 78 |       "[\n",
 79 |       "    [  1.000   2.000]\n",
 80 |       "]\n",
 81 |       "\n",
 82 |       "[\n",
 83 |       "    [  0.000   0.000   0.000   0.000   0.000]\n",
 84 |       "]\n",
 85 |       "\n",
 86 |       "[\n",
 87 |       "    [  0.000   0.000   0.000   0.000   0.000]\n",
 88 |       "]\n",
 89 |       "\n",
 90 |       "[\n",
 91 |       "    [  0.150   0.075   0.142  -0.004  -0.001]\n",
 92 |       "]\n",
 93 |       "\n",
 94 |       "[\n",
 95 |       "    [  0.212   0.312   0.254  -0.008  -0.002]\n",
 96 |       "]\n",
 97 |       "\n"
 98 |      ]
 99 |     }
100 |    ],
101 |    "source": [
102 |     "i = Mat([[1, 2]])\n",
103 |     "h = l.initial_states()\n",
104 |     "print(i.__repr__())\n",
105 |     "print(h.hidden.__repr__())\n",
106 |     "print(h.memory.__repr__())\n",
107 |     "h = l.activate(i, h)\n",
108 |     "print(h.hidden.__repr__())\n",
109 |     "print(h.memory.__repr__())"
110 |    ]
111 |   },
112 |   {
113 |    "cell_type": "code",
114 |    "execution_count": 8,
115 |    "metadata": {
116 |     "collapsed": false
117 |    },
118 |    "outputs": [
119 |     {
120 |      "name": "stdout",
121 |      "output_type": "stream",
122 |      "text": [
123 |       "Activate sequence for 3 different inputs states and one hidden states\n",
124 |       "[[ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]\n",
125 |       " [ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]\n",
126 |       " [ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]]\n",
127 |       "Activate sequence for 3 different hidden states and three different inputs\n",
128 |       "[[ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]\n",
129 |       " [ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]\n",
130 |       " [ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]]\n",
131 |       "Activate sequence for 3 different hidden states and one input (!)\n",
132 |       "[[ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]\n",
133 |       " [ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]\n",
134 |       " [ 0.31556997 -0.05376546 -0.0430177  -0.00521236 -0.29317772]]\n"
135 |      ]
136 |     }
137 |    ],
138 |    "source": [
139 |     "print(\"Activate sequence for 3 different inputs states and one hidden states\")\n",
140 |     "r1 = l.activate_sequence([Mat(3, 2) for i in range(10)], l.initial_states()).memory\n",
141 |     "print(r1.w)\n",
142 |     "print(\"Activate sequence for 3 different hidden states and three different inputs\")\n",
143 |     "r2 = l.activate_sequence([Mat(3, 2) for i in range(10)], LSTMState(Mat(3,5), Mat(3,5))).memory\n",
144 |     "print(r2.w)\n",
145 |     "print(\"Activate sequence for 3 different hidden states and one input (!)\")\n",
146 |     "r3 = l.activate_sequence([Mat(1, 2) for i in range(10)], LSTMState(Mat(3,5), Mat(3,5))).memory\n",
147 |     "print(r3.w)"
148 |    ]
149 |   },
150 |   {
151 |    "cell_type": "code",
152 |    "execution_count": 9,
153 |    "metadata": {
154 |     "collapsed": false
155 |    },
156 |    "outputs": [],
157 |    "source": [
158 |     "INPUTS = [2,3]\n",
159 |     "HIDDEN_SIZE = 5\n",
160 |     "NUM_CHILDREN = 3"
161 |    ]
162 |   },
163 |   {
164 |    "cell_type": "code",
165 |    "execution_count": 10,
166 |    "metadata": {
167 |     "collapsed": true
168 |    },
169 |    "outputs": [],
170 |    "source": [
171 |     "l = LSTM(INPUTS, HIDDEN_SIZE, NUM_CHILDREN, memory_feeds_gates=True)"
172 |    ]
173 |   },
174 |   {
175 |    "cell_type": "code",
176 |    "execution_count": 11,
177 |    "metadata": {
178 |     "collapsed": false
179 |    },
180 |    "outputs": [
181 |     {
182 |      "name": "stdout",
183 |      "output_type": "stream",
184 |      "text": [
185 |       "<StackedInputLayer in=[2, 3, 5, 5, 5], out=5>\n",
186 |       "[<StackedInputLayer in=[2, 3, 5, 5, 5], out=5>, <StackedInputLayer in=[2, 3, 5, 5, 5], out=5>, <StackedInputLayer in=[2, 3, 5, 5, 5], out=5>]\n",
187 |       "5\n",
188 |       "[2, 3]\n",
189 |       "<StackedInputLayer in=[2, 3, 5, 5, 5], out=5>\n",
190 |       "3\n",
191 |       "True\n",
192 |       "[[ 0.36870342 -0.03744119 -0.00326931  0.09401595 -0.29351875]]\n"
193 |      ]
194 |     }
195 |    ],
196 |    "source": [
197 |     "idx = random.randint(0, len(l.parameters()) - 1)\n",
198 |     "print(l.cell_layer)\n",
199 |     "print(l.forget_layers)\n",
200 |     "print(l.hidden_size)\n",
201 |     "print(l.input_sizes)\n",
202 |     "print(l.input_layer)\n",
203 |     "print(l.num_children)\n",
204 |     "print(l.memory_feeds_gates)\n",
205 |     "print(l.parameters()[3].w)\n",
206 |     "with open(\"/tmp/lstm_test_dali.dali\", \"wb\") as f:\n",
207 |     "    pickle.dump(l,f)"
208 |    ]
209 |   },
210 |   {
211 |    "cell_type": "code",
212 |    "execution_count": 4,
213 |    "metadata": {
214 |     "collapsed": false
215 |    },
216 |    "outputs": [
217 |     {
218 |      "ename": "ImportError",
219 |      "evalue": "No module named 'test_dali'",
220 |      "output_type": "error",
221 |      "traceback": [
222 |       "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
223 |       "\u001b[1;31mImportError\u001b[0m                               Traceback (most recent call last)",
224 |       "\u001b[1;32m<ipython-input-4-780854079d07>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mpickle\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[1;32mfrom\u001b[0m \u001b[0mtest_dali\u001b[0m \u001b[1;32mimport\u001b[0m \u001b[0mLSTM\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mMat\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      3\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      4\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      5\u001b[0m \u001b[1;32mwith\u001b[0m \u001b[0mopen\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m\"/tmp/lstm_test_dali.dali\"\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;34m\"rb\"\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;32mas\u001b[0m \u001b[0mf\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
225 |       "\u001b[1;31mImportError\u001b[0m: No module named 'test_dali'"
226 |      ]
227 |     }
228 |    ],
229 |    "source": [
230 |     "import pickle\n",
231 |     "from test_dali import LSTM, Mat\n",
232 |     "\n",
233 |     "\n",
234 |     "with open(\"/tmp/lstm_test_dali.dali\", \"rb\") as f:\n",
235 |     "    l_pickled = pickle.load(f)\n",
236 |     "print(\"==== PICKLED ====\")\n",
237 |     "print(l_pickled.cell_layer)\n",
238 |     "print(l_pickled.forget_layers)\n",
239 |     "print(l_pickled.hidden_size)\n",
240 |     "print(l_pickled.input_sizes)\n",
241 |     "print(l_pickled.input_layer)\n",
242 |     "print(l_pickled.num_children)\n",
243 |     "print(l_pickled.memory_feeds_gates)\n",
244 |     "print(l_pickled.parameters()[3].w)"
245 |    ]
246 |   },
247 |   {
248 |    "cell_type": "code",
249 |    "execution_count": 13,
250 |    "metadata": {
251 |     "collapsed": false
252 |    },
253 |    "outputs": [
254 |     {
255 |      "name": "stdout",
256 |      "output_type": "stream",
257 |      "text": [
258 |       "[\n",
259 |       "    [  0.028  -0.025  -0.020  -0.008  -0.049]\n",
260 |       "]\n",
261 |       "\n",
262 |       "[\n",
263 |       "    [  0.060  -0.047  -0.039  -0.014  -0.102]\n",
264 |       "]\n",
265 |       "\n"
266 |      ]
267 |     }
268 |    ],
269 |    "source": [
270 |     "hs = [l_pickled.initial_states() for _ in range(l_pickled.num_children)]\n",
271 |     "i = [Mat(1, ipt) for ipt in l_pickled.input_sizes]\n",
272 |     "\n",
273 |     "h_combined = l_pickled.activate(i, hs)\n",
274 |     "print(h_combined.hidden.__repr__())\n",
275 |     "print(h_combined.memory.__repr__())"
276 |    ]
277 |   },
278 |   {
279 |    "cell_type": "code",
280 |    "execution_count": 7,
281 |    "metadata": {
282 |     "collapsed": false
283 |    },
284 |    "outputs": [
285 |     {
286 |      "ename": "NameError",
287 |      "evalue": "name 'l' is not defined",
288 |      "output_type": "error",
289 |      "traceback": [
290 |       "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
291 |       "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
292 |       "\u001b[1;32m<ipython-input-7-90842db0b0b3>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0ml\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mWcells_to_forgets\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
293 |       "\u001b[1;31mNameError\u001b[0m: name 'l' is not defined"
294 |      ]
295 |     }
296 |    ],
297 |    "source": [
298 |     "l.Wcells_to_forgets[0]"
299 |    ]
300 |   },
301 |   {
302 |    "cell_type": "code",
303 |    "execution_count": 8,
304 |    "metadata": {
305 |     "collapsed": false
306 |    },
307 |    "outputs": [],
308 |    "source": [
309 |     "l = StackedLSTM([1,2], [5,4], shortcut=True)"
310 |    ]
311 |   },
312 |   {
313 |    "cell_type": "code",
314 |    "execution_count": 9,
315 |    "metadata": {
316 |     "collapsed": false
317 |    },
318 |    "outputs": [
319 |     {
320 |      "data": {
321 |       "text/plain": [
322 |        "[<dali.core.LSTMState at 0x7f564c946f80>,\n",
323 |        " <dali.core.LSTMState at 0x7f564c946da0>]"
324 |       ]
325 |      },
326 |      "execution_count": 9,
327 |      "metadata": {},
328 |      "output_type": "execute_result"
329 |     }
330 |    ],
331 |    "source": [
332 |     "l.activate(\n",
333 |     "    [\n",
334 |     "        Mat(5,1),\n",
335 |     "        Mat(5,2),\n",
336 |     "    ], l.initial_states()\n",
337 |     ")"
338 |    ]
339 |   },
340 |   {
341 |    "cell_type": "code",
342 |    "execution_count": 10,
343 |    "metadata": {
344 |     "collapsed": false
345 |    },
346 |    "outputs": [
347 |     {
348 |      "name": "stdout",
349 |      "output_type": "stream",
350 |      "text": [
351 |       "<StackedInputLayer in=[1, 2, 5], out=5>\n",
352 |       "[<StackedInputLayer in=[1, 2, 5], out=5>]\n",
353 |       "5\n",
354 |       "[1, 2]\n",
355 |       "<StackedInputLayer in=[1, 2, 5], out=5>\n",
356 |       "1\n",
357 |       "False\n",
358 |       "[[-0.16443005  0.22159122  0.24860647  0.32551721  0.01914411]\n",
359 |       " [ 0.19727443  0.26258233  0.17914623 -0.17491819  0.1341583 ]]\n",
360 |       "True\n"
361 |      ]
362 |     }
363 |    ],
364 |    "source": [
365 |     "print(l.cells[0].cell_layer)\n",
366 |     "print(l.cells[0].forget_layers)\n",
367 |     "print(l.cells[0].hidden_size)\n",
368 |     "print(l.cells[0].input_sizes)\n",
369 |     "print(l.cells[0].input_layer)\n",
370 |     "print(l.cells[0].num_children)\n",
371 |     "print(l.cells[0].memory_feeds_gates)\n",
372 |     "print(l.cells[0].parameters()[5].w)\n",
373 |     "print(l.shortcut)\n",
374 |     "with open(\"/tmp/stacked_lstm_test_lol.dali\", \"wb\") as f:\n",
375 |     "    pickle.dump(l,f)"
376 |    ]
377 |   },
378 |   {
379 |    "cell_type": "code",
380 |    "execution_count": 12,
381 |    "metadata": {
382 |     "collapsed": false
383 |    },
384 |    "outputs": [
385 |     {
386 |      "name": "stdout",
387 |      "output_type": "stream",
388 |      "text": [
389 |       "==== PICKLED ====\n",
390 |       "<StackedInputLayer in=[1, 2, 5], out=5>\n",
391 |       "[<StackedInputLayer in=[1, 2, 5], out=5>]\n",
392 |       "5\n",
393 |       "[1, 2]\n",
394 |       "<StackedInputLayer in=[1, 2, 5], out=5>\n",
395 |       "1\n",
396 |       "False\n",
397 |       "[[-0.16443005  0.22159122  0.24860647  0.32551721  0.01914411]\n",
398 |       " [ 0.19727443  0.26258233  0.17914623 -0.17491819  0.1341583 ]]\n",
399 |       "True\n"
400 |      ]
401 |     }
402 |    ],
403 |    "source": [
404 |     "import pickle\n",
405 |     "from dali.core import StackedLSTM, Mat\n",
406 |     "\n",
407 |     "with open(\"/tmp/stacked_lstm_test_lol.dali\", \"rb\") as f:\n",
408 |     "    l_pickled = pickle.load(f)\n",
409 |     "print(\"==== PICKLED ====\")\n",
410 |     "\n",
411 |     "print(l_pickled.cells[0].cell_layer)\n",
412 |     "print(l_pickled.cells[0].forget_layers)\n",
413 |     "print(l_pickled.cells[0].hidden_size)\n",
414 |     "print(l_pickled.cells[0].input_sizes)\n",
415 |     "print(l_pickled.cells[0].input_layer)\n",
416 |     "print(l_pickled.cells[0].num_children)\n",
417 |     "print(l_pickled.cells[0].memory_feeds_gates)\n",
418 |     "print(l_pickled.cells[0].parameters()[5].w)\n",
419 |     "print(l.shortcut)"
420 |    ]
421 |   },
422 |   {
423 |    "cell_type": "code",
424 |    "execution_count": 10,
425 |    "metadata": {
426 |     "collapsed": false
427 |    },
428 |    "outputs": [
429 |     {
430 |      "ename": "NameError",
431 |      "evalue": "name 'l_pickled' is not defined",
432 |      "output_type": "error",
433 |      "traceback": [
434 |       "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
435 |       "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
436 |       "\u001b[1;32m<ipython-input-10-f70ba0ce9ad1>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0ml_pickled\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0minitial_states\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
437 |       "\u001b[1;31mNameError\u001b[0m: name 'l_pickled' is not defined"
438 |      ]
439 |     }
440 |    ],
441 |    "source": [
442 |     "l_pickled.initial_states()"
443 |    ]
444 |   },
445 |   {
446 |    "cell_type": "code",
447 |    "execution_count": 21,
448 |    "metadata": {
449 |     "collapsed": false
450 |    },
451 |    "outputs": [
452 |     {
453 |      "data": {
454 |       "text/plain": [
455 |        "[<LSTM inputs=[1, 2], hidden_size=5>, <LSTM inputs=[5], hidden_size=4>]"
456 |       ]
457 |      },
458 |      "execution_count": 21,
459 |      "metadata": {},
460 |      "output_type": "execute_result"
461 |     }
462 |    ],
463 |    "source": [
464 |     "l_pickled.cells"
465 |    ]
466 |   },
467 |   {
468 |    "cell_type": "code",
469 |    "execution_count": 5,
470 |    "metadata": {
471 |     "collapsed": false
472 |    },
473 |    "outputs": [
474 |     {
475 |      "data": {
476 |       "text/plain": [
477 |        "[<test_dali.LSTMState at 0x7f72e743a968>,\n",
478 |        " <test_dali.LSTMState at 0x7f72e743ad00>]"
479 |       ]
480 |      },
481 |      "execution_count": 5,
482 |      "metadata": {},
483 |      "output_type": "execute_result"
484 |     }
485 |    ],
486 |    "source": [
487 |     "l_pickled.activate([\n",
488 |     "    Mat([[1]]),\n",
489 |     "    Mat([[1, 2]])\n",
490 |     "], l_pickled.initial_states())"
491 |    ]
492 |   },
493 |   {
494 |    "cell_type": "code",
495 |    "execution_count": 4,
496 |    "metadata": {
497 |     "collapsed": false
498 |    },
499 |    "outputs": [
500 |     {
501 |      "ename": "RuntimeError",
502 |      "evalue": "Activating LSTM stack of size 2 with different number of states 0",
503 |      "output_type": "error",
504 |      "traceback": [
505 |       "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
506 |       "\u001b[1;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
507 |       "\u001b[1;32m<ipython-input-4-e0b9f00b5030>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[0;32m      2\u001b[0m     \u001b[0mMat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m1\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      3\u001b[0m     \u001b[0mMat\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m1\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;36m2\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 4\u001b[1;33m ], [])\n\u001b[0m",
508 |       "\u001b[1;32m/home/sidor/projects/less_important/dali-cython-stub/dali/layers/LSTM.pyx\u001b[0m in \u001b[0;36mtest_dali.StackedLSTM.activate (test_dali.cpp:68105)\u001b[1;34m()\u001b[0m\n\u001b[0;32m    808\u001b[0m                 \u001b[0minputs_vector_float\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mmats_to_vec_float\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0minputs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    809\u001b[0m                 return WrapLSTMStates_float(\n\u001b[1;32m--> 810\u001b[1;33m                     \u001b[1;33m(\u001b[0m\u001b[1;33m<\u001b[0m\u001b[0mCStackedLSTM\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m*\u001b[0m\u001b[1;33m>\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m<\u001b[0m\u001b[0mStackedLSTM\u001b[0m\u001b[1;33m>\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mlayerinternal\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mactivate\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mhiddens_vector_float\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0minputs_vector_float\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;33m<\u001b[0m\u001b[0mfloat\u001b[0m\u001b[1;33m>\u001b[0m \u001b[0mdrop_prob\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    811\u001b[0m                 )\n\u001b[0;32m    812\u001b[0m             \u001b[1;32melif\u001b[0m \u001b[0mtype\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0minputs\u001b[0m\u001b[1;33m)\u001b[0m \u001b[1;33m==\u001b[0m \u001b[0mMat\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
509 |       "\u001b[1;31mRuntimeError\u001b[0m: Activating LSTM stack of size 2 with different number of states 0"
510 |      ]
511 |     }
512 |    ],
513 |    "source": [
514 |     "l_pickled.activate([\n",
515 |     "    Mat([[1]]),\n",
516 |     "    Mat([[1, 2]])\n",
517 |     "], [])"
518 |    ]
519 |   },
520 |   {
521 |    "cell_type": "code",
522 |    "execution_count": 23,
523 |    "metadata": {
524 |     "collapsed": false
525 |    },
526 |    "outputs": [],
527 |    "source": [
528 |     "h1 = l_pickled.cells[0].activate(\n",
529 |     "    [Mat([[1]]),\n",
530 |     "    Mat([[1, 2]])],\n",
531 |     "    l_pickled.cells[0].initial_states()\n",
532 |     ")\n",
533 |     "h2 = l_pickled.cells[1].activate(\n",
534 |     "    h1.hidden,\n",
535 |     "    l_pickled.cells[1].initial_states()\n",
536 |     ")"
537 |    ]
538 |   },
539 |   {
540 |    "cell_type": "code",
541 |    "execution_count": 24,
542 |    "metadata": {
543 |     "collapsed": false
544 |    },
545 |    "outputs": [
546 |     {
547 |      "data": {
548 |       "text/plain": [
549 |        "[\n",
550 |        "    [ -0.007  -0.068  -0.095   0.145  -0.057]\n",
551 |        "]"
552 |       ]
553 |      },
554 |      "execution_count": 24,
555 |      "metadata": {},
556 |      "output_type": "execute_result"
557 |     }
558 |    ],
559 |    "source": [
560 |     "h1.hidden"
561 |    ]
562 |   },
563 |   {
564 |    "cell_type": "code",
565 |    "execution_count": null,
566 |    "metadata": {
567 |     "collapsed": false
568 |    },
569 |    "outputs": [],
570 |    "source": [
571 |     "new_state = l_pickled.activate([\n",
572 |     "    Mat([[1]]),\n",
573 |     "    Mat([[1, 2]])\n",
574 |     "],\n",
575 |     "l_pickled.initial_states(),\n",
576 |     "0.5\n",
577 |     ")\n",
578 |     "new_state[0].memory"
579 |    ]
580 |   },
581 |   {
582 |    "cell_type": "code",
583 |    "execution_count": 13,
584 |    "metadata": {
585 |     "collapsed": false
586 |    },
587 |    "outputs": [
588 |     {
589 |      "data": {
590 |       "text/plain": [
591 |        "<matplotlib.image.AxesImage at 0x7f4b6440f748>"
592 |       ]
593 |      },
594 |      "execution_count": 13,
595 |      "metadata": {},
596 |      "output_type": "execute_result"
597 |     },
598 |     {
599 |      "data": {
600 |       "image/png": "iVBORw0KGgoAAAANSUhEUgAAA5QAAADOCAYAAABBy01EAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAACA5JREFUeJzt3U9opHcBxvEn2d2iUlRsD2K7mEvB+gcUZA9t1g16aUWs\n4KF49C4KBVk82VuVHnrxqB5EaQWFooh4Mrq7YkFs0f5Z2RUj/YMVrQgiyGri4Y1lq12n+8ykv0zm\n84GQmSQMzyGEfOd9550EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAgP9yV5KLSS4lOTt4C7S+nuTF\nJL8ePQTmcDLJj5M8leTJJJ8dOwdqb0jyWJInkjyd5IGxc2Aux5I8nuT7o4fAYXQsyeUkG0lOZPrD\nf/vIQVA6neQDEZQst7cnef/+7RuT/Cb+JrO83rT/+XiSnyfZHLgF5nFfkm8l+d7oIatqffQA/q9T\nmYJyJ8mVJI8kuWfkICidS/KX0SNgTn/I9MRekvwtyTNJ3jFuDszl7/ufb8j0BPZLA7dA69YkH03y\n1SRrg7esLEF5uN2S5Nmr7j+3/zUAxtrIdNT9scE7oLWe6QmSFzOdyv302DlQeSjJ55Psjh6yygTl\n4bY3egAA/+PGJN9J8rlMRyphGe1mOoX71iQfSrI1dA1cv48l+WOm1086OjmQoDzcns90EYj/OJnp\nKCUAY5xI8t0k30zy6OAtsAh/TfKDJB8cPQSu0x1JPp7kd0keTvLhJN8YuggOoeNJfpvp1Kob4qI8\nLLeNuCgPy20t0z8rD40eAnO6Oclb92+/MclPk3xk3ByY25m4yitc092ZriR4OckXBm+B1sNJXkjy\nj0yvC/702DlQ2cx0muATmU6xejzTWzvBsnlfkl9m+l3+VabXoMEyOxNXeQUAAAAAAAAAAAAAAAAA\nAAAAAEab+01A35ns/X4RSwAAADh87rgz+dmFV23HuYMyyd4XF/AgXNt2kq3BG466jdEDVsSjST4x\nesQR9+a9u0dPWAnfvv9S7r3/ttEzjrRPrp0aPWEFbMd/GAfvxJ/uGz3hyPvXlx/IsbPeXe8gXbn5\nLck12nH99Z0CAADAUSEoAQAAqAjKJbAxegAsyLtGD4AFec/W20ZPgAXYGD0AFmLtzs3RE1aaoFwC\nG6MHwIIISo6K927dNHoCLMDG6AGwEOubp0dPWGmCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACA\niqAEAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAA\nqAhKAAAAKoISAACAiqAEAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAA\ngIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEA\nAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACoCEoAAAAqghIA\nAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigB\nAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoIS\nAACAiqAEAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIo\nAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACovJagvCvJxSSXkpw92DkAAAAsi1lBeSzJVzJF5buT\nfCrJ7Qc9CgAAgMNvVlCeSnI5yU6SK0keSXLPAW8CAABgCcwKyluSPHvV/ef2vwYAAMCKmxWUe6/L\nCgAAAJbO8Rnffz7Jyavun8x0lPIVtq+6vbH/AQAAwPLZPX8uexfOv6afnRWUv0hyW6ZGfCHJvZku\nzPMKW9c1DwAAgMNqffN0snn65fu7D37pmj87Kyj/meQzSX6U6YqvX0vyzPwTAQAAWHazgjJJfrj/\nAQAAAC+bdVEeAAAAeFWCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACoCEoA\nAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAE\nAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhK\nAAAAKoISAACAiqAEAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqg\nBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACoCEoAAAAqghIAAICKoAQAAKAiKAEAAKgI\nSgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACoCEoAAAAqghIAAICK\noAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACAiqAEAACgIigBAACo\nCEoAAAAqghIAAICKoAQAAKAiKAEAAKgISgAAACqCEgAAgIqgBAAAoCIoAQAAqAhKAAAAKoISAACA\niqAEAACgIigBAACoCEoAAAAqgnIJ7IweAAtycfQAWJAnt/88egIswM7oAbAQu+fPjZ6w0gTlEtgZ\nPQAWRFByVDy1/dLoCbAAO6MHwELsXTg/esJKE5QAAABUBCUAAACVtQU8xnaSMwt4HAAAAA6fnyTZ\nGj0CAAAAAAAAAAAAAAAAAAAAAAAAAADg6Pk33YaSzE4NNTEAAAAASUVORK5CYII=\n",
601 |       "text/plain": [
602 |        "<matplotlib.figure.Figure at 0x7f4b6651c1d0>"
603 |       ]
604 |      },
605 |      "metadata": {},
606 |      "output_type": "display_data"
607 |     }
608 |    ],
609 |    "source": [
610 |     "plt.matshow(l_pickled.cells[0].forget_layers[0].matrices[0].w)"
611 |    ]
612 |   },
613 |   {
614 |    "cell_type": "code",
615 |    "execution_count": 33,
616 |    "metadata": {
617 |     "collapsed": true
618 |    },
619 |    "outputs": [],
620 |    "source": [
621 |     "?l.activate_sequence"
622 |    ]
623 |   },
624 |   {
625 |    "cell_type": "code",
626 |    "execution_count": null,
627 |    "metadata": {
628 |     "collapsed": true
629 |    },
630 |    "outputs": [],
631 |    "source": []
632 |   }
633 |  ],
634 |  "metadata": {
635 |   "kernelspec": {
636 |    "display_name": "Python 3",
637 |    "language": "python",
638 |    "name": "python3"
639 |   },
640 |   "language_info": {
641 |    "codemirror_mode": {
642 |     "name": "ipython",
643 |     "version": 3
644 |    },
645 |    "file_extension": ".py",
646 |    "mimetype": "text/x-python",
647 |    "name": "python",
648 |    "nbconvert_exporter": "python",
649 |    "pygments_lexer": "ipython3",
650 |    "version": "3.4.1"
651 |   }
652 |  },
653 |  "nbformat": 4,
654 |  "nbformat_minor": 0
655 | }
656 | 


--------------------------------------------------------------------------------
/preprocessor_utils.py:
--------------------------------------------------------------------------------
  1 | import re
  2 | 
  3 | class TypeReplacer(object):
  4 |     def __init__(self, macro_name, templated_type, base_class, internal_property, deref):
  5 |         self.pattern = re.compile(macro_name + r"\((?P<var>.+?)\)")
  6 |         self.templated_type = templated_type
  7 |         self.deref = deref
  8 |         self.base_class = base_class
  9 |         self.internal_property = internal_property
 10 | 
 11 |     def rephrase(self, type_name):
 12 |         def wrapped(match):
 13 |             var = match.group("var")
 14 |             if self.deref:
 15 |                 return "(<%s[%s]*>((<%s>(%s)).%s))[0]" % (self.templated_type, type_name, self.base_class, var, self.internal_property)
 16 |             else:
 17 |                 return "(<%s[%s]*>((<%s>(%s)).%s))" % (self.templated_type, type_name, self.base_class, var, self.internal_property)
 18 |         return wrapped
 19 | 
 20 |     def __call__(self, *args, **kwargs):
 21 |         return self.replace(*args, **kwargs)
 22 | 
 23 |     def replace(self, type_name, text):
 24 |         return self.pattern.sub(self.rephrase(type_name), text)
 25 | 
 26 | class WrapperReplacer(object):
 27 |     def __init__(self, pattern, wrapper_function):
 28 |         self.pattern = pattern
 29 |         self.wrapper_function = wrapper_function
 30 | 
 31 |     def __call__(self, *args, **kwargs):
 32 |         return self.replace(*args, **kwargs)
 33 | 
 34 |     def replace(self, type_name, text):
 35 |         return text.replace(self.pattern, self.wrapper_function % (type_name,))
 36 | 
 37 | class LambdaReplacer(object):
 38 |     def __init__(self, macro_name, lambdaf):
 39 |         self.pattern = re.compile(macro_name + r"\((?P<var>.+?)\)")
 40 |         self.lambdaf = lambdaf
 41 | 
 42 |     def __call__(self, *args, **kwargs):
 43 |         return self.replace(*args, **kwargs)
 44 | 
 45 |     def replace(self, type_name, text):
 46 |         return self.pattern.sub(self.lambdaf(type_name), text)
 47 | 
 48 | class TypedName(LambdaReplacer):
 49 |     def __init__(self):
 50 |         def replacer(type_name):
 51 |             def wrapped(match):
 52 |                 var = match.group("var")
 53 |                 return '%s_%s' % (var, type_name)
 54 |             return wrapped
 55 | 
 56 |         super(TypedName, self).__init__('TYPED', replacer)
 57 | 
 58 | 
 59 | REPLACERS = [
 60 |     TypeReplacer("DEREF_MAT", "CMat", "Mat", "matinternal", deref=True),
 61 |     TypeReplacer("PTR_MAT", "CMat",  "Mat", "matinternal", deref=False),
 62 |     WrapperReplacer("WRAP_MAT", 'WrapMat_%s'),
 63 | 
 64 |     TypeReplacer("DEREF_LAYER", "CLayer", "Layer", "layerinternal", deref=True),
 65 |     TypeReplacer("PTR_LAYER", "CLayer",  "Layer", "layerinternal", deref=False),
 66 |     WrapperReplacer("WRAP_LAYER", 'WrapLayer_%s'),
 67 | 
 68 |     TypeReplacer("DEREF_RNN", "CRNN", "RNN", "layerinternal", deref=True),
 69 |     TypeReplacer("PTR_RNN", "CRNN",  "RNN", "layerinternal", deref=False),
 70 |     WrapperReplacer("WRAP_RNN", 'WrapRNN_%s'),
 71 | 
 72 |     TypeReplacer("DEREF_GRU", "CGRU", "GRU", "layerinternal", deref=True),
 73 |     TypeReplacer("PTR_GRU", "CGRU",  "GRU", "layerinternal", deref=False),
 74 |     WrapperReplacer("WRAP_GRU", 'WrapGRU_%s'),
 75 | 
 76 |     TypeReplacer("DEREF_STACKEDLAYER", "CStackedInputLayer", "StackedInputLayer", "layerinternal", deref=True),
 77 |     TypeReplacer("PTR_STACKEDLAYER", "CStackedInputLayer", "StackedInputLayer", "layerinternal", deref=False),
 78 |     WrapperReplacer("WRAP_STACKEDLAYER", 'WrapStackedLayer_%s'),
 79 | 
 80 |     TypeReplacer("DEREF_LSTMSTATE", "CLSTMState", "LSTMState", "lstmstateinternal", deref=True),
 81 |     TypeReplacer("PTR_LSTMSTATE", "CLSTMState", "LSTMState", "lstmstateinternal", deref=False),
 82 |     WrapperReplacer("WRAP_LSTMSTATE", 'WrapLSTMState_%s'),
 83 | 
 84 |     TypeReplacer("DEREF_LSTM", "CLSTM", "LSTM", "layerinternal", deref=True),
 85 |     TypeReplacer("PTR_LSTM", "CLSTM", "LSTM", "layerinternal", deref=False),
 86 |     WrapperReplacer("WRAP_LSTM", 'WrapLSTM_%s'),
 87 | 
 88 |     TypeReplacer("DEREF_STACKEDLSTM", "CStackedLSTM", "StackedLSTM", "layerinternal", deref=True),
 89 |     TypeReplacer("PTR_STACKEDLSTM", "CStackedLSTM", "StackedLSTM", "layerinternal", deref=False),
 90 |     WrapperReplacer("WRAP_STACKEDLSTM", 'WrapStackedLSTM_%s'),
 91 | 
 92 |     TypedName()
 93 | ]
 94 | 
 95 | for solver in ["SGD", "AdaGrad", "RMSProp", "AdaDelta", "Adam"]:
 96 |     REPLACERS.append(
 97 |         TypeReplacer("DEREF_" + solver.upper(), "C" + solver, solver, "solverinternal", deref=True)
 98 |     )
 99 |     REPLACERS.append(
100 |         TypeReplacer("PTR_" + solver.upper(), "C" + solver, solver, "solverinternal", deref=False)
101 |     )
102 | 
103 | TYPE_NPYINTERNAL_DICT = {
104 |     'int':    'np.NPY_INT32',
105 |     'float':  'np.NPY_FLOAT32',
106 |     'double': 'np.NPY_FLOAT64',
107 | }
108 | 
109 | TYPE_NUMPY_PRETTY = {
110 |     'int':    'np.int32',
111 |     'float':  'np.float32',
112 |     'double': 'np.float64',
113 | }
114 | 
115 | def modify_snippet(pyp, code, type_name):
116 |     modified = code
117 |     modified = modified.replace('TYPE_NAME',       type_name)
118 |     modified = modified.replace('TYPE_NPYINTERNAL', TYPE_NPYINTERNAL_DICT.get(type_name))
119 |     modified = modified.replace('TYPE_NPYPRETTY', TYPE_NUMPY_PRETTY.get(type_name))
120 | 
121 |     for replacer in REPLACERS:
122 |         modified = replacer(type_name, modified)
123 | 
124 |     pyp.indent(modified)
125 | 
126 | 
127 | 
128 | def type_repeat_with_types(pyp, types, code):
129 |     for typ in types:
130 |         modify_snippet(pyp, code, typ)
131 | 
132 | def type_repeat(pyp, code):
133 |     type_repeat_with_types(pyp, ["int", "float", "double"], code)
134 | 
135 | def type_frepeat(pyp, code):
136 |     type_repeat_with_types(pyp, ["float", "double"], code)
137 | 
138 | def typed_expression_args_with_types(pyp, types, args, code):
139 |     if type(args) == tuple:
140 |         args_class
141 |     assert len(args) > 0
142 |     if len(args) > 1:
143 |         check_str = []
144 |         for arg1, arg2 in zip(args[:-1], args[1:]):
145 |             check_str.append('(%s).dtypeinternal != (%s).dtypeinternal' % (arg1, arg2))
146 |         check_str = 'if ' + ' or '.join(check_str) + ':'
147 |         pyp.indent(check_str)
148 |         pyp.indent('   raise ValueError("All arguments must be of the same type")')
149 | 
150 |     first_run = True
151 |     for typ in types:
152 |         if_str = 'if' if first_run else 'elif'
153 |         first_run = False
154 |         pyp.indent(if_str + ' (%s).dtypeinternal == %s:' % (args[0], TYPE_NPYINTERNAL_DICT[typ]))
155 |         modify_snippet(pyp, code, typ)
156 |     pyp.indent('else:')
157 |     types_str = ', '.join([TYPE_NUMPY_PRETTY[typ] for typ in types])
158 |     pyp.indent('    raise ValueError("Invalid dtype:" + str(' + args[0] + '.dtype) + " (should be one of ' + types_str+ ')")')
159 | 
160 | def typed_expression_args(pyp, args, code):
161 |     typed_expression_args_with_types(pyp, ["int", "float", "double"], args, code)
162 | 
163 | def typed_fexpression_args(pyp, args, code):
164 |     typed_expression_args_with_types(pyp, ["float", "double"], args, code)
165 | 
166 | def typed_expressions_with_types(pyp, lst, cast_to, types, code):
167 |     assert len(lst) > 0
168 |     pyp.indent('if len(%s) == 0:' % (lst,))
169 |     pyp.indent("    raise ValueError('list cannot be empty')")
170 |     pyp.indent('common_dtype = (<%s>(%s[0])).dtypeinternal' % (cast_to, lst,))
171 |     pyp.indent('for el in %s:' % (lst,))
172 |     pyp.indent('    if (<%s>el).dtypeinternal != common_dtype:' % (cast_to,))
173 |     pyp.indent('        common_dtype = -1')
174 |     pyp.indent('        break')
175 |     pyp.indent('if common_dtype == -1:')
176 |     pyp.indent('    raise ValueError("All the arguments must be of the same type")')
177 | 
178 |     first_run = True
179 |     for typ in types:
180 |         if_str = 'if' if first_run else 'elif'
181 |         first_run = False
182 |         pyp.indent(if_str + ' common_dtype == %s:' % (TYPE_NPYINTERNAL_DICT[typ],))
183 |         modify_snippet(pyp, code, typ)
184 |     pyp.indent('else:')
185 |     types_str = ', '.join([TYPE_NUMPY_PRETTY[typ] for typ in types])
186 |     pyp.indent('    raise ValueError("Invalid dtype:" + str(' + lst + '[0].dtype) + " (should be one of ' + types_str+ ')")')
187 | 
188 | 
189 | def typed_expression_list(pyp, lst, cast_to, code):
190 |     typed_expressions_with_types(pyp, lst, cast_to, ["int", "float", "double"], code)
191 | 
192 | def typed_fexpression_list(pyp, lst, cast_to, code):
193 |     typed_expressions_with_types(pyp, lst, cast_to, ["float", "double"], code)
194 | 
195 | def typed_expression(pyp, code):
196 |     return typed_expression_args(pyp, ["self"], code)
197 | 
198 | def typed_fexpression(pyp, code):
199 |     return typed_fexpression_args(pyp, ["self"], code)
200 | 
201 | def rich_typed_expression(pyp, replacable_type, code):
202 |     def modify_snippet(type_name):
203 |         modified = code
204 |         modified = modified.replace('TYPE_NAME', type_name)
205 |         modified = modified.replace('TEMPLATED_TYPE', '%s[%s]' % (replacable_type, type_name))
206 |         modified = modified.replace('TEMPLATED_CAST', '<%s[%s]>' % (replacable_type, type_name))
207 |         pyp.indent(modified)
208 | 
209 |     pyp.indent('if self.dtypeinternal == np.NPY_INT32:')
210 |     modify_snippet('int')
211 |     pyp.indent('elif self.dtypeinternal == np.NPY_FLOAT32:')
212 |     modify_snippet('float')
213 |     pyp.indent('elif self.dtypeinternal == np.NPY_FLOAT64:')
214 |     modify_snippet('double')
215 |     pyp.indent('else:')
216 |     pyp.indent('    raise ValueError("Invalid dtype:" + str(self.dtype) + " (should be one of int32, float32, float64)")')
217 | 
218 | WITHOUT_INT = ["float", "double"]
219 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | preprocessor>=1.1.0
 2 | numpy>=1.9.2
 3 | epub-conversion>=1.0.7
 4 | pytreebank>=0.1.4
 5 | xml-cleaner>=1.0.18
 6 | requests>=2.6.0
 7 | dill>=0.2.4
 8 | Cython>=0.23.2
 9 | 
10 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
  1 | import distutils.ccompiler
  2 | import distutils.sysconfig
  3 | import numpy as np
  4 | import preprocessor
  5 | import subprocess
  6 | 
  7 | from Cython.Distutils.extension import Extension
  8 | from Cython.Distutils           import build_ext
  9 | from distutils.core             import setup
 10 | from distutils.command          import build as build_module, clean as clean_module
 11 | from distutils.spawn            import find_executable
 12 | from os.path                    import join, dirname, realpath, exists, getmtime, relpath
 13 | from os                         import environ, walk, makedirs
 14 | from sys                        import platform, exit
 15 | 
 16 | 
 17 | from tempfile import TemporaryDirectory
 18 | 
 19 | SCRIPT_DIR = dirname(realpath(__file__))
 20 | DALI_CORE_DIR    = join(SCRIPT_DIR, "cython", "dali", "core")
 21 | DALI_CORE_MODULE = "dali.core"
 22 | 
 23 | ################################################################################
 24 | ##                               TOOLS                                        ##
 25 | ################################################################################
 26 | 
 27 | def find_extension_files(path, extension):
 28 |     """Recursively find files with specific extension in a directory"""
 29 |     for relative_path, dirs, files in walk(path):
 30 |         for fname in files:
 31 |             if fname.endswith(extension):
 32 |                 yield join(path, relative_path, fname)
 33 | 
 34 | def execute_bash(command, *args, **kwargs):
 35 |     """Executes bash command, prints output and throws an exception on failure."""
 36 |     #print(subprocess.check_output(command.split(' '), shell=True))
 37 |     process = subprocess.Popen(command,
 38 |                                stdout=subprocess.PIPE,
 39 |                                stderr=subprocess.STDOUT,
 40 |                                universal_newlines=True,
 41 |                                *args, **kwargs)
 42 |     process.wait()
 43 |     return str(process.stdout.read()), process.returncode
 44 | 
 45 | ################################################################################
 46 | ##                 STEALING LINKING ARGS FROM CMAKE                           ##
 47 | ################################################################################
 48 | 
 49 | def cmake_robbery(varnames, fake_executable="dummy"):
 50 |     """Capture Cmake environment variables by running `find_package(dali)`"""
 51 |     varstealers = []
 52 |     magic_command = "CYTHON_DALI_BEGIN_VARIABLE_STEALING"
 53 |     varstealers.append("message(STATUS \"%s\")" % (magic_command,))
 54 |     for varname in varnames:
 55 |         varstealers.append("message(STATUS  \"CYTHON_DALI_%s: ${%s}\")" % (varname, varname,))
 56 |     varstealers = "\n".join(varstealers) + "\n"
 57 | 
 58 |     with TemporaryDirectory() as temp_dir:
 59 |         with open(join(temp_dir, "source.cpp"), "wt") as source_cpp:
 60 |             source_cpp.write("int main() {};\n")
 61 |         with open(join(temp_dir, "CMakeLists.txt"), "wt") as cmake_conf:
 62 |             cmake_conf.write("""
 63 |                 cmake_minimum_required(VERSION 2.8 FATAL_ERROR)
 64 |                 project("dali-cython")
 65 |                 find_package(Dali REQUIRED) # find Dali.
 66 |                 add_executable(%s source.cpp)
 67 |                 target_link_libraries(%s ${DALI_AND_DEPS_LIBRARIES})
 68 |             """ % (fake_executable, fake_executable,) + varstealers)
 69 | 
 70 |         cmake_subdirectory = fake_executable + ".dir"
 71 |         cmake_stdout, cmake_status = execute_bash(["cmake", "."], cwd=temp_dir)
 72 |         if cmake_status != 0:
 73 |             print("HORRIBLE CMAKE ERROR.")
 74 |             print('*' * 79)
 75 |             print(cmake_stdout)
 76 |             print('*' * 79)
 77 |             exit(1)
 78 |         # capture the link arguments
 79 |         with open(join(temp_dir, "CMakeFiles", cmake_subdirectory, "link.txt"), "rt") as f:
 80 |             linking_command = f.read()
 81 | 
 82 |     linking_command = linking_command.replace("-o %s" % (fake_executable,), " ")
 83 |     linking_args = linking_command.split(" ", 1)[1].strip().split()
 84 |     linking_args = [arg for arg in linking_args if cmake_subdirectory not in arg]
 85 |     outvars = {}
 86 |     outvars["LINK_ARGS"] = linking_args
 87 | 
 88 |     # slice output after the magic command and retrieve these variables
 89 |     # from the CMake environment
 90 |     idx = cmake_stdout.find(magic_command) + len(magic_command) + 1
 91 |     lines = cmake_stdout[idx:].split("\n")[:len(varnames)]
 92 | 
 93 |     for varname, line in zip(varnames, lines):
 94 |         assert(varname in line)
 95 |         _, value = line.split(":", 1)
 96 |         outvars[varname] = value.strip().split(";")
 97 |     return outvars
 98 | 
 99 | # cmake environment variables
100 | robbed = cmake_robbery(["DALI_AND_DEPS_INCLUDE_DIRS"])
101 | 
102 | ################################################################################
103 | ##                 AUTODETECTING COMPILER VERSION                             ##
104 | ################################################################################
105 | 
106 | class Version(tuple):
107 |     @staticmethod
108 |     def from_string(version_str):
109 |         return Version([int(n) for n in version_str.split('.')])
110 | 
111 |     def __str__(self):
112 |         return '.'.join([str(n) for n in self])
113 | 
114 | def detect_compiler(possible_commands, version_extractor, min_version):
115 |     good_executable = None
116 |     good_version    = None
117 |     for command in possible_commands:
118 |         executable = find_executable(command)
119 |         if executable is None: continue
120 |         version = version_extractor(executable)
121 |         if version is None: continue
122 |         if version >= min_version:
123 |             good_executable = executable
124 |             good_version    = version
125 |             break
126 |     return good_executable, good_version
127 | 
128 | def obtain_gxx_version(gcc_executable):
129 |     try:
130 |         gcc_version, status = execute_bash([gcc_executable, '-dumpversion'])
131 |         assert status == 0
132 |         return Version.from_string(gcc_version)
133 |     except Exception:
134 |         return None
135 | 
136 | GXX_VERSION_ERROR = \
137 | """Minimum required version of gcc/g++ must is %s.
138 | 
139 | We strive to cover all the cases for automatic compiler detection,
140 | however if we failed to detect yours please kindly report it on github.
141 | 
142 | You can explicitly specify an executables by running:
143 | 
144 |     CC=/path/to/my/gcc CXX=/path/to/my/g++ python3 setup.py ...
145 | 
146 | """
147 | 
148 | # set the compiler unless explicitly specified.
149 | if platform == 'linux':
150 |     for env_var, possible_commands, min_version in [
151 |                 ('CC',  ['gcc', 'gcc4.9', 'gcc-4.9'], Version((4, 9))),
152 |                 ('CXX', ['g++', 'g++4.9', 'g++-4.9'], Version((4, 9))),
153 |             ]:
154 |         if env_var not in environ:
155 |             gxx_executable, gxx_version = detect_compiler(possible_commands, obtain_gxx_version, min_version)
156 |             if gxx_executable is None:
157 |                 print(GXX_VERSION_ERROR % (str(min_version),))
158 |                 exit(2)
159 |             else:
160 |                 print('Autodetected %s executable %s, version: %s' % (env_var, gxx_executable, str(gxx_version)))
161 |                 environ[env_var] = gxx_executable
162 | else:
163 |     if "CC" not in environ:
164 |         environ["CC"]  = "clang"
165 |     if "CXX" not in environ:
166 |         environ["CXX"] = "clang++"
167 | 
168 | ################################################################################
169 | ##                      TAKING OUT THE TRASH                                  ##
170 | ################################################################################
171 | 
172 | 
173 | # Make a `cleanall` rule to get rid of intermediate and library files
174 | class clean(clean_module.clean):
175 |     def run(self):
176 |         print("Cleaning up cython files...")
177 |         # Just in case the build directory was created by accident,
178 |         # note that shell=True should be OK here because the command is constant.
179 |         for place in ["build", "cython/dali/core.c", "cython/dali/core.cpp", "dali/*.so", "MANIFEST.in"]:
180 |             subprocess.Popen("rm -rf %s" % (place,), shell=True, executable="/bin/bash", cwd=SCRIPT_DIR)
181 | 
182 | compiler = distutils.ccompiler.new_compiler()
183 | distutils.sysconfig.customize_compiler(compiler)
184 | BLACKLISTED_COMPILER_SO = ['-Wp,-D_FORTIFY_SOURCE=2']
185 | build_ext.compiler = compiler
186 | 
187 | ext_modules = [Extension(
188 |     name=DALI_CORE_MODULE,
189 |     sources=[join(SCRIPT_DIR, "cython", "dali", "core.pyx")] + list(find_extension_files(DALI_CORE_DIR, ".cpp")),
190 |     library_dirs=[],
191 |     language='c++',
192 |     extra_compile_args=['-std=c++11'],
193 |     extra_link_args=robbed["LINK_ARGS"],
194 |     libraries=[],
195 |     extra_objects=[],
196 |     include_dirs=[np.get_include()] + robbed["DALI_AND_DEPS_INCLUDE_DIRS"]
197 | )]
198 | 
199 | 
200 | ################################################################################
201 | ##       PREPROCSSOR - HOW TO SHRINK DALI CYTHON CODE THREEFOLD               ##
202 | ################################################################################
203 | 
204 | 
205 | def run_preprocessor():
206 |     """
207 |     Generate python files using a file prepocessor (essentially macros
208 |     that generate multiple versions of the code for each dtype supported
209 |     by a Dali operation)
210 |     """
211 |     EXTENSION = ".pre"
212 |     for py_processor_file in find_extension_files(SCRIPT_DIR, EXTENSION):
213 |         output_file = py_processor_file[:-len(EXTENSION)]
214 | 
215 |         if not exists(output_file) or \
216 |                 getmtime(py_processor_file) > getmtime(output_file) or \
217 |                 getmtime(join(SCRIPT_DIR, "preprocessor_utils.py")) > getmtime(output_file):
218 |             print('Preprocessing %s' % (py_processor_file,))
219 |             with open(output_file, "wt") as f:
220 |                 f.write(preprocessor.process_file(py_processor_file, prefix='pyp', suffix='ypy'))
221 | 
222 | 
223 | 
224 | ################################################################################
225 | ##                 POSSIBLY NO LONGER NEEDED                                  ##
226 | ################################################################################
227 | 
228 | 
229 | # We need to remove some compiler flags, to make sure
230 | # the code can compile on Fedora (to be honest it seems
231 | # to be a bug in Fedora's distrubtion of Clang).
232 | # Nevertheless this little madness below is to change
233 | # default compiler flags used by Cython.
234 | # If you know a better way call me immediately day
235 | # or night at 4getszymo4. Thank you!
236 | class nonbroken_build_ext(build_ext):
237 |     def build_extensions(self, *args, **kwargs):
238 |         run_preprocessor()
239 |         new_compiler_so = []
240 |         for arg in self.compiler.compiler_so:
241 |             if arg not in BLACKLISTED_COMPILER_SO:
242 |                 new_compiler_so.append(arg)
243 |         self.compiler.compiler_so = new_compiler_so
244 |         super(nonbroken_build_ext, self).build_extensions(*args, **kwargs)
245 | 
246 | 
247 | ################################################################################
248 | ##                 FIND ALL THE FILES AND CONFIGURE SETUP                     ##
249 | ################################################################################
250 | 
251 | # generate manifest.in
252 | pre_files = list(find_extension_files(SCRIPT_DIR, ".pre"))
253 | pyx_files = list(find_extension_files(SCRIPT_DIR, ".pyx"))
254 | # check that this file was not auto-generated
255 | pyx_files = [fname for fname in pyx_files if fname + ".pre" not in pre_files]
256 | cpp_files = list(find_extension_files(DALI_CORE_DIR, ".cpp"))
257 | header_files = list(find_extension_files(DALI_CORE_DIR, ".h"))
258 | pxd_files = (
259 |     list(find_extension_files(join(SCRIPT_DIR, "libcpp11"), ".pxd")) +
260 |     list(find_extension_files(join(SCRIPT_DIR, "modern_numpy"), ".pxd"))
261 | )
262 | 
263 | with open(join(SCRIPT_DIR, "MANIFEST.in"), "wt") as manifest_in:
264 |     for fname in pre_files + pyx_files + cpp_files + header_files + pxd_files + [join(SCRIPT_DIR, "preprocessor_utils.py")]:
265 |         manifest_in.write("include %s\n" % (relpath(fname, SCRIPT_DIR)))
266 | 
267 | setup(
268 |   name="dali",
269 |   version='1.0.9',
270 |   cmdclass={"build_ext": nonbroken_build_ext, 'clean': clean},
271 |   ext_modules=ext_modules,
272 |   description="Buttery smooth automatic differentiation using Dali.",
273 |   author="Jonathan Raiman, Szymon Sidor",
274 |   author_email="jonathanraiman at gmail dot com",
275 |   install_requires=[
276 |     'preprocessor',
277 |     'numpy',
278 |     'dill'
279 |   ],
280 |   packages=[
281 |     "dali",
282 |     "dali.utils",
283 |     "dali.data",
284 |     "dali.models",
285 |   ]
286 | )
287 | 


--------------------------------------------------------------------------------
/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dali-ml/dali-cython/e258469aeb1d4cb3e4cdf5c07e8948f461a038f1/tests/__init__.py


--------------------------------------------------------------------------------
/tests/test.txt:
--------------------------------------------------------------------------------
1 | Ala ma kota
2 | kota zadziergal ale na smierc
3 | Gdzie jest ala ?
4 | 


--------------------------------------------------------------------------------
/tests/tests_beam_search.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import unittest
 3 | 
 4 | import numpy as np
 5 | import dali.core as D
 6 | 
 7 | from dali import beam_search, Beam
 8 | 
 9 | class BeamSearchTests(unittest.TestCase):
10 |     def test_letters(self):
11 |         MAX_LENGTH = 2
12 |         choices = {
13 |             #initial_choices
14 |             "a": 0.6,
15 |             "b": 0.4,
16 |             #after chosing a
17 |             "aa": 0.55,  # (total worth 0.33)
18 |             "ab": 0.45,  # (total worth 0.18)
19 |             #after choosing b
20 |             "ba": 0.99,  # (total worth 0.495)
21 |             "bb": 0.11,  # (total worth 0.044)
22 |         };
23 | 
24 |         # Above example is designed to demonstrate greedy solution,
25 |         # as well as better optimal solution:
26 |         # GREEDY:    (beam_width == 1) => "aa" worth 0.33
27 |         # OPTIMAL:   (beam_width == 2) => "ba" worth 0.495
28 |         res_aa = Beam([0,0], D.Mat([math.log(0.6 * 0.55)]), "aa")
29 |         res_ab = Beam([0,1], D.Mat([math.log(0.6 * 0.45)]), "ab")
30 |         res_ba = Beam([1,0], D.Mat([math.log(0.4 * 0.99)]), "ba")
31 |         res_bb = Beam([1,1], D.Mat([math.log(0.4 * 0.11)]), "bb")
32 | 
33 |         initial_state = "";
34 |         def candidate_scores(state):
35 |             ret = D.Mat(1,2)
36 |             ret.w[0,0] = math.log(choices[state + "a"])
37 |             ret.w[0,1] = math.log(choices[state + "b"])
38 |             return ret
39 |         def make_choice(prev_state, choice):
40 |             return prev_state + ("a" if choice == 0 else "b")
41 | 
42 |         def my_beam_search(beam_width):
43 |             return beam_search(initial_state=initial_state,
44 |                                candidate_scores=candidate_scores,
45 |                                make_choice=make_choice,
46 |                                beam_width=beam_width,
47 |                                max_sequence_length = MAX_LENGTH)
48 | 
49 |         def beams_equal(b1, b2):
50 |             return (b1.solution == b2.solution and
51 |                     np.allclose(b1.score.w, b2.score.w) and
52 |                     b1.state == b2.state)
53 | 
54 |         def results_equal(a,b):
55 |             return len(a) == len(b) and all(beams_equal(b1,b2) for b1,b2 in zip(a,b))
56 | 
57 |         with self.assertRaises(ValueError):
58 |             my_beam_search(0)
59 | 
60 |         self.assertTrue(results_equal(my_beam_search(1), [res_aa]))
61 |         self.assertTrue(results_equal(my_beam_search(2), [res_ba, res_aa]))
62 |         self.assertTrue(results_equal(my_beam_search(4), [res_ba, res_aa, res_ab, res_bb]))
63 |         self.assertTrue(results_equal(my_beam_search(10),[res_ba, res_aa, res_ab, res_bb]))
64 | 
65 | if __name__ == '__main__':
66 |     unittest.main()
67 | 


--------------------------------------------------------------------------------
/tests/tests_data.py:
--------------------------------------------------------------------------------
  1 | import dill as pickle
  2 | import mock
  3 | import unittest
  4 | 
  5 | from dali.data import DiscoverFiles, Lines, BatchBenefactor
  6 | 
  7 | from os.path import join, dirname, realpath
  8 | SCRIPT_DIR = dirname(realpath(__file__))
  9 | 
 10 | class DataTests(unittest.TestCase):
 11 |     @mock.patch('os.walk')
 12 |     def test_discover_files(self, patched_os_walk):
 13 |         patched_os_walk.return_value = [
 14 |             ('test_dir', ['hi'], ['lol.py', 'lol2.py']),
 15 |             ('test_dir/hi', [], ['hello.py', 'yikes.txt']),
 16 |         ]
 17 | 
 18 |         x = DiscoverFiles('/what/ever', '.py')
 19 | 
 20 |         self.assertEqual(next(x), "test_dir/lol.py")
 21 |         x_pickle = pickle.loads(pickle.dumps(x))
 22 | 
 23 |         self.assertEqual(next(x), "test_dir/lol2.py")
 24 |         self.assertEqual(next(x_pickle), "test_dir/lol2.py")
 25 | 
 26 |         self.assertEqual(next(x), "test_dir/hi/hello.py")
 27 |         self.assertEqual(next(x_pickle), "test_dir/hi/hello.py")
 28 | 
 29 |         with self.assertRaises(StopIteration):
 30 |             next(x)
 31 |         with self.assertRaises(StopIteration):
 32 |             next(x_pickle)
 33 | 
 34 |     def test_lines(self):
 35 |         r = Lines() \
 36 |             .lower()                                 \
 37 |             .split_spaces()                          \
 38 |             .bound_length(2,4)
 39 | 
 40 |         r.set_file(join(SCRIPT_DIR, "test.txt"))
 41 | 
 42 |         self.assertEqual(next(r), ["ala", "ma", "kota"])
 43 | 
 44 |         r2 = pickle.loads(pickle.dumps(r))
 45 | 
 46 |         self.assertEqual(next(r), ["gdzie", "jest","ala", "?"])
 47 |         self.assertEqual(next(r2), ["gdzie", "jest","ala", "?"])
 48 | 
 49 |         with self.assertRaises(StopIteration):
 50 |             next(r)
 51 |         with self.assertRaises(StopIteration):
 52 |             next(r2)
 53 | 
 54 | 
 55 |     @mock.patch('random.shuffle')
 56 |     def test_batch_benefactor(self, patched_random_shuffle):
 57 |         # random shuffle no longer shuffles ;-)
 58 | 
 59 |         d = BatchBenefactor(2, lambda x: ' '.join(x), 4)
 60 |         d.add("where")
 61 |         with self.assertRaises(StopIteration):
 62 |             next(d)
 63 |         d.add("is")
 64 |         with self.assertRaises(StopIteration):
 65 |             next(d)
 66 |         d.add("the")
 67 |         with self.assertRaises(StopIteration):
 68 |             next(d)
 69 |         d.add("love")
 70 |         self.assertEqual(list(d), ["is the", "love where"])
 71 | 
 72 |         d = pickle.loads(pickle.dumps(d))
 73 |         d.add("where")
 74 |         with self.assertRaises(StopIteration):
 75 |             next(d)
 76 |         d.add("is")
 77 |         with self.assertRaises(StopIteration):
 78 |             next(d)
 79 |         d.add("the")
 80 |         with self.assertRaises(StopIteration):
 81 |             next(d)
 82 |         d.add("love")
 83 |         self.assertEqual(list(d), ["is the", "love where"])
 84 | 
 85 |         d = pickle.loads(pickle.dumps(d))
 86 |         d.update_minibatch_size(4)
 87 |         d.add("siema")
 88 |         with self.assertRaises(StopIteration):
 89 |             next(d)
 90 |         d.add("is")
 91 |         with self.assertRaises(StopIteration):
 92 |             next(d)
 93 |         d.add("polish")
 94 |         with self.assertRaises(StopIteration):
 95 |             next(d)
 96 |         d.add("greeting")
 97 |         self.assertEqual(list(d), ["is siema polish greeting"])
 98 |         with self.assertRaises(StopIteration):
 99 |             next(d)
100 | 


--------------------------------------------------------------------------------
/tests/tests_vocab.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | 
 3 | from dali.utils import Vocab, VocabEncoded
 4 | 
 5 | class VocabTests(unittest.TestCase):
 6 |     @classmethod
 7 |     def setUp(self):
 8 |         self.vocab = Vocab()
 9 |         self.vocab.add([[{
10 |             'interesting_words': ['awesome', 'cat', 'lol'],
11 |             'daniel' : 'daniel',
12 |             'wtf':[[[[[[[[[[[['there']]]]]]]]]]]]
13 |         }]])
14 | 
15 |         self.example =  {1:{1:{1:[[[[[ 'awesome', 'but','staph', 'daniel' ]]]]]}}}
16 |         self.example_unks = {1: {1: {1: [[[[['awesome', '**UNK**', '**UNK**', 'daniel']]]]]}}}
17 | 
18 | 
19 |     def test_addition(self):
20 |         self.assertEqual(set(self.vocab.words()),
21 |                          set(['awesome',
22 |                               'there',
23 |                               'daniel',
24 |                               '**UNK**',
25 |                               'cat',
26 |                               '**EOS**',
27 |                               'lol']))
28 | 
29 | 
30 |     def test_encode(self):
31 |         encoded  = self.vocab.encode(self.example, encode_type=VocabEncoded)
32 |         decoded  = self.vocab.decode(encoded, decode_type=VocabEncoded)
33 |         self.assertEqual(self.example_unks, decoded)
34 | 
35 |     def test_encode_eos(self):
36 |         encoded  = self.vocab.encode(self.example, add_eos=True, encode_type=VocabEncoded)
37 |         decoded  = self.vocab.decode(encoded, strip_eos=True, decode_type=VocabEncoded)
38 |         assert self.example_unks == decoded
39 | 


--------------------------------------------------------------------------------