├── .gitignore
├── LICENSE
├── README.md
├── docs
    ├── ai-cover.jpg
    ├── cnn-convolution.gif
    ├── cnn-convolution.png
    ├── cnn-layers.png
    ├── cnn-maxpooling.png
    ├── cnn-pooling.png
    ├── conv-with-padding.png
    ├── fe-ai.md
    ├── img-grayscale.jpeg
    ├── img-regression.jpg
    ├── picture-55.jpg
    ├── picture-rgb.png
    ├── regression-result.jpg
    └── tensorflow-playground.png
├── index.html
└── net
    ├── car.js
    └── convnet.js


/.gitignore:
--------------------------------------------------------------------------------
1 | # MAC
2 | .DS_Store


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2018 Ranjay
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ## 项目说明
 2 | 
 3 | 前端CNN图像识别项目:
 4 | 
 5 | * 打开页面，调出开发者工具控制台并切换到console面板
 6 | * 等待console输出“模型训练好了”字段
 7 | * 点击识别按钮即可输出识别结果
 8 | 
 9 | ![img-regression](docs/img-regression.jpg)
10 | 
11 | ## 目录结构
12 | 
13 | ```
14 | ├── net             依赖库及资源文件
15 | ├── docs            项目文档
16 | ├── index.html      项目主文件
17 | └── .gitignore
18 | ```
19 | 
20 | ## 项目文档
21 | 
22 | [《前端AI实战——告诉世界前端也能做AI》](docs/fe-ai.md)
23 | 
24 | ## 其他
25 | 
26 | 项目具体知识点详见文件`index.html`内代码注释
27 | 


--------------------------------------------------------------------------------
/docs/ai-cover.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/ai-cover.jpg


--------------------------------------------------------------------------------
/docs/cnn-convolution.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/cnn-convolution.gif


--------------------------------------------------------------------------------
/docs/cnn-convolution.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/cnn-convolution.png


--------------------------------------------------------------------------------
/docs/cnn-layers.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/cnn-layers.png


--------------------------------------------------------------------------------
/docs/cnn-maxpooling.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/cnn-maxpooling.png


--------------------------------------------------------------------------------
/docs/cnn-pooling.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/cnn-pooling.png


--------------------------------------------------------------------------------
/docs/conv-with-padding.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/conv-with-padding.png


--------------------------------------------------------------------------------
/docs/fe-ai.md:
--------------------------------------------------------------------------------
  1 | # 前端AI实战——告诉世界前端也能做AI
  2 | 
  3 | 我想大多数人和我一样，第一次听见“人工智能”这个词的时候都会觉得是一个很高大上、遥不可及的概念，特别像我这样一个平凡的前端，和大部分人一样，都觉得人工智能其实离我们很遥远，我们对它的印象总是停留在各种各样神奇而又复杂的算法，这些仿佛都是那些技术专家或者海归博士才有能力去做的工作。我也曾一度以为自己和这个行业没有太多缘分，但自从Tensorflow发布了JS版本之后，这一领域又引起了我的注意。在python垄断的时代，发布JS工具库不就是意味着我们前端工程师也可以参与其中？
  4 | 
  5 | 当我决定开始投身这片领域做一些自己感兴趣的事情的时候，却发现身边的人投来的都是鄙夷的目光，他们对前端的印象，还总是停留在上个年代那些只会写写页面脚本的切图仔，只有身处这片领域的我们才知道大前端时代早已发生了翻天覆地的变革。
  6 | 
  7 | 今天，我就带领大家从原理开始，尽可能用最通俗易懂的方式，让JS的爱好者们快速上手人工智能。
  8 | 
  9 | 具体项目可参照：https://github.com/jerryOnlyZRJ/image-regression 。
 10 | 
 11 | 本文就单拿人工智能下的一块小领域——“图像识别”作一些简单介绍和实战指引，当然这些都只是这片大领域下的冰山一角，还有很多很多知识等着你去发掘。
 12 | 
 13 | ## 1.CNN卷积神经网络原理剖析
 14 | 
 15 | 如果我不讲解这部分内容，而是直接教你们怎么使用一个现成的库，那这篇文章就没什么价值了，看完之后给你们留下的也一定都会是“开局一张图，过程全靠编”的错觉。因此，要真正了解人工智能，就应该进入这个黑盒，里面的思想才是精华。
 16 | 
 17 | ### 1.1.图像灰度级与灰度图
 18 | 
 19 | #### 1.1.1.基本概念
 20 | 
 21 | 要做图像识别，我们肯定要先从图像下手，大家先理解一个概念——图像灰度级。
 22 | 
 23 | 众所周知，我们的图片都是由许多像素点组成的，就好像一张100*100像素的图片，就表示它是由10000个像素点呈现的。但你可曾想过，这些像素点可以由一系列的数字表示嘛？
 24 | 
 25 | 就先不拿彩色的图片吧，彩色太复杂了，我们就先拿一张黑白的图片为例，假设我们以黑色像素的深浅为基准，将白色到黑色的渐变过程分为不同的等级，这样，图片上每一个像素点都能用一个最为临近的等级数字表示出来：
 26 | 
 27 | ![img-grayscale](img-grayscale.jpeg)
 28 | 
 29 | 如果我们用1表示白色，用0表示黑色，将图像二值化，最后以矢量（数字）的形式呈现出来，结果大概就是这样：（下图是一张5*5的二值化图像，没有具体表示含义，只作示例）
 30 | 
 31 | ![picture-55](picture-55.jpg)
 32 | 
 33 | 同理，如果是彩色的图像，那我们是不是可以把R、G、B三个维度的像素单独提取出来分别处理呢？这样，每一个维度不就可以单独视为一张灰度图。
 34 | 
 35 | ![picture-rgb](picture-rgb.png)
 36 | 
 37 | #### 1.1.2.平滑图像与特征点
 38 | 
 39 | 如果一张图像没有什么像素突变，比如一张全白的图片，如果以数字表示，自然都是0，那我们可以称这张图片的像素点是平滑的。再比如这张全白的图片上有一个黑点，自然，灰度图上就会有一个突兀的数值，我们就把它称作特征点，通常来说，图像的特征点有可能是噪声、边缘或者图片的实际特征。
 40 | 
 41 | ### 1.2.神经网络与模型训练
 42 | 
 43 | tensorflow在发布了JS版本的工具库后，也同时制作了一个[Tensorflow游乐场](http://playground.tensorflow.org/)，打开之后，引入眼帘的网页中央这个东西便是神经网络：
 44 | 
 45 | ![tensorflow-playground](tensorflow-playground.png)
 46 | 
 47 | 从图中，我们可以看到神经网络有很多不同的层级，就是图中的Layers，每一层都是前一层经过滤波器计算后的结果，越多的层级以及越多的“神经元”经过一次计算过程计算出来的结果误差越小，同时，计算的时间也会增加。神经网络正是模仿了我们人类脑袋里的神经元经过了一系列计算然后学习事物的过程。这里推荐阮一峰的[《神经网络入门》](http://www.ruanyifeng.com/blog/2017/07/neural-network.html)这篇文章，能够帮助大家更加浅显地了解神经网络是什么。
 48 | 
 49 | 在我们的卷积神经网络中，这些层级都有不同的名字：输入层、卷积层、池化层以及输出层。
 50 | 
 51 | * 输入层：我们输入的矢量化之后的图像
 52 | * 卷积层：经过滤波器卷积计算之后的图像
 53 | * 池化层：经过池化滤波器卷积计算之后的图像
 54 | * 输出层：输出数据
 55 | 
 56 | Features就是我们的算子，也称为滤波器，但是每种不同的滤波器对最后的输出结果都会有不同的影响，进过训练之后，机器会通过我们赋予的算法（比如激活函数等等）计算出哪些滤波器会对输出结果造成较大的误差，哪些滤波器对输出结果压根没有影响（原理很简单，第一次计算使用所有滤波器，第二次计算拿掉某一个滤波器，然后观察误差值（Training loss）就可以知道这个被拿掉的滤波器所起到的作用了），机器会为比较重要的滤波器赋予较高的权重，我们将这样一个过程称为“训练”。最终，我们将得到的整个带有权重的神经网络称为我们通过机器训练出的“模型”，我们可以拿着这个模型去让机器学习事物。
 57 | 
 58 | 这就是机器学习中“训练模型”的过程，Tensorflow.js就是为我们提供的训练模型的工具库，当你真正掌握了模型训练的奥义之后，Tensorflow对你而言就像JQuery用起来一般简单。
 59 | 
 60 | 大家看完这些介绍之后肯定还是一脸茫然，什么是滤波器？什么又是卷积计算？不着急，下一个版块的内容将会为大家揭开所有谜题。
 61 | 
 62 | ### 1.3.卷积算法揭秘
 63 | 
 64 | #### 1.3.1.卷积算法
 65 | 
 66 | 还记得我们在1.1.1里说到一张图片可以用矢量的形式表示每个像素点嘛？卷积计算就是在这基础上，使用某些算子对这些像素点进行处理，而这些算子，就是我们刚刚提到的滤波器（比如左边，就是一张经过二值化处理的5\*5的图片，中间的就是我们的滤波器）：
 67 | 
 68 | ![cnn-convolution](cnn-convolution.png)
 69 | 
 70 | 那计算的过程又是怎样的呢？卷积这东西听起来感觉很复杂，但实际上就是把我们的滤波器套到图像上，乘积求和，然后将图像上位于滤波器中心的值用计算结果替换，大概的效果就是下面这张动图这样：
 71 | 
 72 | ![cnn-convolution](cnn-convolution.gif)
 73 | 
 74 | 对，所谓高大上的卷积就是这样一个过程，我们的滤波器每次计算之后就向右移动一个像素，所以我们可以称滤波器的步长为1，以此类推。不过我们发现，经过滤波器处理后的图像，好像“变小了”！原来是5\*5的图片这下变成了3\*3，这是卷积运算带来的必然副作用，如果不想让图片变小，我们可以为原图像加上一定像素且值均为0的边界（padding）去抵消副作用，就像下面这样：
 75 | 
 76 | ![conv-with-padding](conv-with-padding.png)
 77 | 
 78 | #### 1.3.2.池化算法
 79 | 
 80 | 其实在平时训练模型的过程中，我们输入的图像肯定不只有5\*5像素这么小，我们最经常见到的图片许多都是100\*100像素以上的，这样使用我们的机器去计算起来肯定是比较复杂的，因此，我们常常会使用池化算法进行特征提取或者图像平滑处理，池化的过程其实就是按照某种规律将图片等比缩小，过程就像下面这样：
 81 | 
 82 | ![cnn-pooling](cnn-pooling.png)
 83 | 
 84 | 而池化算法最常用的有两大类：取均值算法和取最大值算法，顾名思义，取均值算法就是取滤波器中的平均值作为结果，取最大值算法就是取滤波器中的最大值作为输出结果：
 85 | 
 86 | ![cnn-maxpooling](cnn-maxpooling.png)
 87 | 
 88 | 上图就是取最大值算法的处理过程，大家也能很直观的看出，在池化层中，滤波器的步长大都是等于滤波器自身大小的（比较方便控制缩放比例）。并且，取最大值算法肯定是很容易取到滤波器中的特征点（还记得特征点嘛？忘记的话快回去1.1.2看看哦～），所以我们可以讲取最大值算法的池化处理称为特征提取；同理，取均值算法因为把所有的像素点的灰度级都平均了，所以我们可以称之为平滑处理。
 89 | 
 90 | 关于卷积神经网络的知识，可以具体参照这篇文章：[《卷积神经网络（1）卷积层和池化层学习》](https://www.cnblogs.com/zf-blog/p/6075286.html)。了解了这些知识之后，就可以开始我们的实战啦～
 91 | 
 92 | ## 2.图像识别实战
 93 | 
 94 | 说了那么多理论，也不比实操来得有感觉。在大家了解了卷积神经网络的基本原理之后，就可以使用我们的工具库来帮助我们完成相关工作，这里我推荐[ConvNetJS](https://github.com/karpathy/convnetjs)。这款工具库的本质就是我们在1.2中提到的别人训练好的模型，我们只需要拿来“学习”即可。
 95 | 
 96 | ### 2.1.使用ConvNetJS
 97 | 
 98 | 我们可以看到在ConvNetJS的README里有这样一段官方demo，具体的含义我已经用注释在代码里标注：
 99 | 
100 | ```js
101 | // 定义一个神经网络
102 | var layer_defs = [];
103 | // 输入层：即是32*32*3的图像
104 | layer_defs.push({type:'input', out_sx:32, out_sy:32, out_depth:3}); 
105 | // 卷积层 
106 | // filter：用16个5*5的滤波器去卷积
107 | // stride：卷积步长为1
108 | // padding：填充宽度为2（为保证输出的图像大小不会发生变化）
109 | // activation：激活函数为relu（还有Tanh、Sigmoid等等函数，功能不同）
110 | layer_defs.push({type:'conv', sx:5, filters:16, stride:1, pad:2, activation:'relu'});
111 | // 池化层
112 | // 池化滤波器的大小为2*2
113 | // stride：步长为2
114 | // 在这里我们无法看出这个框架池化是使用的Avy Pooling还是Max Pooling算法，先视为后者
115 | layer_defs.push({type:'pool', sx:2, stride:2});
116 | // 反复卷积和池化减小模型误差
117 | layer_defs.push({type:'conv', sx:5, filters:20, stride:1, pad:2, activation:'relu'});
118 | layer_defs.push({type:'pool', sx:2, stride:2});
119 | layer_defs.push({type:'conv', sx:5, filters:20, stride:1, pad:2, activation:'relu'});
120 | layer_defs.push({type:'pool', sx:2, stride:2});
121 | // 输出层
122 | // 分类器：输出10中不同的类别
123 | layer_defs.push({type:'softmax', num_classes:10});
124 | 
125 | // 实例化一个神经网络
126 | net = new convnetjs.Net();
127 | net.makeLayers(layer_defs);
128 | 
129 | // 模型训练
130 | const trainer = new convnetjs.SGDTrainer(net, { learning_rate: 0.01, momentum: 0.9, batch_size: 5, l2_decay: 0.0 });
131 | trainer.train(imgVol, classIndex);
132 | 
133 | // 使用训练好的模型进行图像识别
134 | var x = convnetjs.img_to_vol(document.getElementById('some_image'))
135 | var output_probabilities_vol = net.forward(x)
136 | ```
137 | 
138 | 如果想要更形象点，上述过程可以用这样一幅图表示：
139 | 
140 | ![cnn-layers](cnn-layers.png)
141 | 
142 | 中间的“卷积-池化-卷积-池化……“就是我们定义并训练的神经网络，我们输入矢量化处理后的图像后，先进行卷积运算，不同的滤波器得到了不同的结果，官方demo里是使用了16个不同的滤波器（PS：这里给大家留一个思考的问题，一个3\*3的二值化滤波器，能写出多少种可能？），自然能卷积出16种不同的结果，再拿着这些结果池化处理，不断重复这个过程，最终得出图像识别结果：
143 | 
144 | ![img-regression](img-regression.jpg)
145 | 
146 | ### 2.2.实战项目解析
147 | 
148 | 来，我们一起详细梳理一下使用ConvNetJS这个工具库完成整个图像识别的具体流程，
149 | 
150 | （PS：项目代码具体参照：https://github.com/jerryOnlyZRJ/image-regression ）
151 | 
152 | 首先，我们必须先有数据供我们的模型去学习，至少你该让这个模型知道啥是啥对吧，在项目里的 `net` 文件夹里的 `car.js` 文件，存放的就是我们的学习数据，如果你们感兴趣可以打开看看，里面的数据就是告诉机器什么样的车标对应的是车的什么品牌。
153 | 
154 | 在我们的项目里，是通过这样一段代码完成机器学习的：
155 | 
156 | ```js
157 | const trainer = new convnetjs.SGDTrainer(net, { learning_rate: 0.01, momentum: 0.9, batch_size: 5, l2_decay: 0.0 });
158 | let imageList = [];
159 | const loadData = i => {
160 |     return function () {
161 |         return new Promise(function (resolve, reject) {
162 |     		let image = new Image();
163 | 		    image.crossOrigin = "anonymous";
164 |  		    image.src = carList[i].url;
165 | 		    image.onload = function () {
166 |         		let vol = convnetjs.img_to_vol(image);
167 |                 // 逐张训练图片
168 |         		trainer.train(vol, i);
169 |        		 	resolve();
170 |     		};
171 |    		  	image.onerror = reject;
172 | 		})
173 |     }
174 | }
175 | // 遍历图片资源
176 | for (let j = 0; j < carList.length; j++) {
177 |     imageList.push(loadData(j));
178 | }
179 | var testBtn = document.getElementById("test")
180 | function training(){
181 |     testBtn.disabled = true
182 |     return new Promise((resolve, reject) => {
183 |         Promise.all(imageList.map(imageContainer => imageContainer())).then(() => {
184 |     		console.log("模型训练好了！！！👌")
185 |     		testBtn.disabled = false
186 |     		resolve()
187 | 		})
188 |     })
189 | }
190 | ```
191 | 
192 | 我们试着去打印一下图像识别的输出结果，得到的是这样一个东西：
193 | 
194 | ![regression-result](regression-result.jpg)
195 | 
196 | 从识别结果中我们可以看到，我们得到的是一个数组，这就是经过分类器分类的10个不同类别，对应的自然是我们的车的品牌，值就是每个类别对应的概率。所以，我们只要拿到概率的最大值，就是预测得出的最倾向的结果。
197 | 
198 | ## 3.结语
199 | 
200 | 随着JS引擎的计算能力不断增强，人工智能领域的不断发展，可以预见的是，在不久的将来，肯定能有一些简单的算法可以被移植到用户前端执行，这样既能减少请求，又能分担后端压力。这一切并不是无稽之谈，为什么tensorflow.js会应运而生，正是因为JS的社区在不断壮大，JS这款便捷的语言也在得到更为普遍的使用。所以，请对你所从事的这份前端事业，有足够的信心！
201 | 
202 | 还是那句老话：
203 | 
204 | **技术从来不会受限于语言，受限你的，永远只是思想。**
205 | 
206 | 我并不是什么算法工程师，我也不是CS专业出来的科班生，我只是一枚普普通通的前端，和绝大多数人一样，没有多深厚的基础，但我愿意去学，我享受克服困难的过程，而那份对人工智能的执着，只是来源于那份不满足于现状的倔性和对这片领域一成不变的初心。
207 | 
208 | 如果您觉得这篇文章对您有帮助，还请麻烦您为文章提供的示例demo项目点个star；如果您对我的其他项目感兴趣，也欢迎follow哦～
209 | 
210 | ## 4.鸣谢
211 | 
212 | 本文项目资源大部分来自[京程一灯](https://yd.ke.qq.com)，感谢[京程一灯](https://yd.ke.qq.com/)袁志佳老师对本文以及我个人提供的支持和帮助，如果你也在前端前进路上感到迷茫，[京程一灯](https://yd.ke.qq.com/)也许是你不错的选择。


--------------------------------------------------------------------------------
/docs/img-grayscale.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/img-grayscale.jpeg


--------------------------------------------------------------------------------
/docs/img-regression.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/img-regression.jpg


--------------------------------------------------------------------------------
/docs/picture-55.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/picture-55.jpg


--------------------------------------------------------------------------------
/docs/picture-rgb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/picture-rgb.png


--------------------------------------------------------------------------------
/docs/regression-result.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/regression-result.jpg


--------------------------------------------------------------------------------
/docs/tensorflow-playground.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/jerryOnlyZRJ/image-regression/4d076078bcd7e0aab461cadbe71d84e49aa477af/docs/tensorflow-playground.png


--------------------------------------------------------------------------------
/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 | 
 4 | <head>
 5 |     <meta charset="UTF-8">
 6 |     <meta name="viewport" content="width=device-width, initial-scale=1.0">
 7 |     <meta http-equiv="X-UA-Compatible" content="ie=edge">
 8 |     <title>利用卷积神经网络算法识别车logo</title>
 9 | </head>
10 | 
11 | <body>
12 |     <img src="http://p.pstatp.com/avatar/100x100/1dd5000018fab5bd782b.png" id="some_image" crossorigin="anonymous" />
13 |     <input type="button" value="识别" id="test" />
14 |     <script src="./net/car.js"></script>
15 |     <script src="./net/convnet.js"></script>
16 |     <script>
17 |         //神经网络
18 |         let layer_defs = [];
19 |         // 输入层：即是100*100*3的图像
20 |         layer_defs.push({ type: 'input', out_sx: 100, out_sy: 100, out_depth: 3 });
21 |         // 卷积层 
22 |         // filter：用16个5*5的滤波器去卷积
23 |         // stride：卷积步长为1
24 |         // padding：填充宽度为2（为保证输出的图像大小不会发生变化）
25 |         // activation：激活函数为relu（还有Tanh、Sigmoid等等函数，功能不同）
26 |         layer_defs.push({ type: 'conv', sx: 5, filters: 16, stride: 1, pad: 2, activation: 'relu' });
27 |         // 池化层
28 |         // 池化滤波器的大小为2*2
29 |         // stride：步长为2
30 |         // 在这里我们无法看出这个框架池化是使用的Avy Pooling还是Max Pooling算法，先视为后者
31 |         layer_defs.push({ type: 'pool', sx: 2, stride: 2 });
32 |         // 反复卷积和池化减小模型误差
33 |         layer_defs.push({ type: 'conv', sx: 5, filters: 20, stride: 1, pad: 2, activation: 'relu' });
34 |         layer_defs.push({ type: 'pool', sx: 2, stride: 2 });
35 |         layer_defs.push({ type: 'conv', sx: 5, filters: 20, stride: 1, pad: 2, activation: 'relu' });
36 |         layer_defs.push({ type: 'pool', sx: 2, stride: 2 });
37 |         // 分类器：输出10中不同的类别
38 |         layer_defs.push({ type: 'softmax', num_classes: 10 });
39 |         // 初始化神经网路
40 |         const net = new convnetjs.Net();
41 |         net.makeLayers(layer_defs);
42 |         // 初始化训练机制
43 |         const trainer = new convnetjs.SGDTrainer(net, { learning_rate: 0.01, momentum: 0.9, batch_size: 5, l2_decay: 0.0 });
44 |         let imageList = [];
45 |         const loadData = i => {
46 |             return function () {
47 |                 return new Promise(function (resolve, reject) {
48 |                     let image = new Image();
49 |                     image.crossOrigin = "anonymous";
50 |                     image.src = carList[i].url;
51 |                     image.onload = function () {
52 |                         let vol = convnetjs.img_to_vol(image);
53 |                         trainer.train(vol, i);
54 |                         resolve();
55 |                     };
56 |                     image.onerror = reject;
57 |                 })
58 |             }
59 |         }
60 |         for (let j = 0; j < carList.length; j++) {
61 |             imageList.push(loadData(j));
62 |         }
63 |         var testBtn = document.getElementById("test")
64 |         function training(){
65 |             testBtn.disabled = true
66 |             return new Promise((resolve, reject) => {
67 |                 Promise.all(imageList.map(imageContainer => imageContainer())).then(() => {
68 |                     console.log("模型训练好了！！！👌")
69 |                     testBtn.disabled = false
70 |                     resolve()
71 |                 })
72 |             })
73 |         }
74 |         training().then(() => {
75 |             testBtn.addEventListener('click', () => {
76 |                 // 告诉机器每一类对应的是什么（即让机器认识图片的过程）
77 |                 const carNameList = ["奥迪", "奔驰", "宝马", "本田", "别克", "比亚迪", "保时捷", "大众", "哈弗"];
78 |                 const x = convnetjs.img_to_vol(document.getElementById('some_image'));
79 |                 // console.log(net.forward(x));
80 |                 const result = Array.from(net.forward(x).w);
81 |                 let max = Math.max.apply(Math, result);
82 |                 console.log("最有可能的那个汽车logo🚗", carNameList[result.indexOf(max)])
83 |                 console.log("接着训练！！！💪")
84 |                 training()
85 |             })
86 |         })
87 |     </script>
88 | </body>
89 | 
90 | </html>


--------------------------------------------------------------------------------
/net/car.js:
--------------------------------------------------------------------------------
 1 | var carList = [
 2 |   {
 3 |     "name": "奥迪",
 4 |     "url": "http://p.pstatp.com/avatar/100x100/1dd5000048d6334c26b4.png",
 5 |     "index": 0
 6 |   },
 7 |   {
 8 |     "name": "奔驰",
 9 |     "url": "http://p.pstatp.com/avatar/100x100/1dd50000190229abeec8.png",
10 |     "index": 1
11 |   },
12 |   {
13 |     "name": "宝马",
14 |     "url": "http://p.pstatp.com/avatar/100x100/1dd5000018fab5bd782b.png",
15 |     "index": 2
16 |   },
17 |   {
18 |     "name": "本田",
19 |     "url": "http://p.pstatp.com/avatar/100x100/1dd5000018fc7c108922.png",
20 |     "index": 3
21 |   },
22 |   {
23 |     "name": "别克",
24 |     "url": "http://p.pstatp.com/avatar/100x100/1dd5000018fefd5c26b7.png",
25 |     "index": 4
26 |   },
27 |   {
28 |     "name": "比亚迪",
29 |     "url": "http://p.pstatp.com/avatar/100x100/1dd5000018f0e7000aa7.png",
30 |     "index": 5
31 |   },
32 |   {
33 |     "name": "保时捷",
34 |     "url": "http://p.pstatp.com/avatar/100x100/1dd50000190122c26c84.png",
35 |     "index": 6
36 |   },
37 |   {
38 |     "name": "大众",
39 |     "url": "http://p.pstatp.com/avatar/100x100/1dd500001906761eb47e.png",
40 |     "index": 7
41 |   },
42 |   {
43 |     "name": "哈弗",
44 |     "url": "http://p.pstatp.com/avatar/100x100/1dd50000193811739d87.png",
45 |     "index": 8
46 |   },
47 |   {
48 |     "name": "兰博基尼",
49 |     "url": "http://p.pstatp.com/avatar/100x100/1dd50000191738275961.png",
50 |     "index": 9
51 |   },
52 |   {
53 |     "name": "雪佛兰",
54 |     "url": "http://p.pstatp.com/avatar/100x100/1dd50000196a38ee3f43.png",
55 |     "index": 10
56 |   },
57 |   {
58 |     "name": "现代",
59 |     "url": "http://p.pstatp.com/avatar/100x100/1dd50000196d2f0b9a05.png",
60 |     "index": 11
61 |   }
62 | ]


--------------------------------------------------------------------------------
/net/convnet.js:
--------------------------------------------------------------------------------
   1 | var convnetjs = convnetjs || { REVISION: 'ALPHA' };
   2 | (function(global) {
   3 |   "use strict";
   4 | 
   5 |   // Random number utilities
   6 |   var return_v = false;
   7 |   var v_val = 0.0;
   8 |   var gaussRandom = function() {
   9 |     if(return_v) { 
  10 |       return_v = false;
  11 |       return v_val; 
  12 |     }
  13 |     var u = 2*Math.random()-1;
  14 |     var v = 2*Math.random()-1;
  15 |     var r = u*u + v*v;
  16 |     if(r == 0 || r > 1) return gaussRandom();
  17 |     var c = Math.sqrt(-2*Math.log(r)/r);
  18 |     v_val = v*c; // cache this
  19 |     return_v = true;
  20 |     return u*c;
  21 |   }
  22 |   var randf = function(a, b) { return Math.random()*(b-a)+a; }
  23 |   var randi = function(a, b) { return Math.floor(Math.random()*(b-a)+a); }
  24 |   var randn = function(mu, std){ return mu+gaussRandom()*std; }
  25 | 
  26 |   // Array utilities
  27 |   var zeros = function(n) {
  28 |     if(typeof(n)==='undefined' || isNaN(n)) { return []; }
  29 |     if(typeof ArrayBuffer === 'undefined') {
  30 |       // lacking browser support
  31 |       var arr = new Array(n);
  32 |       for(var i=0;i<n;i++) { arr[i]= 0; }
  33 |       return arr;
  34 |     } else {
  35 |       return new Float64Array(n);
  36 |     }
  37 |   }
  38 | 
  39 |   var arrContains = function(arr, elt) {
  40 |     for(var i=0,n=arr.length;i<n;i++) {
  41 |       if(arr[i]===elt) return true;
  42 |     }
  43 |     return false;
  44 |   }
  45 | 
  46 |   var arrUnique = function(arr) {
  47 |     var b = [];
  48 |     for(var i=0,n=arr.length;i<n;i++) {
  49 |       if(!arrContains(b, arr[i])) {
  50 |         b.push(arr[i]);
  51 |       }
  52 |     }
  53 |     return b;
  54 |   }
  55 | 
  56 |   // return max and min of a given non-empty array.
  57 |   var maxmin = function(w) {
  58 |     if(w.length === 0) { return {}; } // ... ;s
  59 |     var maxv = w[0];
  60 |     var minv = w[0];
  61 |     var maxi = 0;
  62 |     var mini = 0;
  63 |     var n = w.length;
  64 |     for(var i=1;i<n;i++) {
  65 |       if(w[i] > maxv) { maxv = w[i]; maxi = i; } 
  66 |       if(w[i] < minv) { minv = w[i]; mini = i; } 
  67 |     }
  68 |     return {maxi: maxi, maxv: maxv, mini: mini, minv: minv, dv:maxv-minv};
  69 |   }
  70 | 
  71 |   // create random permutation of numbers, in range [0...n-1]
  72 |   var randperm = function(n) {
  73 |     var i = n,
  74 |         j = 0,
  75 |         temp;
  76 |     var array = [];
  77 |     for(var q=0;q<n;q++)array[q]=q;
  78 |     while (i--) {
  79 |         j = Math.floor(Math.random() * (i+1));
  80 |         temp = array[i];
  81 |         array[i] = array[j];
  82 |         array[j] = temp;
  83 |     }
  84 |     return array;
  85 |   }
  86 | 
  87 |   // sample from list lst according to probabilities in list probs
  88 |   // the two lists are of same size, and probs adds up to 1
  89 |   var weightedSample = function(lst, probs) {
  90 |     var p = randf(0, 1.0);
  91 |     var cumprob = 0.0;
  92 |     for(var k=0,n=lst.length;k<n;k++) {
  93 |       cumprob += probs[k];
  94 |       if(p < cumprob) { return lst[k]; }
  95 |     }
  96 |   }
  97 | 
  98 |   // syntactic sugar function for getting default parameter values
  99 |   var getopt = function(opt, field_name, default_value) {
 100 |     if(typeof field_name === 'string') {
 101 |       // case of single string
 102 |       return (typeof opt[field_name] !== 'undefined') ? opt[field_name] : default_value;
 103 |     } else {
 104 |       // assume we are given a list of string instead
 105 |       var ret = default_value;
 106 |       for(var i=0;i<field_name.length;i++) {
 107 |         var f = field_name[i];
 108 |         if (typeof opt[f] !== 'undefined') {
 109 |           ret = opt[f]; // overwrite return value
 110 |         }
 111 |       }
 112 |       return ret;
 113 |     }
 114 |   }
 115 | 
 116 |   function assert(condition, message) {
 117 |     if (!condition) {
 118 |       message = message || "Assertion failed";
 119 |       if (typeof Error !== "undefined") {
 120 |         throw new Error(message);
 121 |       }
 122 |       throw message; // Fallback
 123 |     }
 124 |   }
 125 | 
 126 |   global.randf = randf;
 127 |   global.randi = randi;
 128 |   global.randn = randn;
 129 |   global.zeros = zeros;
 130 |   global.maxmin = maxmin;
 131 |   global.randperm = randperm;
 132 |   global.weightedSample = weightedSample;
 133 |   global.arrUnique = arrUnique;
 134 |   global.arrContains = arrContains;
 135 |   global.getopt = getopt;
 136 |   global.assert = assert;
 137 |   
 138 | })(convnetjs);
 139 | (function(global) {
 140 |   "use strict";
 141 | 
 142 |   // Vol is the basic building block of all data in a net.
 143 |   // it is essentially just a 3D volume of numbers, with a
 144 |   // width (sx), height (sy), and depth (depth).
 145 |   // it is used to hold data for all filters, all volumes,
 146 |   // all weights, and also stores all gradients w.r.t. 
 147 |   // the data. c is optionally a value to initialize the volume
 148 |   // with. If c is missing, fills the Vol with random numbers.
 149 |   var Vol = function(sx, sy, depth, c) {
 150 |     // this is how you check if a variable is an array. Oh, Javascript :)
 151 |     if(Object.prototype.toString.call(sx) === '[object Array]') {
 152 |       // we were given a list in sx, assume 1D volume and fill it up
 153 |       this.sx = 1;
 154 |       this.sy = 1;
 155 |       this.depth = sx.length;
 156 |       // we have to do the following copy because we want to use
 157 |       // fast typed arrays, not an ordinary javascript array
 158 |       this.w = global.zeros(this.depth);
 159 |       this.dw = global.zeros(this.depth);
 160 |       for(var i=0;i<this.depth;i++) {
 161 |         this.w[i] = sx[i];
 162 |       }
 163 |     } else {
 164 |       // we were given dimensions of the vol
 165 |       this.sx = sx;
 166 |       this.sy = sy;
 167 |       this.depth = depth;
 168 |       var n = sx*sy*depth;
 169 |       this.w = global.zeros(n);
 170 |       this.dw = global.zeros(n);
 171 |       if(typeof c === 'undefined') {
 172 |         // weight normalization is done to equalize the output
 173 |         // variance of every neuron, otherwise neurons with a lot
 174 |         // of incoming connections have outputs of larger variance
 175 |         var scale = Math.sqrt(1.0/(sx*sy*depth));
 176 |         for(var i=0;i<n;i++) { 
 177 |           this.w[i] = global.randn(0.0, scale);
 178 |         }
 179 |       } else {
 180 |         for(var i=0;i<n;i++) { 
 181 |           this.w[i] = c;
 182 |         }
 183 |       }
 184 |     }
 185 |   }
 186 | 
 187 |   Vol.prototype = {
 188 |     get: function(x, y, d) { 
 189 |       var ix=((this.sx * y)+x)*this.depth+d;
 190 |       return this.w[ix];
 191 |     },
 192 |     set: function(x, y, d, v) { 
 193 |       var ix=((this.sx * y)+x)*this.depth+d;
 194 |       this.w[ix] = v; 
 195 |     },
 196 |     add: function(x, y, d, v) { 
 197 |       var ix=((this.sx * y)+x)*this.depth+d;
 198 |       this.w[ix] += v; 
 199 |     },
 200 |     get_grad: function(x, y, d) { 
 201 |       var ix = ((this.sx * y)+x)*this.depth+d;
 202 |       return this.dw[ix]; 
 203 |     },
 204 |     set_grad: function(x, y, d, v) { 
 205 |       var ix = ((this.sx * y)+x)*this.depth+d;
 206 |       this.dw[ix] = v; 
 207 |     },
 208 |     add_grad: function(x, y, d, v) { 
 209 |       var ix = ((this.sx * y)+x)*this.depth+d;
 210 |       this.dw[ix] += v; 
 211 |     },
 212 |     cloneAndZero: function() { return new Vol(this.sx, this.sy, this.depth, 0.0)},
 213 |     clone: function() {
 214 |       var V = new Vol(this.sx, this.sy, this.depth, 0.0);
 215 |       var n = this.w.length;
 216 |       for(var i=0;i<n;i++) { V.w[i] = this.w[i]; }
 217 |       return V;
 218 |     },
 219 |     addFrom: function(V) { for(var k=0;k<this.w.length;k++) { this.w[k] += V.w[k]; }},
 220 |     addFromScaled: function(V, a) { for(var k=0;k<this.w.length;k++) { this.w[k] += a*V.w[k]; }},
 221 |     setConst: function(a) { for(var k=0;k<this.w.length;k++) { this.w[k] = a; }},
 222 | 
 223 |     toJSON: function() {
 224 |       // todo: we may want to only save d most significant digits to save space
 225 |       var json = {}
 226 |       json.sx = this.sx; 
 227 |       json.sy = this.sy;
 228 |       json.depth = this.depth;
 229 |       json.w = this.w;
 230 |       return json;
 231 |       // we wont back up gradients to save space
 232 |     },
 233 |     fromJSON: function(json) {
 234 |       this.sx = json.sx;
 235 |       this.sy = json.sy;
 236 |       this.depth = json.depth;
 237 | 
 238 |       var n = this.sx*this.sy*this.depth;
 239 |       this.w = global.zeros(n);
 240 |       this.dw = global.zeros(n);
 241 |       // copy over the elements.
 242 |       for(var i=0;i<n;i++) {
 243 |         this.w[i] = json.w[i];
 244 |       }
 245 |     }
 246 |   }
 247 | 
 248 |   global.Vol = Vol;
 249 | })(convnetjs);
 250 | (function(global) {
 251 |   "use strict";
 252 |   var Vol = global.Vol; // convenience
 253 | 
 254 |   // Volume utilities
 255 |   // intended for use with data augmentation
 256 |   // crop is the size of output
 257 |   // dx,dy are offset wrt incoming volume, of the shift
 258 |   // fliplr is boolean on whether we also want to flip left<->right
 259 |   var augment = function(V, crop, dx, dy, fliplr) {
 260 |     // note assumes square outputs of size crop x crop
 261 |     if(typeof(fliplr)==='undefined') var fliplr = false;
 262 |     if(typeof(dx)==='undefined') var dx = global.randi(0, V.sx - crop);
 263 |     if(typeof(dy)==='undefined') var dy = global.randi(0, V.sy - crop);
 264 |     
 265 |     // randomly sample a crop in the input volume
 266 |     var W;
 267 |     if(crop !== V.sx || dx!==0 || dy!==0) {
 268 |       W = new Vol(crop, crop, V.depth, 0.0);
 269 |       for(var x=0;x<crop;x++) {
 270 |         for(var y=0;y<crop;y++) {
 271 |           if(x+dx<0 || x+dx>=V.sx || y+dy<0 || y+dy>=V.sy) continue; // oob
 272 |           for(var d=0;d<V.depth;d++) {
 273 |            W.set(x,y,d,V.get(x+dx,y+dy,d)); // copy data over
 274 |           }
 275 |         }
 276 |       }
 277 |     } else {
 278 |       W = V;
 279 |     }
 280 | 
 281 |     if(fliplr) {
 282 |       // flip volume horziontally
 283 |       var W2 = W.cloneAndZero();
 284 |       for(var x=0;x<W.sx;x++) {
 285 |         for(var y=0;y<W.sy;y++) {
 286 |           for(var d=0;d<W.depth;d++) {
 287 |            W2.set(x,y,d,W.get(W.sx - x - 1,y,d)); // copy data over
 288 |           }
 289 |         }
 290 |       }
 291 |       W = W2; //swap
 292 |     }
 293 |     return W;
 294 |   }
 295 | 
 296 |   // img is a DOM element that contains a loaded image
 297 |   // returns a Vol of size (W, H, 4). 4 is for RGBA
 298 |   var img_to_vol = function(img, convert_grayscale) {
 299 | 
 300 |     if(typeof(convert_grayscale)==='undefined') var convert_grayscale = false;
 301 | 
 302 |     var canvas = document.createElement('canvas');
 303 |     canvas.width = img.width;
 304 |     canvas.height = img.height;
 305 |     var ctx = canvas.getContext("2d");
 306 | 
 307 |     // due to a Firefox bug
 308 |     try {
 309 |       ctx.drawImage(img, 0, 0);
 310 |     } catch (e) {
 311 |       if (e.name === "NS_ERROR_NOT_AVAILABLE") {
 312 |         // sometimes happens, lets just abort
 313 |         return false;
 314 |       } else {
 315 |         throw e;
 316 |       }
 317 |     }
 318 | 
 319 |     try {
 320 |       var img_data = ctx.getImageData(0, 0, canvas.width, canvas.height);
 321 |     } catch (e) {
 322 |       if(e.name === 'IndexSizeError') {
 323 |         return false; // not sure what causes this sometimes but okay abort
 324 |       } else {
 325 |         throw e;
 326 |       }
 327 |     }
 328 | 
 329 |     // prepare the input: get pixels and normalize them
 330 |     var p = img_data.data;
 331 |     var W = img.width;
 332 |     var H = img.height;
 333 |     var pv = []
 334 |     for(var i=0;i<p.length;i++) {
 335 |       pv.push(p[i]/255.0-0.5); // normalize image pixels to [-0.5, 0.5]
 336 |     }
 337 |     var x = new Vol(W, H, 4, 0.0); //input volume (image)
 338 |     x.w = pv;
 339 | 
 340 |     if(convert_grayscale) {
 341 |       // flatten into depth=1 array
 342 |       var x1 = new Vol(W, H, 1, 0.0);
 343 |       for(var i=0;i<W;i++) {
 344 |         for(var j=0;j<H;j++) {
 345 |           x1.set(i,j,0,x.get(i,j,0));
 346 |         }
 347 |       }
 348 |       x = x1;
 349 |     }
 350 | 
 351 |     return x;
 352 |   }
 353 |   
 354 |   global.augment = augment;
 355 |   global.img_to_vol = img_to_vol;
 356 | 
 357 | })(convnetjs);
 358 | (function(global) {
 359 |   "use strict";
 360 |   var Vol = global.Vol; // convenience
 361 | 
 362 |   // This file contains all layers that do dot products with input,
 363 |   // but usually in a different connectivity pattern and weight sharing
 364 |   // schemes: 
 365 |   // - FullyConn is fully connected dot products 
 366 |   // - ConvLayer does convolutions (so weight sharing spatially)
 367 |   // putting them together in one file because they are very similar
 368 |   var ConvLayer = function(opt) {
 369 |     var opt = opt || {};
 370 | 
 371 |     // required
 372 |     this.out_depth = opt.filters;
 373 |     this.sx = opt.sx; // filter size. Should be odd if possible, it's cleaner.
 374 |     this.in_depth = opt.in_depth;
 375 |     this.in_sx = opt.in_sx;
 376 |     this.in_sy = opt.in_sy;
 377 |     
 378 |     // optional
 379 |     this.sy = typeof opt.sy !== 'undefined' ? opt.sy : this.sx;
 380 |     this.stride = typeof opt.stride !== 'undefined' ? opt.stride : 1; // stride at which we apply filters to input volume
 381 |     this.pad = typeof opt.pad !== 'undefined' ? opt.pad : 0; // amount of 0 padding to add around borders of input volume
 382 |     this.l1_decay_mul = typeof opt.l1_decay_mul !== 'undefined' ? opt.l1_decay_mul : 0.0;
 383 |     this.l2_decay_mul = typeof opt.l2_decay_mul !== 'undefined' ? opt.l2_decay_mul : 1.0;
 384 | 
 385 |     // computed
 386 |     // note we are doing floor, so if the strided convolution of the filter doesnt fit into the input
 387 |     // volume exactly, the output volume will be trimmed and not contain the (incomplete) computed
 388 |     // final application.
 389 |     this.out_sx = Math.floor((this.in_sx + this.pad * 2 - this.sx) / this.stride + 1);
 390 |     this.out_sy = Math.floor((this.in_sy + this.pad * 2 - this.sy) / this.stride + 1);
 391 |     this.layer_type = 'conv';
 392 | 
 393 |     // initializations
 394 |     var bias = typeof opt.bias_pref !== 'undefined' ? opt.bias_pref : 0.0;
 395 |     this.filters = [];
 396 |     for(var i=0;i<this.out_depth;i++) { this.filters.push(new Vol(this.sx, this.sy, this.in_depth)); }
 397 |     this.biases = new Vol(1, 1, this.out_depth, bias);
 398 |   }
 399 |   ConvLayer.prototype = {
 400 |     forward: function(V, is_training) {
 401 |       // optimized code by @mdda that achieves 2x speedup over previous version
 402 | 
 403 |       this.in_act = V;
 404 |       var A = new Vol(this.out_sx |0, this.out_sy |0, this.out_depth |0, 0.0);
 405 |       
 406 |       var V_sx = V.sx |0;
 407 |       var V_sy = V.sy |0;
 408 |       var xy_stride = this.stride |0;
 409 | 
 410 |       for(var d=0;d<this.out_depth;d++) {
 411 |         var f = this.filters[d];
 412 |         var x = -this.pad |0;
 413 |         var y = -this.pad |0;
 414 |         for(var ay=0; ay<this.out_sy; y+=xy_stride,ay++) {  // xy_stride
 415 |           x = -this.pad |0;
 416 |           for(var ax=0; ax<this.out_sx; x+=xy_stride,ax++) {  // xy_stride
 417 | 
 418 |             // convolve centered at this particular location
 419 |             var a = 0.0;
 420 |             for(var fy=0;fy<f.sy;fy++) {
 421 |               var oy = y+fy; // coordinates in the original input array coordinates
 422 |               for(var fx=0;fx<f.sx;fx++) {
 423 |                 var ox = x+fx;
 424 |                 if(oy>=0 && oy<V_sy && ox>=0 && ox<V_sx) {
 425 |                   for(var fd=0;fd<f.depth;fd++) {
 426 |                     // avoid function call overhead (x2) for efficiency, compromise modularity :(
 427 |                     a += f.w[((f.sx * fy)+fx)*f.depth+fd] * V.w[((V_sx * oy)+ox)*V.depth+fd];
 428 |                   }
 429 |                 }
 430 |               }
 431 |             }
 432 |             a += this.biases.w[d];
 433 |             A.set(ax, ay, d, a);
 434 |           }
 435 |         }
 436 |       }
 437 |       this.out_act = A;
 438 |       return this.out_act;
 439 |     },
 440 |     backward: function() {
 441 | 
 442 |       var V = this.in_act;
 443 |       V.dw = global.zeros(V.w.length); // zero out gradient wrt bottom data, we're about to fill it
 444 | 
 445 |       var V_sx = V.sx |0;
 446 |       var V_sy = V.sy |0;
 447 |       var xy_stride = this.stride |0;
 448 | 
 449 |       for(var d=0;d<this.out_depth;d++) {
 450 |         var f = this.filters[d];
 451 |         var x = -this.pad |0;
 452 |         var y = -this.pad |0;
 453 |         for(var ay=0; ay<this.out_sy; y+=xy_stride,ay++) {  // xy_stride
 454 |           x = -this.pad |0;
 455 |           for(var ax=0; ax<this.out_sx; x+=xy_stride,ax++) {  // xy_stride
 456 | 
 457 |             // convolve centered at this particular location
 458 |             var chain_grad = this.out_act.get_grad(ax,ay,d); // gradient from above, from chain rule
 459 |             for(var fy=0;fy<f.sy;fy++) {
 460 |               var oy = y+fy; // coordinates in the original input array coordinates
 461 |               for(var fx=0;fx<f.sx;fx++) {
 462 |                 var ox = x+fx;
 463 |                 if(oy>=0 && oy<V_sy && ox>=0 && ox<V_sx) {
 464 |                   for(var fd=0;fd<f.depth;fd++) {
 465 |                     // avoid function call overhead (x2) for efficiency, compromise modularity :(
 466 |                     var ix1 = ((V_sx * oy)+ox)*V.depth+fd;
 467 |                     var ix2 = ((f.sx * fy)+fx)*f.depth+fd;
 468 |                     f.dw[ix2] += V.w[ix1]*chain_grad;
 469 |                     V.dw[ix1] += f.w[ix2]*chain_grad;
 470 |                   }
 471 |                 }
 472 |               }
 473 |             }
 474 |             this.biases.dw[d] += chain_grad;
 475 |           }
 476 |         }
 477 |       }
 478 |     },
 479 |     getParamsAndGrads: function() {
 480 |       var response = [];
 481 |       for(var i=0;i<this.out_depth;i++) {
 482 |         response.push({params: this.filters[i].w, grads: this.filters[i].dw, l2_decay_mul: this.l2_decay_mul, l1_decay_mul: this.l1_decay_mul});
 483 |       }
 484 |       response.push({params: this.biases.w, grads: this.biases.dw, l1_decay_mul: 0.0, l2_decay_mul: 0.0});
 485 |       return response;
 486 |     },
 487 |     toJSON: function() {
 488 |       var json = {};
 489 |       json.sx = this.sx; // filter size in x, y dims
 490 |       json.sy = this.sy;
 491 |       json.stride = this.stride;
 492 |       json.in_depth = this.in_depth;
 493 |       json.out_depth = this.out_depth;
 494 |       json.out_sx = this.out_sx;
 495 |       json.out_sy = this.out_sy;
 496 |       json.layer_type = this.layer_type;
 497 |       json.l1_decay_mul = this.l1_decay_mul;
 498 |       json.l2_decay_mul = this.l2_decay_mul;
 499 |       json.pad = this.pad;
 500 |       json.filters = [];
 501 |       for(var i=0;i<this.filters.length;i++) {
 502 |         json.filters.push(this.filters[i].toJSON());
 503 |       }
 504 |       json.biases = this.biases.toJSON();
 505 |       return json;
 506 |     },
 507 |     fromJSON: function(json) {
 508 |       this.out_depth = json.out_depth;
 509 |       this.out_sx = json.out_sx;
 510 |       this.out_sy = json.out_sy;
 511 |       this.layer_type = json.layer_type;
 512 |       this.sx = json.sx; // filter size in x, y dims
 513 |       this.sy = json.sy;
 514 |       this.stride = json.stride;
 515 |       this.in_depth = json.in_depth; // depth of input volume
 516 |       this.filters = [];
 517 |       this.l1_decay_mul = typeof json.l1_decay_mul !== 'undefined' ? json.l1_decay_mul : 1.0;
 518 |       this.l2_decay_mul = typeof json.l2_decay_mul !== 'undefined' ? json.l2_decay_mul : 1.0;
 519 |       this.pad = typeof json.pad !== 'undefined' ? json.pad : 0;
 520 |       for(var i=0;i<json.filters.length;i++) {
 521 |         var v = new Vol(0,0,0,0);
 522 |         v.fromJSON(json.filters[i]);
 523 |         this.filters.push(v);
 524 |       }
 525 |       this.biases = new Vol(0,0,0,0);
 526 |       this.biases.fromJSON(json.biases);
 527 |     }
 528 |   }
 529 | 
 530 |   var FullyConnLayer = function(opt) {
 531 |     var opt = opt || {};
 532 | 
 533 |     // required
 534 |     // ok fine we will allow 'filters' as the word as well
 535 |     this.out_depth = typeof opt.num_neurons !== 'undefined' ? opt.num_neurons : opt.filters;
 536 | 
 537 |     // optional 
 538 |     this.l1_decay_mul = typeof opt.l1_decay_mul !== 'undefined' ? opt.l1_decay_mul : 0.0;
 539 |     this.l2_decay_mul = typeof opt.l2_decay_mul !== 'undefined' ? opt.l2_decay_mul : 1.0;
 540 | 
 541 |     // computed
 542 |     this.num_inputs = opt.in_sx * opt.in_sy * opt.in_depth;
 543 |     this.out_sx = 1;
 544 |     this.out_sy = 1;
 545 |     this.layer_type = 'fc';
 546 | 
 547 |     // initializations
 548 |     var bias = typeof opt.bias_pref !== 'undefined' ? opt.bias_pref : 0.0;
 549 |     this.filters = [];
 550 |     for(var i=0;i<this.out_depth ;i++) { this.filters.push(new Vol(1, 1, this.num_inputs)); }
 551 |     this.biases = new Vol(1, 1, this.out_depth, bias);
 552 |   }
 553 | 
 554 |   FullyConnLayer.prototype = {
 555 |     forward: function(V, is_training) {
 556 |       this.in_act = V;
 557 |       var A = new Vol(1, 1, this.out_depth, 0.0);
 558 |       var Vw = V.w;
 559 |       for(var i=0;i<this.out_depth;i++) {
 560 |         var a = 0.0;
 561 |         var wi = this.filters[i].w;
 562 |         for(var d=0;d<this.num_inputs;d++) {
 563 |           a += Vw[d] * wi[d]; // for efficiency use Vols directly for now
 564 |         }
 565 |         a += this.biases.w[i];
 566 |         A.w[i] = a;
 567 |       }
 568 |       this.out_act = A;
 569 |       return this.out_act;
 570 |     },
 571 |     backward: function() {
 572 |       var V = this.in_act;
 573 |       V.dw = global.zeros(V.w.length); // zero out the gradient in input Vol
 574 |       
 575 |       // compute gradient wrt weights and data
 576 |       for(var i=0;i<this.out_depth;i++) {
 577 |         var tfi = this.filters[i];
 578 |         var chain_grad = this.out_act.dw[i];
 579 |         for(var d=0;d<this.num_inputs;d++) {
 580 |           V.dw[d] += tfi.w[d]*chain_grad; // grad wrt input data
 581 |           tfi.dw[d] += V.w[d]*chain_grad; // grad wrt params
 582 |         }
 583 |         this.biases.dw[i] += chain_grad;
 584 |       }
 585 |     },
 586 |     getParamsAndGrads: function() {
 587 |       var response = [];
 588 |       for(var i=0;i<this.out_depth;i++) {
 589 |         response.push({params: this.filters[i].w, grads: this.filters[i].dw, l1_decay_mul: this.l1_decay_mul, l2_decay_mul: this.l2_decay_mul});
 590 |       }
 591 |       response.push({params: this.biases.w, grads: this.biases.dw, l1_decay_mul: 0.0, l2_decay_mul: 0.0});
 592 |       return response;
 593 |     },
 594 |     toJSON: function() {
 595 |       var json = {};
 596 |       json.out_depth = this.out_depth;
 597 |       json.out_sx = this.out_sx;
 598 |       json.out_sy = this.out_sy;
 599 |       json.layer_type = this.layer_type;
 600 |       json.num_inputs = this.num_inputs;
 601 |       json.l1_decay_mul = this.l1_decay_mul;
 602 |       json.l2_decay_mul = this.l2_decay_mul;
 603 |       json.filters = [];
 604 |       for(var i=0;i<this.filters.length;i++) {
 605 |         json.filters.push(this.filters[i].toJSON());
 606 |       }
 607 |       json.biases = this.biases.toJSON();
 608 |       return json;
 609 |     },
 610 |     fromJSON: function(json) {
 611 |       this.out_depth = json.out_depth;
 612 |       this.out_sx = json.out_sx;
 613 |       this.out_sy = json.out_sy;
 614 |       this.layer_type = json.layer_type;
 615 |       this.num_inputs = json.num_inputs;
 616 |       this.l1_decay_mul = typeof json.l1_decay_mul !== 'undefined' ? json.l1_decay_mul : 1.0;
 617 |       this.l2_decay_mul = typeof json.l2_decay_mul !== 'undefined' ? json.l2_decay_mul : 1.0;
 618 |       this.filters = [];
 619 |       for(var i=0;i<json.filters.length;i++) {
 620 |         var v = new Vol(0,0,0,0);
 621 |         v.fromJSON(json.filters[i]);
 622 |         this.filters.push(v);
 623 |       }
 624 |       this.biases = new Vol(0,0,0,0);
 625 |       this.biases.fromJSON(json.biases);
 626 |     }
 627 |   }
 628 | 
 629 |   global.ConvLayer = ConvLayer;
 630 |   global.FullyConnLayer = FullyConnLayer;
 631 |   
 632 | })(convnetjs);
 633 | (function(global) {
 634 |   "use strict";
 635 |   var Vol = global.Vol; // convenience
 636 |   
 637 |   var PoolLayer = function(opt) {
 638 | 
 639 |     var opt = opt || {};
 640 | 
 641 |     // required
 642 |     this.sx = opt.sx; // filter size
 643 |     this.in_depth = opt.in_depth;
 644 |     this.in_sx = opt.in_sx;
 645 |     this.in_sy = opt.in_sy;
 646 | 
 647 |     // optional
 648 |     this.sy = typeof opt.sy !== 'undefined' ? opt.sy : this.sx;
 649 |     this.stride = typeof opt.stride !== 'undefined' ? opt.stride : 2;
 650 |     this.pad = typeof opt.pad !== 'undefined' ? opt.pad : 0; // amount of 0 padding to add around borders of input volume
 651 | 
 652 |     // computed
 653 |     this.out_depth = this.in_depth;
 654 |     this.out_sx = Math.floor((this.in_sx + this.pad * 2 - this.sx) / this.stride + 1);
 655 |     this.out_sy = Math.floor((this.in_sy + this.pad * 2 - this.sy) / this.stride + 1);
 656 |     this.layer_type = 'pool';
 657 |     // store switches for x,y coordinates for where the max comes from, for each output neuron
 658 |     this.switchx = global.zeros(this.out_sx*this.out_sy*this.out_depth);
 659 |     this.switchy = global.zeros(this.out_sx*this.out_sy*this.out_depth);
 660 |   }
 661 | 
 662 |   PoolLayer.prototype = {
 663 |     forward: function(V, is_training) {
 664 |       this.in_act = V;
 665 | 
 666 |       var A = new Vol(this.out_sx, this.out_sy, this.out_depth, 0.0);
 667 |       
 668 |       var n=0; // a counter for switches
 669 |       for(var d=0;d<this.out_depth;d++) {
 670 |         var x = -this.pad;
 671 |         var y = -this.pad;
 672 |         for(var ax=0; ax<this.out_sx; x+=this.stride,ax++) {
 673 |           y = -this.pad;
 674 |           for(var ay=0; ay<this.out_sy; y+=this.stride,ay++) {
 675 | 
 676 |             // convolve centered at this particular location
 677 |             var a = -99999; // hopefully small enough ;\
 678 |             var winx=-1,winy=-1;
 679 |             for(var fx=0;fx<this.sx;fx++) {
 680 |               for(var fy=0;fy<this.sy;fy++) {
 681 |                 var oy = y+fy;
 682 |                 var ox = x+fx;
 683 |                 if(oy>=0 && oy<V.sy && ox>=0 && ox<V.sx) {
 684 |                   var v = V.get(ox, oy, d);
 685 |                   // perform max pooling and store pointers to where
 686 |                   // the max came from. This will speed up backprop 
 687 |                   // and can help make nice visualizations in future
 688 |                   if(v > a) { a = v; winx=ox; winy=oy;}
 689 |                 }
 690 |               }
 691 |             }
 692 |             this.switchx[n] = winx;
 693 |             this.switchy[n] = winy;
 694 |             n++;
 695 |             A.set(ax, ay, d, a);
 696 |           }
 697 |         }
 698 |       }
 699 |       this.out_act = A;
 700 |       return this.out_act;
 701 |     },
 702 |     backward: function() { 
 703 |       // pooling layers have no parameters, so simply compute 
 704 |       // gradient wrt data here
 705 |       var V = this.in_act;
 706 |       V.dw = global.zeros(V.w.length); // zero out gradient wrt data
 707 |       var A = this.out_act; // computed in forward pass 
 708 | 
 709 |       var n = 0;
 710 |       for(var d=0;d<this.out_depth;d++) {
 711 |         var x = -this.pad;
 712 |         var y = -this.pad;
 713 |         for(var ax=0; ax<this.out_sx; x+=this.stride,ax++) {
 714 |           y = -this.pad;
 715 |           for(var ay=0; ay<this.out_sy; y+=this.stride,ay++) {
 716 | 
 717 |             var chain_grad = this.out_act.get_grad(ax,ay,d);
 718 |             V.add_grad(this.switchx[n], this.switchy[n], d, chain_grad);
 719 |             n++;
 720 | 
 721 |           }
 722 |         }
 723 |       }
 724 |     },
 725 |     getParamsAndGrads: function() {
 726 |       return [];
 727 |     },
 728 |     toJSON: function() {
 729 |       var json = {};
 730 |       json.sx = this.sx;
 731 |       json.sy = this.sy;
 732 |       json.stride = this.stride;
 733 |       json.in_depth = this.in_depth;
 734 |       json.out_depth = this.out_depth;
 735 |       json.out_sx = this.out_sx;
 736 |       json.out_sy = this.out_sy;
 737 |       json.layer_type = this.layer_type;
 738 |       json.pad = this.pad;
 739 |       return json;
 740 |     },
 741 |     fromJSON: function(json) {
 742 |       this.out_depth = json.out_depth;
 743 |       this.out_sx = json.out_sx;
 744 |       this.out_sy = json.out_sy;
 745 |       this.layer_type = json.layer_type;
 746 |       this.sx = json.sx;
 747 |       this.sy = json.sy;
 748 |       this.stride = json.stride;
 749 |       this.in_depth = json.in_depth;
 750 |       this.pad = typeof json.pad !== 'undefined' ? json.pad : 0; // backwards compatibility
 751 |       this.switchx = global.zeros(this.out_sx*this.out_sy*this.out_depth); // need to re-init these appropriately
 752 |       this.switchy = global.zeros(this.out_sx*this.out_sy*this.out_depth);
 753 |     }
 754 |   }
 755 | 
 756 |   global.PoolLayer = PoolLayer;
 757 | 
 758 | })(convnetjs);
 759 | 
 760 | (function(global) {
 761 |   "use strict";
 762 |   var Vol = global.Vol; // convenience
 763 |   var getopt = global.getopt;
 764 | 
 765 |   var InputLayer = function(opt) {
 766 |     var opt = opt || {};
 767 | 
 768 |     // required: depth
 769 |     this.out_depth = getopt(opt, ['out_depth', 'depth'], 0);
 770 | 
 771 |     // optional: default these dimensions to 1
 772 |     this.out_sx = getopt(opt, ['out_sx', 'sx', 'width'], 1);
 773 |     this.out_sy = getopt(opt, ['out_sy', 'sy', 'height'], 1);
 774 |     
 775 |     // computed
 776 |     this.layer_type = 'input';
 777 |   }
 778 |   InputLayer.prototype = {
 779 |     forward: function(V, is_training) {
 780 |       this.in_act = V;
 781 |       this.out_act = V;
 782 |       return this.out_act; // simply identity function for now
 783 |     },
 784 |     backward: function() { },
 785 |     getParamsAndGrads: function() {
 786 |       return [];
 787 |     },
 788 |     toJSON: function() {
 789 |       var json = {};
 790 |       json.out_depth = this.out_depth;
 791 |       json.out_sx = this.out_sx;
 792 |       json.out_sy = this.out_sy;
 793 |       json.layer_type = this.layer_type;
 794 |       return json;
 795 |     },
 796 |     fromJSON: function(json) {
 797 |       this.out_depth = json.out_depth;
 798 |       this.out_sx = json.out_sx;
 799 |       this.out_sy = json.out_sy;
 800 |       this.layer_type = json.layer_type; 
 801 |     }
 802 |   }
 803 | 
 804 |   global.InputLayer = InputLayer;
 805 | })(convnetjs);
 806 | (function(global) {
 807 |   "use strict";
 808 |   var Vol = global.Vol; // convenience
 809 |   
 810 |   // Layers that implement a loss. Currently these are the layers that 
 811 |   // can initiate a backward() pass. In future we probably want a more 
 812 |   // flexible system that can accomodate multiple losses to do multi-task
 813 |   // learning, and stuff like that. But for now, one of the layers in this
 814 |   // file must be the final layer in a Net.
 815 | 
 816 |   // This is a classifier, with N discrete classes from 0 to N-1
 817 |   // it gets a stream of N incoming numbers and computes the softmax
 818 |   // function (exponentiate and normalize to sum to 1 as probabilities should)
 819 |   var SoftmaxLayer = function(opt) {
 820 |     var opt = opt || {};
 821 | 
 822 |     // computed
 823 |     this.num_inputs = opt.in_sx * opt.in_sy * opt.in_depth;
 824 |     this.out_depth = this.num_inputs;
 825 |     this.out_sx = 1;
 826 |     this.out_sy = 1;
 827 |     this.layer_type = 'softmax';
 828 |   }
 829 | 
 830 |   SoftmaxLayer.prototype = {
 831 |     forward: function(V, is_training) {
 832 |       this.in_act = V;
 833 | 
 834 |       var A = new Vol(1, 1, this.out_depth, 0.0);
 835 | 
 836 |       // compute max activation
 837 |       var as = V.w;
 838 |       var amax = V.w[0];
 839 |       for(var i=1;i<this.out_depth;i++) {
 840 |         if(as[i] > amax) amax = as[i];
 841 |       }
 842 | 
 843 |       // compute exponentials (carefully to not blow up)
 844 |       var es = global.zeros(this.out_depth);
 845 |       var esum = 0.0;
 846 |       for(var i=0;i<this.out_depth;i++) {
 847 |         var e = Math.exp(as[i] - amax);
 848 |         esum += e;
 849 |         es[i] = e;
 850 |       }
 851 | 
 852 |       // normalize and output to sum to one
 853 |       for(var i=0;i<this.out_depth;i++) {
 854 |         es[i] /= esum;
 855 |         A.w[i] = es[i];
 856 |       }
 857 | 
 858 |       this.es = es; // save these for backprop
 859 |       this.out_act = A;
 860 |       return this.out_act;
 861 |     },
 862 |     backward: function(y) {
 863 | 
 864 |       // compute and accumulate gradient wrt weights and bias of this layer
 865 |       var x = this.in_act;
 866 |       x.dw = global.zeros(x.w.length); // zero out the gradient of input Vol
 867 | 
 868 |       for(var i=0;i<this.out_depth;i++) {
 869 |         var indicator = i === y ? 1.0 : 0.0;
 870 |         var mul = -(indicator - this.es[i]);
 871 |         x.dw[i] = mul;
 872 |       }
 873 | 
 874 |       // loss is the class negative log likelihood
 875 |       return -Math.log(this.es[y]);
 876 |     },
 877 |     getParamsAndGrads: function() { 
 878 |       return [];
 879 |     },
 880 |     toJSON: function() {
 881 |       var json = {};
 882 |       json.out_depth = this.out_depth;
 883 |       json.out_sx = this.out_sx;
 884 |       json.out_sy = this.out_sy;
 885 |       json.layer_type = this.layer_type;
 886 |       json.num_inputs = this.num_inputs;
 887 |       return json;
 888 |     },
 889 |     fromJSON: function(json) {
 890 |       this.out_depth = json.out_depth;
 891 |       this.out_sx = json.out_sx;
 892 |       this.out_sy = json.out_sy;
 893 |       this.layer_type = json.layer_type;
 894 |       this.num_inputs = json.num_inputs;
 895 |     }
 896 |   }
 897 | 
 898 |   // implements an L2 regression cost layer,
 899 |   // so penalizes \sum_i(||x_i - y_i||^2), where x is its input
 900 |   // and y is the user-provided array of "correct" values.
 901 |   var RegressionLayer = function(opt) {
 902 |     var opt = opt || {};
 903 | 
 904 |     // computed
 905 |     this.num_inputs = opt.in_sx * opt.in_sy * opt.in_depth;
 906 |     this.out_depth = this.num_inputs;
 907 |     this.out_sx = 1;
 908 |     this.out_sy = 1;
 909 |     this.layer_type = 'regression';
 910 |   }
 911 | 
 912 |   RegressionLayer.prototype = {
 913 |     forward: function(V, is_training) {
 914 |       this.in_act = V;
 915 |       this.out_act = V;
 916 |       return V; // identity function
 917 |     },
 918 |     // y is a list here of size num_inputs
 919 |     // or it can be a number if only one value is regressed
 920 |     // or it can be a struct {dim: i, val: x} where we only want to 
 921 |     // regress on dimension i and asking it to have value x
 922 |     backward: function(y) { 
 923 | 
 924 |       // compute and accumulate gradient wrt weights and bias of this layer
 925 |       var x = this.in_act;
 926 |       x.dw = global.zeros(x.w.length); // zero out the gradient of input Vol
 927 |       var loss = 0.0;
 928 |       if(y instanceof Array || y instanceof Float64Array) {
 929 |         for(var i=0;i<this.out_depth;i++) {
 930 |           var dy = x.w[i] - y[i];
 931 |           x.dw[i] = dy;
 932 |           loss += 0.5*dy*dy;
 933 |         }
 934 |       } else if(typeof y === 'number') {
 935 |         // lets hope that only one number is being regressed
 936 |         var dy = x.w[0] - y;
 937 |         x.dw[0] = dy;
 938 |         loss += 0.5*dy*dy;
 939 |       } else {
 940 |         // assume it is a struct with entries .dim and .val
 941 |         // and we pass gradient only along dimension dim to be equal to val
 942 |         var i = y.dim;
 943 |         var yi = y.val;
 944 |         var dy = x.w[i] - yi;
 945 |         x.dw[i] = dy;
 946 |         loss += 0.5*dy*dy;
 947 |       }
 948 |       return loss;
 949 |     },
 950 |     getParamsAndGrads: function() { 
 951 |       return [];
 952 |     },
 953 |     toJSON: function() {
 954 |       var json = {};
 955 |       json.out_depth = this.out_depth;
 956 |       json.out_sx = this.out_sx;
 957 |       json.out_sy = this.out_sy;
 958 |       json.layer_type = this.layer_type;
 959 |       json.num_inputs = this.num_inputs;
 960 |       return json;
 961 |     },
 962 |     fromJSON: function(json) {
 963 |       this.out_depth = json.out_depth;
 964 |       this.out_sx = json.out_sx;
 965 |       this.out_sy = json.out_sy;
 966 |       this.layer_type = json.layer_type;
 967 |       this.num_inputs = json.num_inputs;
 968 |     }
 969 |   }
 970 | 
 971 |   var SVMLayer = function(opt) {
 972 |     var opt = opt || {};
 973 | 
 974 |     // computed
 975 |     this.num_inputs = opt.in_sx * opt.in_sy * opt.in_depth;
 976 |     this.out_depth = this.num_inputs;
 977 |     this.out_sx = 1;
 978 |     this.out_sy = 1;
 979 |     this.layer_type = 'svm';
 980 |   }
 981 | 
 982 |   SVMLayer.prototype = {
 983 |     forward: function(V, is_training) {
 984 |       this.in_act = V;
 985 |       this.out_act = V; // nothing to do, output raw scores
 986 |       return V;
 987 |     },
 988 |     backward: function(y) {
 989 | 
 990 |       // compute and accumulate gradient wrt weights and bias of this layer
 991 |       var x = this.in_act;
 992 |       x.dw = global.zeros(x.w.length); // zero out the gradient of input Vol
 993 | 
 994 |       // we're using structured loss here, which means that the score
 995 |       // of the ground truth should be higher than the score of any other 
 996 |       // class, by a margin
 997 |       var yscore = x.w[y]; // score of ground truth
 998 |       var margin = 1.0;
 999 |       var loss = 0.0;
1000 |       for(var i=0;i<this.out_depth;i++) {
1001 |         if(y === i) { continue; }
1002 |         var ydiff = -yscore + x.w[i] + margin;
1003 |         if(ydiff > 0) {
1004 |           // violating dimension, apply loss
1005 |           x.dw[i] += 1;
1006 |           x.dw[y] -= 1;
1007 |           loss += ydiff;
1008 |         }
1009 |       }
1010 | 
1011 |       return loss;
1012 |     },
1013 |     getParamsAndGrads: function() { 
1014 |       return [];
1015 |     },
1016 |     toJSON: function() {
1017 |       var json = {};
1018 |       json.out_depth = this.out_depth;
1019 |       json.out_sx = this.out_sx;
1020 |       json.out_sy = this.out_sy;
1021 |       json.layer_type = this.layer_type;
1022 |       json.num_inputs = this.num_inputs;
1023 |       return json;
1024 |     },
1025 |     fromJSON: function(json) {
1026 |       this.out_depth = json.out_depth;
1027 |       this.out_sx = json.out_sx;
1028 |       this.out_sy = json.out_sy;
1029 |       this.layer_type = json.layer_type;
1030 |       this.num_inputs = json.num_inputs;
1031 |     }
1032 |   }
1033 |   
1034 |   global.RegressionLayer = RegressionLayer;
1035 |   global.SoftmaxLayer = SoftmaxLayer;
1036 |   global.SVMLayer = SVMLayer;
1037 | 
1038 | })(convnetjs);
1039 | 
1040 | (function(global) {
1041 |   "use strict";
1042 |   var Vol = global.Vol; // convenience
1043 |   
1044 |   // Implements ReLU nonlinearity elementwise
1045 |   // x -> max(0, x)
1046 |   // the output is in [0, inf)
1047 |   var ReluLayer = function(opt) {
1048 |     var opt = opt || {};
1049 | 
1050 |     // computed
1051 |     this.out_sx = opt.in_sx;
1052 |     this.out_sy = opt.in_sy;
1053 |     this.out_depth = opt.in_depth;
1054 |     this.layer_type = 'relu';
1055 |   }
1056 |   ReluLayer.prototype = {
1057 |     forward: function(V, is_training) {
1058 |       this.in_act = V;
1059 |       var V2 = V.clone();
1060 |       var N = V.w.length;
1061 |       var V2w = V2.w;
1062 |       for(var i=0;i<N;i++) { 
1063 |         if(V2w[i] < 0) V2w[i] = 0; // threshold at 0
1064 |       }
1065 |       this.out_act = V2;
1066 |       return this.out_act;
1067 |     },
1068 |     backward: function() {
1069 |       var V = this.in_act; // we need to set dw of this
1070 |       var V2 = this.out_act;
1071 |       var N = V.w.length;
1072 |       V.dw = global.zeros(N); // zero out gradient wrt data
1073 |       for(var i=0;i<N;i++) {
1074 |         if(V2.w[i] <= 0) V.dw[i] = 0; // threshold
1075 |         else V.dw[i] = V2.dw[i];
1076 |       }
1077 |     },
1078 |     getParamsAndGrads: function() {
1079 |       return [];
1080 |     },
1081 |     toJSON: function() {
1082 |       var json = {};
1083 |       json.out_depth = this.out_depth;
1084 |       json.out_sx = this.out_sx;
1085 |       json.out_sy = this.out_sy;
1086 |       json.layer_type = this.layer_type;
1087 |       return json;
1088 |     },
1089 |     fromJSON: function(json) {
1090 |       this.out_depth = json.out_depth;
1091 |       this.out_sx = json.out_sx;
1092 |       this.out_sy = json.out_sy;
1093 |       this.layer_type = json.layer_type; 
1094 |     }
1095 |   }
1096 | 
1097 |   // Implements Sigmoid nnonlinearity elementwise
1098 |   // x -> 1/(1+e^(-x))
1099 |   // so the output is between 0 and 1.
1100 |   var SigmoidLayer = function(opt) {
1101 |     var opt = opt || {};
1102 | 
1103 |     // computed
1104 |     this.out_sx = opt.in_sx;
1105 |     this.out_sy = opt.in_sy;
1106 |     this.out_depth = opt.in_depth;
1107 |     this.layer_type = 'sigmoid';
1108 |   }
1109 |   SigmoidLayer.prototype = {
1110 |     forward: function(V, is_training) {
1111 |       this.in_act = V;
1112 |       var V2 = V.cloneAndZero();
1113 |       var N = V.w.length;
1114 |       var V2w = V2.w;
1115 |       var Vw = V.w;
1116 |       for(var i=0;i<N;i++) { 
1117 |         V2w[i] = 1.0/(1.0+Math.exp(-Vw[i]));
1118 |       }
1119 |       this.out_act = V2;
1120 |       return this.out_act;
1121 |     },
1122 |     backward: function() {
1123 |       var V = this.in_act; // we need to set dw of this
1124 |       var V2 = this.out_act;
1125 |       var N = V.w.length;
1126 |       V.dw = global.zeros(N); // zero out gradient wrt data
1127 |       for(var i=0;i<N;i++) {
1128 |         var v2wi = V2.w[i];
1129 |         V.dw[i] =  v2wi * (1.0 - v2wi) * V2.dw[i];
1130 |       }
1131 |     },
1132 |     getParamsAndGrads: function() {
1133 |       return [];
1134 |     },
1135 |     toJSON: function() {
1136 |       var json = {};
1137 |       json.out_depth = this.out_depth;
1138 |       json.out_sx = this.out_sx;
1139 |       json.out_sy = this.out_sy;
1140 |       json.layer_type = this.layer_type;
1141 |       return json;
1142 |     },
1143 |     fromJSON: function(json) {
1144 |       this.out_depth = json.out_depth;
1145 |       this.out_sx = json.out_sx;
1146 |       this.out_sy = json.out_sy;
1147 |       this.layer_type = json.layer_type; 
1148 |     }
1149 |   }
1150 | 
1151 |   // Implements Maxout nnonlinearity that computes
1152 |   // x -> max(x)
1153 |   // where x is a vector of size group_size. Ideally of course,
1154 |   // the input size should be exactly divisible by group_size
1155 |   var MaxoutLayer = function(opt) {
1156 |     var opt = opt || {};
1157 | 
1158 |     // required
1159 |     this.group_size = typeof opt.group_size !== 'undefined' ? opt.group_size : 2;
1160 | 
1161 |     // computed
1162 |     this.out_sx = opt.in_sx;
1163 |     this.out_sy = opt.in_sy;
1164 |     this.out_depth = Math.floor(opt.in_depth / this.group_size);
1165 |     this.layer_type = 'maxout';
1166 | 
1167 |     this.switches = global.zeros(this.out_sx*this.out_sy*this.out_depth); // useful for backprop
1168 |   }
1169 |   MaxoutLayer.prototype = {
1170 |     forward: function(V, is_training) {
1171 |       this.in_act = V;
1172 |       var N = this.out_depth; 
1173 |       var V2 = new Vol(this.out_sx, this.out_sy, this.out_depth, 0.0);
1174 | 
1175 |       // optimization branch. If we're operating on 1D arrays we dont have
1176 |       // to worry about keeping track of x,y,d coordinates inside
1177 |       // input volumes. In convnets we do :(
1178 |       if(this.out_sx === 1 && this.out_sy === 1) {
1179 |         for(var i=0;i<N;i++) {
1180 |           var ix = i * this.group_size; // base index offset
1181 |           var a = V.w[ix];
1182 |           var ai = 0;
1183 |           for(var j=1;j<this.group_size;j++) {
1184 |             var a2 = V.w[ix+j];
1185 |             if(a2 > a) {
1186 |               a = a2;
1187 |               ai = j;
1188 |             }
1189 |           }
1190 |           V2.w[i] = a;
1191 |           this.switches[i] = ix + ai;
1192 |         }
1193 |       } else {
1194 |         var n=0; // counter for switches
1195 |         for(var x=0;x<V.sx;x++) {
1196 |           for(var y=0;y<V.sy;y++) {
1197 |             for(var i=0;i<N;i++) {
1198 |               var ix = i * this.group_size;
1199 |               var a = V.get(x, y, ix);
1200 |               var ai = 0;
1201 |               for(var j=1;j<this.group_size;j++) {
1202 |                 var a2 = V.get(x, y, ix+j);
1203 |                 if(a2 > a) {
1204 |                   a = a2;
1205 |                   ai = j;
1206 |                 }
1207 |               }
1208 |               V2.set(x,y,i,a);
1209 |               this.switches[n] = ix + ai;
1210 |               n++;
1211 |             }
1212 |           }
1213 |         }
1214 | 
1215 |       }
1216 |       this.out_act = V2;
1217 |       return this.out_act;
1218 |     },
1219 |     backward: function() {
1220 |       var V = this.in_act; // we need to set dw of this
1221 |       var V2 = this.out_act;
1222 |       var N = this.out_depth;
1223 |       V.dw = global.zeros(V.w.length); // zero out gradient wrt data
1224 | 
1225 |       // pass the gradient through the appropriate switch
1226 |       if(this.out_sx === 1 && this.out_sy === 1) {
1227 |         for(var i=0;i<N;i++) {
1228 |           var chain_grad = V2.dw[i];
1229 |           V.dw[this.switches[i]] = chain_grad;
1230 |         }
1231 |       } else {
1232 |         // bleh okay, lets do this the hard way
1233 |         var n=0; // counter for switches
1234 |         for(var x=0;x<V2.sx;x++) {
1235 |           for(var y=0;y<V2.sy;y++) {
1236 |             for(var i=0;i<N;i++) {
1237 |               var chain_grad = V2.get_grad(x,y,i);
1238 |               V.set_grad(x,y,this.switches[n],chain_grad);
1239 |               n++;
1240 |             }
1241 |           }
1242 |         }
1243 |       }
1244 |     },
1245 |     getParamsAndGrads: function() {
1246 |       return [];
1247 |     },
1248 |     toJSON: function() {
1249 |       var json = {};
1250 |       json.out_depth = this.out_depth;
1251 |       json.out_sx = this.out_sx;
1252 |       json.out_sy = this.out_sy;
1253 |       json.layer_type = this.layer_type;
1254 |       json.group_size = this.group_size;
1255 |       return json;
1256 |     },
1257 |     fromJSON: function(json) {
1258 |       this.out_depth = json.out_depth;
1259 |       this.out_sx = json.out_sx;
1260 |       this.out_sy = json.out_sy;
1261 |       this.layer_type = json.layer_type; 
1262 |       this.group_size = json.group_size;
1263 |       this.switches = global.zeros(this.group_size);
1264 |     }
1265 |   }
1266 | 
1267 |   // a helper function, since tanh is not yet part of ECMAScript. Will be in v6.
1268 |   function tanh(x) {
1269 |     var y = Math.exp(2 * x);
1270 |     return (y - 1) / (y + 1);
1271 |   }
1272 |   // Implements Tanh nnonlinearity elementwise
1273 |   // x -> tanh(x) 
1274 |   // so the output is between -1 and 1.
1275 |   var TanhLayer = function(opt) {
1276 |     var opt = opt || {};
1277 | 
1278 |     // computed
1279 |     this.out_sx = opt.in_sx;
1280 |     this.out_sy = opt.in_sy;
1281 |     this.out_depth = opt.in_depth;
1282 |     this.layer_type = 'tanh';
1283 |   }
1284 |   TanhLayer.prototype = {
1285 |     forward: function(V, is_training) {
1286 |       this.in_act = V;
1287 |       var V2 = V.cloneAndZero();
1288 |       var N = V.w.length;
1289 |       for(var i=0;i<N;i++) { 
1290 |         V2.w[i] = tanh(V.w[i]);
1291 |       }
1292 |       this.out_act = V2;
1293 |       return this.out_act;
1294 |     },
1295 |     backward: function() {
1296 |       var V = this.in_act; // we need to set dw of this
1297 |       var V2 = this.out_act;
1298 |       var N = V.w.length;
1299 |       V.dw = global.zeros(N); // zero out gradient wrt data
1300 |       for(var i=0;i<N;i++) {
1301 |         var v2wi = V2.w[i];
1302 |         V.dw[i] = (1.0 - v2wi * v2wi) * V2.dw[i];
1303 |       }
1304 |     },
1305 |     getParamsAndGrads: function() {
1306 |       return [];
1307 |     },
1308 |     toJSON: function() {
1309 |       var json = {};
1310 |       json.out_depth = this.out_depth;
1311 |       json.out_sx = this.out_sx;
1312 |       json.out_sy = this.out_sy;
1313 |       json.layer_type = this.layer_type;
1314 |       return json;
1315 |     },
1316 |     fromJSON: function(json) {
1317 |       this.out_depth = json.out_depth;
1318 |       this.out_sx = json.out_sx;
1319 |       this.out_sy = json.out_sy;
1320 |       this.layer_type = json.layer_type; 
1321 |     }
1322 |   }
1323 |   
1324 |   global.TanhLayer = TanhLayer;
1325 |   global.MaxoutLayer = MaxoutLayer;
1326 |   global.ReluLayer = ReluLayer;
1327 |   global.SigmoidLayer = SigmoidLayer;
1328 | 
1329 | })(convnetjs);
1330 | 
1331 | (function(global) {
1332 |   "use strict";
1333 |   var Vol = global.Vol; // convenience
1334 | 
1335 |   // An inefficient dropout layer
1336 |   // Note this is not most efficient implementation since the layer before
1337 |   // computed all these activations and now we're just going to drop them :(
1338 |   // same goes for backward pass. Also, if we wanted to be efficient at test time
1339 |   // we could equivalently be clever and upscale during train and copy pointers during test
1340 |   // todo: make more efficient.
1341 |   var DropoutLayer = function(opt) {
1342 |     var opt = opt || {};
1343 | 
1344 |     // computed
1345 |     this.out_sx = opt.in_sx;
1346 |     this.out_sy = opt.in_sy;
1347 |     this.out_depth = opt.in_depth;
1348 |     this.layer_type = 'dropout';
1349 |     this.drop_prob = typeof opt.drop_prob !== 'undefined' ? opt.drop_prob : 0.5;
1350 |     this.dropped = global.zeros(this.out_sx*this.out_sy*this.out_depth);
1351 |   }
1352 |   DropoutLayer.prototype = {
1353 |     forward: function(V, is_training) {
1354 |       this.in_act = V;
1355 |       if(typeof(is_training)==='undefined') { is_training = false; } // default is prediction mode
1356 |       var V2 = V.clone();
1357 |       var N = V.w.length;
1358 |       if(is_training) {
1359 |         // do dropout
1360 |         for(var i=0;i<N;i++) {
1361 |           if(Math.random()<this.drop_prob) { V2.w[i]=0; this.dropped[i] = true; } // drop!
1362 |           else {this.dropped[i] = false;}
1363 |         }
1364 |       } else {
1365 |         // scale the activations during prediction
1366 |         for(var i=0;i<N;i++) { V2.w[i]*=this.drop_prob; }
1367 |       }
1368 |       this.out_act = V2;
1369 |       return this.out_act; // dummy identity function for now
1370 |     },
1371 |     backward: function() {
1372 |       var V = this.in_act; // we need to set dw of this
1373 |       var chain_grad = this.out_act;
1374 |       var N = V.w.length;
1375 |       V.dw = global.zeros(N); // zero out gradient wrt data
1376 |       for(var i=0;i<N;i++) {
1377 |         if(!(this.dropped[i])) { 
1378 |           V.dw[i] = chain_grad.dw[i]; // copy over the gradient
1379 |         }
1380 |       }
1381 |     },
1382 |     getParamsAndGrads: function() {
1383 |       return [];
1384 |     },
1385 |     toJSON: function() {
1386 |       var json = {};
1387 |       json.out_depth = this.out_depth;
1388 |       json.out_sx = this.out_sx;
1389 |       json.out_sy = this.out_sy;
1390 |       json.layer_type = this.layer_type;
1391 |       json.drop_prob = this.drop_prob;
1392 |       return json;
1393 |     },
1394 |     fromJSON: function(json) {
1395 |       this.out_depth = json.out_depth;
1396 |       this.out_sx = json.out_sx;
1397 |       this.out_sy = json.out_sy;
1398 |       this.layer_type = json.layer_type; 
1399 |       this.drop_prob = json.drop_prob;
1400 |     }
1401 |   }
1402 |   
1403 | 
1404 |   global.DropoutLayer = DropoutLayer;
1405 | })(convnetjs);
1406 | (function(global) {
1407 |   "use strict";
1408 |   var Vol = global.Vol; // convenience
1409 |   
1410 |   // a bit experimental layer for now. I think it works but I'm not 100%
1411 |   // the gradient check is a bit funky. I'll look into this a bit later.
1412 |   // Local Response Normalization in window, along depths of volumes
1413 |   var LocalResponseNormalizationLayer = function(opt) {
1414 |     var opt = opt || {};
1415 | 
1416 |     // required
1417 |     this.k = opt.k;
1418 |     this.n = opt.n;
1419 |     this.alpha = opt.alpha;
1420 |     this.beta = opt.beta;
1421 | 
1422 |     // computed
1423 |     this.out_sx = opt.in_sx;
1424 |     this.out_sy = opt.in_sy;
1425 |     this.out_depth = opt.in_depth;
1426 |     this.layer_type = 'lrn';
1427 | 
1428 |     // checks
1429 |     if(this.n%2 === 0) { console.log('WARNING n should be odd for LRN layer'); }
1430 |   }
1431 |   LocalResponseNormalizationLayer.prototype = {
1432 |     forward: function(V, is_training) {
1433 |       this.in_act = V;
1434 | 
1435 |       var A = V.cloneAndZero();
1436 |       this.S_cache_ = V.cloneAndZero();
1437 |       var n2 = Math.floor(this.n/2);
1438 |       for(var x=0;x<V.sx;x++) {
1439 |         for(var y=0;y<V.sy;y++) {
1440 |           for(var i=0;i<V.depth;i++) {
1441 | 
1442 |             var ai = V.get(x,y,i);
1443 | 
1444 |             // normalize in a window of size n
1445 |             var den = 0.0;
1446 |             for(var j=Math.max(0,i-n2);j<=Math.min(i+n2,V.depth-1);j++) {
1447 |               var aa = V.get(x,y,j);
1448 |               den += aa*aa;
1449 |             }
1450 |             den *= this.alpha / this.n;
1451 |             den += this.k;
1452 |             this.S_cache_.set(x,y,i,den); // will be useful for backprop
1453 |             den = Math.pow(den, this.beta);
1454 |             A.set(x,y,i,ai/den);
1455 |           }
1456 |         }
1457 |       }
1458 | 
1459 |       this.out_act = A;
1460 |       return this.out_act; // dummy identity function for now
1461 |     },
1462 |     backward: function() { 
1463 |       // evaluate gradient wrt data
1464 |       var V = this.in_act; // we need to set dw of this
1465 |       V.dw = global.zeros(V.w.length); // zero out gradient wrt data
1466 |       var A = this.out_act; // computed in forward pass 
1467 | 
1468 |       var n2 = Math.floor(this.n/2);
1469 |       for(var x=0;x<V.sx;x++) {
1470 |         for(var y=0;y<V.sy;y++) {
1471 |           for(var i=0;i<V.depth;i++) {
1472 | 
1473 |             var chain_grad = this.out_act.get_grad(x,y,i);
1474 |             var S = this.S_cache_.get(x,y,i);
1475 |             var SB = Math.pow(S, this.beta);
1476 |             var SB2 = SB*SB;
1477 | 
1478 |             // normalize in a window of size n
1479 |             for(var j=Math.max(0,i-n2);j<=Math.min(i+n2,V.depth-1);j++) {              
1480 |               var aj = V.get(x,y,j); 
1481 |               var g = -aj*this.beta*Math.pow(S,this.beta-1)*this.alpha/this.n*2*aj;
1482 |               if(j===i) g+= SB;
1483 |               g /= SB2;
1484 |               g *= chain_grad;
1485 |               V.add_grad(x,y,j,g);
1486 |             }
1487 | 
1488 |           }
1489 |         }
1490 |       }
1491 |     },
1492 |     getParamsAndGrads: function() { return []; },
1493 |     toJSON: function() {
1494 |       var json = {};
1495 |       json.k = this.k;
1496 |       json.n = this.n;
1497 |       json.alpha = this.alpha; // normalize by size
1498 |       json.beta = this.beta;
1499 |       json.out_sx = this.out_sx; 
1500 |       json.out_sy = this.out_sy;
1501 |       json.out_depth = this.out_depth;
1502 |       json.layer_type = this.layer_type;
1503 |       return json;
1504 |     },
1505 |     fromJSON: function(json) {
1506 |       this.k = json.k;
1507 |       this.n = json.n;
1508 |       this.alpha = json.alpha; // normalize by size
1509 |       this.beta = json.beta;
1510 |       this.out_sx = json.out_sx; 
1511 |       this.out_sy = json.out_sy;
1512 |       this.out_depth = json.out_depth;
1513 |       this.layer_type = json.layer_type;
1514 |     }
1515 |   }
1516 |   
1517 | 
1518 |   global.LocalResponseNormalizationLayer = LocalResponseNormalizationLayer;
1519 | })(convnetjs);
1520 | (function(global) {
1521 |   "use strict";
1522 |   var Vol = global.Vol; // convenience
1523 |   var assert = global.assert;
1524 | 
1525 |   // Net manages a set of layers
1526 |   // For now constraints: Simple linear order of layers, first layer input last layer a cost layer
1527 |   var Net = function(options) {
1528 |     this.layers = [];
1529 |   }
1530 | 
1531 |   Net.prototype = {
1532 |     
1533 |     // takes a list of layer definitions and creates the network layer objects
1534 |     makeLayers: function(defs) {
1535 | 
1536 |       // few checks
1537 |       assert(defs.length >= 2, 'Error! At least one input layer and one loss layer are required.');
1538 |       assert(defs[0].type === 'input', 'Error! First layer must be the input layer, to declare size of inputs');
1539 | 
1540 |       // desugar layer_defs for adding activation, dropout layers etc
1541 |       var desugar = function() {
1542 |         var new_defs = [];
1543 |         for(var i=0;i<defs.length;i++) {
1544 |           var def = defs[i];
1545 |           
1546 |           if(def.type==='softmax' || def.type==='svm') {
1547 |             // add an fc layer here, there is no reason the user should
1548 |             // have to worry about this and we almost always want to
1549 |             new_defs.push({type:'fc', num_neurons: def.num_classes});
1550 |           }
1551 | 
1552 |           if(def.type==='regression') {
1553 |             // add an fc layer here, there is no reason the user should
1554 |             // have to worry about this and we almost always want to
1555 |             new_defs.push({type:'fc', num_neurons: def.num_neurons});
1556 |           }
1557 | 
1558 |           if((def.type==='fc' || def.type==='conv') 
1559 |               && typeof(def.bias_pref) === 'undefined'){
1560 |             def.bias_pref = 0.0;
1561 |             if(typeof def.activation !== 'undefined' && def.activation === 'relu') {
1562 |               def.bias_pref = 0.1; // relus like a bit of positive bias to get gradients early
1563 |               // otherwise it's technically possible that a relu unit will never turn on (by chance)
1564 |               // and will never get any gradient and never contribute any computation. Dead relu.
1565 |             }
1566 |           }
1567 | 
1568 |           new_defs.push(def);
1569 | 
1570 |           if(typeof def.activation !== 'undefined') {
1571 |             if(def.activation==='relu') { new_defs.push({type:'relu'}); }
1572 |             else if (def.activation==='sigmoid') { new_defs.push({type:'sigmoid'}); }
1573 |             else if (def.activation==='tanh') { new_defs.push({type:'tanh'}); }
1574 |             else if (def.activation==='maxout') {
1575 |               // create maxout activation, and pass along group size, if provided
1576 |               var gs = def.group_size !== 'undefined' ? def.group_size : 2;
1577 |               new_defs.push({type:'maxout', group_size:gs});
1578 |             }
1579 |             else { console.log('ERROR unsupported activation ' + def.activation); }
1580 |           }
1581 |           if(typeof def.drop_prob !== 'undefined' && def.type !== 'dropout') {
1582 |             new_defs.push({type:'dropout', drop_prob: def.drop_prob});
1583 |           }
1584 | 
1585 |         }
1586 |         return new_defs;
1587 |       }
1588 |       defs = desugar(defs);
1589 | 
1590 |       // create the layers
1591 |       this.layers = [];
1592 |       for(var i=0;i<defs.length;i++) {
1593 |         var def = defs[i];
1594 |         if(i>0) {
1595 |           var prev = this.layers[i-1];
1596 |           def.in_sx = prev.out_sx;
1597 |           def.in_sy = prev.out_sy;
1598 |           def.in_depth = prev.out_depth;
1599 |         }
1600 | 
1601 |         switch(def.type) {
1602 |           case 'fc': this.layers.push(new global.FullyConnLayer(def)); break;
1603 |           case 'lrn': this.layers.push(new global.LocalResponseNormalizationLayer(def)); break;
1604 |           case 'dropout': this.layers.push(new global.DropoutLayer(def)); break;
1605 |           case 'input': this.layers.push(new global.InputLayer(def)); break;
1606 |           case 'softmax': this.layers.push(new global.SoftmaxLayer(def)); break;
1607 |           case 'regression': this.layers.push(new global.RegressionLayer(def)); break;
1608 |           case 'conv': this.layers.push(new global.ConvLayer(def)); break;
1609 |           case 'pool': this.layers.push(new global.PoolLayer(def)); break;
1610 |           case 'relu': this.layers.push(new global.ReluLayer(def)); break;
1611 |           case 'sigmoid': this.layers.push(new global.SigmoidLayer(def)); break;
1612 |           case 'tanh': this.layers.push(new global.TanhLayer(def)); break;
1613 |           case 'maxout': this.layers.push(new global.MaxoutLayer(def)); break;
1614 |           case 'svm': this.layers.push(new global.SVMLayer(def)); break;
1615 |           default: console.log('ERROR: UNRECOGNIZED LAYER TYPE: ' + def.type);
1616 |         }
1617 |       }
1618 |     },
1619 | 
1620 |     // forward prop the network. 
1621 |     // The trainer class passes is_training = true, but when this function is
1622 |     // called from outside (not from the trainer), it defaults to prediction mode
1623 |     forward: function(V, is_training) {
1624 |       if(typeof(is_training) === 'undefined') is_training = false;
1625 |       var act = this.layers[0].forward(V, is_training);
1626 |       for(var i=1;i<this.layers.length;i++) {
1627 |         act = this.layers[i].forward(act, is_training);
1628 |       }
1629 |       return act;
1630 |     },
1631 | 
1632 |     getCostLoss: function(V, y) {
1633 |       this.forward(V, false);
1634 |       var N = this.layers.length;
1635 |       var loss = this.layers[N-1].backward(y);
1636 |       return loss;
1637 |     },
1638 |     
1639 |     // backprop: compute gradients wrt all parameters
1640 |     backward: function(y) {
1641 |       var N = this.layers.length;
1642 |       var loss = this.layers[N-1].backward(y); // last layer assumed to be loss layer
1643 |       for(var i=N-2;i>=0;i--) { // first layer assumed input
1644 |         this.layers[i].backward();
1645 |       }
1646 |       return loss;
1647 |     },
1648 |     getParamsAndGrads: function() {
1649 |       // accumulate parameters and gradients for the entire network
1650 |       var response = [];
1651 |       for(var i=0;i<this.layers.length;i++) {
1652 |         var layer_reponse = this.layers[i].getParamsAndGrads();
1653 |         for(var j=0;j<layer_reponse.length;j++) {
1654 |           response.push(layer_reponse[j]);
1655 |         }
1656 |       }
1657 |       return response;
1658 |     },
1659 |     getPrediction: function() {
1660 |       // this is a convenience function for returning the argmax
1661 |       // prediction, assuming the last layer of the net is a softmax
1662 |       var S = this.layers[this.layers.length-1];
1663 |       assert(S.layer_type === 'softmax', 'getPrediction function assumes softmax as last layer of the net!');
1664 | 
1665 |       var p = S.out_act.w;
1666 |       var maxv = p[0];
1667 |       var maxi = 0;
1668 |       for(var i=1;i<p.length;i++) {
1669 |         if(p[i] > maxv) { maxv = p[i]; maxi = i;}
1670 |       }
1671 |       return maxi; // return index of the class with highest class probability
1672 |     },
1673 |     toJSON: function() {
1674 |       var json = {};
1675 |       json.layers = [];
1676 |       for(var i=0;i<this.layers.length;i++) {
1677 |         json.layers.push(this.layers[i].toJSON());
1678 |       }
1679 |       return json;
1680 |     },
1681 |     fromJSON: function(json) {
1682 |       this.layers = [];
1683 |       for(var i=0;i<json.layers.length;i++) {
1684 |         var Lj = json.layers[i]
1685 |         var t = Lj.layer_type;
1686 |         var L;
1687 |         if(t==='input') { L = new global.InputLayer(); }
1688 |         if(t==='relu') { L = new global.ReluLayer(); }
1689 |         if(t==='sigmoid') { L = new global.SigmoidLayer(); }
1690 |         if(t==='tanh') { L = new global.TanhLayer(); }
1691 |         if(t==='dropout') { L = new global.DropoutLayer(); }
1692 |         if(t==='conv') { L = new global.ConvLayer(); }
1693 |         if(t==='pool') { L = new global.PoolLayer(); }
1694 |         if(t==='lrn') { L = new global.LocalResponseNormalizationLayer(); }
1695 |         if(t==='softmax') { L = new global.SoftmaxLayer(); }
1696 |         if(t==='regression') { L = new global.RegressionLayer(); }
1697 |         if(t==='fc') { L = new global.FullyConnLayer(); }
1698 |         if(t==='maxout') { L = new global.MaxoutLayer(); }
1699 |         if(t==='svm') { L = new global.SVMLayer(); }
1700 |         L.fromJSON(Lj);
1701 |         this.layers.push(L);
1702 |       }
1703 |     }
1704 |   }
1705 |   
1706 |   global.Net = Net;
1707 | })(convnetjs);
1708 | (function(global) {
1709 |   "use strict";
1710 |   var Vol = global.Vol; // convenience
1711 | 
1712 |   var Trainer = function(net, options) {
1713 | 
1714 |     this.net = net;
1715 | 
1716 |     var options = options || {};
1717 |     this.learning_rate = typeof options.learning_rate !== 'undefined' ? options.learning_rate : 0.01;
1718 |     this.l1_decay = typeof options.l1_decay !== 'undefined' ? options.l1_decay : 0.0;
1719 |     this.l2_decay = typeof options.l2_decay !== 'undefined' ? options.l2_decay : 0.0;
1720 |     this.batch_size = typeof options.batch_size !== 'undefined' ? options.batch_size : 1;
1721 |     this.method = typeof options.method !== 'undefined' ? options.method : 'sgd'; // sgd/adagrad/adadelta/windowgrad/netsterov
1722 | 
1723 |     this.momentum = typeof options.momentum !== 'undefined' ? options.momentum : 0.9;
1724 |     this.ro = typeof options.ro !== 'undefined' ? options.ro : 0.95; // used in adadelta
1725 |     this.eps = typeof options.eps !== 'undefined' ? options.eps : 1e-6; // used in adadelta
1726 | 
1727 |     this.k = 0; // iteration counter
1728 |     this.gsum = []; // last iteration gradients (used for momentum calculations)
1729 |     this.xsum = []; // used in adadelta
1730 |   }
1731 | 
1732 |   Trainer.prototype = {
1733 |     train: function(x, y) {
1734 | 
1735 |       var start = new Date().getTime();
1736 |       this.net.forward(x, true); // also set the flag that lets the net know we're just training
1737 |       var end = new Date().getTime();
1738 |       var fwd_time = end - start;
1739 | 
1740 |       var start = new Date().getTime();
1741 |       var cost_loss = this.net.backward(y);
1742 |       var l2_decay_loss = 0.0;
1743 |       var l1_decay_loss = 0.0;
1744 |       var end = new Date().getTime();
1745 |       var bwd_time = end - start;
1746 |       
1747 |       this.k++;
1748 |       if(this.k % this.batch_size === 0) {
1749 | 
1750 |         var pglist = this.net.getParamsAndGrads();
1751 | 
1752 |         // initialize lists for accumulators. Will only be done once on first iteration
1753 |         if(this.gsum.length === 0 && (this.method !== 'sgd' || this.momentum > 0.0)) {
1754 |           // only vanilla sgd doesnt need either lists
1755 |           // momentum needs gsum
1756 |           // adagrad needs gsum
1757 |           // adadelta needs gsum and xsum
1758 |           for(var i=0;i<pglist.length;i++) {
1759 |             this.gsum.push(global.zeros(pglist[i].params.length));
1760 |             if(this.method === 'adadelta') {
1761 |               this.xsum.push(global.zeros(pglist[i].params.length));
1762 |             } else {
1763 |               this.xsum.push([]); // conserve memory
1764 |             }
1765 |           }
1766 |         }
1767 | 
1768 |         // perform an update for all sets of weights
1769 |         for(var i=0;i<pglist.length;i++) {
1770 |           var pg = pglist[i]; // param, gradient, other options in future (custom learning rate etc)
1771 |           var p = pg.params;
1772 |           var g = pg.grads;
1773 | 
1774 |           // learning rate for some parameters.
1775 |           var l2_decay_mul = typeof pg.l2_decay_mul !== 'undefined' ? pg.l2_decay_mul : 1.0;
1776 |           var l1_decay_mul = typeof pg.l1_decay_mul !== 'undefined' ? pg.l1_decay_mul : 1.0;
1777 |           var l2_decay = this.l2_decay * l2_decay_mul;
1778 |           var l1_decay = this.l1_decay * l1_decay_mul;
1779 | 
1780 |           var plen = p.length;
1781 |           for(var j=0;j<plen;j++) {
1782 |             l2_decay_loss += l2_decay*p[j]*p[j]/2; // accumulate weight decay loss
1783 |             l1_decay_loss += l1_decay*Math.abs(p[j]);
1784 |             var l1grad = l1_decay * (p[j] > 0 ? 1 : -1);
1785 |             var l2grad = l2_decay * (p[j]);
1786 | 
1787 |             var gij = (l2grad + l1grad + g[j]) / this.batch_size; // raw batch gradient
1788 | 
1789 |             var gsumi = this.gsum[i];
1790 |             var xsumi = this.xsum[i];
1791 |             if(this.method === 'adagrad') {
1792 |               // adagrad update
1793 |               gsumi[j] = gsumi[j] + gij * gij;
1794 |               var dx = - this.learning_rate / Math.sqrt(gsumi[j] + this.eps) * gij;
1795 |               p[j] += dx;
1796 |             } else if(this.method === 'windowgrad') {
1797 |               // this is adagrad but with a moving window weighted average
1798 |               // so the gradient is not accumulated over the entire history of the run. 
1799 |               // it's also referred to as Idea #1 in Zeiler paper on Adadelta. Seems reasonable to me!
1800 |               gsumi[j] = this.ro * gsumi[j] + (1-this.ro) * gij * gij;
1801 |               var dx = - this.learning_rate / Math.sqrt(gsumi[j] + this.eps) * gij; // eps added for better conditioning
1802 |               p[j] += dx;
1803 |             } else if(this.method === 'adadelta') {
1804 |               // assume adadelta if not sgd or adagrad
1805 |               gsumi[j] = this.ro * gsumi[j] + (1-this.ro) * gij * gij;
1806 |               var dx = - Math.sqrt((xsumi[j] + this.eps)/(gsumi[j] + this.eps)) * gij;
1807 |               xsumi[j] = this.ro * xsumi[j] + (1-this.ro) * dx * dx; // yes, xsum lags behind gsum by 1.
1808 |               p[j] += dx;
1809 |             } else if(this.method === 'nesterov') {
1810 |             	var dx = gsumi[j];
1811 |             	gsumi[j] = gsumi[j] * this.momentum + this.learning_rate * gij;
1812 |                 dx = this.momentum * dx - (1.0 + this.momentum) * gsumi[j];
1813 |                 p[j] += dx;
1814 |             } else {
1815 |               // assume SGD
1816 |               if(this.momentum > 0.0) {
1817 |                 // momentum update
1818 |                 var dx = this.momentum * gsumi[j] - this.learning_rate * gij; // step
1819 |                 gsumi[j] = dx; // back this up for next iteration of momentum
1820 |                 p[j] += dx; // apply corrected gradient
1821 |               } else {
1822 |                 // vanilla sgd
1823 |                 p[j] +=  - this.learning_rate * gij;
1824 |               }
1825 |             }
1826 |             g[j] = 0.0; // zero out gradient so that we can begin accumulating anew
1827 |           }
1828 |         }
1829 |       }
1830 | 
1831 |       // appending softmax_loss for backwards compatibility, but from now on we will always use cost_loss
1832 |       // in future, TODO: have to completely redo the way loss is done around the network as currently 
1833 |       // loss is a bit of a hack. Ideally, user should specify arbitrary number of loss functions on any layer
1834 |       // and it should all be computed correctly and automatically. 
1835 |       return {fwd_time: fwd_time, bwd_time: bwd_time, 
1836 |               l2_decay_loss: l2_decay_loss, l1_decay_loss: l1_decay_loss,
1837 |               cost_loss: cost_loss, softmax_loss: cost_loss, 
1838 |               loss: cost_loss + l1_decay_loss + l2_decay_loss}
1839 |     }
1840 |   }
1841 |   
1842 |   global.Trainer = Trainer;
1843 |   global.SGDTrainer = Trainer; // backwards compatibility
1844 | })(convnetjs);
1845 | 
1846 | (function(global) {
1847 |   "use strict";
1848 | 
1849 |   // used utilities, make explicit local references
1850 |   var randf = global.randf;
1851 |   var randi = global.randi;
1852 |   var Net = global.Net;
1853 |   var Trainer = global.Trainer;
1854 |   var maxmin = global.maxmin;
1855 |   var randperm = global.randperm;
1856 |   var weightedSample = global.weightedSample;
1857 |   var getopt = global.getopt;
1858 |   var arrUnique = global.arrUnique;
1859 | 
1860 |   /*
1861 |   A MagicNet takes data: a list of convnetjs.Vol(), and labels
1862 |   which for now are assumed to be class indeces 0..K. MagicNet then:
1863 |   - creates data folds for cross-validation
1864 |   - samples candidate networks
1865 |   - evaluates candidate networks on all data folds
1866 |   - produces predictions by model-averaging the best networks
1867 |   */
1868 |   var MagicNet = function(data, labels, opt) {
1869 |     var opt = opt || {};
1870 |     if(typeof data === 'undefined') { data = []; }
1871 |     if(typeof labels === 'undefined') { labels = []; }
1872 | 
1873 |     // required inputs
1874 |     this.data = data; // store these pointers to data
1875 |     this.labels = labels;
1876 | 
1877 |     // optional inputs
1878 |     this.train_ratio = getopt(opt, 'train_ratio', 0.7);
1879 |     this.num_folds = getopt(opt, 'num_folds', 10);
1880 |     this.num_candidates = getopt(opt, 'num_candidates', 50); // we evaluate several in parallel
1881 |     // how many epochs of data to train every network? for every fold?
1882 |     // higher values mean higher accuracy in final results, but more expensive
1883 |     this.num_epochs = getopt(opt, 'num_epochs', 50); 
1884 |     // number of best models to average during prediction. Usually higher = better
1885 |     this.ensemble_size = getopt(opt, 'ensemble_size', 10);
1886 | 
1887 |     // candidate parameters
1888 |     this.batch_size_min = getopt(opt, 'batch_size_min', 10);
1889 |     this.batch_size_max = getopt(opt, 'batch_size_max', 300);
1890 |     this.l2_decay_min = getopt(opt, 'l2_decay_min', -4);
1891 |     this.l2_decay_max = getopt(opt, 'l2_decay_max', 2);
1892 |     this.learning_rate_min = getopt(opt, 'learning_rate_min', -4);
1893 |     this.learning_rate_max = getopt(opt, 'learning_rate_max', 0);
1894 |     this.momentum_min = getopt(opt, 'momentum_min', 0.9);
1895 |     this.momentum_max = getopt(opt, 'momentum_max', 0.9);
1896 |     this.neurons_min = getopt(opt, 'neurons_min', 5);
1897 |     this.neurons_max = getopt(opt, 'neurons_max', 30);
1898 | 
1899 |     // computed
1900 |     this.folds = []; // data fold indices, gets filled by sampleFolds()
1901 |     this.candidates = []; // candidate networks that are being currently evaluated
1902 |     this.evaluated_candidates = []; // history of all candidates that were fully evaluated on all folds
1903 |     this.unique_labels = arrUnique(labels);
1904 |     this.iter = 0; // iteration counter, goes from 0 -> num_epochs * num_training_data
1905 |     this.foldix = 0; // index of active fold
1906 | 
1907 |     // callbacks
1908 |     this.finish_fold_callback = null;
1909 |     this.finish_batch_callback = null;
1910 | 
1911 |     // initializations
1912 |     if(this.data.length > 0) {
1913 |       this.sampleFolds();
1914 |       this.sampleCandidates();
1915 |     }
1916 |   };
1917 | 
1918 |   MagicNet.prototype = {
1919 | 
1920 |     // sets this.folds to a sampling of this.num_folds folds
1921 |     sampleFolds: function() {
1922 |       var N = this.data.length;
1923 |       var num_train = Math.floor(this.train_ratio * N);
1924 |       this.folds = []; // flush folds, if any
1925 |       for(var i=0;i<this.num_folds;i++) {
1926 |         var p = randperm(N);
1927 |         this.folds.push({train_ix: p.slice(0, num_train), test_ix: p.slice(num_train, N)});
1928 |       }
1929 |     },
1930 | 
1931 |     // returns a random candidate network
1932 |     sampleCandidate: function() {
1933 |       var input_depth = this.data[0].w.length;
1934 |       var num_classes = this.unique_labels.length;
1935 | 
1936 |       // sample network topology and hyperparameters
1937 |       var layer_defs = [];
1938 |       layer_defs.push({type:'input', out_sx:1, out_sy:1, out_depth: input_depth});
1939 |       var nl = weightedSample([0,1,2,3], [0.2, 0.3, 0.3, 0.2]); // prefer nets with 1,2 hidden layers
1940 |       for(var q=0;q<nl;q++) {
1941 |         var ni = randi(this.neurons_min, this.neurons_max);
1942 |         var act = ['tanh','maxout','relu'][randi(0,3)];
1943 |         if(randf(0,1)<0.5) {
1944 |           var dp = Math.random();
1945 |           layer_defs.push({type:'fc', num_neurons: ni, activation: act, drop_prob: dp});
1946 |         } else {
1947 |           layer_defs.push({type:'fc', num_neurons: ni, activation: act});
1948 |         }
1949 |       }
1950 |       layer_defs.push({type:'softmax', num_classes: num_classes});
1951 |       var net = new Net();
1952 |       net.makeLayers(layer_defs);
1953 | 
1954 |       // sample training hyperparameters
1955 |       var bs = randi(this.batch_size_min, this.batch_size_max); // batch size
1956 |       var l2 = Math.pow(10, randf(this.l2_decay_min, this.l2_decay_max)); // l2 weight decay
1957 |       var lr = Math.pow(10, randf(this.learning_rate_min, this.learning_rate_max)); // learning rate
1958 |       var mom = randf(this.momentum_min, this.momentum_max); // momentum. Lets just use 0.9, works okay usually ;p
1959 |       var tp = randf(0,1); // trainer type
1960 |       var trainer_def;
1961 |       if(tp<0.33) {
1962 |         trainer_def = {method:'adadelta', batch_size:bs, l2_decay:l2};
1963 |       } else if(tp<0.66) {
1964 |         trainer_def = {method:'adagrad', learning_rate: lr, batch_size:bs, l2_decay:l2};
1965 |       } else {
1966 |         trainer_def = {method:'sgd', learning_rate: lr, momentum: mom, batch_size:bs, l2_decay:l2};
1967 |       }
1968 |       
1969 |       var trainer = new Trainer(net, trainer_def);
1970 | 
1971 |       var cand = {};
1972 |       cand.acc = [];
1973 |       cand.accv = 0; // this will maintained as sum(acc) for convenience
1974 |       cand.layer_defs = layer_defs;
1975 |       cand.trainer_def = trainer_def;
1976 |       cand.net = net;
1977 |       cand.trainer = trainer;
1978 |       return cand;
1979 |     },
1980 | 
1981 |     // sets this.candidates with this.num_candidates candidate nets
1982 |     sampleCandidates: function() {
1983 |       this.candidates = []; // flush, if any
1984 |       for(var i=0;i<this.num_candidates;i++) {
1985 |         var cand = this.sampleCandidate();
1986 |         this.candidates.push(cand);
1987 |       }
1988 |     },
1989 | 
1990 |     step: function() {
1991 |       
1992 |       // run an example through current candidate
1993 |       this.iter++;
1994 | 
1995 |       // step all candidates on a random data point
1996 |       var fold = this.folds[this.foldix]; // active fold
1997 |       var dataix = fold.train_ix[randi(0, fold.train_ix.length)];
1998 |       for(var k=0;k<this.candidates.length;k++) {
1999 |         var x = this.data[dataix];
2000 |         var l = this.labels[dataix];
2001 |         this.candidates[k].trainer.train(x, l);
2002 |       }
2003 | 
2004 |       // process consequences: sample new folds, or candidates
2005 |       var lastiter = this.num_epochs * fold.train_ix.length;
2006 |       if(this.iter >= lastiter) {
2007 |         // finished evaluation of this fold. Get final validation
2008 |         // accuracies, record them, and go on to next fold.
2009 |         var val_acc = this.evalValErrors();
2010 |         for(var k=0;k<this.candidates.length;k++) {
2011 |           var c = this.candidates[k];
2012 |           c.acc.push(val_acc[k]);
2013 |           c.accv += val_acc[k];
2014 |         }
2015 |         this.iter = 0; // reset step number
2016 |         this.foldix++; // increment fold
2017 | 
2018 |         if(this.finish_fold_callback !== null) {
2019 |           this.finish_fold_callback();
2020 |         }
2021 | 
2022 |         if(this.foldix >= this.folds.length) {
2023 |           // we finished all folds as well! Record these candidates
2024 |           // and sample new ones to evaluate.
2025 |           for(var k=0;k<this.candidates.length;k++) {
2026 |             this.evaluated_candidates.push(this.candidates[k]);
2027 |           }
2028 |           // sort evaluated candidates according to accuracy achieved
2029 |           this.evaluated_candidates.sort(function(a, b) { 
2030 |             return (a.accv / a.acc.length) 
2031 |                  > (b.accv / b.acc.length) 
2032 |                  ? -1 : 1;
2033 |           });
2034 |           // and clip only to the top few ones (lets place limit at 3*ensemble_size)
2035 |           // otherwise there are concerns with keeping these all in memory 
2036 |           // if MagicNet is being evaluated for a very long time
2037 |           if(this.evaluated_candidates.length > 3 * this.ensemble_size) {
2038 |             this.evaluated_candidates = this.evaluated_candidates.slice(0, 3 * this.ensemble_size);
2039 |           }
2040 |           if(this.finish_batch_callback !== null) {
2041 |             this.finish_batch_callback();
2042 |           }
2043 |           this.sampleCandidates(); // begin with new candidates
2044 |           this.foldix = 0; // reset this
2045 |         } else {
2046 |           // we will go on to another fold. reset all candidates nets
2047 |           for(var k=0;k<this.candidates.length;k++) {
2048 |             var c = this.candidates[k];
2049 |             var net = new Net();
2050 |             net.makeLayers(c.layer_defs);
2051 |             var trainer = new Trainer(net, c.trainer_def);
2052 |             c.net = net;
2053 |             c.trainer = trainer;
2054 |           }
2055 |         }
2056 |       }
2057 |     },
2058 | 
2059 |     evalValErrors: function() {
2060 |       // evaluate candidates on validation data and return performance of current networks
2061 |       // as simple list
2062 |       var vals = [];
2063 |       var fold = this.folds[this.foldix]; // active fold
2064 |       for(var k=0;k<this.candidates.length;k++) {
2065 |         var net = this.candidates[k].net;
2066 |         var v = 0.0;
2067 |         for(var q=0;q<fold.test_ix.length;q++) {
2068 |           var x = this.data[fold.test_ix[q]];
2069 |           var l = this.labels[fold.test_ix[q]];
2070 |           net.forward(x);
2071 |           var yhat = net.getPrediction();
2072 |           v += (yhat === l ? 1.0 : 0.0); // 0 1 loss
2073 |         }
2074 |         v /= fold.test_ix.length; // normalize
2075 |         vals.push(v);
2076 |       }
2077 |       return vals;
2078 |     },
2079 | 
2080 |     // returns prediction scores for given test data point, as Vol
2081 |     // uses an averaged prediction from the best ensemble_size models
2082 |     // x is a Vol.
2083 |     predict_soft: function(data) {
2084 |       // forward prop the best networks
2085 |       // and accumulate probabilities at last layer into a an output Vol
2086 | 
2087 |       var eval_candidates = [];
2088 |       var nv = 0;
2089 |       if(this.evaluated_candidates.length === 0) {
2090 |         // not sure what to do here, first batch of nets hasnt evaluated yet
2091 |         // lets just predict with current candidates.
2092 |         nv = this.candidates.length;
2093 |         eval_candidates = this.candidates;
2094 |       } else {
2095 |         // forward prop the best networks from evaluated_candidates
2096 |         nv = Math.min(this.ensemble_size, this.evaluated_candidates.length);
2097 |         eval_candidates = this.evaluated_candidates
2098 |       }
2099 | 
2100 |       // forward nets of all candidates and average the predictions
2101 |       var xout, n;
2102 |       for(var j=0;j<nv;j++) {
2103 |         var net = eval_candidates[j].net;
2104 |         var x = net.forward(data);
2105 |         if(j===0) { 
2106 |           xout = x; 
2107 |           n = x.w.length; 
2108 |         } else {
2109 |           // add it on
2110 |           for(var d=0;d<n;d++) {
2111 |             xout.w[d] += x.w[d];
2112 |           }
2113 |         }
2114 |       }
2115 |       // produce average
2116 |       for(var d=0;d<n;d++) {
2117 |         xout.w[d] /= nv;
2118 |       }
2119 |       return xout;
2120 |     },
2121 | 
2122 |     predict: function(data) {
2123 |       var xout = this.predict_soft(data);
2124 |       if(xout.w.length !== 0) {
2125 |         var stats = maxmin(xout.w);
2126 |         var predicted_label = stats.maxi; 
2127 |       } else {
2128 |         var predicted_label = -1; // error out
2129 |       }
2130 |       return predicted_label;
2131 | 
2132 |     },
2133 | 
2134 |     toJSON: function() {
2135 |       // dump the top ensemble_size networks as a list
2136 |       var nv = Math.min(this.ensemble_size, this.evaluated_candidates.length);
2137 |       var json = {};
2138 |       json.nets = [];
2139 |       for(var i=0;i<nv;i++) {
2140 |         json.nets.push(this.evaluated_candidates[i].net.toJSON());
2141 |       }
2142 |       return json;
2143 |     },
2144 | 
2145 |     fromJSON: function(json) {
2146 |       this.ensemble_size = json.nets.length;
2147 |       this.evaluated_candidates = [];
2148 |       for(var i=0;i<this.ensemble_size;i++) {
2149 |         var net = new Net();
2150 |         net.fromJSON(json.nets[i]);
2151 |         var dummy_candidate = {};
2152 |         dummy_candidate.net = net;
2153 |         this.evaluated_candidates.push(dummy_candidate);
2154 |       }
2155 |     },
2156 | 
2157 |     // callback functions
2158 |     // called when a fold is finished, while evaluating a batch
2159 |     onFinishFold: function(f) { this.finish_fold_callback = f; },
2160 |     // called when a batch of candidates has finished evaluating
2161 |     onFinishBatch: function(f) { this.finish_batch_callback = f; }
2162 |     
2163 |   };
2164 | 
2165 |   global.MagicNet = MagicNet;
2166 | })(convnetjs);
2167 | (function(lib) {
2168 |   "use strict";
2169 |   if (typeof module === "undefined" || typeof module.exports === "undefined") {
2170 |     window.jsfeat = lib; // in ordinary browser attach library to window
2171 |   } else {
2172 |     module.exports = lib; // in nodejs
2173 |   }
2174 | })(convnetjs);
2175 | 


--------------------------------------------------------------------------------