├── README.md
├── kervolutionMnist.ipynb
└── layer.py


/README.md:
--------------------------------------------------------------------------------
 1 | ## Kervolutional Neural Networks
 2 | A Pytorch implementation for the Kervolutional AKA Kernel Convolutional Layer from Kervolutional Neural Networks [[paper](https://arxiv.org/pdf/1904.03955.pdf)].
 3 | It is doing something very similar to Network in Network but using kernels to add the non-linearity instead. 
 4 | 
 5 | ## Dependancies
 6 | ```
 7 | pip install <pytorch-latest.whl url>
 8 | ```
 9 | 
10 | To use this layer:
11 | ```
12 | from layer import KernelConv2d, GaussianKernel, PolynomialKernel
13 | ```
14 | 


--------------------------------------------------------------------------------
/kervolutionMnist.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": null,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "import torch\n",
 10 |     "import torch.nn as nn\n",
 11 |     "import torch.nn.functional as F\n",
 12 |     "import torch.optim as optim\n",
 13 |     "from torchvision import datasets,transforms\n",
 14 |     "import numpy as np\n",
 15 |     "import matplotlib.pyplot as plt\n",
 16 |     "import os\n",
 17 |     "import pandas as pd\n",
 18 |     "from layer import KernelConv2d, GaussianKernel, PolynomialKernel\n",
 19 |     "from functools import partial # To invoke Kernel objects with input parameters when creating KernelConv2d object (e.g. partial(GaussianKernel, 0.05) for Gaussian OR partial(PolynomialKernel,2,3) for Polynomial)\n",
 20 |     "%matplotlib inline\n",
 21 |     "def mkdirs(path):\n",
 22 |     "    if not os.path.exists(path):\n",
 23 |     "        os.makedirs(path)"
 24 |    ]
 25 |   },
 26 |   {
 27 |    "cell_type": "markdown",
 28 |    "metadata": {},
 29 |    "source": [
 30 |     "## Kervolution LeNet"
 31 |    ]
 32 |   },
 33 |   {
 34 |    "cell_type": "code",
 35 |    "execution_count": null,
 36 |    "metadata": {},
 37 |    "outputs": [],
 38 |    "source": [
 39 |     "class KNNet(nn.Module):\n",
 40 |     "    def __init__(self):\n",
 41 |     "        super(KNNet,self).__init__()\n",
 42 |     "        self.conv1=KernelConv2d(1,10,5,partial(GaussianKernel, 0.05)) # self.conv1=KernelConv2d(1,10,5) for default/Ploynomial kernel with default parameters\n",
 43 |     "        print(self.conv1)\n",
 44 |     "        self.bn1=nn.BatchNorm2d(10)\n",
 45 |     "        self.conv2=KernelConv2d(10,20,5)\n",
 46 |     "        self.bn2=nn.BatchNorm2d(20)\n",
 47 |     "        self.conv2_drop=nn.Dropout2d()\n",
 48 |     "        self.fc1=nn.Linear(320,50)\n",
 49 |     "        self.fc2=nn.Linear(50,10)\n",
 50 |     "    def forward(self,x):\n",
 51 |     "        x=F.relu(F.max_pool2d(self.conv1(x),2))\n",
 52 |     "        x=self.bn1(x)\n",
 53 |     "        x=F.relu(F.max_pool2d(self.conv2_drop(self.conv2(x)),2))\n",
 54 |     "        x=self.bn2(x)\n",
 55 |     "        x=x.view(-1,320)\n",
 56 |     "        x=F.relu(self.fc1(x))\n",
 57 |     "        x=F.dropout(x,training=self.training)\n",
 58 |     "        x=F.relu(self.fc2(x))\n",
 59 |     "        return F.log_softmax(x,dim=1)"
 60 |    ]
 61 |   },
 62 |   {
 63 |    "cell_type": "code",
 64 |    "execution_count": null,
 65 |    "metadata": {
 66 |     "scrolled": true
 67 |    },
 68 |    "outputs": [],
 69 |    "source": [
 70 |     "train_loader=torch.utils.data.DataLoader(\n",
 71 |     "    datasets.MNIST(\"data\",train=True,download=True,transform=transforms.Compose([\n",
 72 |     "                transforms.ToTensor(),\n",
 73 |     "            ])),batch_size=128,shuffle=True)\n",
 74 |     "test_loader=torch.utils.data.DataLoader(\n",
 75 |     "    datasets.MNIST(\"data\",train=False,download=True,transform=transforms.Compose([\n",
 76 |     "                transforms.ToTensor(),\n",
 77 |     "            ])),batch_size=128,shuffle=False\n",
 78 |     ")\n",
 79 |     "attack_test_loader=torch.utils.data.DataLoader(\n",
 80 |     "    datasets.MNIST(\"data\",train=False,download=True,transform=transforms.Compose([\n",
 81 |     "                transforms.ToTensor(),\n",
 82 |     "            ])),batch_size=1,shuffle=False\n",
 83 |     ")\n",
 84 |     "print(len(train_loader))\n",
 85 |     "print(len(test_loader))"
 86 |    ]
 87 |   },
 88 |   {
 89 |    "cell_type": "code",
 90 |    "execution_count": null,
 91 |    "metadata": {},
 92 |    "outputs": [],
 93 |    "source": [
 94 |     "device=torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
 95 |     "\n",
 96 |     "knn=KNNet().to(device)\n",
 97 |     "knn.train(mode=True)"
 98 |    ]
 99 |   },
100 |   {
101 |    "cell_type": "code",
102 |    "execution_count": null,
103 |    "metadata": {},
104 |    "outputs": [],
105 |    "source": [
106 |     "criterion=torch.nn.NLLLoss()"
107 |    ]
108 |   },
109 |   {
110 |    "cell_type": "code",
111 |    "execution_count": null,
112 |    "metadata": {},
113 |    "outputs": [],
114 |    "source": [
115 |     "def compute_accuray(pred,true):\n",
116 |     "    pred_idx=pred.argmax(dim=1).detach().cpu().numpy()\n",
117 |     "    tmp=pred_idx==true.cpu().numpy()\n",
118 |     "    return sum(tmp)/len(pred_idx)\n",
119 |     "def train(m,out_dir):\n",
120 |     "    iter_loss=[]\n",
121 |     "    train_losses=[]\n",
122 |     "    test_losses=[]\n",
123 |     "    iter_loss_path=os.path.join(out_dir,\"iter_loss.csv\")\n",
124 |     "    epoch_loss_path=os.path.join(out_dir,\"epoch_loss.csv\")\n",
125 |     "    nb_epochs=20\n",
126 |     "    last_loss=99999\n",
127 |     "    mkdirs(os.path.join(out_dir,\"models\"))\n",
128 |     "    optimizer=optim.SGD(m.parameters(),lr=0.003,momentum=0.9)\n",
129 |     "    for epoch in range(nb_epochs):\n",
130 |     "        train_loss=0.\n",
131 |     "        train_acc=0.\n",
132 |     "        m.train(mode=True)\n",
133 |     "        for data,target in train_loader:\n",
134 |     "            data,target=data.to(device),target.to(device)\n",
135 |     "            optimizer.zero_grad()\n",
136 |     "            output=m(data)\n",
137 |     "            loss=criterion(output,target)\n",
138 |     "            loss_value=loss.item()\n",
139 |     "            iter_loss.append(loss_value)\n",
140 |     "            train_loss+=loss_value\n",
141 |     "            loss.backward()\n",
142 |     "            optimizer.step()\n",
143 |     "            acc=compute_accuray(output,target)\n",
144 |     "            train_acc+=acc\n",
145 |     "        train_losses.append(train_loss/len(train_loader))\n",
146 |     "        \n",
147 |     "        test_loss=0.\n",
148 |     "        test_acc=0.\n",
149 |     "        m.train(mode=False)\n",
150 |     "        for data,target in test_loader:\n",
151 |     "            data,target=data.to(device),target.to(device)\n",
152 |     "            output=m(data)\n",
153 |     "            loss=criterion(output,target)\n",
154 |     "            loss_value=loss.item()\n",
155 |     "            iter_loss.append(loss_value)\n",
156 |     "            test_loss+=loss_value\n",
157 |     "            acc=compute_accuray(output,target)\n",
158 |     "            test_acc+=acc\n",
159 |     "        test_losses.append(test_loss/len(test_loader))\n",
160 |     "        print(\"Epoch {}: train loss is {}, train accuracy is {}; test loss is {}, test accuracy is {}\".\n",
161 |     "              format(epoch,round(train_loss/len(train_loader),2),\n",
162 |     "                     round(train_acc/len(train_loader),2),\n",
163 |     "                     round(test_loss/len(test_loader),2),\n",
164 |     "                     round(test_acc/len(test_loader),2)))        \n",
165 |     "        if test_loss/len(test_loader)<last_loss:      \n",
166 |     "            save_model_path=os.path.join(out_dir,\"models\",\"best_model.tar\".format(epoch))\n",
167 |     "            torch.save({\n",
168 |     "                    \"model\":m.state_dict(),\n",
169 |     "                    \"optimizer\":optimizer.state_dict()\n",
170 |     "                },save_model_path)\n",
171 |     "            last_loss=test_loss/len(test_loader)\n",
172 |     "        \n",
173 |     "    df=pd.DataFrame()\n",
174 |     "    df[\"iteration\"]=np.arange(0,len(iter_loss))\n",
175 |     "    df[\"loss\"]=iter_loss\n",
176 |     "    df.to_csv(iter_loss_path,index=False)\n",
177 |     "    \n",
178 |     "    df=pd.DataFrame()\n",
179 |     "    df[\"epoch\"]=np.arange(0,nb_epochs)\n",
180 |     "    df[\"train_loss\"]=train_losses\n",
181 |     "    df[\"test_loss\"]=test_losses\n",
182 |     "    df.to_csv(epoch_loss_path,index=False)    "
183 |    ]
184 |   },
185 |   {
186 |    "cell_type": "code",
187 |    "execution_count": 8,
188 |    "metadata": {},
189 |    "outputs": [
190 |     {
191 |      "name": "stdout",
192 |      "output_type": "stream",
193 |      "text": [
194 |       "Epoch 0: train loss is 2.09, train accuracy is 0.26; test loss is 1.48, test accuracy is 0.62\n",
195 |       "Epoch 1: train loss is 1.38, train accuracy is 0.56; test loss is 0.74, test accuracy is 0.8\n",
196 |       "Epoch 2: train loss is 0.95, train accuracy is 0.7; test loss is 0.49, test accuracy is 0.87\n",
197 |       "Epoch 3: train loss is 0.78, train accuracy is 0.76; test loss is 0.39, test accuracy is 0.89\n",
198 |       "Epoch 4: train loss is 0.69, train accuracy is 0.79; test loss is 0.33, test accuracy is 0.91\n",
199 |       "Epoch 5: train loss is 0.62, train accuracy is 0.81; test loss is 0.3, test accuracy is 0.91\n",
200 |       "Epoch 6: train loss is 0.57, train accuracy is 0.83; test loss is 0.27, test accuracy is 0.92\n",
201 |       "Epoch 7: train loss is 0.53, train accuracy is 0.84; test loss is 0.25, test accuracy is 0.93\n",
202 |       "Epoch 8: train loss is 0.49, train accuracy is 0.85; test loss is 0.23, test accuracy is 0.93\n",
203 |       "Epoch 9: train loss is 0.46, train accuracy is 0.86; test loss is 0.21, test accuracy is 0.94\n",
204 |       "Epoch 10: train loss is 0.43, train accuracy is 0.87; test loss is 0.19, test accuracy is 0.94\n",
205 |       "Epoch 11: train loss is 0.4, train accuracy is 0.88; test loss is 0.18, test accuracy is 0.95\n",
206 |       "Epoch 12: train loss is 0.38, train accuracy is 0.89; test loss is 0.18, test accuracy is 0.95\n",
207 |       "Epoch 13: train loss is 0.36, train accuracy is 0.89; test loss is 0.16, test accuracy is 0.95\n",
208 |       "Epoch 14: train loss is 0.34, train accuracy is 0.9; test loss is 0.15, test accuracy is 0.95\n",
209 |       "Epoch 15: train loss is 0.32, train accuracy is 0.91; test loss is 0.15, test accuracy is 0.96\n",
210 |       "Epoch 16: train loss is 0.31, train accuracy is 0.91; test loss is 0.14, test accuracy is 0.96\n",
211 |       "Epoch 17: train loss is 0.3, train accuracy is 0.91; test loss is 0.14, test accuracy is 0.96\n",
212 |       "Epoch 18: train loss is 0.29, train accuracy is 0.92; test loss is 0.13, test accuracy is 0.96\n",
213 |       "Epoch 19: train loss is 0.28, train accuracy is 0.92; test loss is 0.13, test accuracy is 0.96\n"
214 |      ]
215 |     }
216 |    ],
217 |    "source": [
218 |     "train(knn,\"lenet-knn-cp0.3\")"
219 |    ]
220 |   },
221 |   {
222 |    "cell_type": "code",
223 |    "execution_count": null,
224 |    "metadata": {
225 |     "collapsed": true
226 |    },
227 |    "outputs": [],
228 |    "source": []
229 |   }
230 |  ],
231 |  "metadata": {
232 |   "anaconda-cloud": {},
233 |   "kernelspec": {
234 |    "display_name": "Python 3",
235 |    "language": "python",
236 |    "name": "python3"
237 |   },
238 |   "language_info": {
239 |    "codemirror_mode": {
240 |     "name": "ipython",
241 |     "version": 3
242 |    },
243 |    "file_extension": ".py",
244 |    "mimetype": "text/x-python",
245 |    "name": "python",
246 |    "nbconvert_exporter": "python",
247 |    "pygments_lexer": "ipython3",
248 |    "version": "3.7.1"
249 |   }
250 |  },
251 |  "nbformat": 4,
252 |  "nbformat_minor": 2
253 | }
254 | 


--------------------------------------------------------------------------------
/layer.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | 
 4 | class LinearKernel(torch.nn.Module):
 5 |     def __init__(self):
 6 |         super(LinearKernel, self).__init__()
 7 |     
 8 |     def forward(self, x_unf, w, b):
 9 |         t = x_unf.transpose(1, 2).matmul(w.view(w.size(0), -1).t()).transpose(1, 2)
10 |         if b is not None:
11 |             return t + b
12 |         return t
13 |         
14 |         
15 | class PolynomialKernel(LinearKernel):
16 |     def __init__(self, cp=2.0, dp=3, train_cp=True):
17 |         super(PolynomialKernel, self).__init__()
18 |         self.cp = torch.nn.parameter.Parameter(torch.tensor(cp, requires_grad=train_cp))
19 |         self.dp = dp
20 | 
21 |     def forward(self, x_unf, w, b):
22 |         return (self.cp + super(PolynomialKernel, self).forward(x_unf, w, b))**self.dp
23 | 
24 | 
25 | class GaussianKernel(torch.nn.Module):
26 |     def __init__(self, gamma):
27 |         super(GaussianKernel, self).__init__()
28 |         self.gamma = torch.nn.parameter.Parameter(
29 |                             torch.tensor(gamma, requires_grad=True))
30 |     
31 |     def forward(self, x_unf, w, b):
32 |         l = x_unf.transpose(1, 2)[:, :, :, None] - w.view(1, 1, -1, w.size(0))
33 |         l = torch.sum(l**2, 2)
34 |         t = torch.exp(-self.gamma * l)
35 |         if b:
36 |             return t + b
37 |         return t
38 |         
39 |        
40 | class KernelConv2d(torch.nn.Conv2d):
41 |     def __init__(self, in_channels, out_channels, kernel_size, kernel_fn=PolynomialKernel,
42 |                  stride=1, padding=0, dilation=1, groups=1, bias=None,
43 |                  padding_mode='zeros'):
44 |         '''
45 |         Follows the same API as torch Conv2d except kernel_fn.
46 |         kernel_fn should be an instance of the above kernels.
47 |         '''
48 |         super(KernelConv2d, self).__init__(in_channels, out_channels, 
49 |                                            kernel_size, stride, padding,
50 |                                            dilation, groups, bias, padding_mode)
51 |         self.kernel_fn = kernel_fn()
52 |    
53 |     def compute_shape(self, x):
54 |         h = (x.shape[2] + 2 * self.padding[0] - 1 * (self.kernel_size[0] - 1) - 1) // self.stride[0] + 1
55 |         w = (x.shape[3] + 2 * self.padding[1] - 1 * (self.kernel_size[1] - 1) - 1) // self.stride[1] + 1
56 |         return h, w
57 |     
58 |     def forward(self, x):
59 |         x_unf = torch.nn.functional.unfold(x, self.kernel_size, self.dilation,self.padding, self.stride)
60 |         h, w = self.compute_shape(x)
61 |         return self.kernel_fn(x_unf, self.weight, self.bias).view(x.shape[0], -1, h, w)
62 | 


--------------------------------------------------------------------------------