├── .gitignore
├── README.md
├── ch01_回归问题
    ├── __pycache__
    │   └── utils.cpython-35.pyc
    ├── data.csv
    ├── mnist_train.py
    ├── regression.py
    └── utils.py
├── ch02_PyTorch基础教程
    ├── .ipynb_checkpoints
    │   └── Ch02_PyTorch基础教程-checkpoint.ipynb
    └── Ch02_PyTorch基础教程.ipynb
├── ch03_PyTorch进阶教程
    ├── .ipynb_checkpoints
    │   └── ch03_PyTorch进阶教程-checkpoint.ipynb
    └── ch03_PyTorch进阶教程.ipynb
├── ch04_随机梯度下降
    ├── .ipynb_checkpoints
    │   └── ch04_随机梯度下降-checkpoint.ipynb
    └── ch04_随机梯度下降.ipynb
├── ch05_ 神经网络与全连接层
    ├── .idea
    │   ├── ch05_ 神经网络与全联接层.iml
    │   ├── misc.xml
    │   ├── modules.xml
    │   └── workspace.xml
    ├── .ipynb_checkpoints
    │   └── ch05_神经网络与全连接层-checkpoint.ipynb
    ├── ch05_神经网络与全连接层.ipynb
    └── mnist.py
├── ch06_过拟合与欠拟合_交叉验证_正则化
    ├── .ipynb_checkpoints
    │   ├── ch06_ 正则化_动量与学习率衰减_早停_dropout-checkpoint.ipynb
    │   └── ch06_过拟合与欠拟合-checkpoint.ipynb
    ├── ch06_ 正则化_动量与学习率衰减_早停_dropout.ipynb
    └── ch06_过拟合与欠拟合.ipynb
├── ch07_卷积神经网络CNN
    ├── .ipynb_checkpoints
    │   ├── ch07_卷积神经网络基础-checkpoint.ipynb
    │   └── ch07_经典卷积网络-checkpoint.ipynb
    ├── ch07_卷积神经网络基础.ipynb
    └── ch07_经典卷积网络.ipynb
├── ch08_CIFAR10_ResNet
    ├── .idea
    │   ├── ch08_CIFAR10_ResNet.iml
    │   ├── copyright
    │   │   └── profiles_settings.xml
    │   ├── dictionaries
    │   │   └── mac.xml
    │   ├── inspectionProfiles
    │   │   └── Project_Default.xml
    │   ├── misc.xml
    │   ├── modules.xml
    │   ├── vcs.xml
    │   └── workspace.xml
    ├── LeNet5.py
    ├── ResNet.py
    ├── __pycache__
    │   ├── LeNet5.cpython-35.pyc
    │   ├── LeNet5.cpython-37.pyc
    │   ├── ResNet.cpython-35.pyc
    │   └── ResNet.cpython-37.pyc
    └── main.py
├── ch09_循环神经网络RNN&LSTM
    ├── .ipynb_checkpoints
    │   └── ch09_RNN-checkpoint.ipynb
    └── ch09_RNN.ipynb
├── ch10_迁移学习-实战宝可梦精灵
    ├── .idea
    │   ├── ch10_迁移学习-实战宝可梦精灵.iml
    │   ├── dictionaries
    │   │   └── szz.xml
    │   ├── inspectionProfiles
    │   │   └── Project_Default.xml
    │   ├── misc.xml
    │   ├── modules.xml
    │   ├── vcs.xml
    │   └── workspace.xml
    ├── .ipynb_checkpoints
    │   └── ch10_迁移学习-实战宝可梦精灵-checkpoint.ipynb
    ├── __pycache__
    │   ├── pokemon.cpython-35.pyc
    │   ├── pokemon.cpython-37.pyc
    │   ├── resnet.cpython-35.pyc
    │   ├── resnet.cpython-37.pyc
    │   └── utils.cpython-37.pyc
    ├── best.mdl
    ├── best_for_scratch.mdl
    ├── best_for_transfer.mdl
    ├── ch10_迁移学习-实战宝可梦精灵.ipynb
    ├── pokemon.py
    ├── pokemon_useAPI.py
    ├── resnet.py
    ├── train_scratch.py
    ├── train_transfer.py
    └── utils.py
└── ch11_自编码器 Auto-Encoders
    ├── .idea
        └── ch11_自编码器 Auto-Encoders.iml
    ├── .ipynb_checkpoints
        └── 11 - Auto-Encoders-checkpoint.ipynb
    ├── 11 - Auto-Encoders.ipynb
    ├── ae.py
    ├── ae_train.py
    ├── vae.py
    └── vae_train.py


/.gitignore:
--------------------------------------------------------------------------------
1 | .DS_Store
2 | data/
3 | .idea
4 | picture


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # PyTorch-Course-Note
 2 | 
 3 | 数据集过大,上传到了百度云 链接: https://pan.baidu.com/s/1YGJ-SR1XMp-TLB-mZryqzA  密码: t2i0 解压后放到目录下即可
 4 | 
 5 | #### win10运行问题解决办法:
 6 | 找到 tornado/platform/asyncio.py 文件修改，添加代码如下：
 7 | 
 8 | ```python
 9 | if sys.platform == 'win32':
10 |  asyncio.set_event_loop_policy(asyncio.WindowsSelectorEventLoopPolicy())
11 | 
12 | 
13 | ```
14 | 
15 | 
16 | 
17 | ###  visdom安装
18 | 
19 | - git clone git@github.com:facebookresearch/visdom.git
20 | - cd visdom/
21 | - pip install -e .


--------------------------------------------------------------------------------
/ch01_回归问题/__pycache__/utils.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch01_回归问题/__pycache__/utils.cpython-35.pyc


--------------------------------------------------------------------------------
/ch01_回归问题/data.csv:
--------------------------------------------------------------------------------
  1 | 1.441420763439877906e-01,3.008888522256620845e-01
  2 | 7.561157580978923320e-01,1.200490164403901661e+00
  3 | 7.580154722681392565e-01,1.203282744234164703e+00
  4 | 5.627146030856732262e-01,9.161904665359396072e-01
  5 | 1.726740286659089740e-01,3.428308221388861599e-01
  6 | 5.950836133900827551e-02,1.764772911683421541e-01
  7 | 8.277337446696210188e-01,1.305768604664342858e+00
  8 | 7.109868071758078667e-01,1.134150606548437468e+00
  9 | 3.048718874921082511e-01,5.371616746133991427e-01
 10 | 7.388525634014426746e-01,1.175113268200120631e+00
 11 | 9.590565411252628403e-01,1.498813115454136424e+00
 12 | 8.015464815428295919e-01,1.267273327867959543e+00
 13 | 9.607216520486532296e-01,1.501260828511520096e+00
 14 | 8.445593908547965878e-01,1.330502304556550941e+00
 15 | 4.506229754402359955e-01,7.514157738971468659e-01
 16 | 5.868013230637029176e-01,9.515979449036432447e-01
 17 | 8.007795198203720988e-01,1.266145894135946914e+00
 18 | 5.035736175865878073e-01,8.292532178522840081e-01
 19 | 3.114433926995394675e-01,5.468217872683229785e-01
 20 | 7.317475377906073053e-01,1.164668880552192753e+00
 21 | 6.139734681610302669e-01,9.915409981967144848e-01
 22 | 9.945943755290296284e-01,1.551053732027673604e+00
 23 | 7.055574630060129637e-01,1.126169470618838986e+00
 24 | 4.476654249698448496e-01,7.470681747056718836e-01
 25 | 3.567608208560109073e-01,6.134384066583360440e-01
 26 | 6.127574022587565228e-01,9.897533813203720499e-01
 27 | 4.935134303804317168e-01,8.144647426592346307e-01
 28 | 5.063936386469451989e-01,8.333986488110094459e-01
 29 | 9.955887026058044542e-01,1.552515392830532415e+00
 30 | 9.632136367376882280e-01,1.504924046004401550e+00
 31 | 6.496371483048046791e-02,1.844966608008062892e-01
 32 | 4.475809770427596757e-02,1.547944036252856814e-01
 33 | 6.465951788450118309e-01,1.039494912902167334e+00
 34 | 7.316031926765320659e-02,1.965456693234501895e-01
 35 | 7.349758904863741282e-01,1.169414559014969823e+00
 36 | 5.473148503498541650e-01,8.935528300142855374e-01
 37 | 9.047874438231638949e-01,1.419037542420050979e+00
 38 | 8.826579421734687125e-01,1.386507174994998870e+00
 39 | 7.796753704162312504e-01,1.235122794511859912e+00
 40 | 2.011678690952142246e-01,3.847167675699648681e-01
 41 | 7.932643186640753186e-01,1.255098548436190731e+00
 42 | 5.118798669658771727e-01,8.414634044398393575e-01
 43 | 6.566237722921854925e-01,1.054236945269512615e+00
 44 | 6.285757760027370633e-01,1.013006390724023431e+00
 45 | 7.378221359980340344e-01,1.173598539917110051e+00
 46 | 3.792372434380724133e-01,6.464787478539664178e-01
 47 | 3.034149812555956283e-01,5.350200224457255516e-01
 48 | 8.569840082393150871e-01,1.348766492111793225e+00
 49 | 8.075549610214690643e-01,1.276105792701559549e+00
 50 | 5.418174404078206496e-01,8.854716373994963030e-01
 51 | 4.181387641509373143e-01,7.036639833018778489e-01
 52 | 1.187503349960870036e-01,2.635629924442478567e-01
 53 | 4.866363992436300023e-01,8.043555068881360626e-01
 54 | 6.740491840830054038e-02,1.880852300602017801e-01
 55 | 4.835415882449580760e-01,7.998061347200883242e-01
 56 | 7.849257718903341896e-01,1.242840884678791280e+00
 57 | 2.025011429949694630e-01,3.866766802026051497e-01
 58 | 1.911139930912145735e-01,3.699375698440854343e-01
 59 | 6.063343956409872337e-02,1.781311561592251180e-01
 60 | 3.982912368283442195e-01,6.744881181376659596e-01
 61 | 8.872173439482450297e-01,1.393209495603920045e+00
 62 | 6.681647796307321752e-02,1.872202226057176344e-01
 63 | 2.110109857307218562e-01,3.991861490241611632e-01
 64 | 9.907919996833827181e-01,1.545464239534572570e+00
 65 | 2.122751536898482838e-01,4.010444759240769930e-01
 66 | 9.028160514122285374e-01,1.416139595575975907e+00
 67 | 2.073147375222623712e-01,3.937526641577256958e-01
 68 | 9.471496306862211556e-01,1.481309957108745134e+00
 69 | 8.771565861607195647e-01,1.378420181656257792e+00
 70 | 8.415160805050864168e-01,1.326028638342477084e+00
 71 | 6.329076436268699091e-02,1.820374236131498680e-01
 72 | 3.679429819099352406e-01,6.298761834076047617e-01
 73 | 2.943252270555074546e-02,1.322658083771595938e-01
 74 | 5.313441724475661543e-01,8.700759334979222270e-01
 75 | 7.987263239825815875e-01,1.263127696254394916e+00
 76 | 6.253441188173707310e-01,1.008255854661535000e+00
 77 | 9.085903342154009188e-01,1.424627791296639190e+00
 78 | 6.042450641984775661e-01,9.772402443717619347e-01
 79 | 6.900507380291087678e-02,1.904374584902789880e-01
 80 | 5.092845860973660432e-02,1.638648341563128108e-01
 81 | 4.754453572983440290e-01,7.879046752285656652e-01
 82 | 2.972494436682412422e-01,5.259566821923146174e-01
 83 | 4.139305962028716479e-02,1.498477976418221280e-01
 84 | 7.354242451491166399e-01,1.170073640369201362e+00
 85 | 7.905121638074625867e-01,1.251052880796969857e+00
 86 | 7.819970069136303881e-01,1.238535600163036543e+00
 87 | 8.901316864032422504e-01,1.397493579012766052e+00
 88 | 4.178082113223988703e-01,7.031780706439263451e-01
 89 | 5.668677629854733668e-01,9.222956115886458139e-01
 90 | 7.630679646999156684e-01,1.210709908108875910e+00
 91 | 7.246042988740617474e-01,1.154168319344870630e+00
 92 | 6.951329247627034968e-01,1.110845399401173994e+00
 93 | 2.644843144593916895e-01,4.777919422553057460e-01
 94 | 8.176013249640490255e-01,1.290873947697152024e+00
 95 | 4.364077411936698736e-01,7.305193795546947033e-01
 96 | 5.108615819094332045e-01,8.399665254068667819e-01
 97 | 5.438108309427717169e-01,8.884019214858743796e-01
 98 | 2.078786821515706817e-01,3.945816627628089268e-01
 99 | 2.571302167923578130e-01,4.669814186847659476e-01
100 | 7.091536129762591179e-01,1.131455811075100959e+00
101 | 


--------------------------------------------------------------------------------
/ch01_回归问题/mnist_train.py:
--------------------------------------------------------------------------------
  1 | import torch
  2 | from torch import nn
  3 | from torch.nn import functional as F
  4 | from torch import optim
  5 | 
  6 | import torchvision
  7 | import matplotlib.pyplot as plt
  8 | from utils import plot_image, plot_curve, ont_hot
  9 | 
 10 | # step1. load dataset
 11 | 
 12 | batch_size = 64
 13 | train_load = torch.utils.data.DataLoader(torchvision.datasets.MNIST(
 14 |     'mnist data',
 15 |     train=True,
 16 |     download=True,
 17 |     transform=torchvision.transforms.Compose([
 18 |         torchvision.transforms.ToTensor(),
 19 |         torchvision.transforms.Normalize((0.1307, ), (0.3081, ))
 20 |     ])),
 21 |                                          batch_size=batch_size,
 22 |                                          shuffle=True)
 23 | 
 24 | test_load = torch.utils.data.DataLoader(torchvision.datasets.MNIST(
 25 |     'mnist data/',
 26 |     train=False,
 27 |     download=True,
 28 |     transform=torchvision.transforms.Compose([
 29 |         torchvision.transforms.ToTensor(),
 30 |         torchvision.transforms.Normalize((0.1307, ), (0.3081, ))
 31 |     ])),
 32 |                                         batch_size=batch_size,
 33 |                                         shuffle=False)
 34 | 
 35 | x, y = next(iter(train_load))
 36 | print(x.shape, y.shape)
 37 | print(x.min(), x.max())
 38 | plot_image(x, y, 'image_sample')
 39 | 
 40 | 
 41 | class Net(nn.Module):
 42 |     def __init__(self):
 43 |         super(Net, self).__init__()
 44 | 
 45 |         # xw+b
 46 |         self.fc1 = nn.Linear(28 * 28, 256)
 47 |         self.fc2 = nn.Linear(256, 64)
 48 |         self.fc3 = nn.Linear(64, 10)
 49 | 
 50 |     def forward(self, x):
 51 |         # x: [b,1,28,28]
 52 |         x = F.relu(self.fc1(x))
 53 |         x = F.relu(self.fc2(x))
 54 |         # x = F.softmax(self.fc3(x))
 55 |         x = self.fc3(x)  # h3 = h2w3 + b3
 56 |         return x
 57 | 
 58 | 
 59 | net = Net()
 60 | # net.parameters: [w1,b1,w2,b2,w3,b3]
 61 | optimizer = optim.SGD(net.parameters(), lr=0.01, momentum=0.9)
 62 | 
 63 | train_loss = []
 64 | 
 65 | for epoch in range(3):
 66 |     for batch_idx, (x, y) in enumerate(train_load):
 67 |         # x:[b,1,28,28] , y:[64]
 68 |         # net只接收[b,feature] 需要 [b,1,28,28] -> [b,feature]
 69 |         x = x.view(x.size(0), -1)
 70 |         out = net(x)  # -> [b,10]
 71 |         # [b,10]
 72 |         y_onehot = ont_hot(y)
 73 |         # loss = mse(out,y_onehot)
 74 |         loss = F.mse_loss(out, y_onehot)
 75 | 
 76 |         optimizer.zero_grad()
 77 |         loss.backward()
 78 |         optimizer.step()  # w' = w - lr * grad
 79 |         train_loss.append(loss.item())
 80 |         if batch_idx % 10 == 0:
 81 |             print(epoch, batch_idx, loss.item())
 82 | 
 83 | plot_curve(train_loss)
 84 | # we get optimal [w1,b1,w2,b2,w3,b3]
 85 | 
 86 | total_correct = 0
 87 | for x, y in test_load:
 88 |     x = x.view(x.size(0), -1)
 89 |     out = net(x)
 90 |     # out:[b,10] -> predict_value:[b]
 91 |     predict_value = out.argmax(dim=1)
 92 |     correct = predict_value.eq(
 93 |         y).sum().float().item()  # 正确个数,转为float类型,转为python数值类型
 94 |     total_correct += correct
 95 | 
 96 | total_num = len(test_load.dataset)
 97 | acc = total_correct / total_num
 98 | print('test acc:', acc)
 99 | 
100 | x, y = next(iter(test_load))
101 | out = net(x.view(x.size(0), -1))
102 | pred = out.argmax(dim=1)
103 | plot_image(x, pred, 'test')
104 | 


--------------------------------------------------------------------------------
/ch01_回归问题/regression.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | 
 3 | 
 4 | def compute_error_for_line_given_points(b, w, points):
 5 |     totalError = 0
 6 |     for i in range(0, len(points)):
 7 |         x = points[i, 0]
 8 |         y = points[i, 1]
 9 |         totalError += (y - (w * x + b))**2
10 |     return totalError / float(len(points))
11 | 
12 | 
13 | def step_gradient(b_current, w_current, points, learningRate):
14 |     b_gradient = 0
15 |     w_gradient = 0
16 |     N = float(len(points))
17 |     for i in range(0, len(points)):
18 |         x = points[i, 0]
19 |         y = points[i, 1]
20 |         b_gradient += (2 / N) * (((w_current * x) + b_current) - y)
21 |         w_gradient += (2 / N) * x * (((w_current * x) + b_current) - y)
22 | 
23 |     new_b = b_current - (learningRate * b_gradient)
24 |     new_w = w_current - (learningRate * w_gradient)
25 |     return new_b, new_w
26 | 
27 | 
28 | def gradient_descent_runner(points, starting_b, starting_w, learning_rate,
29 |                             num_iterations):
30 |     b = starting_b
31 |     w = starting_w
32 |     for i in range(num_iterations):
33 |         b, w = step_gradient(b, w, np.array(points), learning_rate)
34 |     return [b, w]
35 | 
36 | 
37 | def generate_data_csv():
38 |     data_x = np.random.rand(100)
39 |     data_y = 1.47 * data_x + 0.089
40 |     points = np.stack((data_x, data_y), axis=1)
41 |     np.savetxt('eat_pyTorch/ch01_回归问题/data.csv', points, delimiter=',')
42 | 
43 | 
44 | def run():
45 |     generate_data_csv()
46 |     points = np.genfromtxt("eat_pyTorch/ch01_回归问题/data.csv", delimiter=',')
47 |     learning_rate = 0.005
48 |     initial_b = 0
49 |     initial_w = 0
50 |     num_iterations = 10000
51 |     print(
52 |         "Starting gradient descent at b = {0} , w = {1} , error = {2} ".format(
53 |             initial_b, initial_w,
54 |             compute_error_for_line_given_points(initial_b, initial_w, points)))
55 |     print("Running ...")
56 |     [b, w] = gradient_descent_runner(points, initial_b, initial_w,
57 |                                      learning_rate, num_iterations)
58 |     print("After {0} iterations b = {1}, w = {2}, error = {3}".format(
59 |         num_iterations, b, w,
60 |         compute_error_for_line_given_points(b, w, points)))
61 | 
62 |     print('b:{}，w:{}'.format(b, w))
63 | 
64 | 
65 | if __name__ == '__main__':
66 |     run()


--------------------------------------------------------------------------------
/ch01_回归问题/utils.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from matplotlib import pyplot as plt
 3 | 
 4 | 
 5 | def plot_curve(data):
 6 |     fig = plt.figure()
 7 |     plt.plot(range(len(data)), data, color='blue')
 8 |     plt.legend(['value'], loc='upper right')
 9 |     plt.xlabel('step')
10 |     plt.ylabel('value')
11 |     plt.show()
12 | 
13 | 
14 | def plot_image(img, label, name):
15 |     fig = plt.figure()
16 |     for i in range(6):
17 |         plt.subplot(2, 3, i + 1)
18 |         plt.tight_layout()
19 |         plt.imshow(img[i][0] * 0.3081 + 0.1307,
20 |                    cmap='gray',
21 |                    interpolation='none')
22 |         plt.title("{} : {}".format(name, label[i].item()))
23 |         plt.xticks([])
24 |         plt.yticks([])
25 |     plt.show()
26 | 
27 | 
28 | def ont_hot(label, depth=10):
29 |     out = torch.zeros(label.size(0), depth)
30 |     idx = torch.LongTensor(label).view(-1, 1)
31 |     out.scatter_(dim=1, index=idx, value=1)
32 |     return out


--------------------------------------------------------------------------------
/ch02_PyTorch基础教程/.ipynb_checkpoints/Ch02_PyTorch基础教程-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# Ch02 PyTorch基础教程"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "## 2.1 张量数据类型"
 15 |    ]
 16 |   },
 17 |   {
 18 |    "cell_type": "code",
 19 |    "execution_count": 16,
 20 |    "metadata": {},
 21 |    "outputs": [],
 22 |    "source": [
 23 |     "import torch\n",
 24 |     "import numpy as np"
 25 |    ]
 26 |   },
 27 |   {
 28 |    "cell_type": "code",
 29 |    "execution_count": 8,
 30 |    "metadata": {},
 31 |    "outputs": [
 32 |     {
 33 |      "name": "stdout",
 34 |      "output_type": "stream",
 35 |      "text": [
 36 |       "torch.FloatTensor\n",
 37 |       "<class 'torch.Tensor'>\n"
 38 |      ]
 39 |     },
 40 |     {
 41 |      "data": {
 42 |       "text/plain": [
 43 |        "True"
 44 |       ]
 45 |      },
 46 |      "execution_count": 8,
 47 |      "metadata": {},
 48 |      "output_type": "execute_result"
 49 |     }
 50 |    ],
 51 |    "source": [
 52 |     "a = torch.randn(2,3)\n",
 53 |     "print(a.type())\n",
 54 |     "print(type(a))\n",
 55 |     "isinstance(a,torch.FloatTensor)"
 56 |    ]
 57 |   },
 58 |   {
 59 |    "cell_type": "markdown",
 60 |    "metadata": {},
 61 |    "source": [
 62 |     "### Note1: 类型推断\n",
 63 |     "- tensor_name.type()\n",
 64 |     "- isinstance(torsor_name,type_name)"
 65 |    ]
 66 |   },
 67 |   {
 68 |    "cell_type": "code",
 69 |    "execution_count": 12,
 70 |    "metadata": {},
 71 |    "outputs": [
 72 |     {
 73 |      "name": "stdout",
 74 |      "output_type": "stream",
 75 |      "text": [
 76 |       "tensor(1.) torch.Size([]) 0 0\n"
 77 |      ]
 78 |     }
 79 |    ],
 80 |    "source": [
 81 |     "# 标量 ,dim=0\n",
 82 |     "a = torch.tensor(1.)\n",
 83 |     "print(a,a.shape,len(a.shape),a.dim())"
 84 |    ]
 85 |   },
 86 |   {
 87 |    "cell_type": "markdown",
 88 |    "metadata": {},
 89 |    "source": [
 90 |     "### Note2: dim=0 标量\n",
 91 |     "- a.shape 成员\n",
 92 |     "- a.size() 成员函数\n",
 93 |     "- a.dim() 维度"
 94 |    ]
 95 |   },
 96 |   {
 97 |    "cell_type": "code",
 98 |    "execution_count": 18,
 99 |    "metadata": {},
100 |    "outputs": [
101 |     {
102 |      "name": "stdout",
103 |      "output_type": "stream",
104 |      "text": [
105 |       "tensor([1.1000, 2.2000]) torch.Size([2]) torch.FloatTensor\n",
106 |       "tensor([8.4078e-45, 0.0000e+00]) torch.Size([2]) torch.FloatTensor\n",
107 |       "tensor([1., 1.], dtype=torch.float64) torch.Size([2]) torch.DoubleTensor\n"
108 |      ]
109 |     }
110 |    ],
111 |    "source": [
112 |     "# 向量,dim=1\n",
113 |     "a = torch.tensor([1.1,2.2])\n",
114 |     "print(a,a.shape,a.type())\n",
115 |     "\n",
116 |     "b = torch.FloatTensor(2)\n",
117 |     "print(b,b.shape,b.type())\n",
118 |     "\n",
119 |     "data = np.ones(2)\n",
120 |     "c = torch.from_numpy(data)\n",
121 |     "print(c,c.shape,c.type())"
122 |    ]
123 |   },
124 |   {
125 |    "cell_type": "markdown",
126 |    "metadata": {},
127 |    "source": [
128 |     "### Note3: dim=1 向量\n",
129 |     "- .tensor接受的是数据的内容\n",
130 |     "- .FloatTensor接受的是数据的shape,随机初始化\n",
131 |     "- .from_numpy()  numpy -> torch.tensor\n",
132 |     "- dim=0 -> 0.1\n",
133 |     "- dim=1 -> [0.1]\n"
134 |    ]
135 |   },
136 |   {
137 |    "cell_type": "code",
138 |    "execution_count": 26,
139 |    "metadata": {},
140 |    "outputs": [
141 |     {
142 |      "name": "stdout",
143 |      "output_type": "stream",
144 |      "text": [
145 |       "tensor([[-0.6025, -0.0328, -1.7973],\n",
146 |       "        [ 0.5828,  0.6371, -0.0266]])\n",
147 |       "torch.Size([2, 3])   2   3\n",
148 |       "用shape索引:  2   3\n"
149 |      ]
150 |     }
151 |    ],
152 |    "source": [
153 |     "a = torch.randn(2,3) # normal distribution 正态分布\n",
154 |     "# a = torch.FloatTensor(2,3)\n",
155 |     "print(a)\n",
156 |     "print(a.shape,' ',a.size(0),' ',a.size(1))\n",
157 |     "print('用shape索引: ',a.shape[0],' ',a.shape[1])"
158 |    ]
159 |   },
160 |   {
161 |    "cell_type": "code",
162 |    "execution_count": 33,
163 |    "metadata": {},
164 |    "outputs": [
165 |     {
166 |      "data": {
167 |       "text/plain": [
168 |        "tensor([[[0.9681, 0.9093, 0.3873],\n",
169 |        "         [0.2986, 0.7554, 0.5381]]])"
170 |       ]
171 |      },
172 |      "metadata": {},
173 |      "output_type": "display_data"
174 |     },
175 |     {
176 |      "name": "stdout",
177 |      "output_type": "stream",
178 |      "text": [
179 |       "torch.Size([1, 2, 3])   torch.Size([1, 2, 3])\n",
180 |       "a的内存大小为:1x2x3 =  6\n",
181 |       "3 3\n"
182 |      ]
183 |     }
184 |    ],
185 |    "source": [
186 |     "a = torch.rand(1,2,3)   #  均匀分布[0,1] uniform distribution\n",
187 |     "display(a)\n",
188 |     "print(a.shape,' ',a.size())\n",
189 |     "list(a.shape)\n",
190 |     "print('a的内存大小为:1x2x3 = ',a.numel())\n",
191 |     "print(len(a.shape),a.dim())"
192 |    ]
193 |   },
194 |   {
195 |    "cell_type": "markdown",
196 |    "metadata": {},
197 |    "source": [
198 |     "### Note4: dim=3的张量\n",
199 |     "- rand 均匀分布[0,1]\n",
200 |     "- randn 正态分布[0,1]\n",
201 |     "- 为了和python交互,使用list将shape转换为list类型\n",
202 |     "- 用.numel()方法得到tensor的大小\n",
203 |     "- 用len(a.shape)和a.dim()都可得到tensor的维度\n",
204 |     "- 三维张量在RNN经常使用,四维张量在CNN中经常使用,用来表示图片"
205 |    ]
206 |   },
207 |   {
208 |    "cell_type": "markdown",
209 |    "metadata": {},
210 |    "source": [
211 |     "## 2.2 创建Tensor"
212 |    ]
213 |   },
214 |   {
215 |    "cell_type": "code",
216 |    "execution_count": 35,
217 |    "metadata": {},
218 |    "outputs": [
219 |     {
220 |      "data": {
221 |       "text/plain": [
222 |        "tensor([2.0000, 3.3000], dtype=torch.float64)"
223 |       ]
224 |      },
225 |      "execution_count": 35,
226 |      "metadata": {},
227 |      "output_type": "execute_result"
228 |     }
229 |    ],
230 |    "source": [
231 |     "a_np = np.array([2,3.3])\n",
232 |     "a_pt = torch.from_numpy(a_np)\n",
233 |     "a_pt"
234 |    ]
235 |   },
236 |   {
237 |    "cell_type": "code",
238 |    "execution_count": 36,
239 |    "metadata": {},
240 |    "outputs": [
241 |     {
242 |      "data": {
243 |       "text/plain": [
244 |        "tensor([2.0000, 3.2000])"
245 |       ]
246 |      },
247 |      "execution_count": 36,
248 |      "metadata": {},
249 |      "output_type": "execute_result"
250 |     }
251 |    ],
252 |    "source": [
253 |     "torch.tensor([2.,3.2]) # 小写给具体数据"
254 |    ]
255 |   },
256 |   {
257 |    "cell_type": "code",
258 |    "execution_count": 38,
259 |    "metadata": {},
260 |    "outputs": [
261 |     {
262 |      "data": {
263 |       "text/plain": [
264 |        "tensor([[9.8863e+36, 4.5790e-41, 9.8866e+36],\n",
265 |        "        [4.5790e-41, 2.7604e+20, 1.7744e+28]])"
266 |       ]
267 |      },
268 |      "execution_count": 38,
269 |      "metadata": {},
270 |      "output_type": "execute_result"
271 |     }
272 |    ],
273 |    "source": [
274 |     "torch.FloatTensor(2,3) # 大写给shape\n",
275 |     "# torch.FloatTensor([2.,3.2]) 少使用,易混淆"
276 |    ]
277 |   },
278 |   {
279 |    "cell_type": "code",
280 |    "execution_count": 46,
281 |    "metadata": {},
282 |    "outputs": [
283 |     {
284 |      "name": "stdout",
285 |      "output_type": "stream",
286 |      "text": [
287 |       "torch.FloatTensor\n",
288 |       "torch.DoubleTensor\n"
289 |      ]
290 |     }
291 |    ],
292 |    "source": [
293 |     "# set default type\n",
294 |     "print(torch.tensor([1.2,3]).type())\n",
295 |     "torch.set_default_tensor_type(torch.DoubleTensor)\n",
296 |     "print(torch.tensor([1.2,3]).type())"
297 |    ]
298 |   },
299 |   {
300 |    "cell_type": "markdown",
301 |    "metadata": {},
302 |    "source": [
303 |     "### Note5: tensor和FloatTensor\n",
304 |     "- 小写给具体数据,大写给shape\n",
305 |     "- 这种方法生成的张量不能直接使用,里面会存在无穷大和无穷小,后面必须用别的数据写入\n",
306 |     "- .set_default_tensor_type()方法可以设置tensor的默认类型"
307 |    ]
308 |   },
309 |   {
310 |    "cell_type": "code",
311 |    "execution_count": 51,
312 |    "metadata": {},
313 |    "outputs": [
314 |     {
315 |      "name": "stdout",
316 |      "output_type": "stream",
317 |      "text": [
318 |       "tensor([[0.2782, 0.6091, 0.6666],\n",
319 |       "        [0.3973, 0.5082, 0.8371],\n",
320 |       "        [0.4828, 0.8271, 0.6257]])\n",
321 |       "tensor([[0.2782, 0.6091, 0.6666],\n",
322 |       "        [0.3973, 0.5082, 0.8371],\n",
323 |       "        [0.4828, 0.8271, 0.6257]])\n",
324 |       "tensor([[5, 4, 8],\n",
325 |       "        [3, 3, 2],\n",
326 |       "        [6, 8, 2]])\n"
327 |      ]
328 |     }
329 |    ],
330 |    "source": [
331 |     "# rand\n",
332 |     "a = torch.rand(3,3)\n",
333 |     "print(a)\n",
334 |     "b = torch.rand_like(a)\n",
335 |     "print(a)\n",
336 |     "\n",
337 |     "a = torch.randint(1,10,[3,3])\n",
338 |     "print(a)"
339 |    ]
340 |   },
341 |   {
342 |    "cell_type": "markdown",
343 |    "metadata": {},
344 |    "source": [
345 |     "### Note6: rand/rand_like , randint\n",
346 |     "- rand会均匀随机产生[0,1)之间的数据\n",
347 |     "- *_like方法接收的参数是tensor\n",
348 |     "- .randint(1,10,[3,3])产生[1,10)之间的均匀分布随机数,shape为[3,3]"
349 |    ]
350 |   },
351 |   {
352 |    "cell_type": "code",
353 |    "execution_count": 60,
354 |    "metadata": {},
355 |    "outputs": [
356 |     {
357 |      "name": "stdout",
358 |      "output_type": "stream",
359 |      "text": [
360 |       "tensor([[0.7122, 0.9045, 0.0039],\n",
361 |       "        [0.8279, 0.5099, 0.2207],\n",
362 |       "        [0.0466, 0.6949, 0.9866]])\n",
363 |       "tensor([ 1.8412,  0.0322,  0.7769,  0.7791,  0.2126,  0.1222, -0.2154,  0.2899,\n",
364 |       "         0.3680,  0.1192])\n",
365 |       "\n",
366 |       "\n",
367 |       "\n",
368 |       "想把tensor全部赋值为一个元素用full: \n",
369 |       " tensor([[7., 7., 7.],\n",
370 |       "        [7., 7., 7.]])\n",
371 |       "生成一个标量:\n",
372 |       " tensor(7.)\n",
373 |       "生成一个vec:\n",
374 |       " tensor([7., 7.])\n",
375 |       "\n",
376 |       "\n",
377 |       "\n"
378 |      ]
379 |     }
380 |    ],
381 |    "source": [
382 |     "# randn正太分布   N(0,1)\n",
383 |     "a = torch.rand(3,3)\n",
384 |     "print(a)\n",
385 |     "\n",
386 |     "# N(u,std)\n",
387 |     "print(torch.normal(mean=torch.full([10],0),std=torch.arange(1,0,-0.1)))\n",
388 |     "\n",
389 |     "print('\\n\\n')\n",
390 |     "\n",
391 |     "# full\n",
392 |     "print('想把tensor全部赋值为一个元素用full: \\n',torch.full([2,3],7))\n",
393 |     "print('生成一个标量:\\n',torch.full([],7))\n",
394 |     "print('生成一个vec:\\n',torch.full([2],7))\n",
395 |     "\n",
396 |     "print('\\n\\n')\n"
397 |    ]
398 |   },
399 |   {
400 |    "cell_type": "markdown",
401 |    "metadata": {},
402 |    "source": [
403 |     "### Note7: randn , full\n",
404 |     "- randn正态分布\n",
405 |     "- full将tensor全部赋值为一个元素"
406 |    ]
407 |   },
408 |   {
409 |    "cell_type": "code",
410 |    "execution_count": 64,
411 |    "metadata": {},
412 |    "outputs": [
413 |     {
414 |      "name": "stdout",
415 |      "output_type": "stream",
416 |      "text": [
417 |       "arange生成[0,10)内的等差为2的数列: \n",
418 |       " tensor([0, 2, 4, 6, 8])\n",
419 |       "\n",
420 |       "\n"
421 |      ]
422 |     }
423 |    ],
424 |    "source": [
425 |     "# arrange/range\n",
426 |     "print('arange生成[0,10)内的等差为2的数列: \\n',torch.arange(0,10,2))\n",
427 |     "print('\\n')"
428 |    ]
429 |   },
430 |   {
431 |    "cell_type": "code",
432 |    "execution_count": 69,
433 |    "metadata": {},
434 |    "outputs": [
435 |     {
436 |      "name": "stdout",
437 |      "output_type": "stream",
438 |      "text": [
439 |       "linespace在[0,10]中生成4个间隔相同的数字: \n",
440 |       " tensor([ 0.0000,  3.3333,  6.6667, 10.0000])\n",
441 |       "logspace在[-1,0]中切割10份,设每个数为xi,生成10^xi: \n",
442 |       " tensor([1.0000, 0.7743, 0.5995, 0.4642, 0.3594, 0.2783, 0.2154, 0.1668, 0.1292,\n",
443 |       "        0.1000])\n"
444 |      ]
445 |     }
446 |    ],
447 |    "source": [
448 |     "# linespace/logspace\n",
449 |     "print('linespace在[0,10]中生成4个间隔相同的数字: \\n',torch.linspace(0,10,steps=4))\n",
450 |     "print('logspace在[-1,0]中切割10份,设每个数为xi,生成10^xi: \\n',torch.logspace(0,-1,steps=10,base=10))"
451 |    ]
452 |   },
453 |   {
454 |    "cell_type": "markdown",
455 |    "metadata": {},
456 |    "source": [
457 |     "### Note8: arange/range  linespace/logspace\n",
458 |     "- pytorch不建议使用range\n",
459 |     "- arange的第三个参数是等差\n",
460 |     "- linespace的第三个参数是等分的数量\n",
461 |     "- logspace的base参数可以设置为2,10,e等底数"
462 |    ]
463 |   },
464 |   {
465 |    "cell_type": "code",
466 |    "execution_count": null,
467 |    "metadata": {},
468 |    "outputs": [],
469 |    "source": []
470 |   }
471 |  ],
472 |  "metadata": {
473 |   "kernelspec": {
474 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
475 |    "language": "python",
476 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
477 |   },
478 |   "language_info": {
479 |    "codemirror_mode": {
480 |     "name": "ipython",
481 |     "version": 3
482 |    },
483 |    "file_extension": ".py",
484 |    "mimetype": "text/x-python",
485 |    "name": "python",
486 |    "nbconvert_exporter": "python",
487 |    "pygments_lexer": "ipython3",
488 |    "version": "3.5.6"
489 |   },
490 |   "varInspector": {
491 |    "cols": {
492 |     "lenName": 16,
493 |     "lenType": 16,
494 |     "lenVar": 40
495 |    },
496 |    "kernels_config": {
497 |     "python": {
498 |      "delete_cmd_postfix": "",
499 |      "delete_cmd_prefix": "del ",
500 |      "library": "var_list.py",
501 |      "varRefreshCmd": "print(var_dic_list())"
502 |     },
503 |     "r": {
504 |      "delete_cmd_postfix": ") ",
505 |      "delete_cmd_prefix": "rm(",
506 |      "library": "var_list.r",
507 |      "varRefreshCmd": "cat(var_dic_list()) "
508 |     }
509 |    },
510 |    "types_to_exclude": [
511 |     "module",
512 |     "function",
513 |     "builtin_function_or_method",
514 |     "instance",
515 |     "_Feature"
516 |    ],
517 |    "window_display": false
518 |   }
519 |  },
520 |  "nbformat": 4,
521 |  "nbformat_minor": 2
522 | }
523 | 


--------------------------------------------------------------------------------
/ch05_ 神经网络与全连接层/.idea/ch05_ 神经网络与全联接层.iml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <module type="PYTHON_MODULE" version="4">
 3 |   <component name="NewModuleRootManager">
 4 |     <content url="file://$MODULE_DIR$" />
 5 |     <orderEntry type="jdk" jdkName="Python 3.5 (ch05_ 神经网络与全联接层)" jdkType="Python SDK" />
 6 |     <orderEntry type="sourceFolder" forTests="false" />
 7 |   </component>
 8 |   <component name="TestRunnerService">
 9 |     <option name="PROJECT_TEST_RUNNER" value="Unittests" />
10 |   </component>
11 | </module>


--------------------------------------------------------------------------------
/ch05_ 神经网络与全连接层/.idea/misc.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="JavaScriptSettings">
4 |     <option name="languageLevel" value="ES6" />
5 |   </component>
6 |   <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.5 (ch05_ 神经网络与全联接层)" project-jdk-type="Python SDK" />
7 | </project>


--------------------------------------------------------------------------------
/ch05_ 神经网络与全连接层/.idea/modules.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="ProjectModuleManager">
4 |     <modules>
5 |       <module fileurl="file://$PROJECT_DIR$/.idea/ch05_ 神经网络与全联接层.iml" filepath="$PROJECT_DIR$/.idea/ch05_ 神经网络与全联接层.iml" />
6 |     </modules>
7 |   </component>
8 | </project>


--------------------------------------------------------------------------------
/ch05_ 神经网络与全连接层/.idea/workspace.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8"?>
  2 | <project version="4">
  3 |   <component name="ChangeListManager">
  4 |     <list default="true" id="e21c3365-74d4-4a4e-bb21-1c3cb477b779" name="Default Changelist" comment="" />
  5 |     <option name="EXCLUDED_CONVERTED_TO_IGNORED" value="true" />
  6 |     <option name="SHOW_DIALOG" value="false" />
  7 |     <option name="HIGHLIGHT_CONFLICTS" value="true" />
  8 |     <option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
  9 |     <option name="LAST_RESOLUTION" value="IGNORE" />
 10 |   </component>
 11 |   <component name="FileEditorManager">
 12 |     <leaf>
 13 |       <file pinned="false" current-in-tab="true">
 14 |         <entry file="file://$PROJECT_DIR$/mnist.py">
 15 |           <provider selected="true" editor-type-id="text-editor">
 16 |             <state relative-caret-position="126">
 17 |               <caret line="6" column="15" lean-forward="true" selection-start-line="6" selection-start-column="15" selection-end-line="6" selection-end-column="15" />
 18 |               <folding>
 19 |                 <element signature="e#0#12#0" expanded="true" />
 20 |               </folding>
 21 |             </state>
 22 |           </provider>
 23 |         </entry>
 24 |       </file>
 25 |     </leaf>
 26 |   </component>
 27 |   <component name="ProjectFrameBounds" extendedState="6">
 28 |     <option name="y" value="33" />
 29 |     <option name="width" value="1403" />
 30 |     <option name="height" value="878" />
 31 |   </component>
 32 |   <component name="ProjectView">
 33 |     <navigator proportions="" version="1">
 34 |       <foldersAlwaysOnTop value="true" />
 35 |     </navigator>
 36 |     <panes>
 37 |       <pane id="Scope" />
 38 |       <pane id="ProjectPane">
 39 |         <subPane>
 40 |           <expand>
 41 |             <path>
 42 |               <item name="ch05_ 神经网络与全联接层" type="b2602c69:ProjectViewProjectNode" />
 43 |               <item name="ch05_ 神经网络与全联接层" type="462c0819:PsiDirectoryNode" />
 44 |             </path>
 45 |           </expand>
 46 |           <select />
 47 |         </subPane>
 48 |       </pane>
 49 |     </panes>
 50 |   </component>
 51 |   <component name="PropertiesComponent">
 52 |     <property name="WebServerToolWindowFactoryState" value="false" />
 53 |     <property name="last_opened_file_path" value="$PROJECT_DIR$" />
 54 |     <property name="nodejs_interpreter_path.stuck_in_default_project" value="undefined stuck path" />
 55 |     <property name="nodejs_npm_path_reset_for_default_project" value="true" />
 56 |     <property name="settings.editor.selected.configurable" value="preferences.lookFeel" />
 57 |   </component>
 58 |   <component name="RunDashboard">
 59 |     <option name="ruleStates">
 60 |       <list>
 61 |         <RuleState>
 62 |           <option name="name" value="ConfigurationTypeDashboardGroupingRule" />
 63 |         </RuleState>
 64 |         <RuleState>
 65 |           <option name="name" value="StatusDashboardGroupingRule" />
 66 |         </RuleState>
 67 |       </list>
 68 |     </option>
 69 |   </component>
 70 |   <component name="RunManager">
 71 |     <configuration name="mnist" type="PythonConfigurationType" factoryName="Python" temporary="true">
 72 |       <module name="ch05_ 神经网络与全联接层" />
 73 |       <option name="INTERPRETER_OPTIONS" value="" />
 74 |       <option name="PARENT_ENVS" value="true" />
 75 |       <envs>
 76 |         <env name="PYTHONUNBUFFERED" value="1" />
 77 |       </envs>
 78 |       <option name="SDK_HOME" value="" />
 79 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
 80 |       <option name="IS_MODULE_SDK" value="true" />
 81 |       <option name="ADD_CONTENT_ROOTS" value="true" />
 82 |       <option name="ADD_SOURCE_ROOTS" value="true" />
 83 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
 84 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/mnist.py" />
 85 |       <option name="PARAMETERS" value="" />
 86 |       <option name="SHOW_COMMAND_LINE" value="false" />
 87 |       <option name="EMULATE_TERMINAL" value="false" />
 88 |       <option name="MODULE_MODE" value="false" />
 89 |       <option name="REDIRECT_INPUT" value="false" />
 90 |       <option name="INPUT_FILE" value="" />
 91 |       <method v="2" />
 92 |     </configuration>
 93 |     <recent_temporary>
 94 |       <list>
 95 |         <item itemvalue="Python.mnist" />
 96 |       </list>
 97 |     </recent_temporary>
 98 |   </component>
 99 |   <component name="SvnConfiguration">
100 |     <configuration />
101 |   </component>
102 |   <component name="TaskManager">
103 |     <task active="true" id="Default" summary="Default task">
104 |       <changelist id="e21c3365-74d4-4a4e-bb21-1c3cb477b779" name="Default Changelist" comment="" />
105 |       <created>1595484643533</created>
106 |       <option name="number" value="Default" />
107 |       <option name="presentableId" value="Default" />
108 |       <updated>1595484643533</updated>
109 |       <workItem from="1595484654720" duration="1699000" />
110 |     </task>
111 |     <servers />
112 |   </component>
113 |   <component name="TimeTrackingManager">
114 |     <option name="totallyTimeSpent" value="1699000" />
115 |   </component>
116 |   <component name="ToolWindowManager">
117 |     <frame x="0" y="23" width="1403" height="877" extended-state="6" />
118 |     <editor active="true" />
119 |     <layout>
120 |       <window_info id="Favorites" side_tool="true" />
121 |       <window_info content_ui="combo" id="Project" order="0" visible="true" weight="0.24908155" />
122 |       <window_info id="Structure" order="1" side_tool="true" weight="0.25" />
123 |       <window_info anchor="bottom" id="Docker" show_stripe_button="false" />
124 |       <window_info anchor="bottom" id="Database Changes" />
125 |       <window_info anchor="bottom" id="Version Control" />
126 |       <window_info anchor="bottom" id="Python Console" weight="0.32899868" />
127 |       <window_info anchor="bottom" id="Terminal" sideWeight="0.49963263" weight="0.32769832" />
128 |       <window_info anchor="bottom" id="Event Log" sideWeight="0.5003674" side_tool="true" weight="0.32769832" />
129 |       <window_info anchor="bottom" id="Message" order="0" />
130 |       <window_info anchor="bottom" id="Find" order="1" />
131 |       <window_info anchor="bottom" id="Run" order="2" weight="0.32899868" />
132 |       <window_info anchor="bottom" id="Debug" order="3" weight="0.4" />
133 |       <window_info anchor="bottom" id="Cvs" order="4" weight="0.25" />
134 |       <window_info anchor="bottom" id="Inspection" order="5" weight="0.4" />
135 |       <window_info anchor="bottom" id="TODO" order="6" />
136 |       <window_info anchor="right" id="SciView" />
137 |       <window_info anchor="right" id="Database" />
138 |       <window_info anchor="right" id="Commander" internal_type="SLIDING" order="0" type="SLIDING" weight="0.4" />
139 |       <window_info anchor="right" id="Ant Build" order="1" weight="0.25" />
140 |       <window_info anchor="right" content_ui="combo" id="Hierarchy" order="2" weight="0.25" />
141 |     </layout>
142 |   </component>
143 |   <component name="TypeScriptGeneratedFilesManager">
144 |     <option name="version" value="1" />
145 |   </component>
146 |   <component name="com.intellij.coverage.CoverageDataManagerImpl">
147 |     <SUITE FILE_PATH="coverage/ch05__$mnist.coverage" NAME="mnist Coverage Results" MODIFIED="1595485762018" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
148 |   </component>
149 |   <component name="editorHistoryManager">
150 |     <entry file="file://$PROJECT_DIR$/mnist.py">
151 |       <provider selected="true" editor-type-id="text-editor">
152 |         <state relative-caret-position="126">
153 |           <caret line="6" column="15" lean-forward="true" selection-start-line="6" selection-start-column="15" selection-end-line="6" selection-end-column="15" />
154 |           <folding>
155 |             <element signature="e#0#12#0" expanded="true" />
156 |           </folding>
157 |         </state>
158 |       </provider>
159 |     </entry>
160 |   </component>
161 |   <component name="masterDetails">
162 |     <states>
163 |       <state key="ScopeChooserConfigurable.UI">
164 |         <settings>
165 |           <splitter-proportions>
166 |             <option name="proportions">
167 |               <list>
168 |                 <option value="0.2" />
169 |               </list>
170 |             </option>
171 |           </splitter-proportions>
172 |         </settings>
173 |       </state>
174 |     </states>
175 |   </component>
176 | </project>


--------------------------------------------------------------------------------
/ch05_ 神经网络与全连接层/ch05_神经网络与全连接层.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# ch05_神经网络与全连接层"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "## 5.1 Logistic ( sigmoid ) Regression \n",
 15 |     "\n",
 16 |     "- for continuous (由于是continuous,所以才叫做regression):\n",
 17 |     "$$ y = x w + b$$\n",
 18 |     "- for probability output :  \n",
 19 |     "$$ y = \\sigma ( x w + b )$$\n",
 20 |     " - $\\sigma$: sigmoid or logistic\n",
 21 |     "\n",
 22 |     "### Binary Classification :\n",
 23 |     "- interpred network as $ f : x \\to p( y \\mid x ; \\theta) $\n",
 24 |     "- output $ \\in [ 0 , 1 ]$\n",
 25 |     "- which is exactly what logistic function comes in\n",
 26 |     "\n",
 27 |     "### For Regression:\n",
 28 |     "- Goal : $ pred = y $\n",
 29 |     "- Approach : minimize $ dist(pred,y) $\n",
 30 |     "\n",
 31 |     "### For classification:\n",
 32 |     "- Goal : maximize benchmark , e.g. accuracy\n",
 33 |     "- Approach 1:  minimize $ dist ( p_\\theta ( y \\mid x ) , p_r ( y \\mid x )) $\n",
 34 |     "- Approach 2:  minimize $ divergence ( p_\\theta ( y \\mid x ) , p_r (y \\mid x )) $\n",
 35 |     "\n",
 36 |     "### Why call logistic regression ?\n",
 37 |     "- use sigmoid\n",
 38 |     "- Controversial:\n",
 39 |     " - MSE $\\to$ regression\n",
 40 |     " - Cross Entropy $\\to$ classification"
 41 |    ]
 42 |   },
 43 |   {
 44 |    "cell_type": "markdown",
 45 |    "metadata": {},
 46 |    "source": [
 47 |     "## 5.2 Cross Entropy Loss ( 交叉熵 )\n",
 48 |     "\n",
 49 |     "### Loss for classification:\n",
 50 |     "- MSE\n",
 51 |     "- Hinge Loss (SVM)\n",
 52 |     "$$ \\sum_i \\max (0 , 1-y_i * h_\\theta(x_i)) $$\n",
 53 |     "- Cross Entropy Loss\n",
 54 |     "\n",
 55 |     "### What's Entropy means ? \n",
 56 |     "- Uncertainty ( 不确定性 )\n",
 57 |     " - measure of surprise ( 惊喜度 )\n",
 58 |     "- higher entropy = less info.\n",
 59 |     "$$ Entropy = - \\sum_i P(i)\\space \\log P(i) $$\n",
 60 |     "\n",
 61 |     "### Binary Classification\n",
 62 |     "$$ H(P,Q) = -P(cat)\\log Q(cat) - (1-P(cat))\\log (1-Q(cat))$$\n",
 63 |     "$$由于是二分类,所以 P(dog) = (1-P(cat))$$\n",
 64 |     "$$\n",
 65 |     "H(P,Q) = - \\sum_{i=(cat,dog)}P(i)\\log Q(i) \\\\\n",
 66 |     "= -P(cat)\\log Q(cat) - P(dog)\\log Q(dog)  \\\\\n",
 67 |     " -(y\\log (p) + (1-y)\\log (1-p))\n",
 68 |     "$$\n",
 69 |     "\n",
 70 |     "### Why not use MSE on classification\n",
 71 |     "- sigmoid + MSE $\\to$ gradient vanish\n",
 72 |     "- converge slower\n",
 73 |     "- But,sometimes\n",
 74 |     " - e.g. meta-learning"
 75 |    ]
 76 |   },
 77 |   {
 78 |    "cell_type": "code",
 79 |    "execution_count": 1,
 80 |    "metadata": {},
 81 |    "outputs": [],
 82 |    "source": [
 83 |     "import torch\n",
 84 |     "import numpy as np\n",
 85 |     "from torch.nn import functional as F\n",
 86 |     "from torch import optim\n",
 87 |     "from torch import nn\n",
 88 |     "import torchvision"
 89 |    ]
 90 |   },
 91 |   {
 92 |    "cell_type": "code",
 93 |    "execution_count": 2,
 94 |    "metadata": {},
 95 |    "outputs": [
 96 |     {
 97 |      "name": "stdout",
 98 |      "output_type": "stream",
 99 |      "text": [
100 |       "x.shape:  torch.Size([1, 784]) \n",
101 |       "w.shape:  torch.Size([10, 784]) \n",
102 |       "logits = x@w.t(),logits.shape:  torch.Size([1, 10])\n",
103 |       "pred = softmax(logits,dim=1) :\n",
104 |       " tensor([[2.8702e-04, 4.0199e-01, 1.3270e-05, 9.6294e-04, 1.8527e-02, 2.3045e-01,\n",
105 |       "         7.3673e-03, 4.2058e-04, 3.3930e-01, 6.7891e-04]])\n",
106 |       "log(pred): tensor([[ -8.1559,  -0.9113, -11.2300,  -6.9455,  -3.9885,  -1.4677,  -4.9107,\n",
107 |       "          -7.7739,  -1.0809,  -7.2950]])\n",
108 |       "方法一:使用F.cross_entropy(logits,torch.tensor([3])直接计算: tensor(6.9455)\n",
109 |       "方法二:使用softmax计算出的pred_log计算: tensor(6.9455)\n",
110 |       "方法一只需要一步,而方法二的CE = softmax -> logits -> nll_loss\n"
111 |      ]
112 |     }
113 |    ],
114 |    "source": [
115 |     "# Numerical Stability\n",
116 |     "x = torch.rand(1,784)\n",
117 |     "w = torch.rand(10,784)\n",
118 |     "logits = x@w.t()\n",
119 |     "print('x.shape: ',x.shape,'\\nw.shape: ',w.shape,\n",
120 |     "      '\\nlogits = x@w.t(),logits.shape: ',logits.shape)\n",
121 |     "\n",
122 |     "pred = torch.softmax(logits,dim=1)\n",
123 |     "print('pred = softmax(logits,dim=1) :\\n',pred)\n",
124 |     "pred_log = torch.log(pred)\n",
125 |     "print('log(pred):',pred_log)\n",
126 |     "\n",
127 |     "loss = F.cross_entropy(logits,torch.tensor([3]))\n",
128 |     "print('方法一:使用F.cross_entropy(logits,torch.tensor([3])直接计算:',loss)\n",
129 |     "my_loss = F.nll_loss(pred_log,torch.tensor([3]))\n",
130 |     "print('方法二:使用softmax计算出的pred_log计算:',my_loss)\n",
131 |     "print('方法一只需要一步,而方法二的CE = softmax -> logits -> nll_loss')\n",
132 |     "      "
133 |    ]
134 |   },
135 |   {
136 |    "cell_type": "markdown",
137 |    "metadata": {},
138 |    "source": [
139 |     "## 5.3 多分类问题实战"
140 |    ]
141 |   },
142 |   {
143 |    "cell_type": "code",
144 |    "execution_count": null,
145 |    "metadata": {},
146 |    "outputs": [
147 |     {
148 |      "name": "stderr",
149 |      "output_type": "stream",
150 |      "text": [
151 |       "Setting up a new session...\n"
152 |      ]
153 |     },
154 |     {
155 |      "name": "stdout",
156 |      "output_type": "stream",
157 |      "text": [
158 |       "Train Epoch: 0 [0/60000 (0%)]\tLoss: 3.083690\n",
159 |       "Train Epoch: 0 [6400/60000 (11%)]\tLoss: 0.528396\n",
160 |       "Train Epoch: 0 [12800/60000 (21%)]\tLoss: 0.577129\n",
161 |       "Train Epoch: 0 [19200/60000 (32%)]\tLoss: 0.460878\n",
162 |       "Train Epoch: 0 [25600/60000 (43%)]\tLoss: 0.586255\n",
163 |       "Train Epoch: 0 [32000/60000 (53%)]\tLoss: 0.624034\n",
164 |       "Train Epoch: 0 [38400/60000 (64%)]\tLoss: 0.334806\n",
165 |       "Train Epoch: 0 [44800/60000 (75%)]\tLoss: 0.431546\n",
166 |       "Train Epoch: 0 [51200/60000 (85%)]\tLoss: 0.629640\n",
167 |       "Train Epoch: 0 [57600/60000 (96%)]\tLoss: 0.407158\n"
168 |      ]
169 |     },
170 |     {
171 |      "name": "stderr",
172 |      "output_type": "stream",
173 |      "text": [
174 |       "/Users/distiller/project/conda/conda-bld/pytorch_1591914879026/work/aten/src/ATen/native/BinaryOps.cpp:81: UserWarning: Integer division of tensors using div or / is deprecated, and in a future release div will perform true division as in Python 3. Use true_divide or floor_divide (// in Python) instead.\n"
175 |      ]
176 |     },
177 |     {
178 |      "name": "stdout",
179 |      "output_type": "stream",
180 |      "text": [
181 |       "\n",
182 |       "Test set: Average loss: 0.0071, Accuracy: 8427/10000 (84%)\n",
183 |       "\n",
184 |       "Train Epoch: 1 [0/60000 (0%)]\tLoss: 0.619346\n",
185 |       "Train Epoch: 1 [6400/60000 (11%)]\tLoss: 0.550431\n",
186 |       "Train Epoch: 1 [12800/60000 (21%)]\tLoss: 0.452561\n",
187 |       "Train Epoch: 1 [19200/60000 (32%)]\tLoss: 0.439310\n",
188 |       "Train Epoch: 1 [25600/60000 (43%)]\tLoss: 0.529607\n",
189 |       "Train Epoch: 1 [32000/60000 (53%)]\tLoss: 0.257746\n",
190 |       "Train Epoch: 1 [38400/60000 (64%)]\tLoss: 0.293476\n",
191 |       "Train Epoch: 1 [44800/60000 (75%)]\tLoss: 0.316650\n",
192 |       "Train Epoch: 1 [51200/60000 (85%)]\tLoss: 0.297505\n",
193 |       "Train Epoch: 1 [57600/60000 (96%)]\tLoss: 0.440608\n",
194 |       "\n",
195 |       "Test set: Average loss: 0.0064, Accuracy: 8538/10000 (85%)\n",
196 |       "\n",
197 |       "Train Epoch: 2 [0/60000 (0%)]\tLoss: 0.480287\n",
198 |       "Train Epoch: 2 [6400/60000 (11%)]\tLoss: 0.530437\n",
199 |       "Train Epoch: 2 [12800/60000 (21%)]\tLoss: 0.350130\n",
200 |       "Train Epoch: 2 [19200/60000 (32%)]\tLoss: 0.409370\n",
201 |       "Train Epoch: 2 [25600/60000 (43%)]\tLoss: 0.333595\n",
202 |       "Train Epoch: 2 [32000/60000 (53%)]\tLoss: 0.396966\n",
203 |       "Train Epoch: 2 [38400/60000 (64%)]\tLoss: 0.434597\n",
204 |       "Train Epoch: 2 [44800/60000 (75%)]\tLoss: 0.492732\n",
205 |       "Train Epoch: 2 [51200/60000 (85%)]\tLoss: 0.391622\n",
206 |       "Train Epoch: 2 [57600/60000 (96%)]\tLoss: 0.388209\n",
207 |       "\n",
208 |       "Test set: Average loss: 0.0060, Accuracy: 8597/10000 (86%)\n",
209 |       "\n",
210 |       "Train Epoch: 3 [0/60000 (0%)]\tLoss: 0.437538\n",
211 |       "Train Epoch: 3 [6400/60000 (11%)]\tLoss: 0.258717\n",
212 |       "Train Epoch: 3 [12800/60000 (21%)]\tLoss: 0.403510\n",
213 |       "Train Epoch: 3 [19200/60000 (32%)]\tLoss: 0.407749\n",
214 |       "Train Epoch: 3 [25600/60000 (43%)]\tLoss: 0.234885\n",
215 |       "Train Epoch: 3 [32000/60000 (53%)]\tLoss: 0.279934\n",
216 |       "Train Epoch: 3 [38400/60000 (64%)]\tLoss: 0.370400\n",
217 |       "Train Epoch: 3 [44800/60000 (75%)]\tLoss: 0.444407\n",
218 |       "Train Epoch: 3 [51200/60000 (85%)]\tLoss: 0.498015\n",
219 |       "Train Epoch: 3 [57600/60000 (96%)]\tLoss: 0.557527\n",
220 |       "\n",
221 |       "Test set: Average loss: 0.0056, Accuracy: 8659/10000 (87%)\n",
222 |       "\n",
223 |       "Train Epoch: 4 [0/60000 (0%)]\tLoss: 0.316698\n",
224 |       "Train Epoch: 4 [6400/60000 (11%)]\tLoss: 0.409586\n",
225 |       "Train Epoch: 4 [12800/60000 (21%)]\tLoss: 0.511134\n",
226 |       "Train Epoch: 4 [19200/60000 (32%)]\tLoss: 0.567208\n",
227 |       "Train Epoch: 4 [25600/60000 (43%)]\tLoss: 0.456032\n",
228 |       "Train Epoch: 4 [32000/60000 (53%)]\tLoss: 0.232997\n",
229 |       "Train Epoch: 4 [38400/60000 (64%)]\tLoss: 0.335775\n",
230 |       "Train Epoch: 4 [44800/60000 (75%)]\tLoss: 0.349151\n",
231 |       "Train Epoch: 4 [51200/60000 (85%)]\tLoss: 0.449998\n",
232 |       "Train Epoch: 4 [57600/60000 (96%)]\tLoss: 0.337424\n",
233 |       "\n",
234 |       "Test set: Average loss: 0.0054, Accuracy: 8708/10000 (87%)\n",
235 |       "\n",
236 |       "Train Epoch: 5 [0/60000 (0%)]\tLoss: 0.262621\n",
237 |       "Train Epoch: 5 [6400/60000 (11%)]\tLoss: 0.442502\n",
238 |       "Train Epoch: 5 [12800/60000 (21%)]\tLoss: 0.381229\n",
239 |       "Train Epoch: 5 [19200/60000 (32%)]\tLoss: 0.424382\n",
240 |       "Train Epoch: 5 [25600/60000 (43%)]\tLoss: 0.339480\n",
241 |       "Train Epoch: 5 [32000/60000 (53%)]\tLoss: 0.156607\n",
242 |       "Train Epoch: 5 [38400/60000 (64%)]\tLoss: 0.543846\n",
243 |       "Train Epoch: 5 [44800/60000 (75%)]\tLoss: 0.370581\n",
244 |       "Train Epoch: 5 [51200/60000 (85%)]\tLoss: 0.180045\n",
245 |       "Train Epoch: 5 [57600/60000 (96%)]\tLoss: 0.728054\n",
246 |       "\n",
247 |       "Test set: Average loss: 0.0053, Accuracy: 8725/10000 (87%)\n",
248 |       "\n",
249 |       "Train Epoch: 6 [0/60000 (0%)]\tLoss: 0.278354\n",
250 |       "Train Epoch: 6 [6400/60000 (11%)]\tLoss: 0.254100\n",
251 |       "Train Epoch: 6 [12800/60000 (21%)]\tLoss: 0.430109\n",
252 |       "Train Epoch: 6 [19200/60000 (32%)]\tLoss: 0.319065\n",
253 |       "Train Epoch: 6 [25600/60000 (43%)]\tLoss: 0.408925\n",
254 |       "Train Epoch: 6 [32000/60000 (53%)]\tLoss: 0.181885\n",
255 |       "Train Epoch: 6 [38400/60000 (64%)]\tLoss: 0.255681\n",
256 |       "Train Epoch: 6 [44800/60000 (75%)]\tLoss: 0.395882\n",
257 |       "Train Epoch: 6 [51200/60000 (85%)]\tLoss: 0.179406\n",
258 |       "Train Epoch: 6 [57600/60000 (96%)]\tLoss: 0.424512\n",
259 |       "\n",
260 |       "Test set: Average loss: 0.0052, Accuracy: 8755/10000 (88%)\n",
261 |       "\n",
262 |       "Train Epoch: 7 [0/60000 (0%)]\tLoss: 0.178965\n",
263 |       "Train Epoch: 7 [6400/60000 (11%)]\tLoss: 0.530159\n",
264 |       "Train Epoch: 7 [12800/60000 (21%)]\tLoss: 0.092848\n",
265 |       "Train Epoch: 7 [19200/60000 (32%)]\tLoss: 0.296255\n",
266 |       "Train Epoch: 7 [25600/60000 (43%)]\tLoss: 0.399122\n",
267 |       "Train Epoch: 7 [32000/60000 (53%)]\tLoss: 0.278785\n",
268 |       "Train Epoch: 7 [38400/60000 (64%)]\tLoss: 0.234787\n",
269 |       "Train Epoch: 7 [44800/60000 (75%)]\tLoss: 0.338992\n",
270 |       "Train Epoch: 7 [51200/60000 (85%)]\tLoss: 0.452053\n",
271 |       "Train Epoch: 7 [57600/60000 (96%)]\tLoss: 0.372501\n",
272 |       "\n",
273 |       "Test set: Average loss: 0.0051, Accuracy: 8770/10000 (88%)\n",
274 |       "\n",
275 |       "Train Epoch: 8 [0/60000 (0%)]\tLoss: 0.293521\n",
276 |       "Train Epoch: 8 [6400/60000 (11%)]\tLoss: 0.329178\n",
277 |       "Train Epoch: 8 [12800/60000 (21%)]\tLoss: 0.304065\n",
278 |       "Train Epoch: 8 [19200/60000 (32%)]\tLoss: 0.279119\n",
279 |       "Train Epoch: 8 [25600/60000 (43%)]\tLoss: 0.398582\n",
280 |       "Train Epoch: 8 [32000/60000 (53%)]\tLoss: 0.370215\n",
281 |       "Train Epoch: 8 [38400/60000 (64%)]\tLoss: 0.211270\n",
282 |       "Train Epoch: 8 [44800/60000 (75%)]\tLoss: 0.380234\n",
283 |       "Train Epoch: 8 [51200/60000 (85%)]\tLoss: 0.280856\n"
284 |      ]
285 |     }
286 |    ],
287 |    "source": [
288 |     "from visdom import Visdom\n",
289 |     "\n",
290 |     "learning_rate = 1e-2\n",
291 |     "epochs = 10\n",
292 |     "batch_size = 64\n",
293 |     "\n",
294 |     "train_load = torch.utils.data.DataLoader(torchvision.datasets.MNIST(\n",
295 |     "    '../data/',\n",
296 |     "    train=True,\n",
297 |     "    download=True,\n",
298 |     "    transform=torchvision.transforms.Compose([\n",
299 |     "        torchvision.transforms.ToTensor(),\n",
300 |     "        torchvision.transforms.Normalize((0.1307, ), (0.3081, ))\n",
301 |     "    ])),\n",
302 |     "    batch_size=batch_size,\n",
303 |     "    shuffle=True)\n",
304 |     "\n",
305 |     "test_load = torch.utils.data.DataLoader(torchvision.datasets.MNIST(\n",
306 |     "    '../data/',\n",
307 |     "    train=False,\n",
308 |     "    transform=torchvision.transforms.Compose([\n",
309 |     "        torchvision.transforms.ToTensor(),\n",
310 |     "        torchvision.transforms.Normalize((0.1307),(0.3081,))])),\n",
311 |     "            batch_size=batch_size,\n",
312 |     "            shuffle=True)\n",
313 |     "\n",
314 |     "\n",
315 |     "w1,b1 = torch.randn(200,784,requires_grad=True),\\\n",
316 |     "        torch.zeros(200,requires_grad=True)\n",
317 |     "w2,b2 = torch.randn(200,200,requires_grad=True),\\\n",
318 |     "        torch.zeros(200,requires_grad=True)\n",
319 |     "w3,b3 = torch.randn(10,200,requires_grad=True),\\\n",
320 |     "        torch.zeros(10,requires_grad=True)\n",
321 |     "\n",
322 |     "nn.init.kaiming_normal_(w1)\n",
323 |     "nn.init.kaiming_normal_(w2)\n",
324 |     "nn.init.kaiming_normal_(w3)\n",
325 |     "\n",
326 |     "def forward(x):\n",
327 |     "    x = x@w1.t() + b1\n",
328 |     "    x = F.relu(x)\n",
329 |     "    x = x@w2.t() + b2\n",
330 |     "    x = F.relu(x)\n",
331 |     "    x = x@w3.t() + b3\n",
332 |     "    x = F.relu(x)\n",
333 |     "    return x\n",
334 |     "\n",
335 |     "\n",
336 |     "optimizer = optim.SGD([w1,b1,w2,b2,w3,b3],lr=learning_rate)\n",
337 |     "criteon = nn.CrossEntropyLoss()\n",
338 |     "global_step = 0\n",
339 |     "global_test_step = 0\n",
340 |     "# criteon = F.cross_entropy()\n",
341 |     "\n",
342 |     "global_step = 0\n",
343 |     "vis = Visdom()\n",
344 |     "vis.line([0.],[0.],win='train_loss',opts=dict(title='train_loss'))\n",
345 |     "vis.line([[0.0,0.0]],[0.],win='test',opts=dict(title='test loss&acc.',legend=['loss','acc.']))\n",
346 |     "\n",
347 |     "for epoch in range(epochs):\n",
348 |     "    for batch_idx, (data,target) in enumerate(train_load):\n",
349 |     "        data = data.view(-1,28*28)\n",
350 |     "        logits = forward(data)\n",
351 |     "        loss = criteon(logits,target)\n",
352 |     "        \n",
353 |     "        optimizer.zero_grad()\n",
354 |     "        loss.backward()\n",
355 |     "        optimizer.step()\n",
356 |     "        \n",
357 |     "        if batch_idx%100 == 0:\n",
358 |     "            print('Train Epoch: {} [{}/{} ({:.0f}%)]\\tLoss: {:.6f}'.\n",
359 |     "                 format(epoch,batch_idx*len(data),len(train_load.dataset),\n",
360 |     "                       100. *batch_idx/len(train_load),loss.item()))\n",
361 |     "        global_step += 1\n",
362 |     "        vis.line([loss.item()],[global_step],win='train_loss',update='append')\n",
363 |     "            \n",
364 |     "    test_loss = 0\n",
365 |     "    correct = 0\n",
366 |     "    for data,target in test_load:\n",
367 |     "        \n",
368 |     "        vis.images(data.view(-1,1,28,28),win='x')\n",
369 |     "        \n",
370 |     "        data = data.view(-1,28*28)\n",
371 |     "        logits = forward(data)\n",
372 |     "        test_loss += criteon(logits,target).item()\n",
373 |     "        pred = logits.data.max(1)[1]\n",
374 |     "        correct += pred.eq(target.data).sum()\n",
375 |     "        \n",
376 |     "        global_test_step += 1\n",
377 |     "        vis.line([[test_loss,correct/len(test_load.dataset)]],[global_test_step],win='test',update='append')\n",
378 |     "    \n",
379 |     "       \n",
380 |     "        vis.text(str(pred.detach().cpu().numpy()),win='pred',opts=dict(title='pred'))\n",
381 |     "    \n",
382 |     "    test_loss /= len(test_load.dataset)\n",
383 |     "    print('\\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.0f}%)\\n'.\n",
384 |     "         format(test_loss,correct,len(test_load.dataset),100. *correct/len(test_load.dataset)))\n",
385 |     "    "
386 |    ]
387 |   },
388 |   {
389 |    "cell_type": "markdown",
390 |    "metadata": {},
391 |    "source": [
392 |     "## 5.4 全连接层\n",
393 |     "\n",
394 |     "- x = F.relu(x,inplace = True)\n",
395 |     " - inplace = True 代表进行原地操作,可以节省一半空间"
396 |    ]
397 |   },
398 |   {
399 |    "cell_type": "markdown",
400 |    "metadata": {},
401 |    "source": [
402 |     "## 5.5 Visdom 可视化\n",
403 |     "- 安装:\n",
404 |     " - python -m pip install --upgrade pip\n",
405 |     " - python -m pip install visdom\n",
406 |     "- 启动:\n",
407 |     " - python -m visdom.server"
408 |    ]
409 |   },
410 |   {
411 |    "cell_type": "code",
412 |    "execution_count": null,
413 |    "metadata": {},
414 |    "outputs": [],
415 |    "source": [
416 |     "    \n"
417 |    ]
418 |   }
419 |  ],
420 |  "metadata": {
421 |   "kernelspec": {
422 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
423 |    "language": "python",
424 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
425 |   },
426 |   "language_info": {
427 |    "codemirror_mode": {
428 |     "name": "ipython",
429 |     "version": 3
430 |    },
431 |    "file_extension": ".py",
432 |    "mimetype": "text/x-python",
433 |    "name": "python",
434 |    "nbconvert_exporter": "python",
435 |    "pygments_lexer": "ipython3",
436 |    "version": "3.5.6"
437 |   },
438 |   "latex_envs": {
439 |    "LaTeX_envs_menu_present": true,
440 |    "autoclose": false,
441 |    "autocomplete": true,
442 |    "bibliofile": "biblio.bib",
443 |    "cite_by": "apalike",
444 |    "current_citInitial": 1,
445 |    "eqLabelWithNumbers": true,
446 |    "eqNumInitial": 1,
447 |    "hotkeys": {
448 |     "equation": "Ctrl-E",
449 |     "itemize": "Ctrl-I"
450 |    },
451 |    "labels_anchors": false,
452 |    "latex_user_defs": false,
453 |    "report_style_numbering": false,
454 |    "user_envs_cfg": false
455 |   },
456 |   "varInspector": {
457 |    "cols": {
458 |     "lenName": 16,
459 |     "lenType": 16,
460 |     "lenVar": 40
461 |    },
462 |    "kernels_config": {
463 |     "python": {
464 |      "delete_cmd_postfix": "",
465 |      "delete_cmd_prefix": "del ",
466 |      "library": "var_list.py",
467 |      "varRefreshCmd": "print(var_dic_list())"
468 |     },
469 |     "r": {
470 |      "delete_cmd_postfix": ") ",
471 |      "delete_cmd_prefix": "rm(",
472 |      "library": "var_list.r",
473 |      "varRefreshCmd": "cat(var_dic_list()) "
474 |     }
475 |    },
476 |    "types_to_exclude": [
477 |     "module",
478 |     "function",
479 |     "builtin_function_or_method",
480 |     "instance",
481 |     "_Feature"
482 |    ],
483 |    "window_display": false
484 |   }
485 |  },
486 |  "nbformat": 4,
487 |  "nbformat_minor": 2
488 | }
489 | 


--------------------------------------------------------------------------------
/ch05_ 神经网络与全连接层/mnist.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | import torch.nn.functional as F
 4 | import torch.optim as optim
 5 | from torchvision import datasets, transforms
 6 | 
 7 | batch_size = 64
 8 | learning_rate = 0.01
 9 | epoches = 10
10 | 
11 | train_loader = torch.utils.data.DataLoader(datasets.MNIST(
12 |     '../data/',
13 |     train=True,
14 |     download=False,
15 |     transform=transforms.Compose(
16 |         [transforms.ToTensor(),
17 |          transforms.Normalize((0.1307, ), (0.3081, ))])),
18 |                                            batch_size=batch_size,
19 |                                            shuffle=True)
20 | 
21 | test_loader = torch.utils.data.DataLoader(datasets.MNIST(
22 |     '../data/',
23 |     train=False,
24 |     download=False,
25 |     transform=transforms.Compose(
26 |         [transforms.ToTensor(),
27 |          transforms.Normalize((0.1307, ), (0.3081, ))])),
28 |                                           batch_size=batch_size,
29 |                                           shuffle=True)
30 | 
31 | 
32 | class MLP(nn.Module):
33 |     """Some Information about MLP"""
34 |     def __init__(self):
35 |         super(MLP, self).__init__()
36 | 
37 |         self.model = nn.Sequential(nn.Linear(784, 200),
38 |                                    nn.LeakyReLU(inplace=True),
39 |                                    nn.Linear(200, 200),
40 |                                    nn.LeakyReLU(inplace=True),
41 |                                    nn.Linear(200, 10),
42 |                                    nn.LeakyReLU(inplace=True))
43 | 
44 |     def forward(self, x):
45 |         x = self.model(x)
46 |         return x
47 | 
48 | 
49 | net = MLP()
50 | optimizer = optim.SGD(net.parameters(), lr=learning_rate)
51 | criterion = nn.CrossEntropyLoss()
52 | 
53 | for epoch in range(epoches):
54 |     for batch_idx, (data, target) in enumerate(train_loader):
55 |         data = data.view(-1, 28 * 28)
56 |         logits = net(data)
57 |         loss = criterion(logits, target)
58 | 
59 |         optimizer.zero_grad()
60 |         loss.backward()
61 |         optimizer.step()
62 | 
63 |         if batch_idx % 100 == 0:
64 |             print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
65 |                 epoch, batch_idx * len(data), len(train_loader.dataset),
66 |                 100. * batch_idx / len(train_loader), loss.item()))
67 | 
68 |     test_loss = 0
69 |     correct = 0
70 |     for data, target in test_loader:
71 |         data = data.view(-1, 28 * 28)
72 |         logits = net(data)
73 |         test_loss += criterion(logits, target).item()
74 |         pred = logits.data.max(1)[1]
75 |         correct += pred.eq(target.data).sum()
76 |     test_loss /= len(test_loader.dataset)
77 |     print('\nTest set:Average loss:{:.4f}, Accuracy:{}/{}({:.0f}%)\n'.format(
78 |         test_loss, correct, len(test_loader.dataset),
79 |         100. * correct / len(test_loader.dataset)))
80 | 


--------------------------------------------------------------------------------
/ch06_过拟合与欠拟合_交叉验证_正则化/.ipynb_checkpoints/ch06_ 正则化_动量与学习率衰减_早停_dropout-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# ch06_ 正则化_动量与学习率衰减_早停_dropout"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "\n",
 15 |     "## Reduce Overfitting\n",
 16 |     "- Mode Data\n",
 17 |     "- Constrain model complexity\n",
 18 |     " - shallow\n",
 19 |     " - regularization\n",
 20 |     "- Dropout\n",
 21 |     "- Data argumentation\n",
 22 |     "- Early Stopping\n",
 23 |     "\n",
 24 |     "## 6.3 Regularization 正则化 ( Weigh Decay)\n",
 25 |     "\n",
 26 |     "$$ J(\\theta) = - \\frac{1}{m} \\sum_{i=1}^{m} \\left [y_i \\ln \\hat{y_i} + (1-y_i)\\ln (1-\\hat{y_i} \\right ] + \\lambda \\sum_{i=1}^n \\left | \\theta_i \\right |$$\n",
 27 |     "\n",
 28 |     "\n",
 29 |     "- **L1-Regularization:**\n",
 30 |     "\n",
 31 |     "$$J(\\theta) = - \\frac{1}{m} \\sum_{i=1}^m \\left [ y_i \\ln \\hat{y_i} + (1-y_i)\\ln (1- \\hat{y_i} \\right | + \\lambda \\sum_n^{i=1}\\left | \\theta_i \\right |$$\n",
 32 |     "\n",
 33 |     "```Python\n",
 34 |     "regularization_loss = 0\n",
 35 |     "for param in model.parameters():\n",
 36 |     "    regularization_loss += torch.sum(torch.abs(param))\n",
 37 |     "    \n",
 38 |     "classify_loss = criteon(logits,target)\n",
 39 |     "loss = classify_loss + 0.01 * regularization_loss\n",
 40 |     "\n",
 41 |     "optimizer.zero_grad()\n",
 42 |     "loss.backward()\n",
 43 |     "optimizer.step()\n",
 44 |     "\n",
 45 |     "```\n",
 46 |     "\n",
 47 |     "\n",
 48 |     "- **L2-Regularization:**\n",
 49 |     "\n",
 50 |     "$$J(W;X,y) + \\frac {1}{2} \\lambda \\cdot {\\left \\| W \\right \\|}^2$$\n",
 51 |     "\n",
 52 |     "\n",
 53 |     "```Python\n",
 54 |     "optimizer = optim.SGD(net.parameters(),lr=learning_rate,weight_decay=0.01)\n",
 55 |     "```\n",
 56 |     "$\\lambda$ = 0.01\n",
 57 |     "\n"
 58 |    ]
 59 |   },
 60 |   {
 61 |    "cell_type": "markdown",
 62 |    "metadata": {},
 63 |    "source": [
 64 |     "## 6.4 动量与学习率衰减\n",
 65 |     "\n",
 66 |     "#### Momentum :\n",
 67 |     "\n",
 68 |     "$$\n",
 69 |     "w^{k+1} = w^k - \\alpha \\nabla f(w^k) \\\\\n",
 70 |     "        \\Downarrow \\\\\n",
 71 |     "z^{k+1} = \\beta z^k + \\nabla f(w^k) \\\\\n",
 72 |     "w^{k+1} = w^k - \\alpha z^{k+1}\n",
 73 |     "$$\n",
 74 |     "\n",
 75 |     "\n",
 76 |     "```Python\n",
 77 |     "\n",
 78 |     "optimizer = torch.optim.SGD(model.parameters(),args.lr,\n",
 79 |     "                            momentum = args.momentum,\n",
 80 |     "                            weight_decay = args.weight_decay)\n",
 81 |     "scheduler = ReduceLROnPlateau(optimizer,'min')\n",
 82 |     "\n",
 83 |     "for epoch in xrange(args.start_epoch,args.epoches):\n",
 84 |     "    train(train_loader,model,criterion,optimizer,opoch)\n",
 85 |     "    result_avg,loss_val = validate(val_loader,model,criterion,epoch)\n",
 86 |     "    scheduler.step(loss_val)\n",
 87 |     "    \n",
 88 |     "    \n",
 89 |     "```\n",
 90 |     "\n",
 91 |     "#### learning rate decay :\n",
 92 |     "\n",
 93 |     "```Python\n",
 94 |     "\n",
 95 |     "# Assuming optimizer uses lr = 0.05 for all groups\n",
 96 |     "# lr = 0.05  if epoch < 30\n",
 97 |     "# lr = 0.005 if 30 <= epoch < 60\n",
 98 |     "# lr = 0.0005 if 60 <= epoch < 90\n",
 99 |     "scheduler = StepLR(optimier,step_size = 30, gamma=0.1)\n",
100 |     "for epoch in range(100):\n",
101 |     "    scheduler.step()\n",
102 |     "    train(...)\n",
103 |     "    validate(...)\n",
104 |     "```\n",
105 |     "\n"
106 |    ]
107 |   },
108 |   {
109 |    "cell_type": "markdown",
110 |    "metadata": {},
111 |    "source": [
112 |     "## 6.5 Early Stopping , Dropout , Stochastic Gradient Descent\n",
113 |     "\n",
114 |     "### Early Stopping : How-To:\n",
115 |     "- Validation set to select parameters\n",
116 |     "- Monitor validation performance\n",
117 |     "- Stop at the highest val performance\n",
118 |     "\n",
119 |     "\n",
120 |     "### Dropout\n",
121 |     "- Learning less to learn better\n",
122 |     "- Each connection has p=[0,1] to lose \n",
123 |     "\n",
124 |     "- torch.nn.Dropout(p=droupout_prob) -> p\n",
125 |     "- tf.nn.dropout(keep_prob) -> (1-p)\n",
126 |     "\n",
127 |     "#### 在val set 和 test set 中不使用dropout , net_dropped.eval()\n",
128 |     "```Python\n",
129 |     "for epoch in range(epoches):\n",
130 |     "    net_dropped.eval()\n",
131 |     "    for batch_idx, (data,target) in enumerate(train_loader):\n",
132 |     "        ...\n",
133 |     "        net_dropped.eval()\n",
134 |     "        test_loss = 0\n",
135 |     "        correct = 0\n",
136 |     "        for data, target in test_loader:\n",
137 |     "            ...\n",
138 |     "\n",
139 |     "```\n",
140 |     "\n",
141 |     "\n",
142 |     "### Stochastic Gradient Descent (SGD)\n",
143 |     "- Stochastic\n",
144 |     " - not random!\n",
145 |     "- Deterministic\n",
146 |     "- 分批次进行梯度下降,每次进一个batch,显存没那么大,无法一次性装入所有数据\n"
147 |    ]
148 |   },
149 |   {
150 |    "cell_type": "code",
151 |    "execution_count": null,
152 |    "metadata": {},
153 |    "outputs": [],
154 |    "source": []
155 |   }
156 |  ],
157 |  "metadata": {
158 |   "kernelspec": {
159 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
160 |    "language": "python",
161 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
162 |   },
163 |   "language_info": {
164 |    "codemirror_mode": {
165 |     "name": "ipython",
166 |     "version": 3
167 |    },
168 |    "file_extension": ".py",
169 |    "mimetype": "text/x-python",
170 |    "name": "python",
171 |    "nbconvert_exporter": "python",
172 |    "pygments_lexer": "ipython3",
173 |    "version": "3.5.6"
174 |   },
175 |   "latex_envs": {
176 |    "LaTeX_envs_menu_present": true,
177 |    "autoclose": false,
178 |    "autocomplete": true,
179 |    "bibliofile": "biblio.bib",
180 |    "cite_by": "apalike",
181 |    "current_citInitial": 1,
182 |    "eqLabelWithNumbers": true,
183 |    "eqNumInitial": 1,
184 |    "hotkeys": {
185 |     "equation": "Ctrl-E",
186 |     "itemize": "Ctrl-I"
187 |    },
188 |    "labels_anchors": false,
189 |    "latex_user_defs": false,
190 |    "report_style_numbering": false,
191 |    "user_envs_cfg": false
192 |   },
193 |   "varInspector": {
194 |    "cols": {
195 |     "lenName": 16,
196 |     "lenType": 16,
197 |     "lenVar": 40
198 |    },
199 |    "kernels_config": {
200 |     "python": {
201 |      "delete_cmd_postfix": "",
202 |      "delete_cmd_prefix": "del ",
203 |      "library": "var_list.py",
204 |      "varRefreshCmd": "print(var_dic_list())"
205 |     },
206 |     "r": {
207 |      "delete_cmd_postfix": ") ",
208 |      "delete_cmd_prefix": "rm(",
209 |      "library": "var_list.r",
210 |      "varRefreshCmd": "cat(var_dic_list()) "
211 |     }
212 |    },
213 |    "types_to_exclude": [
214 |     "module",
215 |     "function",
216 |     "builtin_function_or_method",
217 |     "instance",
218 |     "_Feature"
219 |    ],
220 |    "window_display": false
221 |   }
222 |  },
223 |  "nbformat": 4,
224 |  "nbformat_minor": 2
225 | }
226 | 


--------------------------------------------------------------------------------
/ch06_过拟合与欠拟合_交叉验证_正则化/.ipynb_checkpoints/ch06_过拟合与欠拟合-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "## 6.1 过拟合与欠拟合\n",
  8 |     "\n",
  9 |     "- **Underfitted 欠拟合**\n",
 10 |     " - train acc. is bad\n",
 11 |     " - test acc. is bad as well\n",
 12 |     " \n",
 13 |     "- **Overfitted 过拟合**\n",
 14 |     " - train loss and acc. is much better\n",
 15 |     " - test acc. is worse\n",
 16 |     " - ->Generalization Performance 泛化能力"
 17 |    ]
 18 |   },
 19 |   {
 20 |    "cell_type": "markdown",
 21 |    "metadata": {},
 22 |    "source": [
 23 |     "## 6.2 交叉验证"
 24 |    ]
 25 |   },
 26 |   {
 27 |    "cell_type": "markdown",
 28 |    "metadata": {},
 29 |    "source": [
 30 |     "### Spliting -> Train Set & Test Set :"
 31 |    ]
 32 |   },
 33 |   {
 34 |    "cell_type": "code",
 35 |    "execution_count": 2,
 36 |    "metadata": {},
 37 |    "outputs": [],
 38 |    "source": [
 39 |     "import torch\n",
 40 |     "from torchvision import transforms , datasets"
 41 |    ]
 42 |   },
 43 |   {
 44 |    "cell_type": "code",
 45 |    "execution_count": 16,
 46 |    "metadata": {},
 47 |    "outputs": [],
 48 |    "source": [
 49 |     "train_loader = torch.utils.data.DataLoader(\n",
 50 |     "    datasets.MNIST('../data/',\n",
 51 |     "                   train=True,\n",
 52 |     "                   download=True,\n",
 53 |     "                   transform=transforms.Compose([\n",
 54 |     "                       transforms.ToTensor(),\n",
 55 |     "                       transforms.Normalize((0.1307, ), (0.3081, ))\n",
 56 |     "                   ])),\n",
 57 |     "                   \n",
 58 |     "                   shuffle=True)\n",
 59 |     "    \n",
 60 |     "test_loader = torch.utils.data.DataLoader(\n",
 61 |     "    datasets.MNIST('../data/',\n",
 62 |     "                   train=False,\n",
 63 |     "                   transform=transforms.Compose([\n",
 64 |     "                       transforms.ToTensor(),\n",
 65 |     "                       transforms.Normalize((0.1307, ), (0.3081, ))])),\n",
 66 |     "                   shuffle=False)"
 67 |    ]
 68 |   },
 69 |   {
 70 |    "cell_type": "markdown",
 71 |    "metadata": {},
 72 |    "source": [
 73 |     "### Spliting -> Train Set & Val Set & Test Set :"
 74 |    ]
 75 |   },
 76 |   {
 77 |    "cell_type": "code",
 78 |    "execution_count": 17,
 79 |    "metadata": {},
 80 |    "outputs": [
 81 |     {
 82 |      "name": "stdout",
 83 |      "output_type": "stream",
 84 |      "text": [
 85 |       "train_:  60000 test:  10000\n",
 86 |       "train: 50000   val: 10000\n",
 87 |       "train: 782   val: 157\n"
 88 |      ]
 89 |     }
 90 |    ],
 91 |    "source": [
 92 |     "print('train_: ',len(train_loader),'test: ',len(test_loader))\n",
 93 |     "train_db,val_db = torch.utils.data.random_split(train_loader,[50000,10000])\n",
 94 |     "print('train:',len(train_db),'  val:',len(val_db))\n",
 95 |     "\n",
 96 |     "train_loader = torch.utils.data.DataLoader(\n",
 97 |     "    train_db,batch_size=64,shuffle=True)\n",
 98 |     "\n",
 99 |     "val_loader = torch.utils.data.DataLoader(\n",
100 |     "    val_db,batch_size=64,shuffle=True)\n",
101 |     "\n",
102 |     "print('train:',len(train_loader),'  val:',len(val_loader))"
103 |    ]
104 |   },
105 |   {
106 |    "cell_type": "markdown",
107 |    "metadata": {},
108 |    "source": [
109 |     "## K-fold cross-validation :\n",
110 |     "\n",
111 |     "- merge train/val sets\n",
112 |     "- randomly sample 1/k as val set\n",
113 |     "\n",
114 |     "\n",
115 |     "如果数据区间为[0,60k],根据上述划分:\n",
116 |     "- [0,50k]为train set,\n",
117 |     "- [50k,60k]为val set,\n",
118 |     "- [60k,70k]为test set\n",
119 |     "\n",
120 |     "上面这个方法,val-set的数据没有参与训练的反向传播,\n",
121 |     "而 K-fold Cross-Validation的划分为:\n",
122 |     "- epoch 1:\n",
123 |     " - [0,50k] -> train set,\n",
124 |     " - [50k,60k] -> val set,\n",
125 |     " - [60k,70k] -> test set\n",
126 |     "\n",
127 |     "- epoch 2:\n",
128 |     " - [0,40k] [50k,60k] -> train set,\n",
129 |     " - [40k,50k] -> val set,\n",
130 |     " - [60k,70k] -> test set\n",
131 |     " \n",
132 |     "- epoch 3:\n",
133 |     " - [0,30k] [40k,60k] -> train set,\n",
134 |     " - [30k,40k] -> val set,\n",
135 |     " - [60k,70k] -> test set\n",
136 |     " \n",
137 |     "- ....\n",
138 |     "\n",
139 |     "具体实践中的划分视情况而定,上面的例子主要是为了表达 K-fold Cross-Validation 的思想\n",
140 |     "\n"
141 |    ]
142 |   },
143 |   {
144 |    "cell_type": "code",
145 |    "execution_count": null,
146 |    "metadata": {},
147 |    "outputs": [],
148 |    "source": []
149 |   }
150 |  ],
151 |  "metadata": {
152 |   "kernelspec": {
153 |    "display_name": "Python [default]",
154 |    "language": "python",
155 |    "name": "python3"
156 |   },
157 |   "language_info": {
158 |    "codemirror_mode": {
159 |     "name": "ipython",
160 |     "version": 3
161 |    },
162 |    "file_extension": ".py",
163 |    "mimetype": "text/x-python",
164 |    "name": "python",
165 |    "nbconvert_exporter": "python",
166 |    "pygments_lexer": "ipython3",
167 |    "version": "3.5.6"
168 |   },
169 |   "latex_envs": {
170 |    "LaTeX_envs_menu_present": true,
171 |    "autoclose": false,
172 |    "autocomplete": true,
173 |    "bibliofile": "biblio.bib",
174 |    "cite_by": "apalike",
175 |    "current_citInitial": 1,
176 |    "eqLabelWithNumbers": true,
177 |    "eqNumInitial": 1,
178 |    "hotkeys": {
179 |     "equation": "Ctrl-E",
180 |     "itemize": "Ctrl-I"
181 |    },
182 |    "labels_anchors": false,
183 |    "latex_user_defs": false,
184 |    "report_style_numbering": false,
185 |    "user_envs_cfg": false
186 |   },
187 |   "varInspector": {
188 |    "cols": {
189 |     "lenName": 16,
190 |     "lenType": 16,
191 |     "lenVar": 40
192 |    },
193 |    "kernels_config": {
194 |     "python": {
195 |      "delete_cmd_postfix": "",
196 |      "delete_cmd_prefix": "del ",
197 |      "library": "var_list.py",
198 |      "varRefreshCmd": "print(var_dic_list())"
199 |     },
200 |     "r": {
201 |      "delete_cmd_postfix": ") ",
202 |      "delete_cmd_prefix": "rm(",
203 |      "library": "var_list.r",
204 |      "varRefreshCmd": "cat(var_dic_list()) "
205 |     }
206 |    },
207 |    "types_to_exclude": [
208 |     "module",
209 |     "function",
210 |     "builtin_function_or_method",
211 |     "instance",
212 |     "_Feature"
213 |    ],
214 |    "window_display": false
215 |   }
216 |  },
217 |  "nbformat": 4,
218 |  "nbformat_minor": 2
219 | }
220 | 


--------------------------------------------------------------------------------
/ch06_过拟合与欠拟合_交叉验证_正则化/ch06_ 正则化_动量与学习率衰减_早停_dropout.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# ch06_ 正则化_动量与学习率衰减_早停_dropout"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "\n",
 15 |     "## Reduce Overfitting\n",
 16 |     "- Mode Data\n",
 17 |     "- Constrain model complexity\n",
 18 |     " - shallow\n",
 19 |     " - regularization\n",
 20 |     "- Dropout\n",
 21 |     "- Data argumentation\n",
 22 |     "- Early Stopping\n",
 23 |     "\n",
 24 |     "## 6.3 Regularization 正则化 ( Weigh Decay)\n",
 25 |     "\n",
 26 |     "$$ J(\\theta) = - \\frac{1}{m} \\sum_{i=1}^{m} \\left [y_i \\ln \\hat{y_i} + (1-y_i)\\ln (1-\\hat{y_i} \\right ] + \\lambda \\sum_{i=1}^n \\left | \\theta_i \\right |$$\n",
 27 |     "\n",
 28 |     "\n",
 29 |     "- **L1-Regularization:**\n",
 30 |     "\n",
 31 |     "$$J(\\theta) = - \\frac{1}{m} \\sum_{i=1}^m \\left [ y_i \\ln \\hat{y_i} + (1-y_i)\\ln (1- \\hat{y_i} \\right | + \\lambda \\sum_n^{i=1}\\left | \\theta_i \\right |$$\n",
 32 |     "\n",
 33 |     "```Python\n",
 34 |     "regularization_loss = 0\n",
 35 |     "for param in model.parameters():\n",
 36 |     "    regularization_loss += torch.sum(torch.abs(param))\n",
 37 |     "    \n",
 38 |     "classify_loss = criteon(logits,target)\n",
 39 |     "loss = classify_loss + 0.01 * regularization_loss\n",
 40 |     "\n",
 41 |     "optimizer.zero_grad()\n",
 42 |     "loss.backward()\n",
 43 |     "optimizer.step()\n",
 44 |     "\n",
 45 |     "```\n",
 46 |     "\n",
 47 |     "\n",
 48 |     "- **L2-Regularization:**\n",
 49 |     "\n",
 50 |     "$$J(W;X,y) + \\frac {1}{2} \\lambda \\cdot {\\left \\| W \\right \\|}^2$$\n",
 51 |     "\n",
 52 |     "\n",
 53 |     "```Python\n",
 54 |     "optimizer = optim.SGD(net.parameters(),lr=learning_rate,weight_decay=0.01)\n",
 55 |     "```\n",
 56 |     "$\\lambda$ = 0.01\n",
 57 |     "\n"
 58 |    ]
 59 |   },
 60 |   {
 61 |    "cell_type": "markdown",
 62 |    "metadata": {},
 63 |    "source": [
 64 |     "## 6.4 动量与学习率衰减\n",
 65 |     "\n",
 66 |     "#### Momentum :\n",
 67 |     "\n",
 68 |     "$$\n",
 69 |     "w^{k+1} = w^k - \\alpha \\nabla f(w^k) \\\\\n",
 70 |     "        \\Downarrow \\\\\n",
 71 |     "z^{k+1} = \\beta z^k + \\nabla f(w^k) \\\\\n",
 72 |     "w^{k+1} = w^k - \\alpha z^{k+1}\n",
 73 |     "$$\n",
 74 |     "\n",
 75 |     "\n",
 76 |     "```Python\n",
 77 |     "\n",
 78 |     "optimizer = torch.optim.SGD(model.parameters(),args.lr,\n",
 79 |     "                            momentum = args.momentum,\n",
 80 |     "                            weight_decay = args.weight_decay)\n",
 81 |     "scheduler = ReduceLROnPlateau(optimizer,'min')\n",
 82 |     "\n",
 83 |     "for epoch in xrange(args.start_epoch,args.epoches):\n",
 84 |     "    train(train_loader,model,criterion,optimizer,opoch)\n",
 85 |     "    result_avg,loss_val = validate(val_loader,model,criterion,epoch)\n",
 86 |     "    scheduler.step(loss_val)\n",
 87 |     "    \n",
 88 |     "    \n",
 89 |     "```\n",
 90 |     "\n",
 91 |     "#### learning rate decay :\n",
 92 |     "\n",
 93 |     "```Python\n",
 94 |     "\n",
 95 |     "# Assuming optimizer uses lr = 0.05 for all groups\n",
 96 |     "# lr = 0.05  if epoch < 30\n",
 97 |     "# lr = 0.005 if 30 <= epoch < 60\n",
 98 |     "# lr = 0.0005 if 60 <= epoch < 90\n",
 99 |     "scheduler = StepLR(optimier,step_size = 30, gamma=0.1)\n",
100 |     "for epoch in range(100):\n",
101 |     "    scheduler.step()\n",
102 |     "    train(...)\n",
103 |     "    validate(...)\n",
104 |     "```\n",
105 |     "\n"
106 |    ]
107 |   },
108 |   {
109 |    "cell_type": "markdown",
110 |    "metadata": {},
111 |    "source": [
112 |     "## 6.5 Early Stopping , Dropout , Stochastic Gradient Descent\n",
113 |     "\n",
114 |     "### Early Stopping : How-To:\n",
115 |     "- Validation set to select parameters\n",
116 |     "- Monitor validation performance\n",
117 |     "- Stop at the highest val performance\n",
118 |     "\n",
119 |     "\n",
120 |     "### Dropout\n",
121 |     "- Learning less to learn better\n",
122 |     "- Each connection has p=[0,1] to lose \n",
123 |     "\n",
124 |     "- torch.nn.Dropout(p=droupout_prob) -> p\n",
125 |     "- tf.nn.dropout(keep_prob) -> (1-p)\n",
126 |     "\n",
127 |     "#### 在val set 和 test set 中不使用dropout , net_dropped.eval()\n",
128 |     "```Python\n",
129 |     "for epoch in range(epoches):\n",
130 |     "    net_dropped.eval()\n",
131 |     "    for batch_idx, (data,target) in enumerate(train_loader):\n",
132 |     "        ...\n",
133 |     "        net_dropped.eval()\n",
134 |     "        test_loss = 0\n",
135 |     "        correct = 0\n",
136 |     "        for data, target in test_loader:\n",
137 |     "            ...\n",
138 |     "\n",
139 |     "```\n",
140 |     "\n",
141 |     "\n",
142 |     "### Stochastic Gradient Descent (SGD)\n",
143 |     "- Stochastic\n",
144 |     " - not random!\n",
145 |     "- Deterministic\n",
146 |     "- 分批次进行梯度下降,每次进一个batch,显存没那么大,无法一次性装入所有数据\n"
147 |    ]
148 |   },
149 |   {
150 |    "cell_type": "code",
151 |    "execution_count": null,
152 |    "metadata": {},
153 |    "outputs": [],
154 |    "source": []
155 |   }
156 |  ],
157 |  "metadata": {
158 |   "kernelspec": {
159 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
160 |    "language": "python",
161 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
162 |   },
163 |   "language_info": {
164 |    "codemirror_mode": {
165 |     "name": "ipython",
166 |     "version": 3
167 |    },
168 |    "file_extension": ".py",
169 |    "mimetype": "text/x-python",
170 |    "name": "python",
171 |    "nbconvert_exporter": "python",
172 |    "pygments_lexer": "ipython3",
173 |    "version": "3.5.6"
174 |   },
175 |   "latex_envs": {
176 |    "LaTeX_envs_menu_present": true,
177 |    "autoclose": false,
178 |    "autocomplete": true,
179 |    "bibliofile": "biblio.bib",
180 |    "cite_by": "apalike",
181 |    "current_citInitial": 1,
182 |    "eqLabelWithNumbers": true,
183 |    "eqNumInitial": 1,
184 |    "hotkeys": {
185 |     "equation": "Ctrl-E",
186 |     "itemize": "Ctrl-I"
187 |    },
188 |    "labels_anchors": false,
189 |    "latex_user_defs": false,
190 |    "report_style_numbering": false,
191 |    "user_envs_cfg": false
192 |   },
193 |   "varInspector": {
194 |    "cols": {
195 |     "lenName": 16,
196 |     "lenType": 16,
197 |     "lenVar": 40
198 |    },
199 |    "kernels_config": {
200 |     "python": {
201 |      "delete_cmd_postfix": "",
202 |      "delete_cmd_prefix": "del ",
203 |      "library": "var_list.py",
204 |      "varRefreshCmd": "print(var_dic_list())"
205 |     },
206 |     "r": {
207 |      "delete_cmd_postfix": ") ",
208 |      "delete_cmd_prefix": "rm(",
209 |      "library": "var_list.r",
210 |      "varRefreshCmd": "cat(var_dic_list()) "
211 |     }
212 |    },
213 |    "types_to_exclude": [
214 |     "module",
215 |     "function",
216 |     "builtin_function_or_method",
217 |     "instance",
218 |     "_Feature"
219 |    ],
220 |    "window_display": false
221 |   }
222 |  },
223 |  "nbformat": 4,
224 |  "nbformat_minor": 2
225 | }
226 | 


--------------------------------------------------------------------------------
/ch06_过拟合与欠拟合_交叉验证_正则化/ch06_过拟合与欠拟合.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "## 6.1 过拟合与欠拟合\n",
  8 |     "\n",
  9 |     "- **Underfitted 欠拟合**\n",
 10 |     " - train acc. is bad\n",
 11 |     " - test acc. is bad as well\n",
 12 |     " \n",
 13 |     "- **Overfitted 过拟合**\n",
 14 |     " - train loss and acc. is much better\n",
 15 |     " - test acc. is worse\n",
 16 |     " - ->Generalization Performance 泛化能力"
 17 |    ]
 18 |   },
 19 |   {
 20 |    "cell_type": "markdown",
 21 |    "metadata": {},
 22 |    "source": [
 23 |     "## 6.2 交叉验证"
 24 |    ]
 25 |   },
 26 |   {
 27 |    "cell_type": "markdown",
 28 |    "metadata": {},
 29 |    "source": [
 30 |     "### Spliting -> Train Set & Test Set :"
 31 |    ]
 32 |   },
 33 |   {
 34 |    "cell_type": "code",
 35 |    "execution_count": 2,
 36 |    "metadata": {},
 37 |    "outputs": [],
 38 |    "source": [
 39 |     "import torch\n",
 40 |     "from torchvision import transforms , datasets"
 41 |    ]
 42 |   },
 43 |   {
 44 |    "cell_type": "code",
 45 |    "execution_count": 16,
 46 |    "metadata": {},
 47 |    "outputs": [],
 48 |    "source": [
 49 |     "train_loader = torch.utils.data.DataLoader(\n",
 50 |     "    datasets.MNIST('../data/',\n",
 51 |     "                   train=True,\n",
 52 |     "                   download=True,\n",
 53 |     "                   transform=transforms.Compose([\n",
 54 |     "                       transforms.ToTensor(),\n",
 55 |     "                       transforms.Normalize((0.1307, ), (0.3081, ))\n",
 56 |     "                   ])),\n",
 57 |     "                   \n",
 58 |     "                   shuffle=True)\n",
 59 |     "    \n",
 60 |     "test_loader = torch.utils.data.DataLoader(\n",
 61 |     "    datasets.MNIST('../data/',\n",
 62 |     "                   train=False,\n",
 63 |     "                   transform=transforms.Compose([\n",
 64 |     "                       transforms.ToTensor(),\n",
 65 |     "                       transforms.Normalize((0.1307, ), (0.3081, ))])),\n",
 66 |     "                   shuffle=False)"
 67 |    ]
 68 |   },
 69 |   {
 70 |    "cell_type": "markdown",
 71 |    "metadata": {},
 72 |    "source": [
 73 |     "### Spliting -> Train Set & Val Set & Test Set :"
 74 |    ]
 75 |   },
 76 |   {
 77 |    "cell_type": "code",
 78 |    "execution_count": 17,
 79 |    "metadata": {},
 80 |    "outputs": [
 81 |     {
 82 |      "name": "stdout",
 83 |      "output_type": "stream",
 84 |      "text": [
 85 |       "train_:  60000 test:  10000\n",
 86 |       "train: 50000   val: 10000\n",
 87 |       "train: 782   val: 157\n"
 88 |      ]
 89 |     }
 90 |    ],
 91 |    "source": [
 92 |     "print('train_: ',len(train_loader),'test: ',len(test_loader))\n",
 93 |     "train_db,val_db = torch.utils.data.random_split(train_loader,[50000,10000])\n",
 94 |     "print('train:',len(train_db),'  val:',len(val_db))\n",
 95 |     "\n",
 96 |     "train_loader = torch.utils.data.DataLoader(\n",
 97 |     "    train_db,batch_size=64,shuffle=True)\n",
 98 |     "\n",
 99 |     "val_loader = torch.utils.data.DataLoader(\n",
100 |     "    val_db,batch_size=64,shuffle=True)\n",
101 |     "\n",
102 |     "print('train:',len(train_loader),'  val:',len(val_loader))"
103 |    ]
104 |   },
105 |   {
106 |    "cell_type": "markdown",
107 |    "metadata": {},
108 |    "source": [
109 |     "## K-fold cross-validation :\n",
110 |     "\n",
111 |     "- merge train/val sets\n",
112 |     "- randomly sample 1/k as val set\n",
113 |     "\n",
114 |     "\n",
115 |     "如果数据区间为[0,60k],根据上述划分:\n",
116 |     "- [0,50k]为train set,\n",
117 |     "- [50k,60k]为val set,\n",
118 |     "- [60k,70k]为test set\n",
119 |     "\n",
120 |     "上面这个方法,val-set的数据没有参与训练的反向传播,\n",
121 |     "而 K-fold Cross-Validation的划分为:\n",
122 |     "- epoch 1:\n",
123 |     " - [0,50k] -> train set,\n",
124 |     " - [50k,60k] -> val set,\n",
125 |     " - [60k,70k] -> test set\n",
126 |     "\n",
127 |     "- epoch 2:\n",
128 |     " - [0,40k] [50k,60k] -> train set,\n",
129 |     " - [40k,50k] -> val set,\n",
130 |     " - [60k,70k] -> test set\n",
131 |     " \n",
132 |     "- epoch 3:\n",
133 |     " - [0,30k] [40k,60k] -> train set,\n",
134 |     " - [30k,40k] -> val set,\n",
135 |     " - [60k,70k] -> test set\n",
136 |     " \n",
137 |     "- ....\n",
138 |     "\n",
139 |     "具体实践中的划分视情况而定,上面的例子主要是为了表达 K-fold Cross-Validation 的思想"
140 |    ]
141 |   },
142 |   {
143 |    "cell_type": "code",
144 |    "execution_count": null,
145 |    "metadata": {},
146 |    "outputs": [],
147 |    "source": []
148 |   }
149 |  ],
150 |  "metadata": {
151 |   "kernelspec": {
152 |    "display_name": "Python [default]",
153 |    "language": "python",
154 |    "name": "python3"
155 |   },
156 |   "language_info": {
157 |    "codemirror_mode": {
158 |     "name": "ipython",
159 |     "version": 3
160 |    },
161 |    "file_extension": ".py",
162 |    "mimetype": "text/x-python",
163 |    "name": "python",
164 |    "nbconvert_exporter": "python",
165 |    "pygments_lexer": "ipython3",
166 |    "version": "3.5.6"
167 |   },
168 |   "latex_envs": {
169 |    "LaTeX_envs_menu_present": true,
170 |    "autoclose": false,
171 |    "autocomplete": true,
172 |    "bibliofile": "biblio.bib",
173 |    "cite_by": "apalike",
174 |    "current_citInitial": 1,
175 |    "eqLabelWithNumbers": true,
176 |    "eqNumInitial": 1,
177 |    "hotkeys": {
178 |     "equation": "Ctrl-E",
179 |     "itemize": "Ctrl-I"
180 |    },
181 |    "labels_anchors": false,
182 |    "latex_user_defs": false,
183 |    "report_style_numbering": false,
184 |    "user_envs_cfg": false
185 |   },
186 |   "varInspector": {
187 |    "cols": {
188 |     "lenName": 16,
189 |     "lenType": 16,
190 |     "lenVar": 40
191 |    },
192 |    "kernels_config": {
193 |     "python": {
194 |      "delete_cmd_postfix": "",
195 |      "delete_cmd_prefix": "del ",
196 |      "library": "var_list.py",
197 |      "varRefreshCmd": "print(var_dic_list())"
198 |     },
199 |     "r": {
200 |      "delete_cmd_postfix": ") ",
201 |      "delete_cmd_prefix": "rm(",
202 |      "library": "var_list.r",
203 |      "varRefreshCmd": "cat(var_dic_list()) "
204 |     }
205 |    },
206 |    "types_to_exclude": [
207 |     "module",
208 |     "function",
209 |     "builtin_function_or_method",
210 |     "instance",
211 |     "_Feature"
212 |    ],
213 |    "window_display": false
214 |   }
215 |  },
216 |  "nbformat": 4,
217 |  "nbformat_minor": 2
218 | }
219 | 


--------------------------------------------------------------------------------
/ch07_卷积神经网络CNN/.ipynb_checkpoints/ch07_卷积神经网络基础-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# 7.1 卷积神经网络基础"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "### nn.Conv2d"
 15 |    ]
 16 |   },
 17 |   {
 18 |    "cell_type": "code",
 19 |    "execution_count": 1,
 20 |    "metadata": {},
 21 |    "outputs": [],
 22 |    "source": [
 23 |     "import torch\n",
 24 |     "from torch import nn"
 25 |    ]
 26 |   },
 27 |   {
 28 |    "cell_type": "markdown",
 29 |    "metadata": {},
 30 |    "source": [
 31 |     "$$Output\\_size = \\left \\lfloor \\frac{n + 2p - f}{s} + 1\\right \\rfloor \\times \\left \\lfloor \\frac{n + 2p - f}{s} + 1\\right \\rfloor$$\n",
 32 |     "\n"
 33 |    ]
 34 |   },
 35 |   {
 36 |    "cell_type": "code",
 37 |    "execution_count": 15,
 38 |    "metadata": {},
 39 |    "outputs": [
 40 |     {
 41 |      "name": "stdout",
 42 |      "output_type": "stream",
 43 |      "text": [
 44 |       "out1.shape: torch.Size([1, 3, 26, 26])\n",
 45 |       "out2.shape: torch.Size([1, 3, 28, 28])\n",
 46 |       "out3.shape: torch.Size([1, 4, 14, 14])\n"
 47 |      ]
 48 |     }
 49 |    ],
 50 |    "source": [
 51 |     "layer = nn.Conv2d(1,3,kernel_size=3,stride=1,padding=0)\n",
 52 |     "x = torch.rand(1,1,28,28)\n",
 53 |     "\n",
 54 |     "out = layer.forward(x) # 卷积运算\n",
 55 |     "print('out1.shape:',out.shape)\n",
 56 |     "\n",
 57 |     "layer = nn.Conv2d(1,3,kernel_size=3,stride=1,padding=1)\n",
 58 |     "out = layer.forward(x)\n",
 59 |     "print('out2.shape:',out.shape)\n",
 60 |     "\n",
 61 |     "layer = nn.Conv2d(1,4,kernel_size=3,stride=2,padding=1)\n",
 62 |     "out = layer.forward(x)\n",
 63 |     "print('out3.shape:',out.shape)"
 64 |    ]
 65 |   },
 66 |   {
 67 |    "cell_type": "markdown",
 68 |    "metadata": {},
 69 |    "source": [
 70 |     "### Inner weight & bias"
 71 |    ]
 72 |   },
 73 |   {
 74 |    "cell_type": "code",
 75 |    "execution_count": 16,
 76 |    "metadata": {},
 77 |    "outputs": [
 78 |     {
 79 |      "data": {
 80 |       "text/plain": [
 81 |        "Parameter containing:\n",
 82 |        "tensor([[[[-0.1704, -0.0875,  0.0579],\n",
 83 |        "          [ 0.2762,  0.2394, -0.0993],\n",
 84 |        "          [ 0.1446,  0.0253, -0.1044]]],\n",
 85 |        "\n",
 86 |        "\n",
 87 |        "        [[[-0.1198, -0.3039, -0.3194],\n",
 88 |        "          [ 0.2971, -0.2700, -0.0318],\n",
 89 |        "          [ 0.1160,  0.1986, -0.3255]]],\n",
 90 |        "\n",
 91 |        "\n",
 92 |        "        [[[-0.1016,  0.0956, -0.0222],\n",
 93 |        "          [ 0.1155,  0.1237,  0.1385],\n",
 94 |        "          [ 0.2375, -0.2012,  0.3073]]],\n",
 95 |        "\n",
 96 |        "\n",
 97 |        "        [[[-0.3036,  0.2053,  0.2781],\n",
 98 |        "          [-0.0271, -0.0822, -0.0675],\n",
 99 |        "          [ 0.2384, -0.2601,  0.0878]]]], requires_grad=True)"
100 |       ]
101 |      },
102 |      "execution_count": 16,
103 |      "metadata": {},
104 |      "output_type": "execute_result"
105 |     }
106 |    ],
107 |    "source": [
108 |     "layer.weight"
109 |    ]
110 |   },
111 |   {
112 |    "cell_type": "code",
113 |    "execution_count": 17,
114 |    "metadata": {},
115 |    "outputs": [
116 |     {
117 |      "data": {
118 |       "text/plain": [
119 |        "torch.Size([4, 1, 3, 3])"
120 |       ]
121 |      },
122 |      "execution_count": 17,
123 |      "metadata": {},
124 |      "output_type": "execute_result"
125 |     }
126 |    ],
127 |    "source": [
128 |     "layer.weight.shape"
129 |    ]
130 |   },
131 |   {
132 |    "cell_type": "code",
133 |    "execution_count": 18,
134 |    "metadata": {},
135 |    "outputs": [
136 |     {
137 |      "data": {
138 |       "text/plain": [
139 |        "torch.Size([4])"
140 |       ]
141 |      },
142 |      "execution_count": 18,
143 |      "metadata": {},
144 |      "output_type": "execute_result"
145 |     }
146 |    ],
147 |    "source": [
148 |     "layer.bias.shape"
149 |    ]
150 |   },
151 |   {
152 |    "cell_type": "markdown",
153 |    "metadata": {},
154 |    "source": [
155 |     "### F.conv2d"
156 |    ]
157 |   },
158 |   {
159 |    "cell_type": "code",
160 |    "execution_count": 23,
161 |    "metadata": {},
162 |    "outputs": [],
163 |    "source": [
164 |     "from torch.nn import functional as F\n",
165 |     "x = torch.randn(1,3,28,28) # x 和 w 的 channel 值要相同,均为3\n",
166 |     "w = torch.rand(16,3,5,5)\n",
167 |     "b = torch.rand(16)"
168 |    ]
169 |   },
170 |   {
171 |    "cell_type": "code",
172 |    "execution_count": 27,
173 |    "metadata": {},
174 |    "outputs": [
175 |     {
176 |      "name": "stdout",
177 |      "output_type": "stream",
178 |      "text": [
179 |       "x.shape:  torch.Size([1, 3, 28, 28])\n",
180 |       "out.shape:  torch.Size([1, 16, 14, 14])\n"
181 |      ]
182 |     }
183 |    ],
184 |    "source": [
185 |     "out = F.conv2d(x,w,b,stride=2,padding=2)\n",
186 |     "print('x.shape: ',x.shape)\n",
187 |     "print('out.shape: ',out.shape)"
188 |    ]
189 |   },
190 |   {
191 |    "cell_type": "markdown",
192 |    "metadata": {},
193 |    "source": [
194 |     "# 7.2 Down/Up Sample 池化层与采样 ReLU层"
195 |    ]
196 |   },
197 |   {
198 |    "cell_type": "markdown",
199 |    "metadata": {},
200 |    "source": [
201 |     "### Max Pooling\n",
202 |     "\n",
203 |     "### Avg Pooling\n"
204 |    ]
205 |   },
206 |   {
207 |    "cell_type": "code",
208 |    "execution_count": 28,
209 |    "metadata": {},
210 |    "outputs": [
211 |     {
212 |      "name": "stdout",
213 |      "output_type": "stream",
214 |      "text": [
215 |       "x.shape:  torch.Size([1, 16, 14, 14])\n",
216 |       "out1.shape:  torch.Size([1, 16, 7, 7])\n",
217 |       "out2.shape:  torch.Size([1, 16, 7, 7])\n"
218 |      ]
219 |     }
220 |    ],
221 |    "source": [
222 |     "x = out\n",
223 |     "print('x.shape: ',x.shape)\n",
224 |     "\n",
225 |     "layer = nn.MaxPool2d(2,stride=2)\n",
226 |     "\n",
227 |     "out1 = layer(x)\n",
228 |     "print('out1.shape: ',out1.shape)\n",
229 |     "\n",
230 |     "out2 = F.avg_pool2d(x,2,stride=2)\n",
231 |     "print('out2.shape: ',out2.shape)"
232 |    ]
233 |   },
234 |   {
235 |    "cell_type": "markdown",
236 |    "metadata": {},
237 |    "source": [
238 |     "### UpSample \n",
239 |     "\n",
240 |     "#### F.interpolate( )"
241 |    ]
242 |   },
243 |   {
244 |    "cell_type": "code",
245 |    "execution_count": 30,
246 |    "metadata": {},
247 |    "outputs": [
248 |     {
249 |      "name": "stdout",
250 |      "output_type": "stream",
251 |      "text": [
252 |       "x.shape:  torch.Size([1, 16, 14, 14])\n",
253 |       "out.shape:  torch.Size([1, 16, 28, 28])\n"
254 |      ]
255 |     }
256 |    ],
257 |    "source": [
258 |     "x = out\n",
259 |     "print('x.shape: ',x.shape)\n",
260 |     "out = F.interpolate(x,scale_factor=2,mode='nearest')\n",
261 |     "print('out.shape: ',out.shape)"
262 |    ]
263 |   },
264 |   {
265 |    "cell_type": "markdown",
266 |    "metadata": {},
267 |    "source": [
268 |     "### ReLU层"
269 |    ]
270 |   },
271 |   {
272 |    "cell_type": "code",
273 |    "execution_count": 33,
274 |    "metadata": {},
275 |    "outputs": [
276 |     {
277 |      "name": "stdout",
278 |      "output_type": "stream",
279 |      "text": [
280 |       "x.shape:  torch.Size([1, 16, 14, 14])\n",
281 |       "layer = nn.ReLU(inplace=True), inplace=True可以节省内存一半空间\n",
282 |       "out.shape:  torch.Size([1, 16, 14, 14])\n"
283 |      ]
284 |     }
285 |    ],
286 |    "source": [
287 |     "print('x.shape: ',x.shape)\n",
288 |     "\n",
289 |     "layer = nn.ReLU(inplace=True)\n",
290 |     "print('layer = nn.ReLU(inplace=True), inplace=True可以节省内存一半空间')\n",
291 |     "out = layer(x)\n",
292 |     "print('out.shape: ',out.shape)"
293 |    ]
294 |   },
295 |   {
296 |    "cell_type": "code",
297 |    "execution_count": 34,
298 |    "metadata": {},
299 |    "outputs": [
300 |     {
301 |      "name": "stdout",
302 |      "output_type": "stream",
303 |      "text": [
304 |       "out.shape:  torch.Size([1, 16, 14, 14])\n"
305 |      ]
306 |     }
307 |    ],
308 |    "source": [
309 |     "out = F.relu(x)\n",
310 |     "print('out.shape: ',out.shape)"
311 |    ]
312 |   },
313 |   {
314 |    "cell_type": "markdown",
315 |    "metadata": {},
316 |    "source": [
317 |     "# 7.3 Batch Norm\n",
318 |     "\n",
319 |     "### Feature Scaling\n",
320 |     "- Image Normalization:\n",
321 |     "```Python\n",
322 |     "normaliza = transforms.Normaliza(mean=[0.485,0.456,0.406],\n",
323 |     "                                 std=[0.229,0.224,0.225])\n",
324 |     "# RGB 各通道的均值和方差\n",
325 |     "```\n",
326 |     "- Batch Normalization:\n",
327 |     "\n",
328 |     "$ Algorithm : Batch Normalizing Transform, applied to activation x over a mini-batch.$\n",
329 |     "\n",
330 |     "$Input: Values of x over a mini-batch: \\mathcal{B} = \\{ x_{1...m}\\}; $\n",
331 |     "$Output: \\{ y_i = BN_{\\gamma , \\beta}(x_i)\\} $\n",
332 |     "\n",
333 |     "$$mini-batch \\space mean:  \\mu_{\\mathcal{B}} \\leftarrow \\frac{1}{m}\\sum_{i=1}^m x_i $$\n",
334 |     "\n",
335 |     "$$mini-batch \\space variance: \\sigma_{\\mathcal{B}}^2 \\leftarrow \\frac{1}{m} \\sum_{i=1}^m (x_i-\\mu_\\mathcal{B})^2 $$\n",
336 |     "\n",
337 |     "$$normalize: \\hat{x_i} \\leftarrow \\frac{x_i - \\mu_{\\mathcal{B}}}{\\sqrt{\\sigma_\\mathcal{B}^2 + \\varepsilon }}$$\n",
338 |     "\n",
339 |     "$$scale \\space and \\space shift: y_i \\leftarrow \\gamma \\hat{x_i} + \\beta \\equiv BN_{\\gamma , \\beta (x_i)}$$\n",
340 |     "\n"
341 |    ]
342 |   },
343 |   {
344 |    "cell_type": "markdown",
345 |    "metadata": {},
346 |    "source": [
347 |     "### nn.BatchNorm1d"
348 |    ]
349 |   },
350 |   {
351 |    "cell_type": "code",
352 |    "execution_count": 38,
353 |    "metadata": {},
354 |    "outputs": [
355 |     {
356 |      "name": "stdout",
357 |      "output_type": "stream",
358 |      "text": [
359 |       "x.shape:  torch.Size([100, 16, 784])\n"
360 |      ]
361 |     }
362 |    ],
363 |    "source": [
364 |     "x = torch.randn(100,16,784) # 784 = 28*28\n",
365 |     "print('x.shape: ',x.shape)\n",
366 |     "layer = nn.BatchNorm1d(16)\n",
367 |     "out = layer(x)"
368 |    ]
369 |   },
370 |   {
371 |    "cell_type": "markdown",
372 |    "metadata": {},
373 |    "source": [
374 |     "**nn.BatchNorm1d(16)的参数16为channel通道数,BatchNormalize通道的统计数据是跨通道运算的,有多少个channel,就计算多少个channel上的均值和方差,16个channel就生成16个长度的统计信息,每个信息代表每个channel的均值和方差**"
375 |    ]
376 |   },
377 |   {
378 |    "cell_type": "code",
379 |    "execution_count": 39,
380 |    "metadata": {},
381 |    "outputs": [
382 |     {
383 |      "name": "stdout",
384 |      "output_type": "stream",
385 |      "text": [
386 |       "layer.running_mean: \n",
387 |       "tensor([-4.5907e-04,  8.6306e-05, -7.4280e-04, -6.2997e-04, -6.4749e-04,\n",
388 |       "         1.4273e-04, -3.9751e-05, -8.0233e-05,  2.4080e-04, -3.0221e-04,\n",
389 |       "         8.5041e-05,  1.8740e-04, -1.6602e-04, -6.1695e-05, -3.7739e-04,\n",
390 |       "         1.0307e-04])\n",
391 |       "layer.running_var: \n",
392 |       "tensor([1.0003, 0.9996, 1.0000, 1.0000, 1.0006, 1.0003, 1.0000, 1.0004, 1.0000,\n",
393 |       "        0.9994, 0.9999, 0.9996, 0.9997, 1.0008, 0.9995, 0.9999])\n"
394 |      ]
395 |     }
396 |    ],
397 |    "source": [
398 |     "print('layer.running_mean: ')\n",
399 |     "print(layer.running_mean)\n",
400 |     "print('layer.running_var: ')\n",
401 |     "print(layer.running_var)"
402 |    ]
403 |   },
404 |   {
405 |    "cell_type": "markdown",
406 |    "metadata": {},
407 |    "source": [
408 |     "### nn.BatchNorm2d\n",
409 |     "\n",
410 |     "layer.weigh $ \\rightarrow \\space \\gamma \\ $\n",
411 |     "\n",
412 |     "layer.bias $ \\rightarrow \\space \\beta$"
413 |    ]
414 |   },
415 |   {
416 |    "cell_type": "code",
417 |    "execution_count": 41,
418 |    "metadata": {},
419 |    "outputs": [
420 |     {
421 |      "name": "stdout",
422 |      "output_type": "stream",
423 |      "text": [
424 |       "x.shape:  torch.Size([6, 16, 28, 28])\n",
425 |       "After BatchNorm2d(16), out.shape:  torch.Size([6, 16, 28, 28])\n",
426 |       "layer.weight.shape:  torch.Size([16])\n",
427 |       "layer.bias.shape:  torch.Size([16])\n"
428 |      ]
429 |     }
430 |    ],
431 |    "source": [
432 |     "x = torch.rand(6,16,28,28)\n",
433 |     "print('x.shape: ',x.shape)\n",
434 |     "layer = nn.BatchNorm2d(16)\n",
435 |     "out = layer(x)\n",
436 |     "print('After BatchNorm2d(16), out.shape: ',out.shape)\n",
437 |     "\n",
438 |     "print('layer.weight.shape: ',layer.weight.shape)\n",
439 |     "print('layer.bias.shape: ',layer.bias.shape)"
440 |    ]
441 |   },
442 |   {
443 |    "cell_type": "code",
444 |    "execution_count": 43,
445 |    "metadata": {},
446 |    "outputs": [
447 |     {
448 |      "name": "stdout",
449 |      "output_type": "stream",
450 |      "text": [
451 |       "vars()方法打印所有参数:\n"
452 |      ]
453 |     },
454 |     {
455 |      "data": {
456 |       "text/plain": [
457 |        "{'_backward_hooks': OrderedDict(),\n",
458 |        " '_buffers': OrderedDict([('running_mean',\n",
459 |        "               tensor([0.0501, 0.0498, 0.0502, 0.0494, 0.0505, 0.0503, 0.0507, 0.0497, 0.0508,\n",
460 |        "                       0.0509, 0.0500, 0.0496, 0.0496, 0.0510, 0.0501, 0.0502])),\n",
461 |        "              ('running_var',\n",
462 |        "               tensor([0.9084, 0.9082, 0.9082, 0.9082, 0.9084, 0.9082, 0.9084, 0.9083, 0.9083,\n",
463 |        "                       0.9084, 0.9082, 0.9083, 0.9085, 0.9083, 0.9083, 0.9084])),\n",
464 |        "              ('num_batches_tracked', tensor(1))]),\n",
465 |        " '_forward_hooks': OrderedDict(),\n",
466 |        " '_forward_pre_hooks': OrderedDict(),\n",
467 |        " '_load_state_dict_pre_hooks': OrderedDict(),\n",
468 |        " '_modules': OrderedDict(),\n",
469 |        " '_parameters': OrderedDict([('weight', Parameter containing:\n",
470 |        "               tensor([1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.],\n",
471 |        "                      requires_grad=True)), ('bias', Parameter containing:\n",
472 |        "               tensor([0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
473 |        "                      requires_grad=True))]),\n",
474 |        " '_state_dict_hooks': OrderedDict(),\n",
475 |        " 'affine': True,\n",
476 |        " 'eps': 1e-05,\n",
477 |        " 'momentum': 0.1,\n",
478 |        " 'num_features': 16,\n",
479 |        " 'track_running_stats': True,\n",
480 |        " 'training': True}"
481 |       ]
482 |      },
483 |      "execution_count": 43,
484 |      "metadata": {},
485 |      "output_type": "execute_result"
486 |     }
487 |    ],
488 |    "source": [
489 |     "print('vars()方法打印所有参数:')\n",
490 |     "vars(layer)"
491 |    ]
492 |   },
493 |   {
494 |    "cell_type": "markdown",
495 |    "metadata": {},
496 |    "source": [
497 |     "## Test 时注意事项:\n",
498 |     "test时,均值和方差取的不是当前值,而是全局值(running),$\\gamma$和$\\beta$不需要backward,即不需要更新只需切换test模式,使用 **layer.eval()**\n",
499 |     "\n",
500 |     "```Python\n",
501 |     "layer.eval()\n",
502 |     "BatchNorm1d(16,eps=1e-05,momentum=0.1,affine=True,track_running_stats=True)\n",
503 |     "out = layer(x)\n",
504 |     "```"
505 |    ]
506 |   },
507 |   {
508 |    "cell_type": "code",
509 |    "execution_count": null,
510 |    "metadata": {},
511 |    "outputs": [],
512 |    "source": []
513 |   }
514 |  ],
515 |  "metadata": {
516 |   "kernelspec": {
517 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
518 |    "language": "python",
519 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
520 |   },
521 |   "language_info": {
522 |    "codemirror_mode": {
523 |     "name": "ipython",
524 |     "version": 3
525 |    },
526 |    "file_extension": ".py",
527 |    "mimetype": "text/x-python",
528 |    "name": "python",
529 |    "nbconvert_exporter": "python",
530 |    "pygments_lexer": "ipython3",
531 |    "version": "3.5.6"
532 |   },
533 |   "latex_envs": {
534 |    "LaTeX_envs_menu_present": true,
535 |    "autoclose": false,
536 |    "autocomplete": true,
537 |    "bibliofile": "biblio.bib",
538 |    "cite_by": "apalike",
539 |    "current_citInitial": 1,
540 |    "eqLabelWithNumbers": true,
541 |    "eqNumInitial": 1,
542 |    "hotkeys": {
543 |     "equation": "Ctrl-E",
544 |     "itemize": "Ctrl-I"
545 |    },
546 |    "labels_anchors": false,
547 |    "latex_user_defs": false,
548 |    "report_style_numbering": false,
549 |    "user_envs_cfg": false
550 |   },
551 |   "varInspector": {
552 |    "cols": {
553 |     "lenName": 16,
554 |     "lenType": 16,
555 |     "lenVar": 40
556 |    },
557 |    "kernels_config": {
558 |     "python": {
559 |      "delete_cmd_postfix": "",
560 |      "delete_cmd_prefix": "del ",
561 |      "library": "var_list.py",
562 |      "varRefreshCmd": "print(var_dic_list())"
563 |     },
564 |     "r": {
565 |      "delete_cmd_postfix": ") ",
566 |      "delete_cmd_prefix": "rm(",
567 |      "library": "var_list.r",
568 |      "varRefreshCmd": "cat(var_dic_list()) "
569 |     }
570 |    },
571 |    "types_to_exclude": [
572 |     "module",
573 |     "function",
574 |     "builtin_function_or_method",
575 |     "instance",
576 |     "_Feature"
577 |    ],
578 |    "window_display": false
579 |   }
580 |  },
581 |  "nbformat": 4,
582 |  "nbformat_minor": 2
583 | }
584 | 


--------------------------------------------------------------------------------
/ch07_卷积神经网络CNN/.ipynb_checkpoints/ch07_经典卷积网络-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# 7.4 经典卷积网络"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "## 7.4.1 LeNet-5\n",
 15 |     "- 99.2% acc.\n",
 16 |     "- 5/6 layers"
 17 |    ]
 18 |   },
 19 |   {
 20 |    "cell_type": "markdown",
 21 |    "metadata": {},
 22 |    "source": [
 23 |     "## 7.4.2 AlexNet : ILSVRC 2012 Winner\n",
 24 |     "- GTX 580 ( 3GB x 2 )\n",
 25 |     "- 11x11\n",
 26 |     "- 8 layers\n",
 27 |     "\n",
 28 |     "**[ImageNet Classification with Deep Convolutional Neural Networks. NIPS2012]**\n",
 29 |     "\n",
 30 |     "**A. Krizhevsky, I. Sutskever, and G. Hinton**\n",
 31 |     "\n",
 32 |     "#### Similar framework to LeNet but:\n",
 33 |     "- Max pooling, ReLU nonlinearity\n",
 34 |     "- More data and bigger model(7 hidden layers, 650k units, 60M params)\n",
 35 |     "- GPU implementation(50x speedup over CPU)\n",
 36 |     " - Trained on two GPUs for a week\n",
 37 |     "- Dropout regularization"
 38 |    ]
 39 |   },
 40 |   {
 41 |    "cell_type": "markdown",
 42 |    "metadata": {},
 43 |    "source": [
 44 |     "## 7.4.3 VGGNet: ILSVRC 2014 2nd place\n",
 45 |     "- 3x3 filter or\n",
 46 |     "- 1x1 filter\n",
 47 |     "- 11-19 layers\n",
 48 |     "\n",
 49 |     "**[Very Deep Convolutional Networks for Large-Scale Image Recognition, ICLR 2015]**\n",
 50 |     "\n",
 51 |     "**K. Simonyan and A. Zisserman**"
 52 |    ]
 53 |   },
 54 |   {
 55 |    "cell_type": "markdown",
 56 |    "metadata": {},
 57 |    "source": [
 58 |     "## 7.4.4 GoogLeNet: ILSVRC 2014 1st place\n",
 59 |     "- 22 layers\n",
 60 |     "- **[Going deeper with convolutions. CVPR2015] C.Szegedy et al.**"
 61 |    ]
 62 |   },
 63 |   {
 64 |    "cell_type": "markdown",
 65 |    "metadata": {},
 66 |    "source": [
 67 |     "# 7.5 ResNet 深度残差网络 ILSVRC 2015 Winner\n",
 68 |     "\n",
 69 |     "## ResNet\n",
 70 |     "\n",
 71 |     "- **The residual module**\n",
 72 |     " - Introduce skip or shortcut connections(existing before in various forms in literature)\n",
 73 |     " - Make it easy for network layers to represent the identity mapping\n",
 74 |     " - For some reason, need to skip at least two layers\n",
 75 |     " \n",
 76 |     " **[Deep Residual Learning for Image Recognition, CVPR2016(Best Paper)]**\n",
 77 |     " \n",
 78 |     " **Kaiming He, Xiangyu Zhang, Shaoqing Ren, and Jian Sun**\n",
 79 |     " "
 80 |    ]
 81 |   },
 82 |   {
 83 |    "cell_type": "code",
 84 |    "execution_count": 3,
 85 |    "metadata": {},
 86 |    "outputs": [],
 87 |    "source": [
 88 |     "import torch\n",
 89 |     "from torch import nn"
 90 |    ]
 91 |   },
 92 |   {
 93 |    "cell_type": "code",
 94 |    "execution_count": 4,
 95 |    "metadata": {},
 96 |    "outputs": [],
 97 |    "source": [
 98 |     "class ResBlk(nn.Module):\n",
 99 |     "    def __init__(self,ch_in,ch_out):\n",
100 |     "        self.conv1 = nn.Conv2d(ch_in,ch_out,kernel_size=3,stride=1,padding=1)\n",
101 |     "        self.bn1 = nn.BatchNorm2d(ch_out)\n",
102 |     "        self.conv2 = nn.Conv2d(ch_out,ch_out,kernel_size=3,stride=1,padding=1)\n",
103 |     "        self.bn1 = nn.BatchNorm2d\n",
104 |     "        \n",
105 |     "        self.extra = nn.Sequential()\n",
106 |     "        \n",
107 |     "        if ch_out != ch_in:\n",
108 |     "            self.extra = nn.Sequential(\n",
109 |     "                nn.Conv2d(ch_in,ch_out,kernel_size=1,stride=1),\n",
110 |     "                nn.BatchNorm2d(ch_out)\n",
111 |     "            )\n",
112 |     "            \n",
113 |     "    def forward(self,x):\n",
114 |     "        out = nn.ReLU(self.bn1(self.conv1(x)))\n",
115 |     "        out = self.bn2(self.conv2(out))\n",
116 |     "        out = self.extra(x)+out\n",
117 |     "        return out"
118 |    ]
119 |   },
120 |   {
121 |    "cell_type": "markdown",
122 |    "metadata": {},
123 |    "source": [
124 |     "# 7.6 nn.Module\n",
125 |     "\n",
126 |     "### Magic :\n",
127 |     "- Every Layer is nn.Module\n",
128 |     " - nn.Linear\n",
129 |     " - nn.BatchNorm2d\n",
130 |     " - nn.Conv2d\n",
131 |     "- nn.Module nested in nn.Module\n",
132 |     "\n",
133 |     "### 1. embed current layers :\n",
134 |     "- Linear\n",
135 |     "- ReLU\n",
136 |     "- Sigmoid\n",
137 |     "- Conv2d\n",
138 |     "- ConvTransposed2d\n",
139 |     "- Dropout\n",
140 |     "- etc.\n",
141 |     "\n",
142 |     "### 2. Container\n",
143 |     "- net(x)\n",
144 |     "\n",
145 |     "### 3. parameters\n",
146 |     "\n",
147 |     "### 4. modules\n",
148 |     "- modules: all nodes\n",
149 |     "- children: direct children\n",
150 |     "\n",
151 |     "### 5. to(device)\n",
152 |     "\n",
153 |     "### 6. save and load\n",
154 |     "\n",
155 |     "### 7. train / test 切换\n",
156 |     "\n",
157 |     "### 8. implement own layer\n",
158 |     "\n",
159 |     "### 9. own linear layer"
160 |    ]
161 |   },
162 |   {
163 |    "cell_type": "markdown",
164 |    "metadata": {},
165 |    "source": [
166 |     "# 7.7 Data Argumentation 数据增强\n",
167 |     "\n",
168 |     "### Limited Data\n",
169 |     "- Small network capacity\n",
170 |     "- Regularizaion\n",
171 |     "- Data argumentation\n",
172 |     "\n",
173 |     "### Data argumentation\n",
174 |     "- Flip\n",
175 |     "```Python\n",
176 |     "train_loader = torch.utils.data.DataLoader(\n",
177 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
178 |     "                   transform = transforms.Compose([\n",
179 |     "                       transforms.RandomHorizontalFlip(),\n",
180 |     "                       transforms.RandomVerticaalFlip(),\n",
181 |     "                       transforms.ToTensor(),\n",
182 |     "                       transforms.Normalize((0.1307,),(0.3081,))\n",
183 |     "                   ])),\n",
184 |     "    batch_size=batch_size, shuffle=True)\n",
185 |     "```\n",
186 |     "\n",
187 |     "- Rotate\n",
188 |     "```Python\n",
189 |     "train_loader = torch.utils.data.DataLoader(\n",
190 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
191 |     "                   transform = transforms.Compose([\n",
192 |     "                       transforms.RandomRotation(15), # 旋转15度\n",
193 |     "                       # 随机选择三个角度中的一个进行旋转\n",
194 |     "                       transforms.RandomRotation([90,180,270]), \n",
195 |     "                       transforms.ToTensor(),\n",
196 |     "                       transforms.Normaliza((0.1307,),(0.3081,))\n",
197 |     "                   ])),\n",
198 |     "    batch_size=batch_size, shuffle=True)\n",
199 |     "```\n",
200 |     "\n",
201 |     "- Scale 缩放\n",
202 |     "```Python\n",
203 |     "train_loader = torch.utils.data.DataLoader(\n",
204 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
205 |     "                   transform = transforms.Compose([\n",
206 |     "                       transforms.Resize([32,32]) # Scale\n",
207 |     "                       transforms.ToTensor(),\n",
208 |     "                       transforms.Normaliza((0.1307,),(0.3081,))\n",
209 |     "                   ])),\n",
210 |     "    batch_size=batch_size, shuffle=True)\n",
211 |     "```\n",
212 |     "\n",
213 |     "- Crop Part 裁剪\n",
214 |     "```Python\n",
215 |     "train_loader = torch.utils.data.DataLoader(\n",
216 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
217 |     "                   transform = transforms.Compose([\n",
218 |     "                       transforms.RandomCrop([28,28]) # Crop 裁剪\n",
219 |     "                       transforms.ToTensor(),\n",
220 |     "                       transforms.Normaliza((0.1307,),(0.3081,))\n",
221 |     "                   ])),\n",
222 |     "    batch_size=batch_size, shuffle=True)\n",
223 |     "```\n",
224 |     "\n",
225 |     "- Noise 加入噪声\n",
226 |     "\n",
227 |     "- GAN\n"
228 |    ]
229 |   },
230 |   {
231 |    "cell_type": "code",
232 |    "execution_count": null,
233 |    "metadata": {},
234 |    "outputs": [],
235 |    "source": []
236 |   }
237 |  ],
238 |  "metadata": {
239 |   "kernelspec": {
240 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
241 |    "language": "python",
242 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
243 |   },
244 |   "language_info": {
245 |    "codemirror_mode": {
246 |     "name": "ipython",
247 |     "version": 3
248 |    },
249 |    "file_extension": ".py",
250 |    "mimetype": "text/x-python",
251 |    "name": "python",
252 |    "nbconvert_exporter": "python",
253 |    "pygments_lexer": "ipython3",
254 |    "version": "3.5.6"
255 |   },
256 |   "latex_envs": {
257 |    "LaTeX_envs_menu_present": true,
258 |    "autoclose": false,
259 |    "autocomplete": true,
260 |    "bibliofile": "biblio.bib",
261 |    "cite_by": "apalike",
262 |    "current_citInitial": 1,
263 |    "eqLabelWithNumbers": true,
264 |    "eqNumInitial": 1,
265 |    "hotkeys": {
266 |     "equation": "Ctrl-E",
267 |     "itemize": "Ctrl-I"
268 |    },
269 |    "labels_anchors": false,
270 |    "latex_user_defs": false,
271 |    "report_style_numbering": false,
272 |    "user_envs_cfg": false
273 |   },
274 |   "varInspector": {
275 |    "cols": {
276 |     "lenName": 16,
277 |     "lenType": 16,
278 |     "lenVar": 40
279 |    },
280 |    "kernels_config": {
281 |     "python": {
282 |      "delete_cmd_postfix": "",
283 |      "delete_cmd_prefix": "del ",
284 |      "library": "var_list.py",
285 |      "varRefreshCmd": "print(var_dic_list())"
286 |     },
287 |     "r": {
288 |      "delete_cmd_postfix": ") ",
289 |      "delete_cmd_prefix": "rm(",
290 |      "library": "var_list.r",
291 |      "varRefreshCmd": "cat(var_dic_list()) "
292 |     }
293 |    },
294 |    "types_to_exclude": [
295 |     "module",
296 |     "function",
297 |     "builtin_function_or_method",
298 |     "instance",
299 |     "_Feature"
300 |    ],
301 |    "window_display": false
302 |   }
303 |  },
304 |  "nbformat": 4,
305 |  "nbformat_minor": 2
306 | }
307 | 


--------------------------------------------------------------------------------
/ch07_卷积神经网络CNN/ch07_卷积神经网络基础.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# 7.1 卷积神经网络基础"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "### nn.Conv2d"
 15 |    ]
 16 |   },
 17 |   {
 18 |    "cell_type": "code",
 19 |    "execution_count": 1,
 20 |    "metadata": {},
 21 |    "outputs": [],
 22 |    "source": [
 23 |     "import torch\n",
 24 |     "from torch import nn"
 25 |    ]
 26 |   },
 27 |   {
 28 |    "cell_type": "markdown",
 29 |    "metadata": {},
 30 |    "source": [
 31 |     "$$Output\\_size = \\left \\lfloor \\frac{n + 2p - f}{s} + 1\\right \\rfloor \\times \\left \\lfloor \\frac{n + 2p - f}{s} + 1\\right \\rfloor$$\n",
 32 |     "\n"
 33 |    ]
 34 |   },
 35 |   {
 36 |    "cell_type": "code",
 37 |    "execution_count": 15,
 38 |    "metadata": {},
 39 |    "outputs": [
 40 |     {
 41 |      "name": "stdout",
 42 |      "output_type": "stream",
 43 |      "text": [
 44 |       "out1.shape: torch.Size([1, 3, 26, 26])\n",
 45 |       "out2.shape: torch.Size([1, 3, 28, 28])\n",
 46 |       "out3.shape: torch.Size([1, 4, 14, 14])\n"
 47 |      ]
 48 |     }
 49 |    ],
 50 |    "source": [
 51 |     "layer = nn.Conv2d(1,3,kernel_size=3,stride=1,padding=0)\n",
 52 |     "x = torch.rand(1,1,28,28)\n",
 53 |     "\n",
 54 |     "out = layer.forward(x) # 卷积运算\n",
 55 |     "print('out1.shape:',out.shape)\n",
 56 |     "\n",
 57 |     "layer = nn.Conv2d(1,3,kernel_size=3,stride=1,padding=1)\n",
 58 |     "out = layer.forward(x)\n",
 59 |     "print('out2.shape:',out.shape)\n",
 60 |     "\n",
 61 |     "layer = nn.Conv2d(1,4,kernel_size=3,stride=2,padding=1)\n",
 62 |     "out = layer.forward(x)\n",
 63 |     "print('out3.shape:',out.shape)"
 64 |    ]
 65 |   },
 66 |   {
 67 |    "cell_type": "markdown",
 68 |    "metadata": {},
 69 |    "source": [
 70 |     "### Inner weight & bias"
 71 |    ]
 72 |   },
 73 |   {
 74 |    "cell_type": "code",
 75 |    "execution_count": 16,
 76 |    "metadata": {},
 77 |    "outputs": [
 78 |     {
 79 |      "data": {
 80 |       "text/plain": [
 81 |        "Parameter containing:\n",
 82 |        "tensor([[[[-0.1704, -0.0875,  0.0579],\n",
 83 |        "          [ 0.2762,  0.2394, -0.0993],\n",
 84 |        "          [ 0.1446,  0.0253, -0.1044]]],\n",
 85 |        "\n",
 86 |        "\n",
 87 |        "        [[[-0.1198, -0.3039, -0.3194],\n",
 88 |        "          [ 0.2971, -0.2700, -0.0318],\n",
 89 |        "          [ 0.1160,  0.1986, -0.3255]]],\n",
 90 |        "\n",
 91 |        "\n",
 92 |        "        [[[-0.1016,  0.0956, -0.0222],\n",
 93 |        "          [ 0.1155,  0.1237,  0.1385],\n",
 94 |        "          [ 0.2375, -0.2012,  0.3073]]],\n",
 95 |        "\n",
 96 |        "\n",
 97 |        "        [[[-0.3036,  0.2053,  0.2781],\n",
 98 |        "          [-0.0271, -0.0822, -0.0675],\n",
 99 |        "          [ 0.2384, -0.2601,  0.0878]]]], requires_grad=True)"
100 |       ]
101 |      },
102 |      "execution_count": 16,
103 |      "metadata": {},
104 |      "output_type": "execute_result"
105 |     }
106 |    ],
107 |    "source": [
108 |     "layer.weight"
109 |    ]
110 |   },
111 |   {
112 |    "cell_type": "code",
113 |    "execution_count": 17,
114 |    "metadata": {},
115 |    "outputs": [
116 |     {
117 |      "data": {
118 |       "text/plain": [
119 |        "torch.Size([4, 1, 3, 3])"
120 |       ]
121 |      },
122 |      "execution_count": 17,
123 |      "metadata": {},
124 |      "output_type": "execute_result"
125 |     }
126 |    ],
127 |    "source": [
128 |     "layer.weight.shape"
129 |    ]
130 |   },
131 |   {
132 |    "cell_type": "code",
133 |    "execution_count": 18,
134 |    "metadata": {},
135 |    "outputs": [
136 |     {
137 |      "data": {
138 |       "text/plain": [
139 |        "torch.Size([4])"
140 |       ]
141 |      },
142 |      "execution_count": 18,
143 |      "metadata": {},
144 |      "output_type": "execute_result"
145 |     }
146 |    ],
147 |    "source": [
148 |     "layer.bias.shape"
149 |    ]
150 |   },
151 |   {
152 |    "cell_type": "markdown",
153 |    "metadata": {},
154 |    "source": [
155 |     "### F.conv2d"
156 |    ]
157 |   },
158 |   {
159 |    "cell_type": "code",
160 |    "execution_count": 23,
161 |    "metadata": {},
162 |    "outputs": [],
163 |    "source": [
164 |     "from torch.nn import functional as F\n",
165 |     "x = torch.randn(1,3,28,28) # x 和 w 的 channel 值要相同,均为3\n",
166 |     "w = torch.rand(16,3,5,5)\n",
167 |     "b = torch.rand(16)"
168 |    ]
169 |   },
170 |   {
171 |    "cell_type": "code",
172 |    "execution_count": 27,
173 |    "metadata": {},
174 |    "outputs": [
175 |     {
176 |      "name": "stdout",
177 |      "output_type": "stream",
178 |      "text": [
179 |       "x.shape:  torch.Size([1, 3, 28, 28])\n",
180 |       "out.shape:  torch.Size([1, 16, 14, 14])\n"
181 |      ]
182 |     }
183 |    ],
184 |    "source": [
185 |     "out = F.conv2d(x,w,b,stride=2,padding=2)\n",
186 |     "print('x.shape: ',x.shape)\n",
187 |     "print('out.shape: ',out.shape)"
188 |    ]
189 |   },
190 |   {
191 |    "cell_type": "markdown",
192 |    "metadata": {},
193 |    "source": [
194 |     "# 7.2 Down/Up Sample 池化层与采样 ReLU层"
195 |    ]
196 |   },
197 |   {
198 |    "cell_type": "markdown",
199 |    "metadata": {},
200 |    "source": [
201 |     "### Max Pooling\n",
202 |     "\n",
203 |     "### Avg Pooling\n"
204 |    ]
205 |   },
206 |   {
207 |    "cell_type": "code",
208 |    "execution_count": 28,
209 |    "metadata": {},
210 |    "outputs": [
211 |     {
212 |      "name": "stdout",
213 |      "output_type": "stream",
214 |      "text": [
215 |       "x.shape:  torch.Size([1, 16, 14, 14])\n",
216 |       "out1.shape:  torch.Size([1, 16, 7, 7])\n",
217 |       "out2.shape:  torch.Size([1, 16, 7, 7])\n"
218 |      ]
219 |     }
220 |    ],
221 |    "source": [
222 |     "x = out\n",
223 |     "print('x.shape: ',x.shape)\n",
224 |     "\n",
225 |     "layer = nn.MaxPool2d(2,stride=2)\n",
226 |     "\n",
227 |     "out1 = layer(x)\n",
228 |     "print('out1.shape: ',out1.shape)\n",
229 |     "\n",
230 |     "out2 = F.avg_pool2d(x,2,stride=2)\n",
231 |     "print('out2.shape: ',out2.shape)"
232 |    ]
233 |   },
234 |   {
235 |    "cell_type": "markdown",
236 |    "metadata": {},
237 |    "source": [
238 |     "### UpSample \n",
239 |     "\n",
240 |     "#### F.interpolate( )"
241 |    ]
242 |   },
243 |   {
244 |    "cell_type": "code",
245 |    "execution_count": 30,
246 |    "metadata": {},
247 |    "outputs": [
248 |     {
249 |      "name": "stdout",
250 |      "output_type": "stream",
251 |      "text": [
252 |       "x.shape:  torch.Size([1, 16, 14, 14])\n",
253 |       "out.shape:  torch.Size([1, 16, 28, 28])\n"
254 |      ]
255 |     }
256 |    ],
257 |    "source": [
258 |     "x = out\n",
259 |     "print('x.shape: ',x.shape)\n",
260 |     "out = F.interpolate(x,scale_factor=2,mode='nearest')\n",
261 |     "print('out.shape: ',out.shape)"
262 |    ]
263 |   },
264 |   {
265 |    "cell_type": "markdown",
266 |    "metadata": {},
267 |    "source": [
268 |     "### ReLU层"
269 |    ]
270 |   },
271 |   {
272 |    "cell_type": "code",
273 |    "execution_count": 33,
274 |    "metadata": {},
275 |    "outputs": [
276 |     {
277 |      "name": "stdout",
278 |      "output_type": "stream",
279 |      "text": [
280 |       "x.shape:  torch.Size([1, 16, 14, 14])\n",
281 |       "layer = nn.ReLU(inplace=True), inplace=True可以节省内存一半空间\n",
282 |       "out.shape:  torch.Size([1, 16, 14, 14])\n"
283 |      ]
284 |     }
285 |    ],
286 |    "source": [
287 |     "print('x.shape: ',x.shape)\n",
288 |     "\n",
289 |     "layer = nn.ReLU(inplace=True)\n",
290 |     "print('layer = nn.ReLU(inplace=True), inplace=True可以节省内存一半空间')\n",
291 |     "out = layer(x)\n",
292 |     "print('out.shape: ',out.shape)"
293 |    ]
294 |   },
295 |   {
296 |    "cell_type": "code",
297 |    "execution_count": 34,
298 |    "metadata": {},
299 |    "outputs": [
300 |     {
301 |      "name": "stdout",
302 |      "output_type": "stream",
303 |      "text": [
304 |       "out.shape:  torch.Size([1, 16, 14, 14])\n"
305 |      ]
306 |     }
307 |    ],
308 |    "source": [
309 |     "out = F.relu(x)\n",
310 |     "print('out.shape: ',out.shape)"
311 |    ]
312 |   },
313 |   {
314 |    "cell_type": "markdown",
315 |    "metadata": {},
316 |    "source": [
317 |     "# 7.3 Batch Norm\n",
318 |     "\n",
319 |     "### Feature Scaling\n",
320 |     "- Image Normalization:\n",
321 |     "```Python\n",
322 |     "normaliza = transforms.Normaliza(mean=[0.485,0.456,0.406],\n",
323 |     "                                 std=[0.229,0.224,0.225])\n",
324 |     "# RGB 各通道的均值和方差\n",
325 |     "```\n",
326 |     "- Batch Normalization:\n",
327 |     "\n",
328 |     "$ Algorithm : Batch Normalizing Transform, applied to activation x over a mini-batch.$\n",
329 |     "\n",
330 |     "$Input: Values of x over a mini-batch: \\mathcal{B} = \\{ x_{1...m}\\}; $\n",
331 |     "$Output: \\{ y_i = BN_{\\gamma , \\beta}(x_i)\\} $\n",
332 |     "\n",
333 |     "$$mini-batch \\space mean:  \\mu_{\\mathcal{B}} \\leftarrow \\frac{1}{m}\\sum_{i=1}^m x_i $$\n",
334 |     "\n",
335 |     "$$mini-batch \\space variance: \\sigma_{\\mathcal{B}}^2 \\leftarrow \\frac{1}{m} \\sum_{i=1}^m (x_i-\\mu_\\mathcal{B})^2 $$\n",
336 |     "\n",
337 |     "$$normalize: \\hat{x_i} \\leftarrow \\frac{x_i - \\mu_{\\mathcal{B}}}{\\sqrt{\\sigma_\\mathcal{B}^2 + \\varepsilon }}$$\n",
338 |     "\n",
339 |     "$$scale \\space and \\space shift: y_i \\leftarrow \\gamma \\hat{x_i} + \\beta \\equiv BN_{\\gamma , \\beta (x_i)}$$\n",
340 |     "\n"
341 |    ]
342 |   },
343 |   {
344 |    "cell_type": "markdown",
345 |    "metadata": {},
346 |    "source": [
347 |     "### nn.BatchNorm1d"
348 |    ]
349 |   },
350 |   {
351 |    "cell_type": "code",
352 |    "execution_count": 38,
353 |    "metadata": {},
354 |    "outputs": [
355 |     {
356 |      "name": "stdout",
357 |      "output_type": "stream",
358 |      "text": [
359 |       "x.shape:  torch.Size([100, 16, 784])\n"
360 |      ]
361 |     }
362 |    ],
363 |    "source": [
364 |     "x = torch.randn(100,16,784) # 784 = 28*28\n",
365 |     "print('x.shape: ',x.shape)\n",
366 |     "layer = nn.BatchNorm1d(16)\n",
367 |     "out = layer(x)"
368 |    ]
369 |   },
370 |   {
371 |    "cell_type": "markdown",
372 |    "metadata": {},
373 |    "source": [
374 |     "**nn.BatchNorm1d(16)的参数16为channel通道数,BatchNormalize通道的统计数据是跨通道运算的,有多少个channel,就计算多少个channel上的均值和方差,16个channel就生成16个长度的统计信息,每个信息代表每个channel的均值和方差**"
375 |    ]
376 |   },
377 |   {
378 |    "cell_type": "code",
379 |    "execution_count": 39,
380 |    "metadata": {},
381 |    "outputs": [
382 |     {
383 |      "name": "stdout",
384 |      "output_type": "stream",
385 |      "text": [
386 |       "layer.running_mean: \n",
387 |       "tensor([-4.5907e-04,  8.6306e-05, -7.4280e-04, -6.2997e-04, -6.4749e-04,\n",
388 |       "         1.4273e-04, -3.9751e-05, -8.0233e-05,  2.4080e-04, -3.0221e-04,\n",
389 |       "         8.5041e-05,  1.8740e-04, -1.6602e-04, -6.1695e-05, -3.7739e-04,\n",
390 |       "         1.0307e-04])\n",
391 |       "layer.running_var: \n",
392 |       "tensor([1.0003, 0.9996, 1.0000, 1.0000, 1.0006, 1.0003, 1.0000, 1.0004, 1.0000,\n",
393 |       "        0.9994, 0.9999, 0.9996, 0.9997, 1.0008, 0.9995, 0.9999])\n"
394 |      ]
395 |     }
396 |    ],
397 |    "source": [
398 |     "print('layer.running_mean: ')\n",
399 |     "print(layer.running_mean)\n",
400 |     "print('layer.running_var: ')\n",
401 |     "print(layer.running_var)"
402 |    ]
403 |   },
404 |   {
405 |    "cell_type": "markdown",
406 |    "metadata": {},
407 |    "source": [
408 |     "### nn.BatchNorm2d\n",
409 |     "\n",
410 |     "layer.weigh $ \\rightarrow \\space \\gamma \\ $\n",
411 |     "\n",
412 |     "layer.bias $ \\rightarrow \\space \\beta$"
413 |    ]
414 |   },
415 |   {
416 |    "cell_type": "code",
417 |    "execution_count": 41,
418 |    "metadata": {},
419 |    "outputs": [
420 |     {
421 |      "name": "stdout",
422 |      "output_type": "stream",
423 |      "text": [
424 |       "x.shape:  torch.Size([6, 16, 28, 28])\n",
425 |       "After BatchNorm2d(16), out.shape:  torch.Size([6, 16, 28, 28])\n",
426 |       "layer.weight.shape:  torch.Size([16])\n",
427 |       "layer.bias.shape:  torch.Size([16])\n"
428 |      ]
429 |     }
430 |    ],
431 |    "source": [
432 |     "x = torch.rand(6,16,28,28)\n",
433 |     "print('x.shape: ',x.shape)\n",
434 |     "layer = nn.BatchNorm2d(16)\n",
435 |     "out = layer(x)\n",
436 |     "print('After BatchNorm2d(16), out.shape: ',out.shape)\n",
437 |     "\n",
438 |     "print('layer.weight.shape: ',layer.weight.shape)\n",
439 |     "print('layer.bias.shape: ',layer.bias.shape)"
440 |    ]
441 |   },
442 |   {
443 |    "cell_type": "code",
444 |    "execution_count": 43,
445 |    "metadata": {},
446 |    "outputs": [
447 |     {
448 |      "name": "stdout",
449 |      "output_type": "stream",
450 |      "text": [
451 |       "vars()方法打印所有参数:\n"
452 |      ]
453 |     },
454 |     {
455 |      "data": {
456 |       "text/plain": [
457 |        "{'_backward_hooks': OrderedDict(),\n",
458 |        " '_buffers': OrderedDict([('running_mean',\n",
459 |        "               tensor([0.0501, 0.0498, 0.0502, 0.0494, 0.0505, 0.0503, 0.0507, 0.0497, 0.0508,\n",
460 |        "                       0.0509, 0.0500, 0.0496, 0.0496, 0.0510, 0.0501, 0.0502])),\n",
461 |        "              ('running_var',\n",
462 |        "               tensor([0.9084, 0.9082, 0.9082, 0.9082, 0.9084, 0.9082, 0.9084, 0.9083, 0.9083,\n",
463 |        "                       0.9084, 0.9082, 0.9083, 0.9085, 0.9083, 0.9083, 0.9084])),\n",
464 |        "              ('num_batches_tracked', tensor(1))]),\n",
465 |        " '_forward_hooks': OrderedDict(),\n",
466 |        " '_forward_pre_hooks': OrderedDict(),\n",
467 |        " '_load_state_dict_pre_hooks': OrderedDict(),\n",
468 |        " '_modules': OrderedDict(),\n",
469 |        " '_parameters': OrderedDict([('weight', Parameter containing:\n",
470 |        "               tensor([1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.],\n",
471 |        "                      requires_grad=True)), ('bias', Parameter containing:\n",
472 |        "               tensor([0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
473 |        "                      requires_grad=True))]),\n",
474 |        " '_state_dict_hooks': OrderedDict(),\n",
475 |        " 'affine': True,\n",
476 |        " 'eps': 1e-05,\n",
477 |        " 'momentum': 0.1,\n",
478 |        " 'num_features': 16,\n",
479 |        " 'track_running_stats': True,\n",
480 |        " 'training': True}"
481 |       ]
482 |      },
483 |      "execution_count": 43,
484 |      "metadata": {},
485 |      "output_type": "execute_result"
486 |     }
487 |    ],
488 |    "source": [
489 |     "print('vars()方法打印所有参数:')\n",
490 |     "vars(layer)"
491 |    ]
492 |   },
493 |   {
494 |    "cell_type": "markdown",
495 |    "metadata": {},
496 |    "source": [
497 |     "## Test 时注意事项:\n",
498 |     "test时,均值和方差取的不是当前值,而是全局值(running),$\\gamma$和$\\beta$不需要backward,即不需要更新只需切换test模式,使用 **layer.eval()**\n",
499 |     "\n",
500 |     "```Python\n",
501 |     "layer.eval()\n",
502 |     "BatchNorm1d(16,eps=1e-05,momentum=0.1,affine=True,track_running_stats=True)\n",
503 |     "out = layer(x)\n",
504 |     "```"
505 |    ]
506 |   },
507 |   {
508 |    "cell_type": "code",
509 |    "execution_count": null,
510 |    "metadata": {},
511 |    "outputs": [],
512 |    "source": []
513 |   }
514 |  ],
515 |  "metadata": {
516 |   "kernelspec": {
517 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
518 |    "language": "python",
519 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
520 |   },
521 |   "language_info": {
522 |    "codemirror_mode": {
523 |     "name": "ipython",
524 |     "version": 3
525 |    },
526 |    "file_extension": ".py",
527 |    "mimetype": "text/x-python",
528 |    "name": "python",
529 |    "nbconvert_exporter": "python",
530 |    "pygments_lexer": "ipython3",
531 |    "version": "3.5.6"
532 |   },
533 |   "latex_envs": {
534 |    "LaTeX_envs_menu_present": true,
535 |    "autoclose": false,
536 |    "autocomplete": true,
537 |    "bibliofile": "biblio.bib",
538 |    "cite_by": "apalike",
539 |    "current_citInitial": 1,
540 |    "eqLabelWithNumbers": true,
541 |    "eqNumInitial": 1,
542 |    "hotkeys": {
543 |     "equation": "Ctrl-E",
544 |     "itemize": "Ctrl-I"
545 |    },
546 |    "labels_anchors": false,
547 |    "latex_user_defs": false,
548 |    "report_style_numbering": false,
549 |    "user_envs_cfg": false
550 |   },
551 |   "varInspector": {
552 |    "cols": {
553 |     "lenName": 16,
554 |     "lenType": 16,
555 |     "lenVar": 40
556 |    },
557 |    "kernels_config": {
558 |     "python": {
559 |      "delete_cmd_postfix": "",
560 |      "delete_cmd_prefix": "del ",
561 |      "library": "var_list.py",
562 |      "varRefreshCmd": "print(var_dic_list())"
563 |     },
564 |     "r": {
565 |      "delete_cmd_postfix": ") ",
566 |      "delete_cmd_prefix": "rm(",
567 |      "library": "var_list.r",
568 |      "varRefreshCmd": "cat(var_dic_list()) "
569 |     }
570 |    },
571 |    "types_to_exclude": [
572 |     "module",
573 |     "function",
574 |     "builtin_function_or_method",
575 |     "instance",
576 |     "_Feature"
577 |    ],
578 |    "window_display": false
579 |   }
580 |  },
581 |  "nbformat": 4,
582 |  "nbformat_minor": 2
583 | }
584 | 


--------------------------------------------------------------------------------
/ch07_卷积神经网络CNN/ch07_经典卷积网络.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# 7.4 经典卷积网络"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "## 7.4.1 LeNet-5\n",
 15 |     "- 99.2% acc.\n",
 16 |     "- 5/6 layers"
 17 |    ]
 18 |   },
 19 |   {
 20 |    "cell_type": "markdown",
 21 |    "metadata": {},
 22 |    "source": [
 23 |     "## 7.4.2 AlexNet : ILSVRC 2012 Winner\n",
 24 |     "- GTX 580 ( 3GB x 2 )\n",
 25 |     "- 11x11\n",
 26 |     "- 8 layers\n",
 27 |     "\n",
 28 |     "**[ImageNet Classification with Deep Convolutional Neural Networks. NIPS2012]**\n",
 29 |     "\n",
 30 |     "**A. Krizhevsky, I. Sutskever, and G. Hinton**\n",
 31 |     "\n",
 32 |     "#### Similar framework to LeNet but:\n",
 33 |     "- Max pooling, ReLU nonlinearity\n",
 34 |     "- More data and bigger model(7 hidden layers, 650k units, 60M params)\n",
 35 |     "- GPU implementation(50x speedup over CPU)\n",
 36 |     " - Trained on two GPUs for a week\n",
 37 |     "- Dropout regularization"
 38 |    ]
 39 |   },
 40 |   {
 41 |    "cell_type": "markdown",
 42 |    "metadata": {},
 43 |    "source": [
 44 |     "## 7.4.3 VGGNet: ILSVRC 2014 2nd place\n",
 45 |     "- 3x3 filter or\n",
 46 |     "- 1x1 filter\n",
 47 |     "- 11-19 layers\n",
 48 |     "\n",
 49 |     "**[Very Deep Convolutional Networks for Large-Scale Image Recognition, ICLR 2015]**\n",
 50 |     "\n",
 51 |     "**K. Simonyan and A. Zisserman**"
 52 |    ]
 53 |   },
 54 |   {
 55 |    "cell_type": "markdown",
 56 |    "metadata": {},
 57 |    "source": [
 58 |     "## 7.4.4 GoogLeNet: ILSVRC 2014 1st place\n",
 59 |     "- 22 layers\n",
 60 |     "- **[Going deeper with convolutions. CVPR2015] C.Szegedy et al.**"
 61 |    ]
 62 |   },
 63 |   {
 64 |    "cell_type": "markdown",
 65 |    "metadata": {},
 66 |    "source": [
 67 |     "# 7.5 ResNet 深度残差网络 ILSVRC 2015 Winner\n",
 68 |     "\n",
 69 |     "## ResNet\n",
 70 |     "\n",
 71 |     "- **The residual module**\n",
 72 |     " - Introduce skip or shortcut connections(existing before in various forms in literature)\n",
 73 |     " - Make it easy for network layers to represent the identity mapping\n",
 74 |     " - For some reason, need to skip at least two layers\n",
 75 |     " \n",
 76 |     " **[Deep Residual Learning for Image Recognition, CVPR2016(Best Paper)]**\n",
 77 |     " \n",
 78 |     " **Kaiming He, Xiangyu Zhang, Shaoqing Ren, and Jian Sun**\n",
 79 |     " "
 80 |    ]
 81 |   },
 82 |   {
 83 |    "cell_type": "code",
 84 |    "execution_count": 3,
 85 |    "metadata": {},
 86 |    "outputs": [],
 87 |    "source": [
 88 |     "import torch\n",
 89 |     "from torch import nn"
 90 |    ]
 91 |   },
 92 |   {
 93 |    "cell_type": "code",
 94 |    "execution_count": 4,
 95 |    "metadata": {},
 96 |    "outputs": [],
 97 |    "source": [
 98 |     "class ResBlk(nn.Module):\n",
 99 |     "    def __init__(self,ch_in,ch_out):\n",
100 |     "        self.conv1 = nn.Conv2d(ch_in,ch_out,kernel_size=3,stride=1,padding=1)\n",
101 |     "        self.bn1 = nn.BatchNorm2d(ch_out)\n",
102 |     "        self.conv2 = nn.Conv2d(ch_out,ch_out,kernel_size=3,stride=1,padding=1)\n",
103 |     "        self.bn1 = nn.BatchNorm2d\n",
104 |     "        \n",
105 |     "        self.extra = nn.Sequential()\n",
106 |     "        \n",
107 |     "        if ch_out != ch_in:\n",
108 |     "            self.extra = nn.Sequential(\n",
109 |     "                nn.Conv2d(ch_in,ch_out,kernel_size=1,stride=1),\n",
110 |     "                nn.BatchNorm2d(ch_out)\n",
111 |     "            )\n",
112 |     "            \n",
113 |     "    def forward(self,x):\n",
114 |     "        out = nn.ReLU(self.bn1(self.conv1(x)))\n",
115 |     "        out = self.bn2(self.conv2(out))\n",
116 |     "        out = self.extra(x)+out\n",
117 |     "        return out"
118 |    ]
119 |   },
120 |   {
121 |    "cell_type": "markdown",
122 |    "metadata": {},
123 |    "source": [
124 |     "# 7.6 nn.Module\n",
125 |     "\n",
126 |     "### Magic :\n",
127 |     "- Every Layer is nn.Module\n",
128 |     " - nn.Linear\n",
129 |     " - nn.BatchNorm2d\n",
130 |     " - nn.Conv2d\n",
131 |     "- nn.Module nested in nn.Module\n",
132 |     "\n",
133 |     "### 1. embed current layers :\n",
134 |     "- Linear\n",
135 |     "- ReLU\n",
136 |     "- Sigmoid\n",
137 |     "- Conv2d\n",
138 |     "- ConvTransposed2d\n",
139 |     "- Dropout\n",
140 |     "- etc.\n",
141 |     "\n",
142 |     "### 2. Container\n",
143 |     "- net(x)\n",
144 |     "\n",
145 |     "### 3. parameters\n",
146 |     "\n",
147 |     "### 4. modules\n",
148 |     "- modules: all nodes\n",
149 |     "- children: direct children\n",
150 |     "\n",
151 |     "### 5. to(device)\n",
152 |     "\n",
153 |     "### 6. save and load\n",
154 |     "\n",
155 |     "### 7. train / test 切换\n",
156 |     "\n",
157 |     "### 8. implement own layer\n",
158 |     "\n",
159 |     "### 9. own linear layer"
160 |    ]
161 |   },
162 |   {
163 |    "cell_type": "markdown",
164 |    "metadata": {},
165 |    "source": [
166 |     "# 7.7 Data Argumentation 数据增强\n",
167 |     "\n",
168 |     "### Limited Data\n",
169 |     "- Small network capacity\n",
170 |     "- Regularizaion\n",
171 |     "- Data argumentation\n",
172 |     "\n",
173 |     "### Data argumentation\n",
174 |     "- Flip\n",
175 |     "```Python\n",
176 |     "train_loader = torch.utils.data.DataLoader(\n",
177 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
178 |     "                   transform = transforms.Compose([\n",
179 |     "                       transforms.RandomHorizontalFlip(),\n",
180 |     "                       transforms.RandomVerticaalFlip(),\n",
181 |     "                       transforms.ToTensor(),\n",
182 |     "                       transforms.Normalize((0.1307,),(0.3081,))\n",
183 |     "                   ])),\n",
184 |     "    batch_size=batch_size, shuffle=True)\n",
185 |     "```\n",
186 |     "\n",
187 |     "- Rotate\n",
188 |     "```Python\n",
189 |     "train_loader = torch.utils.data.DataLoader(\n",
190 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
191 |     "                   transform = transforms.Compose([\n",
192 |     "                       transforms.RandomRotation(15), # 旋转15度\n",
193 |     "                       # 随机选择三个角度中的一个进行旋转\n",
194 |     "                       transforms.RandomRotation([90,180,270]), \n",
195 |     "                       transforms.ToTensor(),\n",
196 |     "                       transforms.Normaliza((0.1307,),(0.3081,))\n",
197 |     "                   ])),\n",
198 |     "    batch_size=batch_size, shuffle=True)\n",
199 |     "```\n",
200 |     "\n",
201 |     "- Scale 缩放\n",
202 |     "```Python\n",
203 |     "train_loader = torch.utils.data.DataLoader(\n",
204 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
205 |     "                   transform = transforms.Compose([\n",
206 |     "                       transforms.Resize([32,32]) # Scale\n",
207 |     "                       transforms.ToTensor(),\n",
208 |     "                       transforms.Normaliza((0.1307,),(0.3081,))\n",
209 |     "                   ])),\n",
210 |     "    batch_size=batch_size, shuffle=True)\n",
211 |     "```\n",
212 |     "\n",
213 |     "- Crop Part 裁剪\n",
214 |     "```Python\n",
215 |     "train_loader = torch.utils.data.DataLoader(\n",
216 |     "    datasets.MNIST('../data/', train=True, download=True,\n",
217 |     "                   transform = transforms.Compose([\n",
218 |     "                       transforms.RandomCrop([28,28]) # Crop 裁剪\n",
219 |     "                       transforms.ToTensor(),\n",
220 |     "                       transforms.Normaliza((0.1307,),(0.3081,))\n",
221 |     "                   ])),\n",
222 |     "    batch_size=batch_size, shuffle=True)\n",
223 |     "```\n",
224 |     "\n",
225 |     "- Noise 加入噪声\n",
226 |     "\n",
227 |     "- GAN\n"
228 |    ]
229 |   },
230 |   {
231 |    "cell_type": "code",
232 |    "execution_count": null,
233 |    "metadata": {},
234 |    "outputs": [],
235 |    "source": []
236 |   }
237 |  ],
238 |  "metadata": {
239 |   "kernelspec": {
240 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
241 |    "language": "python",
242 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
243 |   },
244 |   "language_info": {
245 |    "codemirror_mode": {
246 |     "name": "ipython",
247 |     "version": 3
248 |    },
249 |    "file_extension": ".py",
250 |    "mimetype": "text/x-python",
251 |    "name": "python",
252 |    "nbconvert_exporter": "python",
253 |    "pygments_lexer": "ipython3",
254 |    "version": "3.5.6"
255 |   },
256 |   "latex_envs": {
257 |    "LaTeX_envs_menu_present": true,
258 |    "autoclose": false,
259 |    "autocomplete": true,
260 |    "bibliofile": "biblio.bib",
261 |    "cite_by": "apalike",
262 |    "current_citInitial": 1,
263 |    "eqLabelWithNumbers": true,
264 |    "eqNumInitial": 1,
265 |    "hotkeys": {
266 |     "equation": "Ctrl-E",
267 |     "itemize": "Ctrl-I"
268 |    },
269 |    "labels_anchors": false,
270 |    "latex_user_defs": false,
271 |    "report_style_numbering": false,
272 |    "user_envs_cfg": false
273 |   },
274 |   "varInspector": {
275 |    "cols": {
276 |     "lenName": 16,
277 |     "lenType": 16,
278 |     "lenVar": 40
279 |    },
280 |    "kernels_config": {
281 |     "python": {
282 |      "delete_cmd_postfix": "",
283 |      "delete_cmd_prefix": "del ",
284 |      "library": "var_list.py",
285 |      "varRefreshCmd": "print(var_dic_list())"
286 |     },
287 |     "r": {
288 |      "delete_cmd_postfix": ") ",
289 |      "delete_cmd_prefix": "rm(",
290 |      "library": "var_list.r",
291 |      "varRefreshCmd": "cat(var_dic_list()) "
292 |     }
293 |    },
294 |    "types_to_exclude": [
295 |     "module",
296 |     "function",
297 |     "builtin_function_or_method",
298 |     "instance",
299 |     "_Feature"
300 |    ],
301 |    "window_display": false
302 |   }
303 |  },
304 |  "nbformat": 4,
305 |  "nbformat_minor": 2
306 | }
307 | 


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/ch08_CIFAR10_ResNet.iml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <module type="PYTHON_MODULE" version="4">
 3 |   <component name="NewModuleRootManager">
 4 |     <content url="file://$MODULE_DIR$" />
 5 |     <orderEntry type="jdk" jdkName="Python 3.7 (ch08_CIFAR10_ResNet)" jdkType="Python SDK" />
 6 |     <orderEntry type="sourceFolder" forTests="false" />
 7 |   </component>
 8 |   <component name="TestRunnerService">
 9 |     <option name="PROJECT_TEST_RUNNER" value="Unittests" />
10 |   </component>
11 | </module>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/copyright/profiles_settings.xml:
--------------------------------------------------------------------------------
1 | <component name="CopyrightManager">
2 |   <settings>
3 |     <LanguageOptions name="Python">
4 |       <option name="block" value="false" />
5 |     </LanguageOptions>
6 |   </settings>
7 | </component>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/dictionaries/mac.xml:
--------------------------------------------------------------------------------
1 | <component name="ProjectDictionaryState">
2 |   <dictionary name="mac" />
3 | </component>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/inspectionProfiles/Project_Default.xml:
--------------------------------------------------------------------------------
 1 | <component name="InspectionProjectProfileManager">
 2 |   <profile version="1.0">
 3 |     <option name="myName" value="Project Default" />
 4 |     <inspection_tool class="SpellCheckingInspection" enabled="false" level="TYPO" enabled_by_default="false">
 5 |       <option name="processCode" value="true" />
 6 |       <option name="processLiterals" value="true" />
 7 |       <option name="processComments" value="true" />
 8 |     </inspection_tool>
 9 |   </profile>
10 | </component>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/misc.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="JavaScriptSettings">
4 |     <option name="languageLevel" value="ES6" />
5 |   </component>
6 |   <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.7 (ch08_CIFAR10_ResNet)" project-jdk-type="Python SDK" />
7 | </project>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/modules.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="ProjectModuleManager">
4 |     <modules>
5 |       <module fileurl="file://$PROJECT_DIR$/.idea/ch08_CIFAR10_ResNet.iml" filepath="$PROJECT_DIR$/.idea/ch08_CIFAR10_ResNet.iml" />
6 |     </modules>
7 |   </component>
8 | </project>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/vcs.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="VcsDirectoryMappings">
4 |     <mapping directory="$PROJECT_DIR$/.." vcs="Git" />
5 |   </component>
6 | </project>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/.idea/workspace.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8"?>
  2 | <project version="4">
  3 |   <component name="ChangeListManager">
  4 |     <list default="true" id="9e1566f7-b66e-4a35-8f35-9a308eafa47e" name="Default Changelist" comment="">
  5 |       <change afterPath="$PROJECT_DIR$/.idea/vcs.xml" afterDir="false" />
  6 |       <change afterPath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/vcs.xml" afterDir="false" />
  7 |       <change beforePath="$PROJECT_DIR$/.idea/ch08_CIFAR10_ResNet.iml" beforeDir="false" afterPath="$PROJECT_DIR$/.idea/ch08_CIFAR10_ResNet.iml" afterDir="false" />
  8 |       <change beforePath="$PROJECT_DIR$/.idea/misc.xml" beforeDir="false" afterPath="$PROJECT_DIR$/.idea/misc.xml" afterDir="false" />
  9 |       <change beforePath="$PROJECT_DIR$/.idea/workspace.xml" beforeDir="false" afterPath="$PROJECT_DIR$/.idea/workspace.xml" afterDir="false" />
 10 |       <change beforePath="$PROJECT_DIR$/LeNet5.py" beforeDir="false" afterPath="$PROJECT_DIR$/LeNet5.py" afterDir="false" />
 11 |       <change beforePath="$PROJECT_DIR$/ResNet.py" beforeDir="false" afterPath="$PROJECT_DIR$/ResNet.py" afterDir="false" />
 12 |       <change beforePath="$PROJECT_DIR$/main.py" beforeDir="false" afterPath="$PROJECT_DIR$/main.py" afterDir="false" />
 13 |       <change beforePath="$PROJECT_DIR$/../ch09_循环神经网络RNN&amp;LSTM/ch09_RNN.ipynb" beforeDir="false" afterPath="$PROJECT_DIR$/../ch09_循环神经网络RNN&amp;LSTM/ch09_RNN.ipynb" afterDir="false" />
 14 |       <change beforePath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/ch10_迁移学习-实战宝可梦精灵.iml" beforeDir="false" afterPath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/ch10_迁移学习-实战宝可梦精灵.iml" afterDir="false" />
 15 |       <change beforePath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/misc.xml" beforeDir="false" afterPath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/misc.xml" afterDir="false" />
 16 |       <change beforePath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/workspace.xml" beforeDir="false" afterPath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/.idea/workspace.xml" afterDir="false" />
 17 |       <change beforePath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/best.mdl" beforeDir="false" afterPath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/best.mdl" afterDir="false" />
 18 |       <change beforePath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/resnet.py" beforeDir="false" afterPath="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵/resnet.py" afterDir="false" />
 19 |     </list>
 20 |     <option name="EXCLUDED_CONVERTED_TO_IGNORED" value="true" />
 21 |     <option name="SHOW_DIALOG" value="false" />
 22 |     <option name="HIGHLIGHT_CONFLICTS" value="true" />
 23 |     <option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
 24 |     <option name="LAST_RESOLUTION" value="IGNORE" />
 25 |   </component>
 26 |   <component name="DatabaseView">
 27 |     <option name="SHOW_INTERMEDIATE" value="true" />
 28 |     <option name="GROUP_DATA_SOURCES" value="true" />
 29 |     <option name="GROUP_SCHEMA" value="true" />
 30 |     <option name="GROUP_CONTENTS" value="false" />
 31 |     <option name="SORT_POSITIONED" value="false" />
 32 |     <option name="SHOW_EMPTY_GROUPS" value="false" />
 33 |     <option name="AUTO_SCROLL_FROM_SOURCE" value="false" />
 34 |     <option name="HIDDEN_KINDS">
 35 |       <set />
 36 |     </option>
 37 |     <expand />
 38 |     <select />
 39 |   </component>
 40 |   <component name="FileEditorManager">
 41 |     <leaf SIDE_TABS_SIZE_LIMIT_KEY="450">
 42 |       <file pinned="false" current-in-tab="true">
 43 |         <entry file="file://$PROJECT_DIR$/main.py">
 44 |           <provider selected="true" editor-type-id="text-editor">
 45 |             <state relative-caret-position="472">
 46 |               <caret line="22" column="36" lean-forward="true" selection-start-line="22" selection-start-column="36" selection-end-line="22" selection-end-column="36" />
 47 |               <folding>
 48 |                 <element signature="e#0#12#0" expanded="true" />
 49 |               </folding>
 50 |             </state>
 51 |           </provider>
 52 |         </entry>
 53 |       </file>
 54 |       <file pinned="false" current-in-tab="false">
 55 |         <entry file="file://$PROJECT_DIR$/LeNet5.py">
 56 |           <provider selected="true" editor-type-id="text-editor">
 57 |             <state relative-caret-position="378">
 58 |               <caret line="20" selection-start-line="20" selection-end-line="20" />
 59 |               <folding>
 60 |                 <element signature="e#0#12#0" expanded="true" />
 61 |               </folding>
 62 |             </state>
 63 |           </provider>
 64 |         </entry>
 65 |       </file>
 66 |       <file pinned="false" current-in-tab="false">
 67 |         <entry file="file://$PROJECT_DIR$/ResNet.py">
 68 |           <provider selected="true" editor-type-id="text-editor">
 69 |             <state relative-caret-position="1533">
 70 |               <caret line="75" column="24" selection-start-line="75" selection-start-column="24" selection-end-line="75" selection-end-column="24" />
 71 |               <folding>
 72 |                 <element signature="e#0#12#0" expanded="true" />
 73 |               </folding>
 74 |             </state>
 75 |           </provider>
 76 |         </entry>
 77 |       </file>
 78 |     </leaf>
 79 |   </component>
 80 |   <component name="FileTemplateManagerImpl">
 81 |     <option name="RECENT_TEMPLATES">
 82 |       <list>
 83 |         <option value="Python Script" />
 84 |       </list>
 85 |     </option>
 86 |   </component>
 87 |   <component name="Git.Settings">
 88 |     <option name="RECENT_GIT_ROOT_PATH" value="$PROJECT_DIR$/.." />
 89 |   </component>
 90 |   <component name="IdeDocumentHistory">
 91 |     <option name="CHANGED_PATHS">
 92 |       <list>
 93 |         <option value="$PROJECT_DIR$/LeNet5.py" />
 94 |         <option value="$PROJECT_DIR$/ResNet.py" />
 95 |         <option value="$PROJECT_DIR$/main.py" />
 96 |       </list>
 97 |     </option>
 98 |   </component>
 99 |   <component name="ProjectFrameBounds" extendedState="6">
100 |     <option name="x" value="730" />
101 |     <option name="y" value="60" />
102 |     <option name="width" value="3225" />
103 |     <option name="height" value="1764" />
104 |   </component>
105 |   <component name="ProjectLevelVcsManager" settingsEditedManually="true" />
106 |   <component name="ProjectView">
107 |     <navigator proportions="" version="1">
108 |       <foldersAlwaysOnTop value="true" />
109 |     </navigator>
110 |     <panes>
111 |       <pane id="ProjectPane">
112 |         <subPane>
113 |           <expand>
114 |             <path>
115 |               <item name="ch08_CIFAR10_ResNet" type="b2602c69:ProjectViewProjectNode" />
116 |               <item name="ch08_CIFAR10_ResNet" type="462c0819:PsiDirectoryNode" />
117 |             </path>
118 |           </expand>
119 |           <select />
120 |         </subPane>
121 |       </pane>
122 |       <pane id="Scope" />
123 |     </panes>
124 |   </component>
125 |   <component name="PropertiesComponent">
126 |     <property name="SHARE_PROJECT_CONFIGURATION_FILES" value="true" />
127 |     <property name="WebServerToolWindowFactoryState" value="false" />
128 |     <property name="last_opened_file_path" value="$PROJECT_DIR$/../ch10_迁移学习-实战宝可梦精灵" />
129 |     <property name="nodejs_interpreter_path.stuck_in_default_project" value="undefined stuck path" />
130 |     <property name="nodejs_npm_path_reset_for_default_project" value="true" />
131 |     <property name="settings.editor.selected.configurable" value="editor.preferences.fonts.default" />
132 |   </component>
133 |   <component name="RunDashboard">
134 |     <option name="ruleStates">
135 |       <list>
136 |         <RuleState>
137 |           <option name="name" value="ConfigurationTypeDashboardGroupingRule" />
138 |         </RuleState>
139 |         <RuleState>
140 |           <option name="name" value="StatusDashboardGroupingRule" />
141 |         </RuleState>
142 |       </list>
143 |     </option>
144 |   </component>
145 |   <component name="RunManager" selected="Python.main">
146 |     <configuration name="LeNet5" type="PythonConfigurationType" factoryName="Python" temporary="true">
147 |       <module name="ch08_CIFAR10_ResNet" />
148 |       <option name="INTERPRETER_OPTIONS" value="" />
149 |       <option name="PARENT_ENVS" value="true" />
150 |       <envs>
151 |         <env name="PYTHONUNBUFFERED" value="1" />
152 |       </envs>
153 |       <option name="SDK_HOME" value="" />
154 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
155 |       <option name="IS_MODULE_SDK" value="true" />
156 |       <option name="ADD_CONTENT_ROOTS" value="true" />
157 |       <option name="ADD_SOURCE_ROOTS" value="true" />
158 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
159 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/LeNet5.py" />
160 |       <option name="PARAMETERS" value="" />
161 |       <option name="SHOW_COMMAND_LINE" value="false" />
162 |       <option name="EMULATE_TERMINAL" value="false" />
163 |       <option name="MODULE_MODE" value="false" />
164 |       <option name="REDIRECT_INPUT" value="false" />
165 |       <option name="INPUT_FILE" value="" />
166 |       <method v="2" />
167 |     </configuration>
168 |     <configuration name="ResNet" type="PythonConfigurationType" factoryName="Python" temporary="true">
169 |       <module name="ch08_CIFAR10_ResNet" />
170 |       <option name="INTERPRETER_OPTIONS" value="" />
171 |       <option name="PARENT_ENVS" value="true" />
172 |       <envs>
173 |         <env name="PYTHONUNBUFFERED" value="1" />
174 |       </envs>
175 |       <option name="SDK_HOME" value="" />
176 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
177 |       <option name="IS_MODULE_SDK" value="true" />
178 |       <option name="ADD_CONTENT_ROOTS" value="true" />
179 |       <option name="ADD_SOURCE_ROOTS" value="true" />
180 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
181 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/ResNet.py" />
182 |       <option name="PARAMETERS" value="" />
183 |       <option name="SHOW_COMMAND_LINE" value="false" />
184 |       <option name="EMULATE_TERMINAL" value="false" />
185 |       <option name="MODULE_MODE" value="false" />
186 |       <option name="REDIRECT_INPUT" value="false" />
187 |       <option name="INPUT_FILE" value="" />
188 |       <method v="2" />
189 |     </configuration>
190 |     <configuration name="main" type="PythonConfigurationType" factoryName="Python" temporary="true">
191 |       <module name="ch08_CIFAR10_ResNet" />
192 |       <option name="INTERPRETER_OPTIONS" value="" />
193 |       <option name="PARENT_ENVS" value="true" />
194 |       <envs>
195 |         <env name="PYTHONUNBUFFERED" value="1" />
196 |       </envs>
197 |       <option name="SDK_HOME" value="" />
198 |       <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
199 |       <option name="IS_MODULE_SDK" value="true" />
200 |       <option name="ADD_CONTENT_ROOTS" value="true" />
201 |       <option name="ADD_SOURCE_ROOTS" value="true" />
202 |       <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
203 |       <option name="SCRIPT_NAME" value="$PROJECT_DIR$/main.py" />
204 |       <option name="PARAMETERS" value="" />
205 |       <option name="SHOW_COMMAND_LINE" value="false" />
206 |       <option name="EMULATE_TERMINAL" value="false" />
207 |       <option name="MODULE_MODE" value="false" />
208 |       <option name="REDIRECT_INPUT" value="false" />
209 |       <option name="INPUT_FILE" value="" />
210 |       <method v="2" />
211 |     </configuration>
212 |     <recent_temporary>
213 |       <list>
214 |         <item itemvalue="Python.main" />
215 |         <item itemvalue="Python.ResNet" />
216 |         <item itemvalue="Python.LeNet5" />
217 |       </list>
218 |     </recent_temporary>
219 |   </component>
220 |   <component name="SvnConfiguration">
221 |     <configuration />
222 |   </component>
223 |   <component name="TaskManager">
224 |     <task active="true" id="Default" summary="Default task">
225 |       <changelist id="9e1566f7-b66e-4a35-8f35-9a308eafa47e" name="Default Changelist" comment="" />
226 |       <created>1595942750103</created>
227 |       <option name="number" value="Default" />
228 |       <option name="presentableId" value="Default" />
229 |       <updated>1595942750103</updated>
230 |       <workItem from="1595942752854" duration="13206000" />
231 |       <workItem from="1599728977086" duration="2782000" />
232 |       <workItem from="1599791083177" duration="229000" />
233 |       <workItem from="1599791323469" duration="118000" />
234 |       <workItem from="1599791466653" duration="261000" />
235 |       <workItem from="1599791742502" duration="1076000" />
236 |       <workItem from="1599802611598" duration="13219000" />
237 |       <workItem from="1599909125495" duration="1047000" />
238 |       <workItem from="1599916328645" duration="164000" />
239 |       <workItem from="1600173365219" duration="366000" />
240 |     </task>
241 |     <servers />
242 |   </component>
243 |   <component name="TimeTrackingManager">
244 |     <option name="totallyTimeSpent" value="32468000" />
245 |   </component>
246 |   <component name="TodoView">
247 |     <todo-panel id="selected-file">
248 |       <is-autoscroll-to-source value="true" />
249 |     </todo-panel>
250 |     <todo-panel id="all">
251 |       <are-packages-shown value="true" />
252 |       <is-autoscroll-to-source value="true" />
253 |     </todo-panel>
254 |   </component>
255 |   <component name="ToolWindowManager">
256 |     <frame x="-7" y="-7" width="2062" height="1126" extended-state="6" />
257 |     <editor active="true" />
258 |     <layout>
259 |       <window_info content_ui="combo" id="Project" order="0" sideWeight="0.49878934" visible="true" weight="0.15675403" />
260 |       <window_info id="Structure" order="1" sideWeight="0.50121063" side_tool="true" weight="0.26299506" />
261 |       <window_info id="Favorites" order="2" side_tool="true" />
262 |       <window_info anchor="bottom" id="Message" order="0" />
263 |       <window_info anchor="bottom" id="Find" order="1" />
264 |       <window_info anchor="bottom" id="Run" order="2" sideWeight="0.844254" weight="0.2952586" />
265 |       <window_info anchor="bottom" id="Debug" order="3" weight="0.4" />
266 |       <window_info anchor="bottom" id="Cvs" order="4" weight="0.25" />
267 |       <window_info anchor="bottom" id="Inspection" order="5" weight="0.4" />
268 |       <window_info anchor="bottom" id="TODO" order="6" sideWeight="0.49949595" weight="0.3297414" />
269 |       <window_info anchor="bottom" id="Docker" order="7" show_stripe_button="false" />
270 |       <window_info anchor="bottom" id="Version Control" order="8" sideWeight="0.6890121" weight="0.3297414" />
271 |       <window_info anchor="bottom" id="Database Changes" order="9" />
272 |       <window_info anchor="bottom" id="Event Log" order="10" sideWeight="0.15574597" side_tool="true" weight="0.19975787" />
273 |       <window_info anchor="bottom" id="Terminal" order="11" />
274 |       <window_info anchor="bottom" id="Python Console" order="12" />
275 |       <window_info anchor="right" id="Commander" internal_type="SLIDING" order="0" type="SLIDING" weight="0.4" />
276 |       <window_info anchor="right" id="Ant Build" order="1" weight="0.25" />
277 |       <window_info anchor="right" content_ui="combo" id="Hierarchy" order="2" weight="0.25" />
278 |       <window_info anchor="right" id="SciView" order="3" />
279 |       <window_info anchor="right" id="Database" order="4" weight="0.32941177" />
280 |     </layout>
281 |   </component>
282 |   <component name="TypeScriptGeneratedFilesManager">
283 |     <option name="version" value="1" />
284 |   </component>
285 |   <component name="Vcs.Log.History.Properties">
286 |     <option name="COLUMN_ORDER">
287 |       <list>
288 |         <option value="0" />
289 |         <option value="2" />
290 |         <option value="3" />
291 |         <option value="1" />
292 |       </list>
293 |     </option>
294 |   </component>
295 |   <component name="com.intellij.coverage.CoverageDataManagerImpl">
296 |     <SUITE FILE_PATH="coverage/ch08_CIFAR10_ResNet$ResNet.coverage" NAME="ResNet Coverage Results" MODIFIED="1599880752135" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
297 |     <SUITE FILE_PATH="coverage/ch08_CIFAR10_ResNet$main.coverage" NAME="main Coverage Results" MODIFIED="1599916442065" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
298 |     <SUITE FILE_PATH="coverage/ch08_CIFAR10_ResNet$LeNet5.coverage" NAME="LeNet5 Coverage Results" MODIFIED="1599802845478" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
299 |   </component>
300 |   <component name="editorHistoryManager">
301 |     <entry file="file://$PROJECT_DIR$/main.py">
302 |       <provider selected="true" editor-type-id="text-editor">
303 |         <state relative-caret-position="472">
304 |           <caret line="22" column="36" lean-forward="true" selection-start-line="22" selection-start-column="36" selection-end-line="22" selection-end-column="36" />
305 |           <folding>
306 |             <element signature="e#0#12#0" expanded="true" />
307 |           </folding>
308 |         </state>
309 |       </provider>
310 |     </entry>
311 |     <entry file="file://$PROJECT_DIR$/LeNet5.py">
312 |       <provider selected="true" editor-type-id="text-editor">
313 |         <state relative-caret-position="378">
314 |           <caret line="20" selection-start-line="20" selection-end-line="20" />
315 |           <folding>
316 |             <element signature="e#0#12#0" expanded="true" />
317 |           </folding>
318 |         </state>
319 |       </provider>
320 |     </entry>
321 |     <entry file="file://$PROJECT_DIR$/ResNet.py">
322 |       <provider selected="true" editor-type-id="text-editor">
323 |         <state relative-caret-position="1533">
324 |           <caret line="75" column="24" selection-start-line="75" selection-start-column="24" selection-end-line="75" selection-end-column="24" />
325 |           <folding>
326 |             <element signature="e#0#12#0" expanded="true" />
327 |           </folding>
328 |         </state>
329 |       </provider>
330 |     </entry>
331 |   </component>
332 |   <component name="masterDetails">
333 |     <states>
334 |       <state key="ScopeChooserConfigurable.UI">
335 |         <settings>
336 |           <splitter-proportions>
337 |             <option name="proportions">
338 |               <list>
339 |                 <option value="0.2" />
340 |               </list>
341 |             </option>
342 |           </splitter-proportions>
343 |         </settings>
344 |       </state>
345 |     </states>
346 |   </component>
347 | </project>


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/LeNet5.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | from torch.nn import functional as F
 4 | 
 5 | 
 6 | class LeNet5(nn.Module):
 7 |     """
 8 |     for cifar10 dataset.
 9 |     """
10 | 
11 |     def __init__(self):
12 |         super(LeNet5, self).__init__()
13 | 
14 |         self.conv_unit = nn.Sequential(
15 |             # x: [b,3,32,32] -> [b,6,28,28]
16 |             nn.Conv2d(3, 6, kernel_size=5, stride=1, padding=0),
17 |             nn.AvgPool2d(kernel_size=2, stride=2, padding=0),
18 |             #
19 |             nn.Conv2d(6, 16, kernel_size=5, stride=1, padding=0),
20 |             nn.AvgPool2d(kernel_size=2, stride=2, padding=0),
21 | 
22 |         )
23 | 
24 |         # flatten
25 |         # fc unit
26 |         self.fc_unit = nn.Sequential(
27 |             nn.Linear(16 * 5 * 5, 120),
28 |             nn.ReLU(),
29 |             nn.Linear(120, 84),
30 |             nn.ReLU(),
31 |             nn.Linear(84, 10)
32 |         )
33 | 
34 |     def forward(self, x):
35 |         """
36 |         :param x: [b,3,32,32]
37 |         :return:
38 |         """
39 |         batch_size = x.size(0)  # size(0)返回[b,3,32,32]的b
40 |         # [b,3,32,32] -> [b,16,5,5]
41 |         x = self.conv_unit(x)
42 |         # [b,16,5,5] -> [b,16*6*6] Flatten
43 |         x = x.view(batch_size, 16 * 5 * 5)
44 |         # [b,16*5*5] -> [b,10]
45 |         logits = self.fc_unit(x)
46 | 
47 |         return logits
48 | 
49 | 
50 | def main():
51 |     net = LeNet5()
52 |     temp = torch.randn(2, 3, 32, 32)
53 |     out = net(temp)
54 |     print('LeNet5 out: ', out.shape)
55 | 
56 | 
57 | if __name__ == '__main__':
58 |     main()
59 | 


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/ResNet.py:
--------------------------------------------------------------------------------
  1 | import torch
  2 | from torch import nn
  3 | from torch.nn import functional as F
  4 | 
  5 | 
  6 | class ResBlock(nn.Module):
  7 |     """
  8 |     resnet block
  9 |     """
 10 | 
 11 |     def __init__(self, channel_in, channel_out, stride=1):
 12 |         """
 13 | 
 14 |         :param channel_in:
 15 |         :param channel_out:
 16 |         """
 17 |         super(ResBlock, self).__init__()
 18 |         self.conv1 = nn.Conv2d(channel_in, channel_out, kernel_size=3, stride=stride, padding=1)
 19 |         self.bn1 = nn.BatchNorm2d(channel_out)
 20 |         self.conv2 = nn.Conv2d(channel_out, channel_out, kernel_size=3, stride=1, padding=1)
 21 |         self.bn2 = nn.BatchNorm2d(channel_out)
 22 | 
 23 |         self.extra = nn.Sequential()
 24 | 
 25 |         if channel_out != channel_in:
 26 |             # [b,ch_in,h,w] -> [b,ch_out,h,w]
 27 |             self.extra = nn.Sequential(
 28 |                 nn.Conv2d(channel_in, channel_out, kernel_size=1, stride=stride),
 29 |                 nn.BatchNorm2d(channel_out)
 30 |             )
 31 | 
 32 |     def forward(self, x):
 33 |         """
 34 |         :param x: [b, ch, h, w]
 35 |         :return:
 36 |         """
 37 |         out = F.relu(self.bn1(self.conv1(x)))
 38 |         out = self.bn2(self.conv2(out))
 39 |         # short cut:
 40 |         # extra module : [b,ch_in,h,w] with [b,ch_out,h,w]
 41 |         # element - wise add
 42 |         out = self.extra(x) + out
 43 |         return out
 44 | 
 45 | 
 46 | class ResNet18(nn.Module):
 47 | 
 48 |     def __init__(self):
 49 |         super(ResNet18, self).__init__()
 50 | 
 51 |         self.conv1 = nn.Sequential(
 52 |             nn.Conv2d(3, 64, kernel_size=3, stride=3, padding=1),
 53 |             nn.BatchNorm2d(64)
 54 |         )
 55 |         # followed 4 blocks
 56 |         # [b,64,h,w] -> [b,128,h,w]
 57 |         self.blk1 = ResBlock(64, 128, stride=2)
 58 |         # [b,128,h,w] -> [b,256,h,w]
 59 |         self.blk2 = ResBlock(128, 256, stride=2)
 60 |         # [b,256,h,w] -> [b,512,h,w]
 61 |         self.blk3 = ResBlock(256, 512, stride=2)
 62 |         # [b,512,h,w] -> [b,1024,h,w]
 63 |         self.blk4 = ResBlock(512, 512, stride=2)
 64 | 
 65 |         self.outlayer = nn.Linear(512, 10)
 66 | 
 67 |     def forward(self, x):
 68 |         """
 69 | 
 70 |         :param x:
 71 |         :return:
 72 |         """
 73 |         x = F.relu(self.conv1(x))
 74 |         # [b,64,h,w] -> [b,1024,h,w]
 75 |         x = self.blk1(x)
 76 |         x = self.blk2(x)
 77 |         x = self.blk3(x)
 78 |         x = self.blk4(x)
 79 | 
 80 |         # print('after conv: ', x.shape)  # [b,512,2,2]
 81 |         # [b,512,h,w] -> [b,512,1,1]
 82 |         x = F.adaptive_avg_pool2d(x, [1, 1])
 83 |         # print('after adaptive_avg_pool2d: ', x.shape)
 84 |         x = x.view(x.size(0), -1)
 85 |         x = self.outlayer(x)
 86 | 
 87 |         return x
 88 | 
 89 | 
 90 | def main():
 91 |     blk = ResBlock(64, 128, stride=4)
 92 |     temp = torch.randn(2, 64, 32, 32)
 93 |     out = blk(temp)
 94 |     print('block: ', out.shape)
 95 | 
 96 |     x = torch.randn(2, 3, 32, 32)
 97 |     model = ResNet18()
 98 |     out = model(x)
 99 |     print('Resnet: ', out.shape)
100 | 
101 | 
102 | if __name__ == '__main__':
103 |     main()
104 | 


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/__pycache__/LeNet5.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch08_CIFAR10_ResNet/__pycache__/LeNet5.cpython-35.pyc


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/__pycache__/LeNet5.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch08_CIFAR10_ResNet/__pycache__/LeNet5.cpython-37.pyc


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/__pycache__/ResNet.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch08_CIFAR10_ResNet/__pycache__/ResNet.cpython-35.pyc


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/__pycache__/ResNet.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch08_CIFAR10_ResNet/__pycache__/ResNet.cpython-37.pyc


--------------------------------------------------------------------------------
/ch08_CIFAR10_ResNet/main.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn, optim
 3 | from torch.utils.data import DataLoader
 4 | from torchvision import datasets
 5 | from torchvision import transforms
 6 | 
 7 | from ResNet import ResNet18
 8 | # from LeNet5 import LeNet5
 9 | 
10 | 
11 | def main():
12 |     batch_size = 32
13 | 
14 |     cifar_train = datasets.CIFAR10('../data/', train=True, transform=transforms.Compose([
15 |         transforms.Resize((32, 32)),
16 |         transforms.ToTensor(),
17 |         transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
18 |     ]), download=True)
19 | 
20 |     cifar_train = DataLoader(cifar_train, batch_size=batch_size, shuffle=True)
21 | 
22 |     cifar_test = datasets.CIFAR10('../data/', train=False, transform=transforms.Compose([
23 |         transforms.Resize((32, 32)),
24 |         transforms.ToTensor(),
25 |         transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
26 |     ]), download=True)
27 | 
28 |     cifar_test = DataLoader(cifar_test, batch_size=batch_size, shuffle=True)
29 | 
30 |     x, label = iter(cifar_train).__next__()
31 |     print('x: ', x.shape, 'label: ', label.shape)
32 | 
33 |     device = torch.device('cuda')
34 | 
35 |     # model = LeNet5().to(device)
36 |     model = ResNet18().to(device)
37 | 
38 |     criterion = nn.CrossEntropyLoss().to(device)  # 包含了softmax
39 |     optimizer = optim.Adam(model.parameters(), lr=1e-3)
40 |     print(model)
41 | 
42 |     for epoch in range(100):
43 |         model.train()
44 |         for batch_size, (x, label) in enumerate(cifar_train):
45 |             # x:[b,3,32,32] label:[b]
46 |             x, label = x.to(device), label.to(device)
47 |             logits = model(x)
48 |             # logits:[b,10]  label:[b]
49 |             loss = criterion(logits, label)  # loss:tensor scalar长度为0的标量
50 | 
51 |             # backprop
52 |             optimizer.zero_grad()
53 |             loss.backward()
54 |             optimizer.step()
55 | 
56 |         print('epoch: ', epoch, '  loss:', loss.item())  # 将loss转换为numpy类型打印出来
57 | 
58 |         # test
59 |         model.eval()
60 |         with torch.no_grad():
61 | 
62 |             total_correct = 0
63 |             total_num = 0
64 |             for x, label in cifar_test:
65 |                 x, label = x.to(device), label.to(device)
66 | 
67 |                 # logits: [b,10]
68 |                 logits = model(x)
69 |                 # pred: [b]
70 |                 pred = logits.argmax(dim=1)
71 |                 # [b] vs [b]  -> scalar tensor
72 |                 total_correct += torch.eq(pred, label).float().sum().item()
73 |                 total_num += x.size(0)
74 | 
75 |             acc = total_correct / total_num
76 |             print('acc: ', acc)
77 | 
78 | 
79 | if __name__ == '__main__':
80 |     main()
81 | 


--------------------------------------------------------------------------------
/ch09_循环神经网络RNN&LSTM/.ipynb_checkpoints/ch09_RNN-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# ch09_RNN"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "code",
 12 |    "execution_count": 3,
 13 |    "metadata": {},
 14 |    "outputs": [],
 15 |    "source": [
 16 |     "import torch\n",
 17 |     "from torch import nn"
 18 |    ]
 19 |   },
 20 |   {
 21 |    "cell_type": "markdown",
 22 |    "metadata": {},
 23 |    "source": [
 24 |     "## 9.1 实践序列表示方法\n",
 25 |     "#### word2vec v.s. GloVe"
 26 |    ]
 27 |   },
 28 |   {
 29 |    "cell_type": "code",
 30 |    "execution_count": 11,
 31 |    "metadata": {},
 32 |    "outputs": [
 33 |     {
 34 |      "name": "stdout",
 35 |      "output_type": "stream",
 36 |      "text": [
 37 |       "word2vec:\n",
 38 |       "tensor([[-0.7960,  0.5041, -0.6968, -0.1504,  0.5828]],\n",
 39 |       "       grad_fn=<EmbeddingBackward>)\n"
 40 |      ]
 41 |     }
 42 |    ],
 43 |    "source": [
 44 |     "word_to_ix = {\"hello\":0, \"world\":1}\n",
 45 |     "lookup_tensor = torch.tensor([word_to_ix[\"hello\"]],dtype=torch.long)\n",
 46 |     "embeds = nn.Embedding(2,5) # 2 words in vocab, 5 dimensional embeddings\n",
 47 |     "hello_embed = embeds(lookup_tensor)\n",
 48 |     "print('word2vec:')\n",
 49 |     "print(hello_embed)"
 50 |    ]
 51 |   },
 52 |   {
 53 |    "cell_type": "code",
 54 |    "execution_count": 12,
 55 |    "metadata": {},
 56 |    "outputs": [
 57 |     {
 58 |      "name": "stdout",
 59 |      "output_type": "stream",
 60 |      "text": [
 61 |       "tensor([[-0.0178,  1.4081, -0.5201,  0.9674,  1.0631]],\n",
 62 |       "       grad_fn=<EmbeddingBackward>)\n"
 63 |      ]
 64 |     }
 65 |    ],
 66 |    "source": [
 67 |     "from torchnlp.wor"
 68 |    ]
 69 |   },
 70 |   {
 71 |    "cell_type": "code",
 72 |    "execution_count": null,
 73 |    "metadata": {},
 74 |    "outputs": [],
 75 |    "source": []
 76 |   },
 77 |   {
 78 |    "cell_type": "code",
 79 |    "execution_count": null,
 80 |    "metadata": {},
 81 |    "outputs": [],
 82 |    "source": []
 83 |   }
 84 |  ],
 85 |  "metadata": {
 86 |   "kernelspec": {
 87 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
 88 |    "language": "python",
 89 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
 90 |   },
 91 |   "language_info": {
 92 |    "codemirror_mode": {
 93 |     "name": "ipython",
 94 |     "version": 3
 95 |    },
 96 |    "file_extension": ".py",
 97 |    "mimetype": "text/x-python",
 98 |    "name": "python",
 99 |    "nbconvert_exporter": "python",
100 |    "pygments_lexer": "ipython3",
101 |    "version": "3.5.6"
102 |   },
103 |   "latex_envs": {
104 |    "LaTeX_envs_menu_present": true,
105 |    "autoclose": false,
106 |    "autocomplete": true,
107 |    "bibliofile": "biblio.bib",
108 |    "cite_by": "apalike",
109 |    "current_citInitial": 1,
110 |    "eqLabelWithNumbers": true,
111 |    "eqNumInitial": 1,
112 |    "hotkeys": {
113 |     "equation": "Ctrl-E",
114 |     "itemize": "Ctrl-I"
115 |    },
116 |    "labels_anchors": false,
117 |    "latex_user_defs": false,
118 |    "report_style_numbering": false,
119 |    "user_envs_cfg": false
120 |   },
121 |   "varInspector": {
122 |    "cols": {
123 |     "lenName": 16,
124 |     "lenType": 16,
125 |     "lenVar": 40
126 |    },
127 |    "kernels_config": {
128 |     "python": {
129 |      "delete_cmd_postfix": "",
130 |      "delete_cmd_prefix": "del ",
131 |      "library": "var_list.py",
132 |      "varRefreshCmd": "print(var_dic_list())"
133 |     },
134 |     "r": {
135 |      "delete_cmd_postfix": ") ",
136 |      "delete_cmd_prefix": "rm(",
137 |      "library": "var_list.r",
138 |      "varRefreshCmd": "cat(var_dic_list()) "
139 |     }
140 |    },
141 |    "types_to_exclude": [
142 |     "module",
143 |     "function",
144 |     "builtin_function_or_method",
145 |     "instance",
146 |     "_Feature"
147 |    ],
148 |    "window_display": false
149 |   }
150 |  },
151 |  "nbformat": 4,
152 |  "nbformat_minor": 2
153 | }
154 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.idea/ch10_迁移学习-实战宝可梦精灵.iml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <module type="PYTHON_MODULE" version="4">
 3 |   <component name="NewModuleRootManager">
 4 |     <content url="file://$MODULE_DIR$" />
 5 |     <orderEntry type="jdk" jdkName="Python 3.7 (ch08_CIFAR10_ResNet)" jdkType="Python SDK" />
 6 |     <orderEntry type="sourceFolder" forTests="false" />
 7 |   </component>
 8 |   <component name="TestRunnerService">
 9 |     <option name="projectConfiguration" value="pytest" />
10 |     <option name="PROJECT_TEST_RUNNER" value="pytest" />
11 |   </component>
12 | </module>


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.idea/dictionaries/szz.xml:
--------------------------------------------------------------------------------
1 | <component name="ProjectDictionaryState">
2 |   <dictionary name="szz" />
3 | </component>


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.idea/inspectionProfiles/Project_Default.xml:
--------------------------------------------------------------------------------
 1 | <component name="InspectionProjectProfileManager">
 2 |   <profile version="1.0">
 3 |     <option name="myName" value="Project Default" />
 4 |     <inspection_tool class="PyPep8Inspection" enabled="false" level="WEAK WARNING" enabled_by_default="false" />
 5 |     <inspection_tool class="PyPep8NamingInspection" enabled="false" level="WEAK WARNING" enabled_by_default="false" />
 6 |     <inspection_tool class="SpellCheckingInspection" enabled="false" level="TYPO" enabled_by_default="false">
 7 |       <option name="processCode" value="true" />
 8 |       <option name="processLiterals" value="true" />
 9 |       <option name="processComments" value="true" />
10 |     </inspection_tool>
11 |   </profile>
12 | </component>


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.idea/misc.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="JavaScriptSettings">
4 |     <option name="languageLevel" value="ES6" />
5 |   </component>
6 |   <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.7 (ch08_CIFAR10_ResNet)" project-jdk-type="Python SDK" />
7 | </project>


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.idea/modules.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="ProjectModuleManager">
4 |     <modules>
5 |       <module fileurl="file://$PROJECT_DIR$/.idea/ch10_迁移学习-实战宝可梦精灵.iml" filepath="$PROJECT_DIR$/.idea/ch10_迁移学习-实战宝可梦精灵.iml" />
6 |     </modules>
7 |   </component>
8 | </project>


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.idea/vcs.xml:
--------------------------------------------------------------------------------
1 | <?xml version="1.0" encoding="UTF-8"?>
2 | <project version="4">
3 |   <component name="VcsDirectoryMappings">
4 |     <mapping directory="$PROJECT_DIR$/.." vcs="Git" />
5 |   </component>
6 | </project>


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/.ipynb_checkpoints/ch10_迁移学习-实战宝可梦精灵-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# ch10_迁移学习-实战宝可梦精灵"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "## 10.1 Pokemon数据集\n",
 15 |     "\n",
 16 |     "- 数据集内容:\n",
 17 |     " - 皮卡丘:234\n",
 18 |     " - 超梦:239\n",
 19 |     " - 杰尼龟:223\n",
 20 |     " - 小火龙:238\n",
 21 |     " - 妙蛙种子:234\n",
 22 |     "\n",
 23 |     "- 数据集划分:\n",
 24 |     " - Train 60%:138\n",
 25 |     " - Validation 20%:46\n",
 26 |     " - Test 20%:46\n",
 27 |     " "
 28 |    ]
 29 |   },
 30 |   {
 31 |    "cell_type": "markdown",
 32 |    "metadata": {},
 33 |    "source": [
 34 |     "### Steps:\n",
 35 |     "#### 1.Load data\n",
 36 |     "- Inherit from torch.utils.data.Dataset\n",
 37 |     "- \\_\\_len\\_\\_\n",
 38 |     "- \\_\\_getitem\\_\\_\n",
 39 |     " \n",
 40 |     " ```Python\n",
 41 |     "class NumbersDataset(Dataset):\n",
 42 |     "    def __init__(self,training=True):\n",
 43 |     "        if trainning:\n",
 44 |     "            self.samples = list(range(1,1001))\n",
 45 |     "        else:\n",
 46 |     "            self.samples = list(range(1001,1501))\n",
 47 |     "    \n",
 48 |     "    def __len__(self):\n",
 49 |     "        return len(self.samples)\n",
 50 |     "    \n",
 51 |     "    def __getitem__(self,idx):\n",
 52 |     "        return self.samples[idx]\n",
 53 |     "```\n",
 54 |     "- Preprocessing:\n",
 55 |     " - Image Resize \n",
 56 |     "   - 224x224 for ResNet18\n",
 57 |     " - Data Argumentation\n",
 58 |     "   - Rotate\n",
 59 |     "   - Crop\n",
 60 |     " - Normalize\n",
 61 |     "   - Mean,Std\n",
 62 |     " - ToTensor\n",
 63 |     " \n",
 64 |     "#### 2.Build model\n",
 65 |     "#### 3.Train and Test\n",
 66 |     "#### 4.Transfer Learning\n",
 67 |     "  \n",
 68 |     "  "
 69 |    ]
 70 |   },
 71 |   {
 72 |    "cell_type": "code",
 73 |    "execution_count": null,
 74 |    "metadata": {},
 75 |    "outputs": [],
 76 |    "source": []
 77 |   }
 78 |  ],
 79 |  "metadata": {
 80 |   "kernelspec": {
 81 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
 82 |    "language": "python",
 83 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
 84 |   },
 85 |   "language_info": {
 86 |    "codemirror_mode": {
 87 |     "name": "ipython",
 88 |     "version": 3
 89 |    },
 90 |    "file_extension": ".py",
 91 |    "mimetype": "text/x-python",
 92 |    "name": "python",
 93 |    "nbconvert_exporter": "python",
 94 |    "pygments_lexer": "ipython3",
 95 |    "version": "3.5.6"
 96 |   },
 97 |   "latex_envs": {
 98 |    "LaTeX_envs_menu_present": true,
 99 |    "autoclose": false,
100 |    "autocomplete": true,
101 |    "bibliofile": "biblio.bib",
102 |    "cite_by": "apalike",
103 |    "current_citInitial": 1,
104 |    "eqLabelWithNumbers": true,
105 |    "eqNumInitial": 1,
106 |    "hotkeys": {
107 |     "equation": "Ctrl-E",
108 |     "itemize": "Ctrl-I"
109 |    },
110 |    "labels_anchors": false,
111 |    "latex_user_defs": false,
112 |    "report_style_numbering": false,
113 |    "user_envs_cfg": false
114 |   },
115 |   "varInspector": {
116 |    "cols": {
117 |     "lenName": 16,
118 |     "lenType": 16,
119 |     "lenVar": 40
120 |    },
121 |    "kernels_config": {
122 |     "python": {
123 |      "delete_cmd_postfix": "",
124 |      "delete_cmd_prefix": "del ",
125 |      "library": "var_list.py",
126 |      "varRefreshCmd": "print(var_dic_list())"
127 |     },
128 |     "r": {
129 |      "delete_cmd_postfix": ") ",
130 |      "delete_cmd_prefix": "rm(",
131 |      "library": "var_list.r",
132 |      "varRefreshCmd": "cat(var_dic_list()) "
133 |     }
134 |    },
135 |    "types_to_exclude": [
136 |     "module",
137 |     "function",
138 |     "builtin_function_or_method",
139 |     "instance",
140 |     "_Feature"
141 |    ],
142 |    "window_display": false
143 |   }
144 |  },
145 |  "nbformat": 4,
146 |  "nbformat_minor": 2
147 | }
148 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/__pycache__/pokemon.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/__pycache__/pokemon.cpython-35.pyc


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/__pycache__/pokemon.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/__pycache__/pokemon.cpython-37.pyc


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/__pycache__/resnet.cpython-35.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/__pycache__/resnet.cpython-35.pyc


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/__pycache__/resnet.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/__pycache__/resnet.cpython-37.pyc


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/__pycache__/utils.cpython-37.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/__pycache__/utils.cpython-37.pyc


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/best.mdl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/best.mdl


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/best_for_scratch.mdl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/best_for_scratch.mdl


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/best_for_transfer.mdl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhuozhudd/PyTorch-Course-Note/152d79dc9c6b662f9461bcb06a8afc82dde726f4/ch10_迁移学习-实战宝可梦精灵/best_for_transfer.mdl


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/ch10_迁移学习-实战宝可梦精灵.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# ch10_迁移学习-实战宝可梦精灵"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "## 10.1 Pokemon数据集\n",
 15 |     "\n",
 16 |     "- 数据集内容:\n",
 17 |     " - 皮卡丘:234\n",
 18 |     " - 超梦:239\n",
 19 |     " - 杰尼龟:223\n",
 20 |     " - 小火龙:238\n",
 21 |     " - 妙蛙种子:234\n",
 22 |     "\n",
 23 |     "- 数据集划分:\n",
 24 |     " - Train 60%:138\n",
 25 |     " - Validation 20%:46\n",
 26 |     " - Test 20%:46\n",
 27 |     " "
 28 |    ]
 29 |   },
 30 |   {
 31 |    "cell_type": "markdown",
 32 |    "metadata": {},
 33 |    "source": [
 34 |     "### Steps:\n",
 35 |     "#### 1.Load data\n",
 36 |     "- Inherit from torch.utils.data.Dataset\n",
 37 |     "- \\_\\_len\\_\\_\n",
 38 |     "- \\_\\_getitem\\_\\_\n",
 39 |     " \n",
 40 |     " ```Python\n",
 41 |     "class NumbersDataset(Dataset):\n",
 42 |     "    def __init__(self,training=True):\n",
 43 |     "        if trainning:\n",
 44 |     "            self.samples = list(range(1,1001))\n",
 45 |     "        else:\n",
 46 |     "            self.samples = list(range(1001,1501))\n",
 47 |     "    \n",
 48 |     "    def __len__(self):\n",
 49 |     "        return len(self.samples)\n",
 50 |     "    \n",
 51 |     "    def __getitem__(self,idx):\n",
 52 |     "        return self.samples[idx]\n",
 53 |     "```\n",
 54 |     "- Preprocessing:\n",
 55 |     " - Image Resize \n",
 56 |     "   - 224x224 for ResNet18\n",
 57 |     " - Data Argumentation\n",
 58 |     "   - Rotate\n",
 59 |     "   - Crop\n",
 60 |     " - Normalize\n",
 61 |     "   - Mean,Std\n",
 62 |     " - ToTensor\n",
 63 |     " \n",
 64 |     "#### 2.Build model\n",
 65 |     "#### 3.Train and Test\n",
 66 |     "\n",
 67 |     "```Python\n",
 68 |     "for epoch in range(epochs):\n",
 69 |     "    train(train_db):\n",
 70 |     "        if epoch%10 == 0:\n",
 71 |     "            val_acc = evaluate(val_db)\n",
 72 |     "            if val_acc is the best:\n",
 73 |     "                save_checkpoint()\n",
 74 |     "            if out_of_patience():\n",
 75 |     "                break\n",
 76 |     "load_checkpoint()\n",
 77 |     "test_acc = evaluate(test_db)\n",
 78 |     "```\n",
 79 |     "\n",
 80 |     "\n",
 81 |     "#### 4.Transfer Learning\n",
 82 |     "  \n",
 83 |     "  "
 84 |    ]
 85 |   },
 86 |   {
 87 |    "cell_type": "code",
 88 |    "execution_count": 2,
 89 |    "metadata": {},
 90 |    "outputs": [],
 91 |    "source": [
 92 |     "import torch\n",
 93 |     "from torch import optim"
 94 |    ]
 95 |   },
 96 |   {
 97 |    "cell_type": "code",
 98 |    "execution_count": null,
 99 |    "metadata": {},
100 |    "outputs": [],
101 |    "source": [
102 |     "torch.optim.Adam()"
103 |    ]
104 |   }
105 |  ],
106 |  "metadata": {
107 |   "kernelspec": {
108 |    "display_name": "Python 3.5.6 64-bit ('base': conda)",
109 |    "language": "python",
110 |    "name": "python35664bitbaseconda34414b764a4544e4b3502fc9f239efc6"
111 |   },
112 |   "language_info": {
113 |    "codemirror_mode": {
114 |     "name": "ipython",
115 |     "version": 3
116 |    },
117 |    "file_extension": ".py",
118 |    "mimetype": "text/x-python",
119 |    "name": "python",
120 |    "nbconvert_exporter": "python",
121 |    "pygments_lexer": "ipython3",
122 |    "version": "3.5.6"
123 |   },
124 |   "latex_envs": {
125 |    "LaTeX_envs_menu_present": true,
126 |    "autoclose": false,
127 |    "autocomplete": true,
128 |    "bibliofile": "biblio.bib",
129 |    "cite_by": "apalike",
130 |    "current_citInitial": 1,
131 |    "eqLabelWithNumbers": true,
132 |    "eqNumInitial": 1,
133 |    "hotkeys": {
134 |     "equation": "Ctrl-E",
135 |     "itemize": "Ctrl-I"
136 |    },
137 |    "labels_anchors": false,
138 |    "latex_user_defs": false,
139 |    "report_style_numbering": false,
140 |    "user_envs_cfg": false
141 |   },
142 |   "varInspector": {
143 |    "cols": {
144 |     "lenName": 16,
145 |     "lenType": 16,
146 |     "lenVar": 40
147 |    },
148 |    "kernels_config": {
149 |     "python": {
150 |      "delete_cmd_postfix": "",
151 |      "delete_cmd_prefix": "del ",
152 |      "library": "var_list.py",
153 |      "varRefreshCmd": "print(var_dic_list())"
154 |     },
155 |     "r": {
156 |      "delete_cmd_postfix": ") ",
157 |      "delete_cmd_prefix": "rm(",
158 |      "library": "var_list.r",
159 |      "varRefreshCmd": "cat(var_dic_list()) "
160 |     }
161 |    },
162 |    "types_to_exclude": [
163 |     "module",
164 |     "function",
165 |     "builtin_function_or_method",
166 |     "instance",
167 |     "_Feature"
168 |    ],
169 |    "window_display": false
170 |   }
171 |  },
172 |  "nbformat": 4,
173 |  "nbformat_minor": 2
174 | }
175 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/pokemon.py:
--------------------------------------------------------------------------------
  1 | import csv
  2 | import glob
  3 | import os
  4 | import random
  5 | import time
  6 | 
  7 | import torch
  8 | import torchvision
  9 | import visdom
 10 | from PIL import Image
 11 | from torch.utils.data import Dataset, DataLoader
 12 | from torchvision import transforms
 13 | 
 14 | 
 15 | class Pokemon(Dataset):
 16 |     def __init__(self, root, resize, mode):
 17 |         super(Pokemon, self).__init__()
 18 | 
 19 |         self.root = root
 20 |         self.resize = resize
 21 | 
 22 |         self.name2label = {}
 23 |         for name in sorted(os.listdir(os.path.join(root))):
 24 |             if not os.path.isdir(os.path.join(root, name)):
 25 |                 continue
 26 |             self.name2label[name] = len(self.name2label.keys())
 27 | 
 28 |         # print(self.name2label)
 29 |         # image <-> label
 30 |         self.images, self.labels = self.load_csv('images.csv')
 31 | 
 32 |         # 划分数据
 33 |         if mode == 'train':  # train 60% : 0~60%
 34 |             self.images = self.images[:int(0.6 * len(self.images))]
 35 |             self.labels = self.labels[:int(0.6 * len(self.labels))]
 36 | 
 37 |         elif mode == 'val':  # val 20% : 60%~80%
 38 |             self.images = self.images[int(0.6 * len(self.images)):int(0.8 * len(self.images))]
 39 |             self.labels = self.labels[int(0.6 * len(self.labels)):int(0.8 * len(self.labels))]
 40 | 
 41 |         else:  # test 20% : 80%~100%
 42 |             self.images = self.images[int(0.8 * len(self.images)):]
 43 |             self.labels = self.labels[int(0.8 * len(self.labels)):]
 44 | 
 45 |     def load_csv(self, filename):
 46 | 
 47 |         if not os.path.exists(os.path.join(self.root, filename)):
 48 |             images = []
 49 |             for name in self.name2label.keys():
 50 |                 # 'pokemon\\mewtwo\\00001.png'
 51 |                 images += glob.glob(os.path.join(self.root, name, '*.png'))
 52 |                 images += glob.glob(os.path.join(self.root, name, '*.jpg'))
 53 |                 images += glob.glob(os.path.join(self.root, name, '*.jpeg'))
 54 |             # 1165 '../data/pokemon/squirtle/00000170.png'
 55 |             print(len(images), images)
 56 | 
 57 |             random.shuffle(images)
 58 |             with open(os.path.join(self.root, filename), mode='w', newline='') as f:
 59 |                 writer = csv.writer(f)
 60 |                 for img in images:  # '../data/pokemon/squirtle/00000170.png'
 61 |                     name = img.split(os.sep)[-2]
 62 |                     label = self.name2label[name]
 63 |                     # '../data/pokemon/squirtle/00000170.png' , 4
 64 |                     writer.writerow([img, label])
 65 | 
 66 |                 print('writen into csv file:', filename)
 67 | 
 68 |         # read from csv file
 69 |         images, labels = [], []
 70 |         with open(os.path.join(self.root, filename)) as f:
 71 |             reader = csv.reader(f)
 72 |             for row in reader:
 73 |                 img, label = row
 74 |                 label = int(label)
 75 |                 images.append(img)
 76 |                 labels.append(label)
 77 | 
 78 |         assert len(images) == len(labels)
 79 |         return images, labels
 80 | 
 81 |     def __len__(self):
 82 |         return len(self.images)
 83 | 
 84 |     def denormalize(self, x_hat):
 85 |         # 由于visdom接收的图片是0～1，正则化后是-1~1，显示效果不好，所以显示时需要denormalize
 86 |         mean = [0.485, 0.456, 0.406]
 87 |         std = [0.229, 0.224, 0.225]
 88 |         # x_hat = (x-mean)/std
 89 |         # x:[c,h,w]  mean:[3] -> [3,1,1] -> broadcast
 90 |         mean = torch.tensor(mean).unsqueeze(1).unsqueeze(1)
 91 |         std = torch.tensor(std).unsqueeze(1).unsqueeze(1)
 92 |         x = x_hat * std + mean
 93 |         return x
 94 | 
 95 |     def __getitem__(self, idx):
 96 |         # idx : [0~len(images)]
 97 |         # 这里的img只是一个路径
 98 |         img, label = self.images[idx], self.labels[idx]
 99 |         tf = transforms.Compose([
100 |             lambda x: Image.open(x).convert('RGB'),  # 把路径转换为RGB图
101 |             transforms.Resize((int(self.resize * 1.25), int(self.resize * 1.25))),
102 |             transforms.RandomRotation(15),  # 旋转15度
103 |             transforms.CenterCrop(self.resize),  # 中心裁剪
104 |             transforms.ToTensor(),
105 |             transforms.Normalize(mean=[0.485, 0.456, 0.406],
106 |                                  std=[0.229, 0.224, 0.225])
107 |         ])
108 |         img = tf(img)
109 |         label = torch.tensor(label)  # 将label转换为tensor
110 |         return img, label
111 | 
112 | 
113 | def main():
114 |     viz = visdom.Visdom()
115 | 
116 |     db = Pokemon('../data/pokemon', 224, 'train')
117 |     x, y = next(iter(db))
118 |     print('sample: ', x.shape, y.shape, y)
119 |     viz.image(db.denormalize(x), win='sample_x', opts=dict(title='sample_x'))
120 | 
121 |     loader = DataLoader(db, batch_size=32, shuffle=True)
122 |     # 批处理后，每次读取32张图
123 |     for x, y in loader:
124 |         viz.images(db.denormalize(x), nrow=8, win='batch', opts=dict(title='batch'))
125 |         viz.text(str(y.numpy()), win='label', opts=dict(title='batch-y'))
126 |         time.sleep(10)
127 | 
128 | 
129 | if __name__ == '__main__':
130 |     main()
131 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/pokemon_useAPI.py:
--------------------------------------------------------------------------------
 1 | import time
 2 | 
 3 | import torchvision
 4 | import visdom
 5 | from torch.utils.data import DataLoader
 6 | from torchvision import transforms
 7 | 
 8 | 
 9 | def main():
10 |     viz = visdom.Visdom()
11 | 
12 |     tf = transforms.Compose([
13 |         transforms.Resize((64, 64)),
14 |         transforms.ToTensor()
15 |     ])
16 |     db = torchvision.datasets.ImageFolder(root='../data/pokemon', transform=tf)
17 | 
18 |     # num_workers=8 8线程加速，让batch_size过大时可以使用
19 |     loader = DataLoader(db, batch_size=32, shuffle=True)
20 |     # num_workers=8 8线程加速，让batch_size过大时可以使用
21 |     # loader = DataLoader(db, batch_size=32, shuffle=True, num_workers=8)
22 | 
23 |     print(db.class_to_idx)  # name2label信息
24 | 
25 |     # 批处理后，每次读取32张图
26 |     for x, y in loader:
27 |         viz.images(x, nrow=8, win='batch', opts=dict(title='batch'))
28 |         viz.text(str(y.numpy()), win='label', opts=dict(title='batch-y'))
29 |         time.sleep(10)
30 |         print('one batch')
31 | 
32 | 
33 | if __name__ == '__main__':
34 |     main()
35 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/resnet.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | from torch.nn import functional as F
 4 | 
 5 | 
 6 | class ResBlock(nn.Module):
 7 |     """
 8 |     resnet block
 9 |     """
10 | 
11 |     def __init__(self, channel_in, channel_out, stride=1):
12 |         """
13 | 
14 |         :param channel_in:
15 |         :param channel_out:
16 |         """
17 |         super(ResBlock, self).__init__()
18 |         self.conv1 = nn.Conv2d(channel_in, channel_out, kernel_size=3, stride=stride, padding=1)
19 |         self.bn1 = nn.BatchNorm2d(channel_out)
20 |         self.conv2 = nn.Conv2d(channel_out, channel_out, kernel_size=3, stride=1, padding=1)
21 |         self.bn2 = nn.BatchNorm2d(channel_out)
22 | 
23 |         self.extra = nn.Sequential()
24 |         if channel_out != channel_in:
25 |             # [b,ch_in,h,w] -> [b,ch_out,h,w]
26 |             self.extra = nn.Sequential(
27 |                 nn.Conv2d(channel_in, channel_out, kernel_size=1, stride=stride),
28 |                 nn.BatchNorm2d(channel_out)
29 |             )
30 | 
31 |     def forward(self, x):
32 |         """
33 |         :param x: [b, ch, h, w]
34 |         :return:
35 |         """
36 |         out = F.relu(self.bn1(self.conv1(x)))
37 |         out = self.bn2(self.conv2(out))
38 |         # short cut:
39 |         # extra module : [b,ch_in,h,w] with [b,ch_out,h,w]
40 |         # element - wise add
41 |         out = self.extra(x) + out
42 |         out = F.relu(out)
43 |         return out
44 | 
45 | 
46 | class ResNet18(nn.Module):
47 | 
48 |     def __init__(self, num_class):
49 |         super(ResNet18, self).__init__()
50 | 
51 |         self.conv1 = nn.Sequential(
52 |             nn.Conv2d(3, 16, kernel_size=3, stride=3, padding=0),
53 |             nn.BatchNorm2d(16)
54 |         )
55 |         # followed 4 blocks
56 |         self.blk1 = ResBlock(16, 32, stride=3)   # [b,16,h,w] -> [b,32,h,3]
57 |         self.blk2 = ResBlock(32, 64, stride=3)   # [b,32,h,w] -> [b,64,h,w]
58 |         self.blk3 = ResBlock(64, 128, stride=2)  # [b,64,h,w] -> [b,128,h,w]
59 |         self.blk4 = ResBlock(128, 256, stride=2)  # [b,128,h,w] -> [b,256,h,w]
60 | 
61 |         self.outlayer = nn.Linear(256 * 3 * 3, num_class)  # [b,256,7,7]
62 | 
63 |     def forward(self, x):
64 |         """
65 | 
66 |         :param x:
67 |         :return:
68 |         """
69 |         x = F.relu(self.conv1(x))
70 |         # [b,64,h,w] -> [b,1024,h,w]
71 |         x = self.blk1(x)
72 |         x = self.blk2(x)
73 |         x = self.blk3(x)
74 |         x = self.blk4(x)
75 | 
76 |         x = x.view(x.size(0), -1)
77 |         x = self.outlayer(x)
78 | 
79 |         return x
80 | 
81 | 
82 | def main():
83 |     blk = ResBlock(64, 128)
84 |     temp = torch.randn(2, 64, 224, 224)
85 |     out = blk(temp)
86 |     print('block: ', out.shape)
87 | 
88 |     model = ResNet18(5)  # 5类 num_class
89 |     temp = torch.randn(2, 3, 224, 224)
90 |     out = model(temp)
91 |     print('resnet:', out.shape)
92 | 
93 |     p = sum(map(lambda p: p.numel(), model.parameters()))
94 |     print('parameters size: ', p)
95 | 
96 | 
97 | if __name__ == '__main__':
98 |     main()
99 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/train_scratch.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import optim, nn
 3 | from torch.utils.data import DataLoader
 4 | import visdom
 5 | from pokemon import Pokemon
 6 | from resnet import ResNet18
 7 | 
 8 | batch_size = 256
 9 | lr = 1e-3
10 | epoches = 10
11 | 
12 | device = torch.device('cuda')
13 | torch.manual_seed(1234)
14 | 
15 | train_db = Pokemon('../data/pokemon', 224, mode='train')
16 | val_db = Pokemon('../data/pokemon', 224, mode='val')
17 | test_db = Pokemon('../data/pokemon', 224, mode='test')
18 | train_loader = DataLoader(train_db, batch_size=batch_size, shuffle=True, num_workers=4)
19 | val_loader = DataLoader(val_db, batch_size=batch_size, num_workers=2)
20 | test_loader = DataLoader(test_db, batch_size=batch_size, num_workers=2)
21 | 
22 | viz = visdom.Visdom()
23 | 
24 | 
25 | def evalute(model, loader):
26 |     correct = 0
27 |     total = len(loader.dataset)
28 |     for x, y in loader:
29 |         x, y = x.to(device), y.to(device)
30 |         with torch.no_grad():
31 |             logits = model(x)
32 |             pred = logits.argmax(dim=1)
33 |         correct += torch.eq(pred, y).sum().float().item()
34 |     return correct / total
35 | 
36 | 
37 | def main():
38 |     model = ResNet18(5).to(device)
39 |     optimizer = optim.Adam(model.parameters(), lr=lr)
40 |     criterion = nn.CrossEntropyLoss()
41 | 
42 |     best_acc, best_epoch = 0, 0
43 |     global_step = 0
44 |     viz.line([0], [-1], win='loss', opts=dict(title='loss'))
45 |     viz.line([0], [-1], win='val_acc', opts=dict(title='val_acc'))
46 | 
47 |     for epoch in range(epoches):
48 |         for step, (x, y) in enumerate(train_loader):
49 |             # x:[b,3,224,224,] y:[b]
50 |             x, y = x.to(device), y.to(device)
51 |             logits = model(x)
52 |             loss = criterion(logits, y)
53 | 
54 |             optimizer.zero_grad()
55 |             loss.backward()
56 |             optimizer.step()
57 | 
58 |             viz.line([loss.item()], [global_step], win='loss', update='append')
59 |             global_step += 1
60 | 
61 |         # validation
62 |         if epoch % 1 == 0:
63 |             val_acc = evalute(model, val_loader)
64 |             if val_acc > best_acc:
65 |                 best_epoch = epoch
66 |                 best_acc = val_acc
67 |                 torch.save(model.state_dict(), 'best_for_scratch.mdl')  # 保存模型
68 | 
69 |                 viz.line([val_acc], [global_step], win='val_acc', update='append')
70 | 
71 |     print('best acc: ', best_acc, ' best epoch: ', best_epoch)
72 |     model.load_state_dict(torch.load('best_for_scratch.mdl'))
73 |     print('loader from ckpt!')
74 | 
75 |     test_acc = evalute(model, test_loader)
76 |     print('test acc:', test_acc)
77 | 
78 | 
79 | if __name__ == '__main__':
80 |     main()
81 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/train_transfer.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import visdom
 3 | from torch import optim, nn
 4 | from torch.utils.data import DataLoader
 5 | from torchvision.models import resnet18
 6 | 
 7 | from pokemon import Pokemon
 8 | from utils import Flatten
 9 | 
10 | # torchvision中的resnet18自带已经训练好的权重
11 | # from resnet import ResNet18
12 | 
13 | 
14 | batch_size = 32
15 | lr = 1e-3
16 | epoches = 10
17 | 
18 | device = torch.device('cuda')
19 | torch.manual_seed(1234)
20 | 
21 | train_db = Pokemon('../data/pokemon', 224, mode='train')
22 | val_db = Pokemon('../data/pokemon', 224, mode='val')
23 | test_db = Pokemon('../data/pokemon', 224, mode='test')
24 | train_loader = DataLoader(train_db, batch_size=batch_size, shuffle=True, num_workers=4)
25 | val_loader = DataLoader(val_db, batch_size=batch_size, num_workers=2)
26 | test_loader = DataLoader(test_db, batch_size=batch_size, num_workers=2)
27 | 
28 | viz = visdom.Visdom()
29 | 
30 | 
31 | def evalute(model, loader):
32 |     correct = 0
33 |     total = len(loader.dataset)
34 |     for x, y in loader:
35 |         x, y = x.to(device), y.to(device)
36 |         with torch.no_grad():
37 |             logits = model(x)
38 |             pred = logits.argmax(dim=1)
39 |         correct += torch.eq(pred, y).sum().float().item()
40 |     return correct / total
41 | 
42 | 
43 | def main():
44 |     trained_model = resnet18(pretrained=True)
45 |     # 用children()方法取resnet18前17层的权重，转换成list，[:-1]即前17层，
46 |     # 由于Sequential接收的是打散的数据，所以加*
47 |     model = nn.Sequential(*list(trained_model.children())[:-1],
48 |                           Flatten(),  # [b,512,1,1]->[b,512]
49 |                           nn.Linear(512, 5)
50 |                           )  # 迁移学习
51 |     model = model.to(device)
52 |     # x = torch.randn(2,3,224,224)
53 |     # print(model(x).shape)
54 | 
55 |     optimizer = optim.Adam(model.parameters(), lr=lr)
56 |     criterion = nn.CrossEntropyLoss()
57 | 
58 |     best_acc, best_epoch = 0, 0
59 |     global_step = 0
60 | 
61 |     viz.line([0], [-1], win='loss', opts=dict(title='loss'))
62 |     viz.line([0], [-1], win='val_acc', opts=dict(title='val_acc'))
63 | 
64 |     for epoch in range(epoches):
65 |         for step, (x, y) in enumerate(train_loader):
66 |             # x:[b,3,224,224,] y:[b]
67 |             x, y = x.to(device), y.to(device)
68 |             logits = model(x)
69 |             loss = criterion(logits, y)
70 | 
71 |             optimizer.zero_grad()
72 |             loss.backward()
73 |             optimizer.step()
74 | 
75 |             viz.line([loss.item()], [global_step], win='loss', update='append')
76 |             global_step += 1
77 | 
78 |         # validation
79 |         if epoch % 1 == 0:
80 |             val_acc = evalute(model, val_loader)
81 |             if val_acc > best_acc:
82 |                 best_epoch = epoch
83 |                 best_acc = val_acc
84 |                 torch.save(model.state_dict(), 'best_for_transfer.mdl')  # 保存模型
85 | 
86 |                 viz.line([val_acc], [global_step], win='val_acc', update='append')
87 | 
88 |     print('best acc: ', best_acc, ' best epoch: ', best_epoch)
89 |     model.load_state_dict(torch.load('best_for_transfer.mdl'))
90 |     print('loader from ckpt!')
91 | 
92 |     test_acc = evalute(model, test_loader)
93 |     print('test acc:', test_acc)
94 | 
95 | 
96 | if __name__ == '__main__':
97 |     main()
98 | 


--------------------------------------------------------------------------------
/ch10_迁移学习-实战宝可梦精灵/utils.py:
--------------------------------------------------------------------------------
 1 | import matplotlib.pyplot as plt
 2 | import torch
 3 | from torch import nn
 4 | 
 5 | 
 6 | class Flatten(nn.Module):
 7 |     def __init__(self):
 8 |         super(Flatten, self).__init__()
 9 | 
10 |     def forward(self, x):
11 |         shape = torch.prod(torch.tensor(x.shape[1:])).item()
12 |         return x.view(-1, shape)
13 | 
14 | 
15 | def plot_image(img,label,name):
16 |     fig = plt.figure()
17 |     for i in range(6):
18 |         plt.subplot(2,3,i+1)
19 |         plt.tight_layout()
20 |         plt.imshow(img[i][0]*0.3081+0.1307,cmap='grapy',interpolation='none')
21 |         plt.title("{}: {}".format(name,label[i].item()))
22 |         plt.xticks([])
23 |         plt.yticks([])
24 |     plt.show()


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/.idea/ch11_自编码器 Auto-Encoders.iml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <module type="PYTHON_MODULE" version="4">
 3 |   <component name="NewModuleRootManager">
 4 |     <content url="file://$MODULE_DIR$" />
 5 |     <orderEntry type="jdk" jdkName="Python 3.7 (ch08_CIFAR10_ResNet)" jdkType="Python SDK" />
 6 |     <orderEntry type="sourceFolder" forTests="false" />
 7 |   </component>
 8 |   <component name="TestRunnerService">
 9 |     <option name="PROJECT_TEST_RUNNER" value="Unittests" />
10 |   </component>
11 | </module>


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/.ipynb_checkpoints/11 - Auto-Encoders-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# 11.1 - Auto-Encoder原理\n"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "attachments": {},
 12 |    "cell_type": "markdown",
 13 |    "metadata": {},
 14 |    "source": [
 15 |     "<img src=\"images/1.png\" style=\"zoom:70%\" />\n",
 16 |     "\n",
 17 |     "- 可以将目标输出当作自己本身\n",
 18 |     "- 可以把 Encoder+Code+Decoder 理解成一个神经网络\n",
 19 |     "- 从784维降维到2维，易于可视化\n",
 20 |     "\n",
 21 |     "<br><br>\n",
 22 |     "## How to Train?\n",
 23 |     "- loss function for **binary** inputs?\n",
 24 |     "$$ l \\space (f(x)) = - \\sum_k{x_k \\log(\\hat{x_k}) + (1-x_k) \\log (1-\\hat{x_k}) }$$\n",
 25 |     "Cross-Entropy error function (reconstruction loss)  $\\space \\space f(x) \\equiv \\hat{x}$\n",
 26 |     "<br>\n",
 27 |     "- Loss function for **real-valued** inputs\n",
 28 |     "$$l \\space (f(x)) = \\frac{1}{2} \\sum_k{ (\\hat{x_k} - x_k)^2}$$\n",
 29 |     " - sum of squared differences (reconstruction loss)\n",
 30 |     " - we use a linear activation function at the output\n",
 31 |     "\n",
 32 |     "<br><br>\n",
 33 |     "\n",
 34 |     "## PCA V.S. Auto-Encoders\n",
 35 |     "- PCA, which finds the directions of maximal variance in high-dimentsional data, select only those axes that have the largest variance.\n",
 36 |     "- The linearity of PCA, however, places significant limitations on the kinds of feature dimentsions that can be extracted.\n",
 37 |     "<br><br>\n",
 38 |     "#### 降维后再重建的效果图\n",
 39 |     "<img src=\"images/2.png\" style=\"zoom:70%\" />\n",
 40 |     "\n",
 41 |     "<br><br>\n",
 42 |     "\n",
 43 |     "# 11.2 - Auto-Encoders变种\n",
 44 |     "\n",
 45 |     "## 变种一：Denoising AutoEncoders\n",
 46 |     "<img src=\"images/3.png\" style=\"zoom:70%\" />\n",
 47 |     "\n",
 48 |     "<br><br>\n",
 49 |     "## 变种二：Dropout Auto-Encoders\n",
 50 |     "<img src=\"images/4.png\" style=\"zoom:70%\" />\n",
 51 |     "\n",
 52 |     "<br><br>\n",
 53 |     "## 变种三：Adversarial AutoEncoders\n",
 54 |     "- Distribution of hidden code\n",
 55 |     "<img src=\"images/5.png\" style=\"zoom:70%\" />\n",
 56 |     "<br>\n",
 57 |     "- Give more details after GAN\n",
 58 |     "<img src=\"images/6.png\" style=\"zoom:70%\" />\n"
 59 |    ]
 60 |   },
 61 |   {
 62 |    "cell_type": "code",
 63 |    "execution_count": null,
 64 |    "metadata": {},
 65 |    "outputs": [],
 66 |    "source": []
 67 |   },
 68 |   {
 69 |    "cell_type": "code",
 70 |    "execution_count": null,
 71 |    "metadata": {},
 72 |    "outputs": [],
 73 |    "source": []
 74 |   },
 75 |   {
 76 |    "cell_type": "code",
 77 |    "execution_count": null,
 78 |    "metadata": {},
 79 |    "outputs": [],
 80 |    "source": []
 81 |   }
 82 |  ],
 83 |  "metadata": {
 84 |   "kernelspec": {
 85 |    "display_name": "Python 3",
 86 |    "language": "python",
 87 |    "name": "python3"
 88 |   },
 89 |   "language_info": {
 90 |    "codemirror_mode": {
 91 |     "name": "ipython",
 92 |     "version": 3
 93 |    },
 94 |    "file_extension": ".py",
 95 |    "mimetype": "text/x-python",
 96 |    "name": "python",
 97 |    "nbconvert_exporter": "python",
 98 |    "pygments_lexer": "ipython3",
 99 |    "version": "3.7.0"
100 |   },
101 |   "stem_cell": {
102 |    "cell_type": "raw",
103 |    "metadata": {
104 |     "pycharm": {
105 |      "metadata": false
106 |     }
107 |    },
108 |    "source": ""
109 |   },
110 |   "varInspector": {
111 |    "cols": {
112 |     "lenName": 16,
113 |     "lenType": 16,
114 |     "lenVar": 40
115 |    },
116 |    "kernels_config": {
117 |     "python": {
118 |      "delete_cmd_postfix": "",
119 |      "delete_cmd_prefix": "del ",
120 |      "library": "var_list.py",
121 |      "varRefreshCmd": "print(var_dic_list())"
122 |     },
123 |     "r": {
124 |      "delete_cmd_postfix": ") ",
125 |      "delete_cmd_prefix": "rm(",
126 |      "library": "var_list.r",
127 |      "varRefreshCmd": "cat(var_dic_list()) "
128 |     }
129 |    },
130 |    "types_to_exclude": [
131 |     "module",
132 |     "function",
133 |     "builtin_function_or_method",
134 |     "instance",
135 |     "_Feature"
136 |    ],
137 |    "window_display": false
138 |   }
139 |  },
140 |  "nbformat": 4,
141 |  "nbformat_minor": 1
142 | }
143 | 


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/11 - Auto-Encoders.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# 11.1 - Auto-Encoder原理\n"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "attachments": {},
 12 |    "cell_type": "markdown",
 13 |    "metadata": {},
 14 |    "source": [
 15 |     "<img src=\"images/1.png\" style=\"zoom:70%\" />\n",
 16 |     "\n",
 17 |     "- 可以将目标输出当作自己本身\n",
 18 |     "- 可以把 Encoder+Code+Decoder 理解成一个神经网络\n",
 19 |     "- 从784维降维到2维，易于可视化\n",
 20 |     "\n",
 21 |     "<br><br>\n",
 22 |     "## How to Train?\n",
 23 |     "- loss function for **binary** inputs?\n",
 24 |     "$$ l \\space (f(x)) = - \\sum_k{x_k \\log(\\hat{x_k}) + (1-x_k) \\log (1-\\hat{x_k}) }$$\n",
 25 |     "Cross-Entropy error function (reconstruction loss)  $\\space \\space f(x) \\equiv \\hat{x}$\n",
 26 |     "<br>\n",
 27 |     "- Loss function for **real-valued** inputs\n",
 28 |     "$$l \\space (f(x)) = \\frac{1}{2} \\sum_k{ (\\hat{x_k} - x_k)^2}$$\n",
 29 |     " - sum of squared differences (reconstruction loss)\n",
 30 |     " - we use a linear activation function at the output\n",
 31 |     "\n",
 32 |     "<br><br>\n",
 33 |     "\n",
 34 |     "## PCA V.S. Auto-Encoders\n",
 35 |     "- PCA, which finds the directions of maximal variance in high-dimentsional data, select only those axes that have the largest variance.\n",
 36 |     "- The linearity of PCA, however, places significant limitations on the kinds of feature dimentsions that can be extracted.\n",
 37 |     "<br><br>\n",
 38 |     "#### 降维后再重建的效果图\n",
 39 |     "<img src=\"images/2.png\" style=\"zoom:70%\" />\n",
 40 |     "\n",
 41 |     "<br><br>\n",
 42 |     "\n",
 43 |     "# 11.2 - Auto-Encoders变种\n",
 44 |     "\n",
 45 |     "## 变种一：Denoising AutoEncoders\n",
 46 |     "<img src=\"images/3.png\" style=\"zoom:70%\" />\n",
 47 |     "\n",
 48 |     "<br><br>\n",
 49 |     "## 变种二：Dropout Auto-Encoders\n",
 50 |     "<img src=\"images/4.png\" style=\"zoom:70%\" />\n",
 51 |     "\n",
 52 |     "<br><br>\n",
 53 |     "## 变种三：Adversarial AutoEncoders\n",
 54 |     "- Distribution of hidden code\n",
 55 |     "<img src=\"images/5.png\" style=\"zoom:70%\" />\n",
 56 |     "<br>\n",
 57 |     "- Give more details after GAN\n",
 58 |     "<img src=\"images/6.png\" style=\"zoom:70%\" />\n"
 59 |    ]
 60 |   },
 61 |   {
 62 |    "cell_type": "code",
 63 |    "execution_count": null,
 64 |    "metadata": {},
 65 |    "outputs": [],
 66 |    "source": []
 67 |   },
 68 |   {
 69 |    "cell_type": "code",
 70 |    "execution_count": null,
 71 |    "metadata": {},
 72 |    "outputs": [],
 73 |    "source": []
 74 |   },
 75 |   {
 76 |    "cell_type": "code",
 77 |    "execution_count": null,
 78 |    "metadata": {},
 79 |    "outputs": [],
 80 |    "source": []
 81 |   }
 82 |  ],
 83 |  "metadata": {
 84 |   "kernelspec": {
 85 |    "display_name": "Python 3",
 86 |    "language": "python",
 87 |    "name": "python3"
 88 |   },
 89 |   "language_info": {
 90 |    "codemirror_mode": {
 91 |     "name": "ipython",
 92 |     "version": 3
 93 |    },
 94 |    "file_extension": ".py",
 95 |    "mimetype": "text/x-python",
 96 |    "name": "python",
 97 |    "nbconvert_exporter": "python",
 98 |    "pygments_lexer": "ipython3",
 99 |    "version": "3.7.0"
100 |   },
101 |   "stem_cell": {
102 |    "cell_type": "raw",
103 |    "metadata": {
104 |     "pycharm": {
105 |      "metadata": false
106 |     }
107 |    },
108 |    "source": ""
109 |   },
110 |   "varInspector": {
111 |    "cols": {
112 |     "lenName": 16,
113 |     "lenType": 16,
114 |     "lenVar": 40
115 |    },
116 |    "kernels_config": {
117 |     "python": {
118 |      "delete_cmd_postfix": "",
119 |      "delete_cmd_prefix": "del ",
120 |      "library": "var_list.py",
121 |      "varRefreshCmd": "print(var_dic_list())"
122 |     },
123 |     "r": {
124 |      "delete_cmd_postfix": ") ",
125 |      "delete_cmd_prefix": "rm(",
126 |      "library": "var_list.r",
127 |      "varRefreshCmd": "cat(var_dic_list()) "
128 |     }
129 |    },
130 |    "types_to_exclude": [
131 |     "module",
132 |     "function",
133 |     "builtin_function_or_method",
134 |     "instance",
135 |     "_Feature"
136 |    ],
137 |    "window_display": false
138 |   }
139 |  },
140 |  "nbformat": 4,
141 |  "nbformat_minor": 1
142 | }
143 | 


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/ae.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | 
 4 | 
 5 | class AE(nn.Module):
 6 | 
 7 |     def __init__(self):
 8 |         super(AE, self).__init__()
 9 | 
10 |         # [b,784] -> [b,20]
11 |         self.encoder = nn.Sequential(
12 |             nn.Linear(784, 256),
13 |             nn.ReLU(),
14 |             nn.Linear(256, 64),
15 |             nn.ReLU(),
16 |             nn.Linear(64, 20),
17 |             nn.ReLU(),
18 |         )
19 |         # [b,20] -> [b,784]
20 |         self.decoder = nn.Sequential(
21 |             nn.Linear(20, 64),
22 |             nn.ReLU(),
23 |             nn.Linear(64, 256),
24 |             nn.ReLU(),
25 |             nn.Linear(256, 784),
26 |             nn.Sigmoid()
27 |         )
28 | 
29 |     def forward(self, x):
30 |         batch_size = x.size(0)
31 |         # flatten
32 |         x = x.view(batch_size, 784)
33 |         # encoder
34 |         x = self.encoder(x)
35 |         # decoder
36 |         x = self.decoder(x)
37 |         # reshape
38 |         x = x.view(batch_size, 1, 28, 28)
39 | 
40 |         return x
41 | 


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/ae_train.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch.utils.data import DataLoader
 3 | from torchvision import transforms, datasets
 4 | from torch import nn, optim
 5 | 
 6 | from ae import AE
 7 | from vae import VAE
 8 | import visdom
 9 | 
10 | 
11 | def main():
12 |     mnist_train = datasets.MNIST('./../data', train=True, transform=transforms.Compose([
13 |         transforms.ToTensor()
14 |     ]), download=False)
15 |     mnist_train = DataLoader(mnist_train, batch_size=128, shuffle=True)
16 | 
17 |     mnist_test = datasets.MNIST('../data', train=False, transform=transforms.Compose([
18 |         transforms.ToTensor()
19 |     ]), download=False)
20 |     mnist_test = DataLoader(mnist_test, batch_size=128, shuffle=False)
21 | 
22 |     # 无监督学习，不需要label
23 |     x, _ = iter(mnist_train).next()
24 |     print('x: ', x.shape)
25 | 
26 |     device = torch.device('cuda')
27 | 
28 |     # model = AE().to(device)
29 |     model = VAE().to(device)
30 | 
31 |     print(model)
32 |     criterion = nn.MSELoss()
33 |     optimizer = optim.Adam(model.parameters(), lr=1e-3)
34 | 
35 |     viz = visdom.Visdom()
36 | 
37 |     for epoch in range(100):
38 | 
39 |         for batchidx, (x, _) in enumerate(mnist_train):
40 |             # [b,1,28,28]
41 |             x = x.to(device)
42 | 
43 |             x_hat = model(x)
44 |             loss = criterion(x_hat, x)
45 | 
46 |             # backprop
47 |             optimizer.zero_grad()
48 |             loss.backward()
49 |             optimizer.step()
50 | 
51 |         print('epoch: ', epoch, '  loss:', loss.item())
52 | 
53 |         x, _ = iter(mnist_test).next()
54 |         x = x.to(device)
55 |         with torch.no_grad():
56 |             x_hat = model(x)
57 |         viz.images(x, nrow=8, win='x', opts=dict(title='x'))
58 |         viz.images(x_hat, nrow=8, win='x_hat', opts=dict(title='x_hat'))
59 | 
60 | 
61 | if __name__ == '__main__':
62 |     main()
63 | 


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/vae.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch import nn
 3 | import numpy as np
 4 | 
 5 | 
 6 | class VAE(nn.Module):
 7 | 
 8 |     def __init__(self):
 9 |         super(VAE, self).__init__()
10 | 
11 |         # [b,784] -> [b,20]
12 |         # u:[b,10] sigma:[b,10]
13 |         self.encoder = nn.Sequential(
14 |             nn.Linear(784, 256),
15 |             nn.ReLU(),
16 |             nn.Linear(256, 64),
17 |             nn.ReLU(),
18 |             nn.Linear(64, 20),
19 |             nn.ReLU(),
20 |         )
21 |         # [b,20] -> [b,784]
22 |         self.decoder = nn.Sequential(
23 |             nn.Linear(10, 64),
24 |             nn.ReLU(),
25 |             nn.Linear(64, 256),
26 |             nn.ReLU(),
27 |             nn.Linear(256, 784),
28 |             nn.Sigmoid()
29 |         )
30 |         self.criterion = nn.MSELoss()
31 | 
32 |     def forward(self, x):
33 |         batch_size = x.size(0)
34 |         # flatten
35 |         x = x.view(batch_size, 784)
36 |         # encoder
37 |         # [b,20] , including mean and sigma
38 |         h_ = self.encoder(x)
39 |         # [b,20] -> [b,10] and [b,10]
40 |         mu, sigma = h_.chunk(2, dim=1)
41 |         # reparametrize trick, epison~N(0,1)
42 |         h = mu + sigma * torch.randn_like(sigma)
43 |         # decoder
44 |         x_hat = self.decoder(h)
45 |         # reshape
46 |         x_hat = x_hat.view(batch_size, 1, 28, 28)
47 | 
48 |         # kl divergence
49 |         kld = 0.5 * torch.sum(
50 |             torch.pow(mu, 2) +
51 |             torch.pow(sigma, 2) -
52 |             torch.log(1e-8 + torch.pow(sigma, 2)) - 1
53 |         ) / (batch_size*28*28)
54 | 
55 |         return x_hat, kld
56 | 


--------------------------------------------------------------------------------
/ch11_自编码器 Auto-Encoders/vae_train.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from torch.utils.data import DataLoader
 3 | from torchvision import transforms, datasets
 4 | from torch import nn, optim
 5 | 
 6 | from vae import VAE
 7 | import visdom
 8 | 
 9 | 
10 | def main():
11 |     mnist_train = datasets.MNIST('./../data', train=True, transform=transforms.Compose([
12 |         transforms.ToTensor()
13 |     ]), download=False)
14 |     mnist_train = DataLoader(mnist_train, batch_size=128, shuffle=True)
15 | 
16 |     mnist_test = datasets.MNIST('../data', train=False, transform=transforms.Compose([
17 |         transforms.ToTensor()
18 |     ]), download=False)
19 |     mnist_test = DataLoader(mnist_test, batch_size=128, shuffle=False)
20 | 
21 |     # 无监督学习，不需要label
22 |     x, _ = iter(mnist_train).next()
23 |     print('x: ', x.shape)
24 | 
25 |     device = torch.device('cuda')
26 | 
27 |     model = VAE().to(device)
28 | 
29 |     print(model)
30 |     criterion = nn.MSELoss()
31 |     optimizer = optim.Adam(model.parameters(), lr=1e-3)
32 | 
33 |     viz = visdom.Visdom()
34 | 
35 |     for epoch in range(100):
36 | 
37 |         for batchidx, (x, _) in enumerate(mnist_train):
38 |             # [b,1,28,28]
39 |             x = x.to(device)
40 | 
41 |             x_hat, kld = model(x)
42 |             loss = criterion(x_hat, x)
43 | 
44 |             if kld is not None:
45 |                 elbo = - loss - 1.0 * kld
46 |                 loss = - elbo
47 | 
48 |             # backprop
49 |             optimizer.zero_grad()
50 |             loss.backward()
51 |             optimizer.step()
52 | 
53 |         print('epoch: ', epoch, '  loss:', loss.item(), 'kld: ',kld.item())
54 | 
55 |         x, _ = iter(mnist_test).next()
56 |         x = x.to(device)
57 |         with torch.no_grad():
58 |             x_hat, kld = model(x)
59 |         viz.images(x, nrow=8, win='x', opts=dict(title='x'))
60 |         viz.images(x_hat, nrow=8, win='x_hat', opts=dict(title='x_hat'))
61 | 
62 | 
63 | if __name__ == '__main__':
64 |     main()
65 | 


--------------------------------------------------------------------------------