PyTorch 训练一个分类神经网络

Posted on 2018-04-29 | Edited on 2018-05-23

现在知道怎么定义一个网络，计算loss更新权重了。

What about data？

通常来说处理的数据有图片，文本，声音和视频，python有专门的库加载这些数据成numpy的array格式。然后转成torch.Tensor.

对于图片，可以使用 Pillow,OpenCV 等
声音的话，可以用 scipy,librosa
文本信息可以使用原生的 Python或Cython,或者 NLKT 和 SpyCy

特别是视频，Torch 有专门的包 torchvision,他为像 Imagenet，CIFAR10，MNIST等这样的数据集提供加载器，也提供图片的数据转换，torchvison.datasets 和 torch.utils.data.DataLoader .

这样提供了很大的便利，避免重复造轮子。

这小节使用 CIFAR10 数据集。这是一个包含，飞机，汽车，鸟，猫，鹿，狗，青蛙，马，船，卡车，十种类型图片。 CIFAR-10 图片是统一的 32 x 32 大小，包含 RGB 三个通道。

训练一个图片分类器

我们需要做以下几布：

利用 torchvision 加载格式化 CIFAR-10 测试集和训练集
定义一个卷积神经网络
定义一个 loss 函数
利用训练集训练网络
利用测试集进行测试

1.加载、标准化 CIFAR-10

1
2
3

import torch
import torchvision
import torchvision.transforms as transforms

torchvision 输出的数据是 [0,1] PILImage 图片，我们需要转换成标准化的 Tensor [-1,1]格式。

transform = transforms.Compose(
    [transforms.ToTensor(),
    transforms.Normalize((0.5,0.5,0.5),(0.5,0.5,0.5))])

trainset = torchvision.datasets.CIFAR10(root='./data',train=True,
download=True,
transform=transform)

trainloader = torch.utils.data.DataLoader(trainset,batch_size=4,
shuffle=True,
num_workers=2)

testset = torchvision.datasets.CIFAR10(root='./data',train=False,
download=True,
transform=transform)

testloader = torch.utils.data.DataLoader(testset,batch_size=4,
shuffle=False,num_workers=2)

classes = ('plane','car','bird','cat','deer','dog','frog','horse','ship','truck')

OUT:

Files already downloaded and verified
Files already downloaded and verified

这部分数据是从网上下载下来的，但我根本下载不了，所以从kaggle下载放在./data 文件夹下。

先看看图片吧。

import matplotlib.pyplot as plt
import numpy as np
%matplotlib inline

def imshow(img):
    img = img / 2 + 0.5
    npimg = img.numpy()
    plt.imshow(np.transpose(npimg,(1,2,0)))
    
dataiter = iter(trainloader)
images, labels = dataiter.next()

imshow(torchvision.utils.make_grid(images))
print(" ".join('%5s' % classes[labels[j]] for j in range(4)))

OUT:

frog   dog   dog truck

2.定义一个卷积神经网络

把上一小节那个卷积神经网络复制过来，将输入通道改成三。

import torch.nn as nn
import torch.nn.functional as F

class Net(nn.Module):
    def __init__(self):
        super(Net,self).__init__()
        self.conv1 = nn.Conv2d(3,6,5)
        self.pool = nn.MaxPool2d(2,2)
        self.conv2 = nn.Conv2d(6,16,5)
        self.fc1 = nn.Linear(16*5*5,120)
        self.fc2 = nn.Linear(120,84)
        self.fc3 = nn.Linear(84,10)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = x.view(-1,16*5*5)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        return x
    
net = Net()

3.定义 loss 函数和优化器

利用交叉熵loss 和 SGD.

import torch.optim as optim

criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(net.parameters(),lr = 0.001,momentum = 0.9)

4.训练网络

现在开始好玩了。先简单跑一下数据。

for epoch in range(2):

    running_loss = 0.0
    for i,data in enumerate(trainloader,0):
        inputs, labels = data
        optimizer.zero_grad()
        
        outputs = net(inputs)
        loss = criterion(outputs,labels)
        loss.backward()
        optimizer.step()

        running_loss += loss.item()
        if i % 2000 == 1999:
            print('[%d,%5d] loss: %.3f' %(epoch + 1,i+1,running_loss/2000))
            running_loss = 0.0
print('Finished Training')

5.利用测试集测试网络

现在已经利用训练集训练了两次，我们需要测试集检查一下是否学到了什么东西。

dataiter = iter(testloader)
images,labels = dataiter.next()

imshow(torchvision.utils.make_grid(images))
print('GroundTruth: ',' '.join('%5s' % classes[labels[j]] for j in range(4)))

OUT:
GroundTruth: cat ship ship plane

看神经网络能不能认出来

1	outputs = net(images)

输出是一个10个类别的权重。哪个权重高，他会认为更可能是那个。

1
2
3

_,predicted = torch.max(outputs,1)
print('Predicted: ',' '.join('%5s' % classes[predicted[j]] 
for j in rang(4)))

OUT:
Predicted: dog car truck ship

好吧…

大概看下在每个种类上的表现吧

class_correct = list(0. for i in range(10))
class_total = list(0. for i in range(10))
with torch.no_grad():
    for data in testloader:
        images, labels = data
        outputs = net(images)
        _, predicted = torch.max(outputs, 1)
        c = (predicted == labels).squeeze()
        for i in range(4):
            label = labels[i]
            class_correct[label] += c[i].item()
            class_total[label] += 1


for i in range(10):
    print('Accuracy of %5s : %2d %%' % (
        classes[i], 100 * class_correct[i] / class_total[i]))

OUT:
Accuracy of plane : 73 %
Accuracy of car : 44 %
Accuracy of bird : 45 %
Accuracy of cat : 32 %
Accuracy of deer : 26 %
Accuracy of dog : 42 %
Accuracy of frog : 61 %
Accuracy of horse : 75 %
Accuracy of ship : 43 %
Accuracy of truck : 78 %

6.在GPU上训练

这个嘛，额，不存在的，GT740M啊，不支持啊…

Torch 熟悉

Posted on 2018-04-28 | Edited on 2018-04-29

import torch
x = torch.randn(2,3)
print(x)
x = ((x*2)/(x-1))
print(x)
print(x.requires_grad)

# 把variable的设置grad给tensor了
x.requires_grad_(True)
print(x.requires_grad)

y = (x*x).sum()

y.backward()
# y = x^2
#dy/dx = 2 * x
print(x.grad)

a = torch.randn(2,3)
print(a)
b = ((a*2)/(a-1))
print(b)
print("a grad is ",a.requires_grad)
print("b grad is ",b.requires_grad)
a.requires_grad_(True)
b.requires_grad_(True)
print("a grad is ",a.requires_grad)
print("b grad is ",b.requires_grad)

c = (b*b).sum()

c.backward()
# b = a*2/(a-1)
#db/da = 2ln(a-1)
# c = b^2
# dc/db = 2b
print("a_grad = ",a.grad)
print("b_grad = ",b.grad)

tensor([[ 1.3270, -2.5966, -0.1547],
        [ 0.3614,  1.0595,  0.8459]])
tensor([[  8.1156,   1.4439,   0.2679],
        [ -1.1320,  35.5890, -10.9797]])
a grad is  False
b grad is  False
a grad is  True
b grad is  True
a_grad =  None
b_grad =  tensor([[ 16.2312,   2.8879,   0.5359],
        [ -2.2639,  71.1781, -21.9595]])

a = torch.ones(2,3)+1
print(a)
b = ((a*2)/(a-1))
print(b)
print("a grad is ",a.requires_grad)
a.requires_grad_(True)
print("a grad is ",a.requires_grad)

b.backward()

print("a_grad = ",a.grad)

tensor([[ 2.,  2.,  2.],
        [ 2.,  2.,  2.]])
tensor([[ 4.,  4.,  4.],
        [ 4.,  4.,  4.]])
a grad is  False
a grad is  True



---------------------------------------------------------------------------

RuntimeError                              Traceback (most recent call last)

<ipython-input-31-b43c2a9b1b1c> in <module>()
     13 
     14 # c.backward()
---> 15 b.backward()
     16 # b = a*2/(a-1)
     17 #db/da = 2ln(a-1)

RuntimeError: element 0 of tensors does not require grad and does not have a grad_fn

x = torch.randn(3,requires_grad = True)

y = x*2

# y.data.norm() 是求 y 的范数，就是 y 中的元素全部 p 次方，然后开 p 次方，默认 p=2
while y.data.norm() < 1000:
    y = y*2

print(y)
gradients = torch.tensor([0.1,1.0,0.0001],dtype = torch.float)

# backward 自动和参数相乘
y.backward(gradients)
print(x.grad)

print(x.requires_grad)
print((x ** 2).requires_grad)
with torch.no_grad():
    print((x ** 2).requires_grad)
    
print((x ** 2).requires_grad)

tensor([-571.8924,  188.2365, -904.6218])
tensor([  204.8000,  2048.0000,     0.2048])
True
True
False
True

import torch
import torch.nn as nn
import torch.nn.functional as F

class Net(nn.Module):
    # 定义一个网络
    def __init__(self):
        super(Net, self).__init__()
        
        # 1 个图像输入通道，6 个输出通道， 5x5 的卷积核
        self.conv1 = nn.Conv2d(1, 6, 5)
        #6 个输入通道，16 个输出通道
        self.conv2 = nn.Conv2d(6, 16, 5)
        
        #1 个线性函数 y = Wx +b
        self.fc1 = nn.Linear(16 * 5 *5 ,120)
        self.fc2 = nn.Linear(120 , 84)
        self.fc3 = nn.Linear(84,10)
        
    def forward(self, x):
        # 2x2 的池化窗口
        x = F.max_pool2d(F.relu(self.conv1(x)),(2,2))
        
        # 如果池话窗口为方形，你也可以设一个参数
        x = F.max_pool2d(F.relu(self.conv2(x)),2)
        
        x = x.view(-1,self.num_flat_features(x))  # 相当于把 16 个 5*5 的矩阵拍平成 16 个 25 的 
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        return x
    
    def num_flat_features(self, x):
        size = x.size()[1:]  # 得到除第一维的其他维之和，如：3*4*5*6 则最后返回 4*5*6 = 120
        num_features = 1
        for s in size:
            num_features *= s
        return num_features
    
net = Net()
print(net)

Net(
  (conv1): Conv2d(1, 6, kernel_size=(5, 5), stride=(1, 1))
  (conv2): Conv2d(6, 16, kernel_size=(5, 5), stride=(1, 1))
  (fc1): Linear(in_features=400, out_features=120, bias=True)
  (fc2): Linear(in_features=120, out_features=84, bias=True)
  (fc3): Linear(in_features=84, out_features=10, bias=True)
)

# 查看一下参数
params = list(net.parameters())
print(len(params))
print(params[2].size())

10
torch.Size([16, 6, 5, 5])

# 载入数据
input = torch.randn(1,1,32,32)
out = net(input)
print(out)

tensor([[-0.0400,  0.0145, -0.0109, -0.0255,  0.0603,  0.0657, -0.0557,
         -0.0260,  0.0959,  0.1870]])

1 2	net.zero_grad() out.backward(torch.randn(1,10))

output = net(input)
target = torch.arange(1,11)
target = target.view(1,-1)
criterion = nn.MSELoss()

loss = criterion(output,target)
print(loss)

tensor(37.9689)

1
2
3

print(loss.grad_fn) # MSELoss
print(loss.grad_fn.next_functions[0][0]) # Linear
print(loss.grad_fn.next_functions[0][0].next_functions[0][0]) # ReLU

<MseLossBackward object at 0x00000275FF44FDA0>
<AddmmBackward object at 0x00000275FF44FBA8>
<ExpandBackward object at 0x00000275FF44FDA0>

net.zero_grad()
print(net.conv1.bias.grad)
loss.backward()
print(net.conv1.bias.grad)

tensor([ 0.,  0.,  0.,  0.,  0.,  0.])
tensor([-0.1013,  0.0209, -0.0838, -0.0878, -0.0151,  0.0398])

1
2
3

learning_rate = 0.01
for f in net.parameters():
    f.data.sub_(f.grad.data * learning_rate)

# 使用内置 更新权重
import torch.optim as optim

# 做一个自己的 optimizer
optimizer = optim.SGD(net.parameters(),lr = 0.01)

# 训练
optimizer.zero_grad()
output = net(input)
loss = criterion(output, target)
loss.backward()
optimizer.step()

Github 搭建Blog

Posted on 2018-04-27 | Edited on 2018-12-25