Pytorch--MNIST练习--clean版

来源：互联网发布：mac 内存占用编辑：程序博客网时间：2024/06/05 02:26

from __future__ import print_functionimport os, sys, argparseimport torchimport torch.nn as nnimport torch.optim as optimfrom torchvision import datasets, transformsfrom torch.autograd import Variablecuda = torch.cuda.is_available()# Traing settingsparse = argparse.ArgumentParser(description='Pytorch MNIST Example')parse.add_argument('--batchSize', type=int, default=64, metavar='input batch size')parse.add_argument('--testBatchSize', type=int, default=1000, metavar='input batch size for testing')parse.add_argument('--trainSize', type=int, default=1000, metavar='input dataset size(max=60000).Default=1000')parse.add_argument('--nEpochs', type=int, default=2, metavar='number of epochs to train')parse.add_argument('--lr', type=float, default=0.01, metavar='Learning rate.Deafault=0.01')parse.add_argument('--momentum', type=float, default=0.5, metavar='Default=0.5',)parse.add_argument('--seed', type=int, default=123, metavar='Romdom Seed to use.Default=123')opt = parse.parse_args()print(opt)torch.manual_seed(opt.seed)if cuda == True:    torch.cuda.manual_seed(opt.seed)print('Current path is:', sys.path[0])if not os.path.exists('../data'):    #import data    print('Data path doesnt exist')print('===>Loading data')with open('../data/processed/training.pt', 'rb') as f:    training_set = torch.load(f)with open('../data/processed/test.pt', 'rb') as f:    test_set = torch.load(f)#reshape raw image to 28*28*1training_data = training_set[0].view(-1, 1, 28, 28).div(255)training_data = training_data[:opt.trainSize]training_labels = training_set[1]test_data = test_set[0].view(-1, 1, 28, 28).div(255)test_labels = test_set[1]del training_setdel test_set#modelprint('===>Building model')class Net(nn.Module):    def __init__(self):        super(Net, self).__init__()        self.conv1 = nn.Conv2d(1, 10, 5)        self.pool1 = nn.MaxPool2d(2, 2)        self.conv2 = nn.Conv2d(10, 20, 5)        self.pool2 = nn.MaxPool2d(2, 2)        self.fc1   = nn.Linear(320, 50)        self.fc2   = nn.Linear(50, 10)        self.relu       = nn.ReLU()        self.softmax    = nn.LogSoftmax()    def forward(self, x):        x = self.relu(self.pool1(self.conv1(x)))        x = self.relu(self.pool2(self.conv2(x)))        #x.size() = ([64, 20, 4, 4])        #batchSize=64,channel=20,H=W=4        x = x.view(-1, 320)        x = self.relu(self.fc1(x))        x = self.relu(self.fc2(x))        return self.softmax(x)model = Net()if cuda:    model.cuda()criterion = nn.NLLLoss()optimizer = optim.SGD(model.parameters(), lr = opt.lr, momentum=opt.momentum)def train(epoch):    #create buffer for mini-batch    batch_data = torch.FloatTensor(opt.batchSize, 1, 28, 28)    batch_targets = torch.LongTensor(opt.batchSize)    if cuda:        batch_data, batch_targets = batch_data.cuda(), batch_targets.cuda()    #create autograd Variable over these bufferrs    batch_data, batch_targets = Variable(batch_data), Variable(batch_targets)    for i in range(0, training_data.size(0)-opt.batchSize+1, opt.batchSize):        start, end = i, i+opt.batchSize        optimizer.zero_grad()        batch_data.data[:] = training_data[start:end]        batch_targets.data[:] = training_labels[start:end]        output = model(batch_data)        loss = criterion(output, batch_targets)        loss.backward()        loss = loss.data[0]        optimizer.step()        print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.4f}'              .format(epoch, end , opt.trainSize, float(end)/opt.trainSize*100, loss))def test(epoch):    #create buffer for mini-batch    batch_data = torch.FloatTensor(opt.testBatchSize, 1, 28, 28)    batch_targets = torch.LongTensor(opt.testBatchSize)    if cuda:        batch_data, batch_targets = batch_data.cuda(), batch_targets.cuda()    #create autograd Variable over these buffes    #volatile for the Variable use in reference model,and don't save the history    batch_data = Variable(batch_data, volatile=True)    batch_targets = Variable(batch_targets, volatile=True)    test_loss = 0    correct = 0    for i in range(0, test_data.size(0), opt.testBatchSize):        batch_data.data[:] = test_data[i:i+opt.testBatchSize]        batch_targets.data[:] = test_labels[i:i+opt.testBatchSize]        output = model(batch_data)        test_loss += criterion(output, batch_targets)        #get the index of the max log-probability        pred = output.data.max(1)[1]        correct += pred.long().eq(batch_targets.data.long()).cpu().sum()        print("correct = ", correct)    test_loss = test_loss.data[0]    test_loss /= test_data.size(0) / opt.testBatchSize    print('\nTest Set: Average loss: {:.4f}, Accuracy: {}/{} ({:.0f}%)\n'.format(        test_loss, correct, test_data.size(0),        float(correct)/test_data.size(0)*100))for epoch in range(opt.nEpochs+1):    train(epoch)    test(epoch)

注：
1.在代码开头加上：from __future__ import *
自python2.1以后，当python新版本特性与老版本不兼容时，将默认禁止该特性。若想使用，则可以用该语句导入。例如我们平时用的比较多的：
from __future__ import print_function
在python2.7中加上这条语句后，我们就可以使用python3中print 函数了，代码的鲁棒性也变得更好。

2.这里省略了MINIST下载步骤：

torch.utils.data.DataLoader(    datasets.MNIST('../data', train=True, download=True))

代码中class MNIST的初始init（）：

def __init__(self, root, train=True, transform=None, target_transform=None, download=False):

在上面导入数据时，可以根据自己的目录自己导入数据。更好的结构应该把这些部分分离出来，而不是写在一个python文件里。

3.使用view来reshape输入数据
x = torch.randn(64, 20, 4, 4)
x = x.view(64,320)
print(x.size())

([64, 320])

使用-1代表先满足其它维数据的size，最后剩下的size赋给该维：
x = torch.randn(64, 20, 4, 4)
x = x.view(-1,320)
print(x.size())

([64, 320])

需要注意的是，使用view reshape数据后，并没有保存在原来的x中，我们需要将reshape后的数据赋给x。
4.提高正确率
这里的正确率大致为10%，如要提高正确率可以增大opt.nEpochs和opt.trainSize,亦可以优化训练模型

阅读全文

1 0