当前位置：网站首页>Station B Liu Erden softmx classifier and MNIST implementation -structure 9

Station B Liu Erden softmx classifier and MNIST implementation -structure 9

2022-07-06 05:42:00 【Ning Ranye】

Series articles ：

List of articles

softmax classifier
MNIST Realization

softmax classifier

Insert picture description here

Loss function ： Cross entropy

Insert picture description here
Numpty Realize the cross entropy loss function

Insert picture description here
Pytorch Realized cross entropy loss

Insert picture description here

MNIST Realization

Insert picture description here

Guide pack

import torch
from  torch.utils.data import  DataLoader
from torchvision import datasets,transforms
#  Use relu()
import torch.nn.functional as F
#  Construct optimizer 
import  torch.optim as optim

1- Prepare the data

# 1- Prepare the data 
batch_size = 64
#  take PIL Image capture and change to Tensor
transforms = transforms.Compose([transforms.ToTensor(),
                                 transforms.Normalize((0.1307,),(0.3081,))])
train_dataset = datasets.MNIST(root='./datasets/mnist', train=True,
                               transform=transforms,
                               download=False)
test_dataset = datasets.MNIST(root='./datasets/mnist', train=False,
                              transform=transforms,
                              download=False)
train_loader = DataLoader(dataset=train_dataset, batch_size=batch_size,
                          shuffle=True)
test_loader = DataLoader(dataset=test_dataset, batch_size=batch_size,
                         shuffle=False)

2- Design the network model

# 2- Design the network model 
class Net(torch.nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.lay1 = torch.nn.Linear(784,512)
        self.lay2 = torch.nn.Linear(512,256)
        self.lay3 = torch.nn.Linear(256,128)
        self.lay4 = torch.nn.Linear(128,64)
        self.lay5 = torch.nn.Linear(64,10)
    def forward(self,x):

        x = x.view(-1,784)
        x = F.relu(self.lay1(x))
        x = F.relu(self.lay2(x))
        x = F.relu(self.lay3(x))
        x = F.relu(self.lay4(x))
        x = F.relu(self.lay5(x))
        return x

3- Build a model 、 Loss function 、 Optimizer

# 3- Construct loss function and optimizer 
model = Net()
criterion = torch.nn.CrossEntropyLoss()
optimizer =  torch.optim.SGD(model.parameters(), lr=0.005,momentum=0.5)

4- Training 、 test

# 4- Training test 
def train(epoch):
    running_loss = 0.0
    # enumerate(train_loader, 0): batch_idx from 0 Count 
    for batch_idx, data in enumerate(train_loader, 0):
        inputs, target = data
        optimizer.zero_grad()
# forward + backward + update
        outputs = model(inputs)
        loss = criterion(outputs, target)
        loss.backward()
        optimizer.step()
        running_loss += loss.item()
        if(batch_idx % 300 == 299):
            print('[%d, %5d] loss: %.3f'%(epoch + 1, batch_idx + 1, running_loss/300))
            running_loss = 0.0

def test():
    correct = 0
    total = 0
    #  The test does not need to generate a calculation diagram , No gradient update is required 、 Back propagation 
    with torch.no_grad():
         # data yes len =2 Of list
        # input yes data[0], target  yes data[1]
        for data in test_loader:
            images, label = data
            outputs = model(images)
            # _  Is the maximum value returned , predicted Is the subscript corresponding to the maximum 
            _, predicted = torch.max(outputs.data, dim=1)
            total += label.size(0)
            correct += (predicted == label).sum().item()
        print('Accutacy on test set : %d %%'%(100*correct/total))

if __name__ == '__main__':
    for epoch in range(10):
        train(epoch)
        test()

About ：(predicted == label).sum()
Will predicted Each element in is associated with the corresponding position label Opposite edge , Same back True, Different back False. .sum Seeking True The number of
Insert picture description here
inputs, target = data Explain the assignment

Complete code

import torch
from  torch.utils.data import  DataLoader
from torchvision import datasets,transforms
#  Use relu()
import torch.nn.functional as F
#  Construct optimizer 
import  torch.optim as optim

# 1- Prepare the data 
batch_size = 64
#  take PIL Image capture and change to Tensor
transforms = transforms.Compose([transforms.ToTensor(),
                                 transforms.Normalize((0.1307,),(0.3081,))])
train_dataset = datasets.MNIST(root='./datasets/mnist', train=True,
                               transform=transforms,
                               download=False)
test_dataset = datasets.MNIST(root='./datasets/mnist', train=False,
                              transform=transforms,
                              download=False)
train_loader = DataLoader(dataset=train_dataset, batch_size=batch_size,
                          shuffle=True)
test_loader = DataLoader(dataset=test_dataset, batch_size=batch_size,
                         shuffle=False)

# 2- Design the network model 
class Net(torch.nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.lay1 = torch.nn.Linear(784,512)
        self.lay2 = torch.nn.Linear(512,256)
        self.lay3 = torch.nn.Linear(256,128)
        self.lay4 = torch.nn.Linear(128,64)
        self.lay5 = torch.nn.Linear(64,10)
    def forward(self,x):

        x = x.view(-1,784)
        x = F.relu(self.lay1(x))
        x = F.relu(self.lay2(x))
        x = F.relu(self.lay3(x))
        x = F.relu(self.lay4(x))
        x = F.relu(self.lay5(x))
        return x


# 3- Construct loss function and optimizer 
model = Net()
criterion = torch.nn.CrossEntropyLoss()
optimizer =  torch.optim.SGD(model.parameters(), lr=0.005,momentum=0.5)
# 4- Training test 
def train(epoch):
    running_loss = 0.0
    # enumerate(train_loader, 0): batch_idx from 0 Count 
    for batch_idx, data in enumerate(train_loader, 0):
        inputs, target = data
        optimizer.zero_grad()
# forward + backward + update
        outputs = model(inputs)
        loss = criterion(outputs, target)
        loss.backward()
        optimizer.step()
        running_loss += loss.item()
        if(batch_idx % 300 == 299):
            print('[%d, %5d] loss: %.3f'%(epoch + 1, batch_idx + 1, running_loss/300))
            running_loss = 0.0

def test():
    correct = 0
    total = 0
    #  The test does not need to generate a calculation diagram , No gradient update is required 、 Back propagation 
    with torch.no_grad():
        for data in test_loader:
            images, label = data
            outputs = model(images)
            # _  Is the maximum value returned , predicted Is the subscript corresponding to the maximum 
            _, predicted = torch.max(outputs.data, dim=1)
            total += label.size(0)
            correct += (predicted == label).sum().item()
        print('Accutacy on test set : %d %%'%(100*correct/total))

if __name__ == '__main__':
    for epoch in range(10):
        train(epoch)
        test()