# <center>MobileNet - Pytorch

# Step 1: Prepare data

In [1]:
# MobileNet-Pytorch
import argparse 
import torch
import numpy as np
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch.optim.lr_scheduler import StepLR
from torchvision import datasets, transforms
from torch.autograd import Variable
from torch.utils.data.sampler import SubsetRandomSampler
from sklearn.metrics import accuracy_score
from mobilenets import mobilenet

use_cuda = torch.cuda.is_available()
use_cudause_cud  = torch.cuda.is_available()
dtype = torch.cuda.FloatTensor if use_cuda else torch.FloatTensor

In [2]:
# Train, Validate, Test. Heavily inspired by Kevinzakka https://github.com/kevinzakka/DenseNet/blob/master/data_loader.py

normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                 std=[0.229, 0.224, 0.225])

valid_size=0.1

# define transforms
valid_transform = transforms.Compose([
        transforms.ToTensor(),
        normalize
])

train_transform = transforms.Compose([
    transforms.RandomCrop(32, padding=4),
    transforms.RandomHorizontalFlip(),
    transforms.ToTensor(),
    normalize
])


# load the dataset
train_dataset = datasets.CIFAR10(root="data", train=True, 
            download=True, transform=train_transform)

valid_dataset = datasets.CIFAR10(root="data", train=True, 
            download=True, transform=valid_transform)

num_train = len(train_dataset)
indices = list(range(num_train))
split = int(np.floor(valid_size * num_train)) #5w张图片的10%用来当做验证集


np.random.seed(42)
np.random.shuffle(indices) # 随机乱序[0,1,...,49999]

train_idx, valid_idx = indices[split:], indices[:split]


train_sampler = SubsetRandomSampler(train_idx) # 这个很有意思
valid_sampler = SubsetRandomSampler(valid_idx)


# ------------------------- 使用不同的批次大小 ------------------------------------
show_step=20  # 批次大，show_step就小点
max_epoch=50  # 训练最大epoch数目
train_loader = torch.utils.data.DataLoader(train_dataset, 
                batch_size=256, sampler=train_sampler)

valid_loader = torch.utils.data.DataLoader(valid_dataset, 
                batch_size=256, sampler=valid_sampler)


test_transform = transforms.Compose([
    transforms.ToTensor(), normalize
])

test_dataset = datasets.CIFAR10(root="data", 
                                train=False, 
                                download=True,transform=test_transform)

test_loader = torch.utils.data.DataLoader(test_dataset, 
                                          batch_size=64, 
                                          shuffle=True)

Files already downloaded and verified
Files already downloaded and verified
Files already downloaded and verified


# Step 2: Model Config

In [5]:
# 32  缩放5次到 1x1@1024 
# From https://github.com/kuangliu/pytorch-cifar 
import torch
import torch.nn as nn
import torch.nn.functional as F


class Block(nn.Module):
    '''Depthwise conv + Pointwise conv'''
    def __init__(self, in_planes, out_planes, stride=1):
        super(Block, self).__init__()
        
        # 分组卷积数=输入通道数
        self.conv1 = nn.Conv2d(in_planes, in_planes, kernel_size=3, stride=stride, padding=1, groups=in_planes, bias=False)
        
        self.bn1 = nn.BatchNorm2d(in_planes)
        
        self.conv2 = nn.Conv2d(in_planes, out_planes, kernel_size=1, stride=1, padding=0, bias=False)
        
        self.bn2 = nn.BatchNorm2d(out_planes)

    def forward(self, x):
        out = F.relu(self.bn1(self.conv1(x)))
        out = F.relu(self.bn2(self.conv2(out)))
        return out


class MobileNet(nn.Module):
    # (128,2) means conv planes=128, conv stride=2, by default conv stride=1
    cfg = [64, (128,2), 128, (256,2), 256, (512,2), 512, 512, 512, 512, 512, (1024,2), 1024]

    def __init__(self, num_classes=10):
        super(MobileNet, self).__init__()
        self.conv1 = nn.Conv2d(3, 32, kernel_size=3, stride=1, padding=1, bias=False)
        
        self.bn1 = nn.BatchNorm2d(32)
        self.layers = self._make_layers(in_planes=32) # 自动化构建层
        self.linear = nn.Linear(1024, num_classes)

    def _make_layers(self, in_planes):
        layers = []
        for x in self.cfg:
            out_planes = x if isinstance(x, int) else x[0]
            stride = 1 if isinstance(x, int) else x[1]
            layers.append(Block(in_planes, out_planes, stride))
            in_planes = out_planes
        return nn.Sequential(*layers)

    def forward(self, x):
        out = F.relu(self.bn1(self.conv1(x)))
        out = self.layers(out)
        out = F.avg_pool2d(out, 2)
        out = out.view(out.size(0), -1)
        out = self.linear(out)
        return out

In [6]:
# From https://github.com/Z0m6ie/CIFAR-10_PyTorch
#model = mobilenet(num_classes=10, large_img=False)

# From https://github.com/kuangliu/pytorch-cifar 
model=MobileNet(10).cuda()

optimizer = optim.Adam(model.parameters(), lr=0.01)
scheduler = StepLR(optimizer, step_size=10, gamma=0.5)
criterion = nn.CrossEntropyLoss()

In [7]:
# Implement validation
def train(epoch):
    model.train()
    #writer = SummaryWriter()
    for batch_idx, (data, target) in enumerate(train_loader):
        if use_cuda:
            data, target = data.cuda(), target.cuda()
        data, target = Variable(data), Variable(target)
        optimizer.zero_grad()
        output = model(data)
        correct = 0
        pred = output.data.max(1, keepdim=True)[1] # get the index of the max log-probability
        correct += pred.eq(target.data.view_as(pred)).sum()
        
        loss = criterion(output, target)
        loss.backward()
        accuracy = 100. * (correct.cpu().numpy()/ len(output))
        optimizer.step()
        if batch_idx % show_step == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}, Accuracy: {:.2f}'.format(
                epoch, batch_idx * len(data), len(train_loader.dataset),
                100. * batch_idx / len(train_loader), loss.item(), accuracy))
            #writer.add_scalar('Loss/Loss', loss.item(), epoch)
            #writer.add_scalar('Accuracy/Accuracy', accuracy, epoch)
    scheduler.step()

In [8]:
def validate(epoch):
    model.eval()
    #writer = SummaryWriter()
    valid_loss = 0
    correct = 0
    for data, target in valid_loader:
        if use_cuda:
            data, target = data.cuda(), target.cuda()
        data, target = Variable(data), Variable(target)
        output = model(data)
        valid_loss += F.cross_entropy(output, target, size_average=False).item() # sum up batch loss
        pred = output.data.max(1, keepdim=True)[1] # get the index of the max log-probability
        correct += pred.eq(target.data.view_as(pred)).sum()

    valid_loss /= len(valid_idx)
    accuracy = 100. * correct.cpu().numpy() / len(valid_idx)
    print('\nValidation set: Average loss: {:.4f}, Accuracy: {}/{} ({:.2f}%)\n'.format(
        valid_loss, correct, len(valid_idx),
        100. * correct / len(valid_idx)))
    #writer.add_scalar('Loss/Validation_Loss', valid_loss, epoch)
    #writer.add_scalar('Accuracy/Validation_Accuracy', accuracy, epoch)
    return valid_loss, accuracy

In [9]:
# Fix best model

def test(epoch):
    model.eval()
    test_loss = 0
    correct = 0
    for data, target in test_loader:
        if use_cuda:
            data, target = data.cuda(), target.cuda()
        data, target = Variable(data), Variable(target)
        output = model(data)
        test_loss += F.cross_entropy(output, target, size_average=False).item() # sum up batch loss
        pred = output.data.max(1, keepdim=True)[1] # get the index of the max log-probability
        correct += pred.eq(target.data.view_as(pred)).cpu().sum()

    test_loss /= len(test_loader.dataset)
    print('\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.2f}%)\n'.format(
        test_loss, correct, len(test_loader.dataset),
        100. * correct.cpu().numpy() / len(test_loader.dataset)))

In [10]:
def save_best(loss, accuracy, best_loss, best_acc):
    if best_loss == None:
        best_loss = loss
        best_acc = accuracy
        file = 'saved_models/best_save_model.p'
        torch.save(model.state_dict(), file)
        
    elif loss < best_loss and accuracy > best_acc:
        best_loss = loss
        best_acc = accuracy
        file = 'saved_models/best_save_model.p'
        torch.save(model.state_dict(), file)
    return best_loss, best_acc

In [11]:
# Fantastic logger for tensorboard and pytorch, 
# run tensorboard by opening a new terminal and run "tensorboard --logdir runs"
# open tensorboard at http://localhost:6006/
from tensorboardX import SummaryWriter
best_loss = None
best_acc = None

import time 
SINCE=time.time()

for epoch in range(max_epoch):
    train(epoch)
    loss, accuracy = validate(epoch)
    best_loss, best_acc = save_best(loss, accuracy, best_loss, best_acc)
    
    NOW=time.time() 
    DURINGS=NOW-SINCE
    SINCE=NOW
    print("the time of this epoch:[{} s]".format(DURINGS))
    
#writer = SummaryWriter()
#writer.export_scalars_to_json("./all_scalars.json")

#writer.close()


Validation set: Average loss: 1.8172, Accuracy: 2090/5000 (41.00%)

the time of this epoch:[19.475614070892334 s]

Validation set: Average loss: 1.2392, Accuracy: 2844/5000 (56.00%)

the time of this epoch:[19.68838405609131 s]

Validation set: Average loss: 1.0994, Accuracy: 3141/5000 (62.00%)

the time of this epoch:[19.884924173355103 s]

Validation set: Average loss: 1.1535, Accuracy: 3164/5000 (63.00%)

the time of this epoch:[19.64325737953186 s]

Validation set: Average loss: 0.7551, Accuracy: 3685/5000 (73.00%)

the time of this epoch:[19.729968070983887 s]

Validation set: Average loss: 0.7003, Accuracy: 3770/5000 (75.00%)

the time of this epoch:[19.7011661529541 s]

Validation set: Average loss: 0.7221, Accuracy: 3808/5000 (76.00%)

the time of this epoch:[19.63713765144348 s]

Validation set: Average loss: 0.7072, Accuracy: 3827/5000 (76.00%)

the time of this epoch:[19.864455938339233 s]

Validation set: Average loss: 0.5856, Accuracy: 3994/5000 (79.00%)

the time of this


Validation set: Average loss: 0.4636, Accuracy: 4214/5000 (84.00%)

the time of this epoch:[19.611411094665527 s]

Validation set: Average loss: 0.4264, Accuracy: 4267/5000 (85.00%)

the time of this epoch:[19.623915195465088 s]

Validation set: Average loss: 0.4920, Accuracy: 4194/5000 (83.00%)

the time of this epoch:[19.641515731811523 s]

Validation set: Average loss: 0.4516, Accuracy: 4238/5000 (84.00%)

the time of this epoch:[19.611614227294922 s]

Validation set: Average loss: 0.4730, Accuracy: 4218/5000 (84.00%)

the time of this epoch:[19.907944202423096 s]

Validation set: Average loss: 0.4217, Accuracy: 4266/5000 (85.00%)

the time of this epoch:[19.584630727767944 s]

Validation set: Average loss: 0.4363, Accuracy: 4274/5000 (85.00%)

the time of this epoch:[19.603719472885132 s]

Validation set: Average loss: 0.4550, Accuracy: 4231/5000 (84.00%)

the time of this epoch:[19.786169052124023 s]

Validation set: Average loss: 0.4243, Accuracy: 4279/5000 (85.00%)

the time of


Validation set: Average loss: 0.3718, Accuracy: 4397/5000 (87.00%)

the time of this epoch:[19.8292133808136 s]

Validation set: Average loss: 0.3749, Accuracy: 4410/5000 (88.00%)

the time of this epoch:[19.576144456863403 s]

Validation set: Average loss: 0.3751, Accuracy: 4404/5000 (88.00%)

the time of this epoch:[19.59357523918152 s]

Validation set: Average loss: 0.3832, Accuracy: 4391/5000 (87.00%)

the time of this epoch:[19.79728364944458 s]

Validation set: Average loss: 0.3632, Accuracy: 4396/5000 (87.00%)

the time of this epoch:[19.55585479736328 s]

Validation set: Average loss: 0.3817, Accuracy: 4410/5000 (88.00%)

the time of this epoch:[19.569167375564575 s]

Validation set: Average loss: 0.4108, Accuracy: 4374/5000 (87.00%)

the time of this epoch:[19.83908247947693 s]

Validation set: Average loss: 0.3776, Accuracy: 4421/5000 (88.00%)

the time of this epoch:[19.571686029434204 s]

Validation set: Average loss: 0.3682, Accuracy: 4433/5000 (88.00%)

the time of this 


Validation set: Average loss: 0.3677, Accuracy: 4435/5000 (88.00%)

the time of this epoch:[19.7981960773468 s]

Validation set: Average loss: 0.3960, Accuracy: 4438/5000 (88.00%)

the time of this epoch:[19.581066608428955 s]

Validation set: Average loss: 0.3812, Accuracy: 4449/5000 (88.00%)

the time of this epoch:[19.617161989212036 s]

Validation set: Average loss: 0.3930, Accuracy: 4465/5000 (89.00%)

the time of this epoch:[19.726255655288696 s]

Validation set: Average loss: 0.4067, Accuracy: 4457/5000 (89.00%)

the time of this epoch:[19.557750701904297 s]

Validation set: Average loss: 0.3978, Accuracy: 4430/5000 (88.00%)

the time of this epoch:[19.84236454963684 s]

Validation set: Average loss: 0.3970, Accuracy: 4434/5000 (88.00%)

the time of this epoch:[19.57187533378601 s]

Validation set: Average loss: 0.3860, Accuracy: 4466/5000 (89.00%)

the time of this epoch:[19.622222423553467 s]

Validation set: Average loss: 0.3959, Accuracy: 4465/5000 (89.00%)

the time of thi


Validation set: Average loss: 0.4292, Accuracy: 4467/5000 (89.00%)

the time of this epoch:[19.828170776367188 s]

Validation set: Average loss: 0.4183, Accuracy: 4469/5000 (89.00%)

the time of this epoch:[19.58849549293518 s]

Validation set: Average loss: 0.4190, Accuracy: 4470/5000 (89.00%)

the time of this epoch:[19.78034210205078 s]

Validation set: Average loss: 0.4315, Accuracy: 4466/5000 (89.00%)

the time of this epoch:[19.586527347564697 s]

Validation set: Average loss: 0.4292, Accuracy: 4476/5000 (89.00%)

the time of this epoch:[19.613239288330078 s]


# Step 3: Test

In [12]:
test(epoch)


Test set: Average loss: 0.4542, Accuracy: 8932/10000 (89.32%)

