In [2]:
import torch 
import torchvision
import torch.nn as nn
import torch.utils.data as data
import numpy as np
import torchvision.transforms as transforms
import torchvision.datasets as dsets
from torch.autograd import Variable

In [3]:
#Generate a random 5x3 Matrix
x = torch.randn(5,3)
print(x)


-1.6739  0.7834  0.7146
 0.7311  1.2642  0.4907
-1.0195 -1.9199  1.8519
 0.6640  0.2892 -2.1121
-1.6668 -1.7949 -1.3759
[torch.FloatTensor of size 5x3]



# module = Linear(inputDimension,outputDimension)
### Applies a linear transformation to the incoming data, i.e. //y= Wx+b//. 

In [4]:
#Generate a linear transformation from dim 3 to dim 2 with random parameters Weight & Bias
linear = nn.Linear(3,2)
print(linear.weight)
print(linear.bias)

Parameter containing:
 0.3326  0.0637 -0.4364
 0.5296 -0.3063 -0.0562
[torch.FloatTensor of size 2x3]

Parameter containing:
 0.0803
-0.1674
[torch.FloatTensor of size 2]



In [5]:
#Put data into linear transformation to get the result
y = linear(Variable(x))
print (y)
print(linear)

Variable containing:
-0.7384 -1.3340
 0.1898 -0.1951
-1.1894 -0.2233
 1.2414  0.2145
 0.0120 -0.4228
[torch.FloatTensor of size 5x2]

Linear (3 -> 2)


In [6]:
#Add to a network
Linear= nn.Linear(10,5)  
m = nn.Sequential()
m.add_module(module=Linear,name='Test')

In [9]:
#Transfer np.array to torch Tensor
a = np.array([[1,2],[3,4]])
b = torch.from_numpy(a)
print(b)


 1  2
 3  4
[torch.LongTensor of size 2x2]



### Document : http://pytorch.org/docs/torchvision/transforms.html

In [10]:
#In short, to transform the input data for later training
transform = transforms.Compose([
    transforms.Scale(40),
    transforms.RandomHorizontalFlip(),
    transforms.RandomCrop(32),
    transforms.ToTensor()])

In [11]:
#Download Data Set
train_dataset = dsets.CIFAR10(root='./data/',
                               train=True, 
                               transform=transform,
                               download=True)

image, label = train_dataset[0]
print (image.size())
print (label)

Files already downloaded and verified
torch.Size([3, 32, 32])
6


In [13]:
train_loader = data.DataLoader(dataset=train_dataset,
                               batch_size=100, 
                               shuffle=True,
                               num_workers=2)

In [15]:
# iteration start then queue and thread start
data_iter = iter(train_loader)

# mini-batch images and labels
images, labels = data_iter.next()

for images, labels in train_loader:
    pass

In [None]:
#Load custom dataset
class CustomDataset(data.Dataset):
    def __init__(self):
        # TODO
        # 1. Initialize file path or list of file names. 
        pass
    def __getitem__(self, index):
        # TODO
        # 1. Read one data from file (e.g. using numpy.fromfile, PIL.Image.open).
        # 2. Preprocess the data (e.g. torchvision.Transform).
        # 3. Return a data pair (e.g. image and label).
        pass
    def __len__(self):
        # You should change 0 to the total size of your dataset.
        return 0 

# Then, you can just use prebuilt torch's data loader. 
custom_dataset = CustomDataset()
train_loader = torch.utils.data.DataLoader(dataset=custom_dataset,
                                           batch_size=100, 
                                           shuffle=True,
                                           num_workers=2)

In [20]:
#Download & load pretrained models
resnet = torchvision.models.resnet18(pretrained=True)

In [21]:
# If you want to finetune only top layer of the model.
for param in resnet.parameters():
    param.requires_grad = False
    
# Replace top layer for finetuning.
resnet.fc = nn.Linear(resnet.fc.in_features, 100)  # 100 is for example.

# For test.
images = Variable(torch.randn(10, 3, 256, 256))
outputs = resnet(images)
print (outputs.size())   # (10, 100)

torch.Size([10, 100])


In [None]:
# Save and load the entire model.
torch.save(resnet, 'model.pkl')
model = torch.load('model.pkl')

# Save and load only the model parameters(recommended).
torch.save(resnet.state_dict(), 'params.pkl')
resnet.load_state_dict(torch.load('params.pkl'))

In [22]:
x = Variable(torch.Tensor([3]), requires_grad=True)
w = Variable(torch.Tensor([4]), requires_grad=True)
b = Variable(torch.Tensor([20]), requires_grad=True)
print(x,w,b)

Variable containing:
 3
[torch.FloatTensor of size 1]
 Variable containing:
 4
[torch.FloatTensor of size 1]
 Variable containing:
 20
[torch.FloatTensor of size 1]



In [23]:
y =  2*w * x + b

In [24]:
print(y)

Variable containing:
 44
[torch.FloatTensor of size 1]



In [25]:
y.backward()   #Partial Differentiate every parameters 

In [26]:
print(x.grad)    
print(w.grad)    
print(b.grad)    

Variable containing:
 8
[torch.FloatTensor of size 1]

Variable containing:
 6
[torch.FloatTensor of size 1]

Variable containing:
 1
[torch.FloatTensor of size 1]



In [27]:
# Create tensors.
x = Variable(torch.randn(5, 3))
y = Variable(torch.randn(5, 2))
print('x:',x)
print('y:',y)
# Build a linear layer.
linear = nn.Linear(3, 2)
print ('w: ', linear.weight)
print ('b: ', linear.bias)

x: Variable containing:
-0.1706 -1.9050  1.3719
-0.2103  0.4423 -0.2773
-0.3801 -0.8468  0.2802
-1.0409 -1.5621  1.2274
-0.0432 -0.7304 -1.4813
[torch.FloatTensor of size 5x3]

y: Variable containing:
-0.7187 -0.2424
 0.0461  0.1277
-0.9749  0.2873
-0.0317 -0.2266
 0.2661 -0.8796
[torch.FloatTensor of size 5x2]

w:  Parameter containing:
 0.4473  0.2759 -0.0281
-0.3915  0.4829 -0.0940
[torch.FloatTensor of size 2x3]

b:  Parameter containing:
1.00000e-02 *
  1.7566
  4.0828
[torch.FloatTensor of size 2]



In [28]:
# Build Loss and Optimizer.
criterion = nn.MSELoss()
optimizer = torch.optim.SGD(linear.parameters(), lr=0.01)

In [29]:
pred = linear(x)

In [30]:
loss = criterion(pred, y)
print('loss: ', loss.data[0])

loss:  0.26969239115715027


In [31]:
loss.backward()

In [32]:
print ('dL/dw: ', linear.weight.grad) 
print ('dL/db: ', linear.bias.grad)

dL/dw:  Variable containing:
 0.1395  0.2037 -0.0313
 0.0887  0.3324 -0.4969
[torch.FloatTensor of size 2x3]

dL/db:  Variable containing:
-0.1251
-0.0935
[torch.FloatTensor of size 2]



In [33]:
optimizer.step()

In [34]:
pred = linear(x)
loss = criterion(pred, y)
print('loss after 1 step optimization: ', loss.data[0])

loss after 1 step optimization:  0.2652277946472168
