### Layers : Fundamental blocks of Neural Network

In [1]:
import torch
from torch.nn import Linear, ReLU
import torch.nn as nn
import numpy as np
from torch.autograd import Variable



### Linear(in_features,out_features,bias)

定義 輸入和輸出層的維度(weight的維度)

In [2]:
myLayer = Linear(in_features=10,out_features=5,bias=True)
inp = Variable(torch.randn(1,10))
myLayer = Linear(in_features=10,out_features=5,bias=True) 
myLayer(inp)

tensor([[-0.1231,  0.0635, -0.3844,  0.0926,  0.3034]],
       grad_fn=<AddmmBackward>)

In [3]:
myLayer.weight

Parameter containing:
tensor([[ 0.1376,  0.0409,  0.2941,  0.2772,  0.2091, -0.1796,  0.1341,  0.1498,
         -0.1208,  0.0241],
        [ 0.0788, -0.0186, -0.1551,  0.1403, -0.1763, -0.0895,  0.1719,  0.1273,
          0.2864,  0.1432],
        [-0.1036,  0.0280,  0.2013,  0.2118,  0.2831,  0.0381,  0.2777,  0.1796,
         -0.0007,  0.0058],
        [ 0.2078, -0.2720, -0.1966, -0.0131, -0.2251,  0.1215, -0.1393,  0.1918,
         -0.0872,  0.0815],
        [-0.0416, -0.0785,  0.3053,  0.0950, -0.2367,  0.0885,  0.2341,  0.2989,
         -0.1447, -0.2902]], requires_grad=True)

In [4]:
myLayer.bias

Parameter containing:
tensor([ 0.0736, -0.0595,  0.0757, -0.3133,  0.1915], requires_grad=True)

### Stacking Linear layers

建立多層神經層透過迭代

In [5]:
myLayer1 = Linear(10,5)
myLayer2 = Linear(5,2)
myLayer2(myLayer1(inp))

tensor([[ 0.3677, -0.3968]], grad_fn=<AddmmBackward>)

### PyTorch Non-linear Activations

使用兩種呼叫激勵函數的不同方式

In [6]:
sample_data = Variable(torch.Tensor([[1,2,-1,-1]])) 
myRelu = ReLU()
myRelu(sample_data)


tensor([[1., 2., 0., 0.]])

In [7]:
import torch.nn as nn
import torch.nn.functional as F
sample_data = Variable(torch.Tensor([[1,2,-1,-1]])) 
f = F.relu(sample_data) # Much simpler.
f

tensor([[1., 2., 0., 0.]])

### Neural Network 

利用類別建立多層神經網路

In [8]:
class MyFirstNetwork(nn.Module):
    def __init__(self,input_size,hidden_size,output_size):
        super(MyFirstNetwork,self).__init__() 
        self.layer1 = nn.Linear(input_size,hidden_size) 
        self.layer2 = nn.Linear(hidden_size,output_size)
    def layer(self):
        first  = [self.layer1.weight.data,self.layer1.bias.data]
        second = [self.layer2.weight.data,self.layer2.bias.data]
        return first,second
    def forward(self,input): 
        out = self.layer1(input) 
        out = F.relu(out)
        out = self.layer2(out) 
        out = F.softmax(out,dim=1)
        return out

model = MyFirstNetwork(112*112*3,56*56,2)
print(model)

MyFirstNetwork(
  (layer1): Linear(in_features=37632, out_features=3136, bias=True)
  (layer2): Linear(in_features=3136, out_features=2, bias=True)
)


### Loss

介紹兩種不同的loss function

In [9]:
loss = nn.MSELoss()
input = Variable(torch.randn(3, 5), requires_grad=True) 
target = Variable(torch.randn(3, 5))
output = loss(input, target)
output.backward()

分類問題常用的loss function: 交叉熵(cross-entropy)

In [10]:
def cross_entropy(true_label, prediction):
    if true_label == 1:
        return -log(prediction)
    else:
        return -log(1 - prediction)

### loss(x,class)=−x[class]+log(∑exp(x[j]))

利用上述公式自訂函數與內建函數比較

In [11]:
loss = nn.CrossEntropyLoss()
input = Variable(torch.randn(3, 5), requires_grad=True) 
target = Variable(torch.LongTensor(3).random_(5)) 
output = loss(input, target)
output.backward()
print(output.data.item())

def CrossEntropyLoss(input,target):
    sum = 0
    for i in range(len(input)):
        tmp = 0
        for j in range(len(input[0])):
            tmp+=np.e**(input[i][j])
        sum+=-input[i][target[i]]+np.log(tmp)
    return float(sum)/len(input)

print(CrossEntropyLoss(input.data.numpy(),target.data.numpy()))

2.2556240558624268
2.25562417727857


### Optimizer

將多個圖形利用自訂的類別建立成一個物件

In [12]:
from glob import glob
from PIL import Image
from torch.utils.data import Dataset
# ### Optimizer
class DogsAndCatsDataset(Dataset):
    def __init__(self,root_dir,size=(112,112)):
        self.files = glob(root_dir)
        self.size = size
        self.arr = np.array([[0],[1]],int)
    def __len__(self):
        return len(self.files)
    def __getitem__(self,idx):
        input = Variable(torch.from_numpy(np.asarray(Image.open(self.files[idx]).resize((self.size)), float).reshape(1,-1)))
        if(idx%2==0):
            target = Variable(torch.from_numpy(self.arr[0]))
        else:
            target = Variable(torch.from_numpy(self.arr[1])) 
        return input,target

dataset=DogsAndCatsDataset("D:/program/vscode_workspace/private/data/dogs-vs-cats/classifier/*.jpg")

### Training

In [13]:
import torch.optim as optim
from time import perf_counter
loss_fn = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr = 0.0001,momentum=0.9)
print("Training......")

t1 = perf_counter()
t  = t1
for i in range(10):
    index = 0
    print("epoch",i)
    for input, target in dataset:
        output = model(input.float()/(3*(255.)**2)**0.5)
        optimizer.zero_grad()
        loss = loss_fn(output, target.long())
        loss.backward()
        optimizer.step()
        index+=1
        if(perf_counter()-t > 30):
            t = perf_counter()
            print("  Completion ratio :",str(index*100.0/60)+"%")
t2  = perf_counter()

print(model)
print("--------------------------------------")
print("layer1 :","\nweight :\n",model.layer()[0][0].numpy(),"\nbias :\n",model.layer()[0][1].numpy())
print("")
print("layer2 :","\nweight :\n",model.layer()[1][0].numpy(),"\nbias :\n",model.layer()[1][1].numpy())
print("time :",str((t2-t1)/60.0)+" min")

print("\ntest.....")
test = DogsAndCatsDataset("D:/program/vscode_workspace/private/data/dogs-vs-cats/sample_test/*.jpg")
output1 = test[0][0]
output2 = test[1][0]
output1 = model(output1.float())
output2 = model(output2 .float())
print(output1)
print(output2)

Training......
epoch 0
  Completion ratio : 81.66666666666667%
MyFirstNetwork(
  (layer1): Linear(in_features=37632, out_features=3136, bias=True)
  (layer2): Linear(in_features=3136, out_features=2, bias=True)
)
--------------------------------------
layer1 : 
weight :
 [[-4.4488120e-03  3.6750795e-04  3.6130946e-03 ... -2.4994789e-03
  -3.7396825e-03 -5.1219594e-03]
 [ 1.8192146e-03 -1.3093352e-03  4.0918863e-03 ... -4.9696737e-03
   2.0432337e-03  5.2238588e-04]
 [ 4.8691293e-04 -3.3613530e-03 -3.0034543e-03 ...  9.9190138e-04
   3.3962082e-03  4.3215160e-03]
 ...
 [ 4.2709708e-03 -1.8750938e-03 -2.8409404e-03 ... -4.9373768e-03
   3.3219832e-03  2.3835062e-03]
 [-2.7655987e-03 -7.8857958e-04  5.0268336e-03 ... -3.7752728e-03
  -4.2670211e-03 -7.7434362e-07]
 [ 2.1146641e-03 -4.9496028e-03 -1.0307432e-03 ...  1.6086708e-03
   1.0586767e-03  2.2468816e-03]] 
bias :
 [ 3.2132133e-03 -2.2570204e-03  6.9759008e-05 ... -3.5398917e-03
 -2.6258430e-03 -4.8018158e-03]

layer2 : 
weight :
 [