### Layers : Fundamental blocks of Neural Network

In [1]:
import torch
from torch.nn import Linear, ReLU, init
import torch.nn as nn
import numpy as np
from torch.autograd import Variable



### Linear(in_features,out_features,bias)

定義 輸入和輸出層的維度(weight的維度)

In [2]:
myLayer = Linear(in_features=10,out_features=5,bias=True)
inp = Variable(torch.randn(1,10))
myLayer = Linear(in_features=10,out_features=5,bias=True) 
myLayer(inp)

tensor([[ 0.2394,  0.1034,  0.1038,  0.5125, -0.3780]],
       grad_fn=<AddmmBackward>)

In [3]:
myLayer.weight

Parameter containing:
tensor([[-0.0450,  0.0352,  0.0770, -0.3095, -0.1850, -0.1519,  0.0235, -0.2627,
         -0.1498,  0.3129],
        [-0.0385, -0.0704,  0.0571, -0.2252,  0.1334,  0.1772,  0.0424,  0.2511,
         -0.2073, -0.2311],
        [-0.2313, -0.2184,  0.2120,  0.1789,  0.2849,  0.0859, -0.2771,  0.0175,
          0.0292, -0.2301],
        [ 0.1921,  0.2942,  0.1756,  0.1878,  0.2019, -0.1106, -0.0392, -0.0559,
          0.0189, -0.2331],
        [-0.2375, -0.1052,  0.0324, -0.1773,  0.2989,  0.0942,  0.2801, -0.1325,
          0.0783, -0.3045]], requires_grad=True)

In [4]:
myLayer.bias

Parameter containing:
tensor([ 0.1704, -0.0005,  0.2180, -0.2556,  0.0230], requires_grad=True)

### Stacking Linear layers

建立多層神經層透過迭代

In [5]:
myLayer1 = Linear(10,5)
myLayer2 = Linear(5,2)
myLayer2(myLayer1(inp))

tensor([[0.0115, 0.1944]], grad_fn=<AddmmBackward>)

### PyTorch Non-linear Activations

使用兩種呼叫激勵函數的不同方式

In [6]:
sample_data = Variable(torch.Tensor([[1,2,-1,-1]])) 
myRelu = ReLU()
myRelu(sample_data)


tensor([[1., 2., 0., 0.]])

In [7]:
import torch.nn as nn
import torch.nn.functional as F
sample_data = Variable(torch.Tensor([[1,2,-1,-1]])) 
f = F.relu(sample_data) # Much simpler.
f

tensor([[1., 2., 0., 0.]])

### Neural Network 

利用類別建立多層神經網路

In [8]:
class MyFirstNetwork(nn.Module):
    def __init__(self,input_size,hidden_size,output_size):
        super(MyFirstNetwork,self).__init__() 
        self.layer1 = nn.Linear(input_size,hidden_size) 
        self.layer2 = nn.Linear(hidden_size,output_size)
        init.xavier_normal(self.layer1.weight)
        init.xavier_normal(self.layer2.weight)
    def layer(self):
        first  = [self.layer1.weight.data,self.layer1.bias.data]
        second = [self.layer2.weight.data,self.layer2.bias.data]
        return first,second
    def forward(self,input): 
        out = self.layer1(input) 
        out = F.relu(out)
        out = self.layer2(out) 
        out = F.softmax(out,dim=1)
        return out

model = MyFirstNetwork(112*112,56*56,2)
model = model.cuda()
print(model)

  
  import sys


MyFirstNetwork(
  (layer1): Linear(in_features=12544, out_features=3136, bias=True)
  (layer2): Linear(in_features=3136, out_features=2, bias=True)
)


### Loss

介紹兩種不同的loss function

In [9]:
loss = nn.MSELoss()
input = Variable(torch.randn(3, 5), requires_grad=True) 
target = Variable(torch.randn(3, 5))
output = loss(input, target)
output.backward()

分類問題常用的loss function: 交叉熵(cross-entropy)

In [10]:
def cross_entropy(true_label, prediction):
    if true_label == 1:
        return -log(prediction)
    else:
        return -log(1 - prediction)

### loss(x,class)=−x[class]+log(∑exp(x[j]))

利用上述公式自訂函數與內建函數比較

In [11]:
loss = nn.CrossEntropyLoss()
input = Variable(torch.randn(3, 5), requires_grad=True) 
target = Variable(torch.LongTensor(3).random_(5)) 
output = loss(input, target)
output.backward()
print(output.data.item())

def CrossEntropyLoss(input,target):
    sum = 0
    for i in range(len(input)):
        tmp = 0
        for j in range(len(input[0])):
            tmp+=np.e**(input[i][j])
        sum+=-input[i][target[i]]+np.log(tmp)
    return float(sum)/len(input)

print(CrossEntropyLoss(input.data.numpy(),target.data.numpy()))

2.02616810798645
2.0261680526688504


### Optimizer

將多個圖形利用自訂的類別建立成一個物件

In [12]:
from glob import glob
from PIL import Image
from torch.utils.data import Dataset
# ### Optimizer
class DogsAndCatsDataset(Dataset):
    def __init__(self,root_dir,size=(112,112)):
        self.files = glob(root_dir)
        self.size = size
        self.arr = np.array([[0],[1]],int)
    def __len__(self):
        return len(self.files)
    def __getitem__(self,idx):
        input = Variable(torch.from_numpy(np.asarray(Image.open(self.files[idx]).resize((self.size)).convert('L'), float).reshape(1,-1)))  
        if(idx%2==0):
            target = Variable(torch.from_numpy(self.arr[0]))
        else:
            target = Variable(torch.from_numpy(self.arr[1])) 
        return input,target

dataset = DogsAndCatsDataset("D:/program/vscode_workspace/private/data/dogs-vs-cats/classifier/*.jpg")
test = DogsAndCatsDataset("D:/program/vscode_workspace/private/data/dogs-vs-cats/sample_test/*.jpg")

### Training

In [13]:
import torch.optim as optim
from time import perf_counter
loss_fn = nn.CrossEntropyLoss()
loss_fn = loss_fn.cuda()
optimizer = optim.Adam(model.parameters(), lr = 0.0001)
t1 = perf_counter()
t  = t1
for i in range(100):
    index = 0
    print("epoch",i)
    for input, target in dataset:
        if torch.cuda.is_available():
            input = Variable(input.cuda())
            target = Variable(target.cuda())
        else:
            input, target = Variable(input), Variable(target)    
        output = model(input.float()/((255.)**2)**0.5)
        optimizer.zero_grad()
        loss = loss_fn(output, target.long())
        loss.backward()
        optimizer.step()
        index+=1
        if(perf_counter()-t > 30):
            t = perf_counter()
            print("  Completion ratio :",str(index*100.0/60)+"%")
    ans=0
    for j in range(10):        
        output = test[j][0].cuda()
        output = model(output.float())
        print(output)
        tmp = output.data.cpu().numpy() 
        print(tmp)
        if(tmp[0][0]>tmp[0][1] and j<5):
            ans+=1
        if(tmp[0][0]<tmp[0][1] and j>=5):
            ans+=1
    print("  accuracy :",str(ans*100/10.)+"%")

        
t2  = perf_counter()

print(model)
print("--------------------------------------")
print("layer1 :","\nweight :\n",model.layer()[0][0].cpu().numpy(),"\nbias :\n",model.layer()[0][1].cpu().numpy())
print("")
print("layer2 :","\nweight :\n",model.layer()[1][0].cpu().numpy(),"\nbias :\n",model.layer()[1][1].cpu().numpy())
print("time :",str((t2-t1)/60.0)+"min")
print("\ntest.....")

epoch 0
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
  accuracy : 50.0%
epoch 1
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
  accuracy : 50.0%
epoch 2
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
  accuracy : 50.0%
epoch 3
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
  accuracy : 50.0%
epoch 4
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
  accuracy : 50.0%
epoch 5
  Completion ratio : 35.0%
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
[[1. 0.]]
  accuracy : 50.0%
epoch 6


KeyboardInterrupt: 