In [2]:
import torch
import torch.nn as nn
import numpy as np

## Object
- linear ([2.0, 1.0, 0.1]) --> softmax (0.65, 0.25, 0.01) --> crossentropy(y,y_hat)

### Softmax

In [11]:
def softmax_np(x):
    return np.exp(x) / np.sum(np.exp(x), axis=0)

In [12]:
x = np.array([2.0, 1.0, 0.1])
outputs = softmax_np(x)
print('softmax numpy :', outputs)

softmax numpy : [0.65900114 0.24243297 0.09856589]


In [13]:
x = torch.tensor([2.0, 1.0, 0.1])
outputs = torch.softmax(x, dim=0)
print('softmax numpy :', outputs)

softmax numpy : tensor([0.6590, 0.2424, 0.0986])


### Cross-entropy

In [14]:
def cross_entropy(actual, predicted):
    EPS = 1e-15
    predicted = np.clip(predicted, EPS, 1 - EPS)
    loss = -np.sum(actual * np.log(predicted))
    return loss

In [15]:
Y = np.array([1,0,0])
Y_pred_good = np.array([0.7, 0.2, 0.1])
Y_pred_bad = np.array([0.1, 0.3, 0.6])
l1 = cross_entropy(Y, Y_pred_good)
l2 = cross_entropy(Y, Y_pred_bad)
print(f'Loss1 numpy: {l1:.4f}')
print(f'Loss2 numpy: {l2:.4f}')

Loss1 numpy: 0.3567
Loss2 numpy: 2.3026


In [16]:
# cross entropy loss in pytorch
loss = nn.CrossEntropyLoss()
# loss(input, target)

In [22]:
Y = torch.tensor([0])    # torch에서는 one-hot이 아닌 label로 표시해야 한다. [1, 0, 0]이 아니라 label : 0
print(Y)
Y_pred_good = torch.tensor([[2.0, 1.0, 0.1]])
Y_pred_bad = torch.tensor([[0.5, 2.0, 0.3]])
l1 = loss(Y_pred_good, Y)
l2 = loss(Y_pred_bad, Y)
print(f'Loss1 numpy: {l1:.4f}')
print(f'Loss2 numpy: {l2:.4f}')

tensor([0])
Loss1 numpy: 0.4170
Loss2 numpy: 1.8406


In [23]:
# get predictions
_, predictions1 = torch.max(Y_pred_good, 1)
_, predictions2 = torch.max(Y_pred_bad, 1)
print(f'Actual class:{Y.item()}, Y_pred1: {predictions1.item()}, Y_pred2: {predictions2.item()}')

Actual class:0, Y_pred1: 0, Y_pred2: 1


In [25]:
# multiple sample
Y = torch.tensor([2,0,1])
Y_pred_good = torch.tensor([[0.1, 0.2, 3.9],
                            [1.2, 0.1, 0.3],
                            [0.3, 2.2, 0.2]])

Y_pred_bad = torch.tensor([[0.9, 0.2, 0.1],
                           [0.1, 0.3, 1.5],
                           [1.2, 0.2, 0.5]])
l1 = loss(Y_pred_good, Y)
l2 = loss(Y_pred_bad, Y)
print(f'Batch Loss1: {l1.item():.4f}')
print(f'Batch Loss2: {l2.item():.4f}')

Batch Loss1: 0.2834
Batch Loss2: 1.6418


In [26]:
# get predictions
_, predictions1 = torch.max(Y_pred_good, 1)
_, predictions2 = torch.max(Y_pred_bad, 1)
print(f'Actual class: {Y}, Y_pred1: {predictions1}, Y_pred2: {predictions2}')

Actual class: tensor([2, 0, 1]), Y_pred1: tensor([2, 0, 1]), Y_pred2: tensor([0, 2, 0])


### Binary Classification

In [28]:
class NeuralNet1(nn.Module):
    def __init__(self, input_size, hidden_size):
        super(NeuralNet1, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size)
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, 1)
        
    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(out)
        out = self.linear2(out)
        y_pred = torch.sigmoid(out)
        return y_pred

model = NeuralNet1(input_size=28*28, hidden_size=5)
criterion = nn.BCELoss()

### Multiclass problem

In [29]:
class NeuralNet2(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(NeuralNet2, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size)
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, num_classes)
        
    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(out)
        out = self.linear2(out)
        return out
    
model = NeuralNet2(input_size=28*28, hidden_size=5, num_classes=3)
criterion = nn.CrossEntropyLoss()