## Softmax

In [1]:
import torch
import torch.nn as nn
import numpy as np

In [2]:
def softmax(x):
    return np.exp(x)/np.sum(np.exp(x), axis=0)

In [3]:
x = np.array([1, 2, 3])
outputs = softmax(x)
print('Softmax numpy:', outputs)

Softmax numpy: [0.09003057 0.24472847 0.66524096]


In [8]:
x = torch.tensor([1., 2., 3.])
outputs = torch.softmax(x, dim=0)
print('Softmax torch:', outputs)

Softmax torch: tensor([0.0900, 0.2447, 0.6652])


## Cross Entropy Loss

In [10]:
def cross_entropy(actual, predicted):
    loss = -np.sum(actual * np.log(predicted))
    return loss

In [11]:
# Y must be a one-hot vector
Y = np.array([1, 0, 0])

In [12]:
Y_pred_good = np.array([0.7, 0.2, 0.1])
Y_pred_bad = np.array([0.1, 0.3, 0.6])
l1 = cross_entropy(Y, Y_pred_good)
l2 = cross_entropy(Y, Y_pred_bad)
print('Cross-entropy loss:', l1, l2)

Cross-entropy loss: 0.35667494393873245 2.3025850929940455


In [15]:
loss = nn.CrossEntropyLoss()

Y = torch.tensor([0])
Y_pred_good = torch.tensor([[2.0, 1.0, 0.1]])
Y_pred_bad = torch.tensor([[0.5, 2.0, 0.3]])

l1 = loss(Y_pred_good, Y)
l2 = loss(Y_pred_bad, Y)
print('Cross-entropy loss:', l1.item(), l2.item())

Cross-entropy loss: 0.4170299470424652 1.840616226196289


In [19]:
_, predictions1 = torch.max(Y_pred_good, 1)
_, predictions2 = torch.max(Y_pred_bad, 1)
print('Predictions:\n', predictions1.item(),'\n', predictions2.item())

Predictions:
 0 
 1


In [20]:
# 3 samples
Y = torch.tensor([2,0,1])

Y_pred_good = torch.tensor([[0.1, 1.0,2.1], [2.0, 1.0, 0.1], [0.1, 3.0, 0.1]])
Y_pred_bad = torch.tensor([[2.1, 1.0,0.1], [0.1, 1.0, 2.1], [0.1, 3.0, 0.1]])

In [21]:
l1 = loss(Y_pred_good, Y)
l2 = loss(Y_pred_bad, Y)
print('Cross-entropy loss:', l1.item(), l2.item())

Cross-entropy loss: 0.3018244206905365 1.6241613626480103


In [23]:
_, predictions1 = torch.max(Y_pred_good, 1)
_, predictions2 = torch.max(Y_pred_bad, 1)
print('Predictions:\n', predictions1,'\n', predictions2)

Predictions:
 tensor([2, 0, 1]) 
 tensor([0, 2, 1])


## Binary Classification

In [24]:
class NeuralNet1(nn.Module):
    def __init__(self, input_size, hidden_size):
        super(NeuralNet1, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size) 
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, 1)  
    
    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(out)
        out = self.linear2(out)
        # sigmoid at the end
        y_pred = torch.sigmoid(out)
        return y_pred
        
model = NeuralNet1(input_size=28*28, hidden_size=5)
criterion = nn.BCELoss()

## Multiclass Classification

In [26]:
# Multiclass problem
class NeuralNet2(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(NeuralNet2, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size) 
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, num_classes)  
    
    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(out)
        out = self.linear2(out)
        # no softmax at the end
        return out

model = NeuralNet2(input_size=28*28, hidden_size=5, num_classes=3)
criterion = nn.CrossEntropyLoss()  # (applies Softmax)