In [87]:
import torch
import torch.nn as nn
import numpy as np

In [88]:
def softmax(x):
    return np.exp(x) / np.sum(np.exp(x), axis=0)

In [89]:
x = np.array([1, 2, 3])
outputs = softmax(x)

print(f"softmax numpy {outputs}")



softmax numpy [0.09003057 0.24472847 0.66524096]


In [90]:
 x = torch.tensor([1, 2, 3], dtype=torch.float32)
outputs = torch.softmax(x, dim=0)

print(f"softmax torch {outputs}")

softmax torch tensor([0.0900, 0.2447, 0.6652])


In [91]:
def cross_entropy(actual, predicted):
    loss = -np.sum(actual * np.log(predicted))
    return loss

Y = np.array([1, 0, 0])

y_pred_good = np.array([0.7, 0.2, 0.1])
y_pred_bad = np.array([0.1, .3, .6])
l1 = cross_entropy(Y, y_pred_good)
l2 = cross_entropy(Y, y_pred_bad)
print(f"Loss1 numpy: {l1:.4f}")
print(f"Loss2 numpy: {l2:.4f}")

Loss1 numpy: 0.3567
Loss2 numpy: 2.3026


## Pytorch Implementation

In [92]:
loss = nn.CrossEntropyLoss()
Y = torch.tensor([2, 0, 1], dtype=torch.long)

Y_pred_good = torch.tensor([
    [.1, 1.0, 2.1],
    [2.0, 1.0, .1],
    [.1, 3.0, .1]
], dtype=torch.float)
Y_pred_bad = torch.tensor([
    [2.1, 1.0, .1],
    [.1, 1.0, 2.1],
    [.1, 3.0, .1]
], dtype=torch.float)


l1 = loss(Y_pred_good, Y)
l2 = loss(Y_pred_bad, Y)

print(f"l1: {l1.item()}")
print(f"l2: {l2.item()}")


l1: 0.3018244206905365
l2: 1.6241613626480103


In [93]:
_, predictions_1 = torch.max(Y_pred_good, 1)
_, predictions_2 = torch.max(Y_pred_bad, 1)

In [94]:
print(f"prediction 1: {predictions_1}")
print(f"prediction 2: {predictions_2}")

prediction 1: tensor([2, 0, 1])
prediction 2: tensor([0, 2, 1])


## Multi Classification

In [95]:
class MultiClassifier(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(MultiClassifier, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size)
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, num_classes)

    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(out)
        out = self.linear2(out)
        return out


model = MultiClassifier(input_size=28 * 28, hidden_size=5, num_classes=3)
criterion = nn.CrossEntropyLoss()

## Binary classification

In [96]:
class BinaryClassifier(nn.Module):
    def __init__(self, input_size, hidden_size):
        super(BinaryClassifier, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size)
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, 1)

    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(out)
        out = self.linear2(out)

        y_pred = torch.sigmoid(out)
        return y_pred

model = BinaryClassifier(input_size=28 * 28, hidden_size=5)
criterion = nn.BCELoss()