## Numpy

In [1]:
import torch
import torch.nn as nn
import numpy as np

In [2]:
def cross_entropy(actual, predicted):
    loss = -np.sum(actual * np.log(predicted))
    return loss # / float(predicted.shape[0])

In [4]:
# y must be one-hot encoded
# if class 0: [1, 0, 0]
# if class 1: [0, 1, 0]
# if class 2: [0, 0, 1]

y = np.array([1, 0, 0])
y_pred_good = np.array([0.7, 0.2, 0.1])
y_pred_bad = np.array([0.1, 0.3, 0.6])
l1 = cross_entropy(y, y_pred_good)
l2 = cross_entropy(y, y_pred_bad)
print(f'Loss1 numpy: {l1:.4f}')
print(f'Loss2 numpy: {l2:.4f}')

Loss1 numpy: 0.3567
Loss2 numpy: 2.3026


## PyTorch

Careful! <br>
nn.CrossEntropyLoss() applies nn.LogSoftmax + nn.NLLLoss (negative log likelihood loss) <br><br>
-> No Softmax in last layer!

* Y has class labels, not One-Hot!
* Y_pred has raw scores (logits), no Softmax!

In [13]:
loss = nn.CrossEntropyLoss()

Y = torch.tensor([2, 0, 1])

# n_samples x n_classes = 3 x 3
Y_pred_good = torch.tensor([[0.1, 1.0, 2.1],
                            [2.0, 1.0, 0.1],
                            [0.1, 3.0, 0.1]])
Y_pred_bad = torch.tensor([[0.5, 2.0, 0.3],
                           [0.1, 1.0, 2.1],
                           [0.1, 3.0, 0.1]])

l1 = loss(Y_pred_good, Y)
l2 = loss(Y_pred_bad, Y)

print(f'Loss1 PyTorch: {l1.item():.4f}')
print(f'Loss2 PyTorch: {l2.item():.4f}')

_, prediction1 = torch.max(Y_pred_good, 1)
_, prediction2 = torch.max(Y_pred_bad, 1)

print(prediction1)
print(prediction2)

Loss1 PyTorch: 0.3018
Loss2 PyTorch: 1.5097
tensor([2, 0, 1])
tensor([1, 2, 1])
