# Softmax and Cross-entropy


In [4]:
import torch
import torch.nn as nn
import numpy as np


In [5]:
# Softmax in Numpy
def softmax(x):
    return np.exp(x)/np.sum(np.exp(x), axis=0)


x = np.array([2.0, 1.0, 0.1])
outputs = softmax(x)
print('Softmax numpy: ', outputs)


Softmax numpy:  [0.65900114 0.24243297 0.09856589]


In [6]:
# Softmax in PyTorch
x = torch.Tensor([2.0, 1.0, 0.1])
outputs = torch.softmax(x, dim=0)
print('Softmax Tensor: ', outputs)


Softmax Tensor:  tensor([0.6590, 0.2424, 0.0986])


In [7]:
# Cross-Entropy in numpy
def cross_entropy(actual, predicted):
    loss = -np.sum(actual * np.log(predicted))
    return loss


Y = np.array([1, 0, 0])
y_good = np.array([0.7, 0.2, 0.1])
y_bad = np.array([0.1, 0.3, 0.6])

l1 = cross_entropy(Y, y_good)
l2 = cross_entropy(Y, y_bad)
print(f'Loss1 numpy: {l1:.4f}')
print(f'Loss2 numpy: {l2:.4f}')


Loss1 numpy: 0.3567
Loss2 numpy: 2.3026


In [10]:
# Cross-Entropy in PyTorch
loss = nn.CrossEntropyLoss()  # use nn.BCELoss() for binary classification

# multiclass with 3 outputs
Y = torch.tensor([2, 0, 1])

# nsamples x nclass = 3x3
y_good = torch.tensor([[0.1, 1.0, 2.1], [2.0, 1.0, 0.1], [2.0, 3.0, 0.1]])
y_bad = torch.tensor([[0.5, 2.0, 0.3], [0.5, 2.0, 0.3], [3.5, 2.0, 0.3]])

l1 = loss(y_good, Y)
l2 = loss(y_bad, Y)
print(f'Loss1 PyTorch: {l1.item():.4f}')
print(f'Loss2 PyTorch: {l2.item():.4f}')

_, predictions1 = torch.max(y_good, 1)
_, predictions2 = torch.max(y_bad, 1)
print(predictions1)
print(predictions2)

# note: you do not need to calculate softmax when calculating loss for multiclassification through PyTorch
# however, you apply sigmoid at the end for binay classification


Loss1 PyTorch: 0.3846
Loss2 PyTorch: 1.8718
tensor([2, 0, 1])
tensor([1, 1, 0])


# Activation Functions


In [None]:
import torch.nn.functional as F

In [None]:
# option1
class NeuralNet(nn.Module):
    def __init__(self, input_size, hidden_size):
        super(NeuralNet, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size)
        self.relu = nn.ReLU()
        self.linear2 = nn.Linear(hidden_size, 1)
        self.sigmoid = nn.Sigmoid()

    def forward(self, x):
        out = self.linear1(x)
        out = self.relu(x)
        out = self.linear2(x)
        out = self.sigmoid(x)
        return out


# option2
class NeuralNet(nn.Module):
    def __init__(self, input_size, hidden_size):
        super(NeuralNet, self).__init__()
        self.linear1 = nn.Linear(input_size, hidden_size)
        self.linear2 = nn.Linear(hidden_size, 1)

    def forward(self, x):
        out = torch.relu(self.linear1(x))
        out = torch.sigmoid(self.linear2(x))
        # F.leaky_relu()
        return out
