In [1]:
import torch 
import torch.nn as nn 
import numpy as np

### Softmax

#### Numpy

In [2]:
def softmax(x):
  return np.exp(x)/np.sum(np.exp(x), axis =0)

x = np.array([2.0, 1.0, 0.1])
outputs = softmax(x)

print("Softmax Numpy:{}".format(outputs))

Softmax Numpy:[0.65900114 0.24243297 0.09856589]


#### Pytorch

In [3]:
x1 = torch.tensor([2.0, 1.0, 0.1])
outputs = torch.softmax(x1, dim=0)
print("Softmax Torch:{}".format(outputs))

Softmax Torch:tensor([0.6590, 0.2424, 0.0986])


### Cross-Entropy

Notes:
  * Good Entropy loss is low
  * Bad Entropy loss is high

#### Numpy

In [4]:
def cross_entropy(actual, predicted):
  
  loss = -np.sum(actual*np.log(predicted))

  return loss

# One hot encoded classes
y = np.array([1,0,0])

y_pred_good = np.array([0.7, 0.2, 0.1])
y_pred_bad = np.array([0.1, 0.3, 0.6])

l1 = cross_entropy(y, y_pred_good)
l2 = cross_entropy(y, y_pred_bad)

print("Loss1 Numpy:{:.4f}".format(l1))
print("Loss2 Numpy:{:.4f}".format(l2))

Loss1 Numpy:0.3567
Loss2 Numpy:2.3026


#### Pytorch

In [5]:
loss = nn.CrossEntropyLoss()

In [6]:
# 3 samples
y = torch.tensor([2,0,1])

# nsamples * nclasses = 3*3
y_pred_good = torch.tensor([[0.3, 1.0, 2.0],[2.0, 1.0, 0.1],[0.1, 3.0, 0.1]])
y_pred_bad = torch.tensor([[2.1, 1.0, 0.1], [2.0, 1.0, 2.3], [0.1, 3.0, 0.1]])

l1 = loss(y_pred_good, y)
l2 = loss(y_pred_bad, y)

print("Loss1 Numpy:{:.4f}".format(l1))
print("Loss2 Numpy:{:.4f}".format(l2))

Loss1 Numpy:0.3200
Loss2 Numpy:1.1627


In [7]:
# Predict
_,prediction1 = torch.max(y_pred_good,1)
_,prediction2 = torch.max(y_pred_bad, 1)

print(prediction1)
print(prediction2)

tensor([2, 0, 1])
tensor([0, 2, 1])


### Multiclass problem

In [12]:
class NNet2(nn.Module):
  def __init__(self, input_size, hidden_size, num_classes):
    super(NNet2, self).__init__()
    self.linear1 = nn.Linear(input_size, hidden_size)
    self.relu = nn.ReLU()
    self.linear2 = nn.Linear(hidden_size, num_classes)

  def forward(self, x):
    out = self.linear1(x)
    out = self.relu(out)
    out = self.linear2(out)
    # do not apply softmax

    return out

In [13]:
model = NNet2(input_size=28*28, hidden_size=5, num_classes=3)

criterion = nn.CrossEntropyLoss() # already applies Softmax