In [3]:
import torch
import torch.nn as nn
import torch.nn.functional as F

In [1]:
# Hyperparameters
input_size = 28
hidden_size = 256
num_layers = 2
num_classes = 10
sequence_length = 28
learning_rate = 0.005
batch_size = 64
num_epochs = 3

In [4]:
# Recurrent Neural Network (many-to-one)

class RNN(nn.Module):
    def __init__(self, input_size, hidden_size, num_layers, num_classes):
        super(RNN,self).__init__()
        self.hidden_size = hidden_size
        self.num_layers = num_layers
        self.rnn = nn.RNN(input_size, hidden_size, num_layers, batch_first = True)
        self.fc = nn.Linear(hidden_size * sequence_length, num_classes)

    def forward(self, x):
        # Set initial hidden and cell states
        h0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(device)

        # Forward propogate
        out,_ = self.rnn(h0, x)
        out = out.reshape(out.shape[0],-1)    

        # Decode hidden state
        out = self.fc(out)

        return out 

In [5]:
# Recurrent neural network with GRU (many-to-one)

class GRU(nn.Module):
    def __init__(self, input_size, hidden_size, num_layers, num_classes):
        super(GRU,self).__init__()
        self.hidden_size = hidden_size
        self.num_layers = num_layers
        self.gru = nn.GRU(input_size, hidden_size, num_layers, batch_first = True)
        self.fc = nn.Linear(hidden_size * sequence_length, num_classes)

    def forward(self, x):
        # Set initial hidden and cell states
        h0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(device)

        # Forward propogate
        out,_ = self.gru(h0, x)
        out = out.reshape(out.shape[0],-1)    

        # Decode hidden state
        out = self.fc(out)

        return out 

In [None]:
# Recurrent neural network with LSTM (many-to-one)

class LSTM(nn.Module):
    def __init__(self, input_size, hidden_size, num_layers, num_classes):
        super(GRU,self).__init__()
        self.hidden_size = hidden_size
        self.num_layers = num_layers
        self.lstm = nn.LSTM(input_size, hidden_size, num_layers, batch_first = True)
        self.fc = nn.Linear(hidden_size * sequence_length, num_classes)

    def forward(self, x):
        # Set initial hidden and cell states
        h0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(device)
        c0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(device)

        # Forward propogate
        out,_ = self.lstm(
            x,(h0, c0)
        ) # out: tensor of shape (batch_size, seq_length, hidden_size)
        out = out.reshape(out.shape[0],-1)    

        # Decode hidden state
        out = self.fc(out)

        return out 