In [23]:
import torch
import torch.nn as nn
import torchvision
import torchvision.transforms as transforms
import torch.optim as optim

In [25]:
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

In [57]:
embedding_dim = 10
hidden_size = 16
num_layers = 1
learning_rate = 0.001
num_epochs = 50

model = TextRNN(vocab_size, embedding_dim, hidden_size, num_layers).to(device)
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

In [31]:
sentence = "the cat is sleeping"
words = sentence.split()

# Create a vocabulary
vocab = list(set(words))  
word_to_idx = {word: idx for idx, word in enumerate(vocab)}
idx_to_word = {idx: word for word, idx in word_to_idx.items()}
vocab_size = len(vocab)

# Prepare input and target
input_words = words[:3] 
target_word = words[3]   

input_indices = [word_to_idx[w] for w in input_words]
target_index = word_to_idx[target_word]

input_tensor = torch.tensor([input_indices], dtype=torch.long).to(device)  
target_tensor = torch.tensor([target_index], dtype=torch.long).to(device)  

#  Define RNN model
class TextRNN(nn.Module):
    def __init__(self, vocab_size, embedding_dim, hidden_size, num_layers):
        super(TextRNN, self).__init__()
        self.embedding = nn.Embedding(vocab_size, embedding_dim)
        self.rnn = nn.RNN(embedding_dim, hidden_size, num_layers, batch_first=True)
        self.fc = nn.Linear(hidden_size, vocab_size)

    def forward(self, x):
        x = self.embedding(x)  # (batch, seq_len, embed_dim)
        h0 = torch.zeros(num_layers, x.size(0), hidden_size).to(device)  # initial hidden state
        out, _ = self.rnn(x, h0)  # out: (batch, seq_len, hidden_size)
        out = out[:, -1, :]  # get the output of the last time step
        out = self.fc(out)   # map to vocab size
        return out


In [59]:
for epoch in range(num_epochs):
    model.train()
    outputs = model(input_tensor)
    loss = criterion(outputs, target_tensor)

    optimizer.zero_grad()
    loss.backward()
    optimizer.step()

    if (epoch + 1) % 10 == 0:
        print(f'Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}')

Epoch [10/50], Loss: 0.8387
Epoch [20/50], Loss: 0.5693
Epoch [30/50], Loss: 0.3850
Epoch [40/50], Loss: 0.2645
Epoch [50/50], Loss: 0.1884


In [61]:
# Test
with torch.no_grad():
    output = model(input_tensor)
    predicted_idx = torch.argmax(output, dim=1).item()
    predicted_word = idx_to_word[predicted_idx]
    print(f'Predicted word: {predicted_word}')

Predicted word: sleeping
