<a href="https://colab.research.google.com/github/fathima6610/base/blob/main/RNN.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import numpy as np
from keras.models import Sequential
from keras.layers import SimpleRNN, Dense, Embedding
from keras.preprocessing.text import Tokenizer
from keras.preprocessing.sequence import pad_sequences
from keras.utils import to_categorical

# Generating some example sequential data
sentences = ['I love learning','I love python','I hate school',
             'Recurrent Neural Networks are powerful']
# Tokenizing the words
tokenizer = Tokenizer()
tokenizer.fit_on_texts(sentences)
total_words = len(tokenizer.word_index) + 1

# Creating input sequences and their corresponding next words
input_sequences = []
for sentence in sentences:
    tokenized_sentence = tokenizer.texts_to_sequences([sentence])[0]
    for i in range(1, len(tokenized_sentence)):
        n_gram_sequence = tokenized_sentence[:i+1]
        input_sequences.append(n_gram_sequence)

# Padding sequences for consistent input size
max_sequence_length = max([len(seq) for seq in input_sequences])
input_sequences = pad_sequences(input_sequences, maxlen=max_sequence_length, padding='pre')

# Creating input and output data
X, y = input_sequences[:, :-1], input_sequences[:, -1]
y = to_categorical(y, num_classes=total_words)

# Building a simple RNN model
model = Sequential()
model.add(Embedding(input_dim=total_words, output_dim=50, input_length=max_sequence_length-1))
model.add(SimpleRNN(100, return_sequences=True))
model.add(SimpleRNN(100))
model.add(Dense(total_words, activation='softmax'))

# Compiling the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Training the model
model.fit(X, y, epochs=50, verbose=2)


Epoch 1/50
1/1 - 4s - loss: 2.4875 - accuracy: 0.1000 - 4s/epoch - 4s/step
Epoch 2/50
1/1 - 0s - loss: 2.3953 - accuracy: 0.3000 - 15ms/epoch - 15ms/step
Epoch 3/50
1/1 - 0s - loss: 2.3079 - accuracy: 0.3000 - 15ms/epoch - 15ms/step
Epoch 4/50
1/1 - 0s - loss: 2.2226 - accuracy: 0.3000 - 15ms/epoch - 15ms/step
Epoch 5/50
1/1 - 0s - loss: 2.1390 - accuracy: 0.3000 - 14ms/epoch - 14ms/step
Epoch 6/50
1/1 - 0s - loss: 2.0581 - accuracy: 0.3000 - 14ms/epoch - 14ms/step
Epoch 7/50
1/1 - 0s - loss: 1.9813 - accuracy: 0.3000 - 14ms/epoch - 14ms/step
Epoch 8/50
1/1 - 0s - loss: 1.9088 - accuracy: 0.3000 - 20ms/epoch - 20ms/step
Epoch 9/50
1/1 - 0s - loss: 1.8377 - accuracy: 0.3000 - 23ms/epoch - 23ms/step
Epoch 10/50
1/1 - 0s - loss: 1.7642 - accuracy: 0.4000 - 17ms/epoch - 17ms/step
Epoch 11/50
1/1 - 0s - loss: 1.6877 - accuracy: 0.4000 - 17ms/epoch - 17ms/step
Epoch 12/50
1/1 - 0s - loss: 1.6115 - accuracy: 0.4000 - 14ms/epoch - 14ms/step
Epoch 13/50
1/1 - 0s - loss: 1.5409 - accuracy: 0.400

<keras.src.callbacks.History at 0x7af5583ab6d0>

In [3]:
# Generating text using the trained model
seed_text = input("Enter the starting word: ")
next_words = int(input("Enter how many words to predict: "))

for _ in range(next_words):
    tokenized_seed = tokenizer.texts_to_sequences([seed_text])[0]
    tokenized_seed = pad_sequences([tokenized_seed], maxlen=max_sequence_length-1, padding='pre')
    predicted_word_index = np.argmax(model.predict(tokenized_seed), axis=-1)
    predicted_word = tokenizer.index_word[predicted_word_index[0]]
    seed_text += " " + predicted_word

print(seed_text)

Enter the starting word: 2
Enter how many words to predict: 1
2 love
