In [27]:
import numpy as np
import pandas as pd
from sklearn.preprocessing import LabelEncoder, StandardScaler
from sklearn.model_selection import train_test_split
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import LSTM, Dense
from tensorflow.keras.utils import to_categorical


In [28]:
# Load dataset
df = pd.read_csv('Dataset_timeseries.csv')

In [32]:

# Encode the class labels
label_encoder = LabelEncoder()
df['Number'] = label_encoder.fit_transform(df['Number'])

# Normalize the 'sopas' column
scaler = StandardScaler()
df['SOPAS'] = scaler.fit_transform(df[['SOPAS']])

In [34]:
sequence_length = 604  # Given length of each example

# Calculate the number of complete sequences
num_complete_sequences = len(df) // sequence_length

# Trim the DataFrame to have a multiple of sequence_length rows
df = df.iloc[:num_complete_sequences * sequence_length]

# Reshape the data into sequences
X = df[['SOPAS']].values.reshape(-1, sequence_length, 1)
y = df['Number'].values[::sequence_length]

# One-hot encode the labels
y = to_categorical(y)

# Split into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


In [43]:
from tensorflow.keras.layers import Dropout

model = Sequential()
model.add(LSTM(30, activation='relu', input_shape=(sequence_length, 1)))
model.add(Dropout(0.2))  # Add dropout layer with 20% dropout rate
model.add(Dense(15, activation='relu'))
model.add(Dropout(0.2))  # Add another dropout layer
model.add(Dense(y.shape[1], activation='softmax'))

model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])


In [44]:
history = model.fit(X_train, y_train, epochs=20, batch_size=32, validation_data=(X_test, y_test))

# Evaluate the model
loss, accuracy = model.evaluate(X_test, y_test)
print(f"Test Accuracy: {accuracy}")

# Plot training history
import matplotlib.pyplot as plt

# Plot training & validation accuracy values
plt.figure(figsize=(12, 6))
plt.plot(history.history['accuracy'], label='Train Accuracy')
plt.plot(history.history['val_accuracy'], label='Val Accuracy')
plt.title('Model accuracy')
plt.ylabel('Accuracy')
plt.xlabel('Epoch')
plt.legend(loc='upper left')
plt.show()

# Plot training & validation loss values
plt.figure(figsize=(12, 6))
plt.plot(history.history['loss'], label='Train Loss')
plt.plot(history.history['val_loss'], label='Val Loss')
plt.title('Model loss')
plt.ylabel('Loss')
plt.xlabel('Epoch')
plt.legend(loc='upper left')
plt.show()


Epoch 1/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m6s[0m 276ms/step - accuracy: 0.0789 - loss: 1.4173 - val_accuracy: 0.1618 - val_loss: 1.3897
Epoch 2/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 215ms/step - accuracy: 0.2919 - loss: 1.3786 - val_accuracy: 0.3235 - val_loss: 1.3565
Epoch 3/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 231ms/step - accuracy: 0.5352 - loss: 1.3313 - val_accuracy: 0.3529 - val_loss: 1.3248
Epoch 4/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 238ms/step - accuracy: 0.5258 - loss: 1.2895 - val_accuracy: 0.3382 - val_loss: 1.2912
Epoch 5/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 220ms/step - accuracy: 0.5187 - loss: 1.2264 - val_accuracy: 0.3382 - val_loss: 1.2504
Epoch 6/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 221ms/step - accuracy: 0.4337 - loss: nan - val_accuracy: 0.5588 - val_loss: nan
Epoch 7/20
[1m9/9[0m [32m━━━━━━━━━━━━━━━━━━