# LSTM

Test of simple MLP models with different amount of neurons, hidden layers and size of input vector

## Load Data

In [222]:
import torch
from torch.utils.data import Dataset, DataLoader, random_split
import torch.nn as nn

import pandas as pd
import numpy as np

from tqdm import tqdm

import plotly.express as px
from torch.optim import Adam


import matplotlib.pyplot as plt

In [223]:
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

In [224]:
df = pd.read_csv("data_N_6000_noise_level_0.05.csv")
df['Time'] = 1
# df_diff = pd.DataFrame(df.iloc[1:].values - df.iloc[:-1].values, columns=["dt", "dx", "dy", "dz"])

In [225]:
# df_diff.head(10)

In [226]:
class SequentDataset(Dataset):
    def __init__(self, dataframe: pd.DataFrame, n_dots=1, n_dot_parameters=4):
        self.n_dot_parameters = n_dot_parameters
        self.n_dots = n_dots
        self.X_, self.y_ = self.__make_stack(dataframe)
        print(self.X_.shape)
        print(self.y_.shape)

    def __len__(self):
        return len(self.X_)

    def __getitem__(self, idx):
        return self.X_[idx], self.y_[idx]

    def __make_stack(self, df: pd.DataFrame):
        seq_amount = df.shape[0] - 2 * self.n_dots - 1
        X = torch.zeros((seq_amount, self.n_dots, self.n_dot_parameters), dtype=torch.float32)
        y = torch.zeros((seq_amount, self.n_dots, self.n_dot_parameters), dtype=torch.float32)
        for i in range(seq_amount):
            X[i, :, :] = torch.reshape(torch.tensor(df.values[i:i+self.n_dots, :], dtype=torch.float32), (1, self.n_dots, self.n_dot_parameters))
            y[i, :, :] = torch.reshape(torch.tensor(df.values[i+1:i+1+self.n_dots, :], dtype=torch.float32), (1, self.n_dots, self.n_dot_parameters))

        # stacks = [[df.iloc[:-self.n_dots]]] + [df.iloc[i:].values if (self.n_dots == i) else df.iloc[i:-(self.n_dots - i)].values for i in range(1, self.n_dots + 1)]
        return (X, y)

In [227]:
N_DOTS = 100
BATCH_SIZE = 16
N_DOT_PARAMETERS = 4
N_LSTM_LAYERS = 1

In [228]:
# dataset = SequentDataset(df_diff[0:5000], n_dots=N_DOTS, n_dot_parameters=N_DOT_PARAMETERS)
# test = SequentDataset(df_diff[5000:6000], n_dots=N_DOTS, n_dot_parameters=N_DOT_PARAMETERS)
dataset = SequentDataset(df[0:5000], n_dots=N_DOTS, n_dot_parameters=N_DOT_PARAMETERS)
test = SequentDataset(df[5000:6000], n_dots=N_DOTS, n_dot_parameters=N_DOT_PARAMETERS)

torch.Size([4799, 100, 4])
torch.Size([4799, 100, 4])
torch.Size([799, 100, 4])
torch.Size([799, 100, 4])


In [229]:
dataset[0]

(tensor([[ 1.0000e+00, -1.0888e+00, -1.8649e+00,  1.9545e+00],
         [ 1.0000e+00, -1.0216e+00, -1.7815e+00,  2.0276e+00],
         [ 1.0000e+00, -1.0424e+00, -1.8584e+00,  2.0272e+00],
         [ 1.0000e+00, -1.0288e+00, -1.8702e+00,  1.9862e+00],
         [ 1.0000e+00, -1.0438e+00, -1.8642e+00,  2.0225e+00],
         [ 1.0000e+00, -1.0778e+00, -1.8049e+00,  2.0375e+00],
         [ 1.0000e+00, -1.0461e+00, -1.8762e+00,  1.9884e+00],
         [ 1.0000e+00, -1.0479e+00, -1.8682e+00,  2.0233e+00],
         [ 1.0000e+00, -1.0967e+00, -1.8871e+00,  2.0040e+00],
         [ 1.0000e+00, -1.0816e+00, -1.8685e+00,  1.9764e+00],
         [ 1.0000e+00, -1.0826e+00, -1.8953e+00,  1.9638e+00],
         [ 1.0000e+00, -1.1065e+00, -1.9204e+00,  1.9312e+00],
         [ 1.0000e+00, -1.0289e+00, -1.9056e+00,  1.9660e+00],
         [ 1.0000e+00, -1.1181e+00, -1.8694e+00,  1.9205e+00],
         [ 1.0000e+00, -1.0807e+00, -1.9166e+00,  1.9936e+00],
         [ 1.0000e+00, -1.0872e+00, -1.9414e+00,  1.903

In [230]:
train_data, val_data = random_split(dataset,[0.8,0.2])

train_loader = DataLoader(train_data, batch_size=N_DOTS, shuffle=True)
val_loader = DataLoader(val_data, batch_size=N_DOTS, shuffle=False)
test_loader = DataLoader(test, batch_size=N_DOTS, shuffle=False)

## Create Model

In [231]:
class LSTMModel(nn.Module):
    def __init__(self, input_size=4, hidden_layer_size=100, output_size=4, num_layers=10):
        super(LSTMModel, self).__init__()
        self.hidden_layer_size = hidden_layer_size
        self.num_layers = num_layers

        # Define the LSTM layer
        self.lstm = nn.LSTM(input_size, hidden_layer_size, num_layers, batch_first=True)

        # Define the output layer
        self.linear = nn.Linear(hidden_layer_size, output_size)

    def forward(self, x):
        x = x.to(device)
        batch_size = x.size(0)
        self.h = torch.zeros(self.num_layers, batch_size, self.hidden_layer_size).requires_grad_()
        self.h = self.h.to(device)
        self.c = torch.zeros(self.num_layers, batch_size, self.hidden_layer_size).requires_grad_()
        self.c = self.c.to(device)
        out, _ = self.lstm(x, (self.h, self.c))

        # print(out.size())

        # Pass through fully connected layer
        out = self.linear(out)  # We want the output corresponding to the last time step
        return out


In [232]:
model = LSTMModel(input_size=N_DOT_PARAMETERS, num_layers=N_LSTM_LAYERS).to(device)

# loss_model = nn.MSELoss(reduction='mean')
loss_model = nn.L1Loss(reduction='mean')

opt = Adam(model.parameters(), lr=0.001)
lr_scheduler = torch.optim.lr_scheduler.StepLR(opt, step_size=10, gamma=0.95)

In [209]:
EPOCH = 250
train_losses = []
val_losses = []

for epoch in range(EPOCH):

    # Обучение
    model.train()
    train_loss = []
    for X, y in train_loader:
        X = X.to(device)
        y = y.to(device)

        y_pred = model(X)
        loss = loss_model(y_pred, y)
        train_loss.append(loss.item())

        opt.zero_grad()
        loss.backward()

        opt.step()
        mean_train_loss = sum(train_loss)/len(train_loss)
        # train_loop.set_description(f"Epoch [{epoch+1}/{EPOCH}], train_loss = {mean_train_loss:.4f}")

    train_losses.append(mean_train_loss)

    # Валидация
    model.eval()
    with torch.no_grad():
        val_loss = []
        for X, y in val_loader:
            X = X.to(device)
            y = y.to(device)
            pred = model(X)
            loss = loss_model(pred, y)
            val_loss.append(loss.item())

        mean_val_loss = sum(val_loss)/len(val_loss)
        val_losses.append(mean_val_loss)

    lr_scheduler.step()
    lr = lr_scheduler.get_last_lr()
    print(f"Epoch [{epoch+1}/{EPOCH}], train_loss = {mean_train_loss:.4f}, val_loss = {mean_val_loss:.4f}")

Epoch [1/250], train_loss = 0.9620, val_loss = 0.3732
Epoch [2/250], train_loss = 0.2028, val_loss = 0.1176
Epoch [3/250], train_loss = 0.0916, val_loss = 0.0747
Epoch [4/250], train_loss = 0.0683, val_loss = 0.0626
Epoch [5/250], train_loss = 0.0593, val_loss = 0.0581
Epoch [6/250], train_loss = 0.0545, val_loss = 0.0526
Epoch [7/250], train_loss = 0.0510, val_loss = 0.0516
Epoch [8/250], train_loss = 0.0488, val_loss = 0.0480
Epoch [9/250], train_loss = 0.0467, val_loss = 0.0457
Epoch [10/250], train_loss = 0.0447, val_loss = 0.0442
Epoch [11/250], train_loss = 0.0440, val_loss = 0.0436
Epoch [12/250], train_loss = 0.0424, val_loss = 0.0413
Epoch [13/250], train_loss = 0.0410, val_loss = 0.0409
Epoch [14/250], train_loss = 0.0401, val_loss = 0.0393
Epoch [15/250], train_loss = 0.0393, val_loss = 0.0386
Epoch [16/250], train_loss = 0.0382, val_loss = 0.0376
Epoch [17/250], train_loss = 0.0376, val_loss = 0.0369
Epoch [18/250], train_loss = 0.0368, val_loss = 0.0367
Epoch [19/250], tra

In [218]:
start, _  = test[0]
# print(start.size())
# start = torch.reshape(start, (1, start.size(0)))
predictions = []
model.eval()

for X, y in train_loader:
    with torch.no_grad():
        for i in range(N_DOTS, 500):
            y_pred = model(X)
            predictions.append(y_pred[0, -1, :])
            X[0, :-1, :] = X.clone()[0, 1:, :]
            X[0, -1, :] = y_pred[0, -1, :]

    break

In [211]:
len(predictions)

400

In [219]:
p_x = pd.DataFrame(np.vstack(list(map(lambda x: x.cpu().detach().numpy(), predictions))), columns=["Time", "X", "Y", "Z"])
_, y  = test[:500]
p_y = pd.DataFrame(y.cpu().detach().numpy()[:, 0, :], columns=["Time", "X", "Y", "Z"])

# p_x = p_x.cumsum()
# p_y = p_y.cumsum()

In [220]:
p_x["C"] = "Predict"
p_y["C"] = "True"
p_z = pd.DataFrame(start, columns=["Time", "X", "Y", "Z"])
p_z["C"] = "Start"
d = pd.concat([p_x,p_y, p_z],axis=0)


In [221]:
fig = px.line_3d(d, x="X", y="Y", z="Z", color='C',markers=0)
# fig = px.scatter_3d(data, x="X", y="Y", z="Z")
fig.show()