In [1]:
#@title Packages

import pandas as pd
import numpy as np
import random
import math
from sklearn import preprocessing
from sklearn.preprocessing import MinMaxScaler
from sklearn.metrics import mean_squared_error  
import tensorflow as tf
from tensorflow.keras.models import Sequential, Model
from tensorflow.keras.layers import LSTM, Dense, Dropout, BatchNormalization, GRU, Bidirectional, Input, Attention, Concatenate, GlobalAveragePooling1D, LeakyReLU
from tensorflow.keras.callbacks import EarlyStopping, LearningRateScheduler
from tensorflow.keras.regularizers import l2
from tensorflow.keras.optimizers import Adam, RMSprop, SGD, Adagrad, Adadelta
from tensorflow.keras.losses import MeanSquaredError, MeanAbsoluteError, MeanAbsolutePercentageError, Huber
from tensorflow.keras.backend import sqrt, mean, square
from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score
import matplotlib.pyplot as plt 

2025-02-20 02:08:45.398202: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


In [2]:
#@tile Read and Prepare Data

def read_prepare_data(symbol):
    #read
    data = pd.read_csv('/Users/pedroalexleite/Desktop/Tese/Dados/dataset4.csv')
    train =  pd.read_csv('/Users/pedroalexleite/Desktop/Tese/Dados/train.csv')
    test =  pd.read_csv('/Users/pedroalexleite/Desktop/Tese/Dados/test.csv')
    
    #we're going to use only one symbol
    data = data[data['Symbol'] == symbol].copy()
    train = train[train['Symbol'] == symbol].copy()
    test = test[test['Symbol'] == symbol].copy()
    
    #we're going to use only the price variable
    data = data[['Date', 'Simple Moving Average', 'Moving Average Convergence Divergence', 'Average Directional Movement Index', 
                 'Middle Band', 'Average True Range', 'Relative Strength Index', 'Stochastic Oscillator K', 'Commodity Channel Index',
                 'Rate of Change', 'On Balance Volume', 'Chaikin AD Line', 'Chaikin AD Oscillator', 'Parabolic SAR', 'Linear Regression',
                 'Aroon Oscillator', 'Money Flow Index', 'Close']].copy()
    train = train[['Date', 'Simple Moving Average', 'Moving Average Convergence Divergence', 'Average Directional Movement Index', 
                 'Middle Band', 'Average True Range', 'Relative Strength Index', 'Stochastic Oscillator K', 'Commodity Channel Index',
                 'Rate of Change', 'On Balance Volume', 'Chaikin AD Line', 'Chaikin AD Oscillator', 'Parabolic SAR', 'Linear Regression',
                 'Aroon Oscillator', 'Money Flow Index', 'Close']].copy()
    test = test[['Date', 'Simple Moving Average', 'Moving Average Convergence Divergence', 'Average Directional Movement Index', 
                 'Middle Band', 'Average True Range', 'Relative Strength Index', 'Stochastic Oscillator K', 'Commodity Channel Index',
                 'Rate of Change', 'On Balance Volume', 'Chaikin AD Line', 'Chaikin AD Oscillator', 'Parabolic SAR', 'Linear Regression',
                 'Aroon Oscillator', 'Money Flow Index', 'Close']].copy()
    
    #set date as index
    data.set_index('Date', inplace=True)
    train.set_index('Date', inplace=True)
    test.set_index('Date', inplace=True)

    #normalize
    scaler = MinMaxScaler(feature_range=(-1, 1))
    train = pd.DataFrame(scaler.fit_transform(train), columns=train.columns, index=train.index)
    test = pd.DataFrame(scaler.transform(test), columns=test.columns, index=test.index)
    data = pd.DataFrame(scaler.transform(data), columns=data.columns, index=data.index) 

    return scaler, data, train, test

scaler, data, train, test = read_prepare_data('AAPL')

#verify
#print(data.head())
#print(data.index)   
#print(data.columns)

In [3]:
#@title Create Dataset

def create_dataset(dataframe, look_back):
    dataset = dataframe.values
    dataX, dataY = [], []
    for i in range(len(dataset)-look_back-1):
        a = dataset[i:(i+look_back)]
        dataX.append(a)
        dataY.append(dataset[i + look_back, -1]) 
        
    return np.array(dataX), np.array(dataY)

In [4]:
#@title Reshape

def reshape(train, test, look_back):
    trainX, trainY = create_dataset(train, look_back)
    testX, testY = create_dataset(test, look_back)
    trainX = np.reshape(trainX, (trainX.shape[0], trainX.shape[1], trainX.shape[2]))
    testX = np.reshape(testX, (testX.shape[0], testX.shape[1], testX.shape[2]))

    return trainX, trainY, testX, testY

In [5]:
#@title Forecast

def forecast_values(testY, look_back, horizon, model, last_sequence):
    testY_copy = testY.copy()
    last_sequence = last_sequence.copy()
    
    for val in range(0, horizon+1):
        a = last_sequence[-look_back:]
        a = np.reshape(a, (1, look_back, last_sequence.shape[-1]))
        a_predict = model.predict(a, verbose=0)[0]
        new_row = last_sequence[-1:].copy()
        new_row[0, -1] = a_predict  
        last_sequence = np.vstack([last_sequence, new_row])
        testY_copy = np.append(testY_copy, a_predict)
    
    forecast = testY_copy[len(testY)+1:]
    return forecast

In [6]:
#@title Auxiliary Function

def predict_forecast_plot(data, train, test, trainX, trainY, testX, testY, nepochs, look_back, horizon, plot_predictions, model):
    #make predictions
    trainPredict = model.predict(trainX)
    testPredict = model.predict(testX)
    
    #forecast (get the last sequence from testX for forecasting)
    last_sequence = testX[-1]
    forecast = forecast_values(testY, look_back, horizon, model, last_sequence)

    #invert predictions - need to handle multivariate data
    dummy = np.zeros((len(trainPredict), train.shape[1]))
    dummy[:, -1] = trainPredict.flatten() 
    trainPredict = scaler.inverse_transform(dummy)[:, -1]
    
    dummy = np.zeros((len(trainY), train.shape[1]))
    dummy[:, -1] = trainY.flatten()
    trainY = scaler.inverse_transform(dummy)[:, -1]
    
    dummy = np.zeros((len(testPredict), train.shape[1]))
    dummy[:, -1] = testPredict.flatten()
    testPredict = scaler.inverse_transform(dummy)[:, -1]
    
    dummy = np.zeros((len(testY), train.shape[1]))
    dummy[:, -1] = testY.flatten()
    testY = scaler.inverse_transform(dummy)[:, -1]
    
    dummy = np.zeros((len(forecast), train.shape[1]))
    dummy[:, -1] = forecast.flatten()
    forecast = scaler.inverse_transform(dummy)[:, -1]

    #calculate root mean squared error
    trainScore = np.sqrt(mean_squared_error(trainY, trainPredict))
    print('Train Score: %.2f RMSE' % (trainScore))
    testScore = np.sqrt(mean_squared_error(testY, testPredict))
    print('Test Score: %.2f RMSE' % (testScore))

    #plot predictions
    if plot_predictions==True: 
        # Get the original Close prices
        original_data = scaler.inverse_transform(data)[:, -1]
        
        #shift train predictions for plotting
        trainPredictPlot = np.empty_like(original_data)
        trainPredictPlot[:] = np.nan
        trainPredictPlot[look_back:len(trainPredict)+look_back] = trainPredict
        
        #shift test predictions for plotting
        testPredictPlot = np.empty_like(original_data)
        testPredictPlot[:] = np.nan
        testPredictPlot[len(trainPredict)+(look_back*2)+1:len(original_data)-1] = testPredict
        
        #shift forecast for plotting
        forecastPlot = np.empty((len(original_data) + len(forecast),))
        forecastPlot[:] = np.nan
        forecastPlot[len(original_data):] = forecast
        
        #plot baseline, predictions and forecast
        plt.figure(figsize=(15,7))
        plt.plot(original_data, label='actual')
        plt.plot(trainPredictPlot, label='train set')
        plt.plot(testPredictPlot, label='test set')
        plt.plot(forecastPlot, label='forecast')
        plt.legend()
        plt.show()

    return testScore

In [7]:
#@title Models

def list_models(look_back, trainX):
    layers = [1, 2]
    neurons = [8, 16, 32, 64, 128, 256, 512]
    dropouts = [0.1, 0.2]
    models = []
    configurations = []
    
    for num_layers in layers:
        for num_neurons in neurons:
            for dropout_rate in dropouts:
                model = Sequential()

                model.add(LSTM(num_neurons, input_shape=(trainX.shape[1], trainX.shape[2]), return_sequences=(num_layers > 1)))
                model.add(Dropout(dropout_rate))
                
                for layer_idx in range(1, num_layers):
                    model.add(LSTM(num_neurons, return_sequences=(layer_idx < num_layers - 1)))
                    model.add(Dropout(dropout_rate))
                
                model.add(Dense(1))
                
                model.compile(loss='mean_squared_error', optimizer='adam')
                
                models.append(model)
                configurations.append({
                    "layers": num_layers,
                    "neurons": num_neurons,
                    "dropout": dropout_rate
                })
    
    return models, configurations

look_back = 60
trainX, trainY, testX, testY = reshape(train, test, look_back)
models, configurations = list_models(look_back, trainX)

print("Configurations:")
for idx, config in enumerate(configurations, start=1):
    print(f"Model {idx}: Layers={config['layers']}, Neurons={config['neurons']}, Dropout={config['dropout']}")

  super().__init__(**kwargs)


Configurations:
Model 1: Layers=1, Neurons=512, Dropout=0.1
Model 2: Layers=1, Neurons=1024, Dropout=0.1
Model 3: Layers=1, Neurons=2048, Dropout=0.1
Model 4: Layers=2, Neurons=512, Dropout=0.1
Model 5: Layers=2, Neurons=1024, Dropout=0.1
Model 6: Layers=2, Neurons=2048, Dropout=0.1


In [None]:
#@title Train and Predict (Find the Optimal Model)

def optimal_model(models, configurations, data, train, test, look_back=1, nepochs=10, horizon=10, plot_predictions=False):
    results = []

    for idx, (model, config) in enumerate(zip(models, configurations), start=1):
        print(f"Training Model {idx}: Layers={config['layers']}, Neurons={config['neurons']}, Dropout={config['dropout']}")
        
        #reshape
        trainX, trainY, testX, testY = reshape(train, test, look_back)

        #fit
        model.fit(trainX, trainY, epochs=nepochs, batch_size=1, verbose=1)

        #predict, foecast and plot
        testScore =  predict_forecast_plot(data, train, test, trainX, trainY, testX, testY, nepochs, look_back, horizon, plot_predictions, model)

        #append results
        results.append({
            "model_index": idx,
            "configuration": config,
            "test_score": testScore
        })

    return results

def calculate_average_results(models, configurations, data, train, test, look_back=1, nepochs=10, horizon=10, runs=10):
    all_results = []

    for run in range(runs):
        print(f"Run {run + 1}/{runs}")
        results = optimal_model(models, configurations, data, train, test, look_back, nepochs, horizon)
        all_results.extend(results)

    #aggregate results by model
    average_results = {}
    for result in all_results:
        model_idx = result["model_index"]
        if model_idx not in average_results:
            average_results[model_idx] = {
                "configuration": result["configuration"],
                "test_scores": []
            }
        average_results[model_idx]["test_scores"].append(result["test_score"])

    #calculate average train and test scores
    for model_idx, scores in average_results.items():
        test_avg = np.mean(scores["test_scores"])
        average_results[model_idx]["test_score_avg"] = test_avg

    return average_results

models, configurations= list_models(60, trainX)
average_results = calculate_average_results(models, configurations, data, train, test, look_back=60, nepochs=50, horizon=10, runs=5)

for model_idx, scores in average_results.items():
    print(f"Model {model_idx}:")
    print(f"  Configuration: {scores['configuration']}")
    print(f"  Average Test Score: {scores['test_score_avg']:.2f}") 

Run 1/1
Training Model 1: Layers=1, Neurons=512, Dropout=0.1
Epoch 1/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m93s[0m 113ms/step - loss: 0.0252
Epoch 2/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m92s[0m 112ms/step - loss: 0.0087
Epoch 3/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m93s[0m 114ms/step - loss: 0.0080
Epoch 4/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m91s[0m 111ms/step - loss: 0.0080
Epoch 5/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m92s[0m 113ms/step - loss: 0.0066
Epoch 6/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m92s[0m 113ms/step - loss: 0.0072
Epoch 7/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m85s[0m 105ms/step - loss: 0.0056
Epoch 8/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m83s[0m 102ms/step - loss: 0.0057
Epoch 9/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m86s[0m 106ms/step - loss: 0.0053
Epo

  new_row[0, -1] = a_predict


Train Score: 2.37 RMSE
Test Score: 14.13 RMSE
Training Model 2: Layers=1, Neurons=1024, Dropout=0.1
Epoch 1/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m449s[0m 550ms/step - loss: 0.0409
Epoch 2/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m447s[0m 549ms/step - loss: 0.0101
Epoch 3/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m451s[0m 553ms/step - loss: 0.0093
Epoch 4/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m451s[0m 553ms/step - loss: 0.0103
Epoch 5/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m449s[0m 551ms/step - loss: 0.0068
Epoch 6/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m453s[0m 555ms/step - loss: 0.4570
Epoch 7/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m452s[0m 555ms/step - loss: 0.2028
Epoch 8/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m453s[0m 555ms/step - loss: 0.1929
Epoch 9/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37

  new_row[0, -1] = a_predict


Train Score: 3.48 RMSE
Test Score: 33.64 RMSE
Training Model 3: Layers=1, Neurons=2048, Dropout=0.1
Epoch 1/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1876s[0m 2s/step - loss: 0.0662
Epoch 2/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1882s[0m 2s/step - loss: 0.1035
Epoch 3/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1883s[0m 2s/step - loss: 0.7963
Epoch 4/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1882s[0m 2s/step - loss: 0.3291
Epoch 5/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1882s[0m 2s/step - loss: 0.4477
Epoch 6/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1884s[0m 2s/step - loss: 0.3272
Epoch 7/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1881s[0m 2s/step - loss: 0.3969
Epoch 8/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1901s[0m 2s/step - loss: 0.2824
Epoch 9/50
[1m815/815[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1876s

In [None]:
#@title Train and Predict

def model(data, train, test, look_back=1, nepochs=10, horizon=10, plot_predictions=False):
    #reshape
    trainX, trainY, testX, testY = reshape(train, test, look_back)

    #create the network
    model = Sequential()
    model.add(LSTM(16, input_shape=(trainX.shape[1], trainX.shape[2])))
    model.add(Dropout(0.1))
    model.add(Dense(1))
    model.compile(loss='mean_squared_error', optimizer='adam')
    #model.summary()

    #fit
    model.fit(trainX, trainY, epochs=nepochs, batch_size=1, verbose=1)

    #predict, forecast and plot
    testScore = predict_forecast_plot(data, train, test, trainX, trainY, testX, testY, nepochs, look_back, horizon, plot_predictions, model)
    
    return testScore

#model(data, train, test, look_back=60, nepochs=50, horizon=10, plot_predictions=True)

In [None]:
#@title Run the Model Several Times

n_runs = 50
rmse_results = []
for i in range(n_runs):
    print(f"Running iteration {i+1}/{n_runs}...")
    test_rmse = model(data, train, test, look_back=60, nepochs=50, horizon=10, plot_predictions=False)  
    rmse_results.append(test_rmse)

rmse_results = np.array(rmse_results)
print("All RMSE results:", rmse_results)
print(f"Mean RMSE: {np.mean(rmse_results):.2f}")
print(f"Standard Deviation: {np.std(rmse_results):.2f}")

In [None]:
#@title Train and Predict (Model Early Stop)

def model_early_stop(data, train, test, look_back=1, nepochs=10, horizon=10, plot_predictions=False):
    #reshape
    trainX, trainY, testX, testY = reshape(train, test, look_back)

    #create the LSTM network
    model = Sequential()
    model.add(LSTM(16, input_shape=(trainX.shape[1], trainX.shape[2])))
    model.add(Dropout(0.1))
    model.add(Dense(1))
    model.compile(loss='mean_squared_error', optimizer='adam')
    #model.summary()

    #early stopping
    early_stop = EarlyStopping(monitor='val_loss', patience=10, restore_best_weights=True)
    
    #fit
    model.fit(trainX, trainY, epochs=nepochs, batch_size=1, verbose=1, validation_data=(testX, testY), callbacks=[early_stop])

    #predict, forecast and plot
    testScore =  predict_forecast_plot(data, train, test, trainX, trainY, testX, testY, nepochs, look_back, horizon, plot_predictions, model)
    
    return testScore