# <font color='blue'>Data Science Challenge @ ITA 2022</font>
# <font color='blue'>Equipe DIOMGIS</font>

## <font color='blue'>1º Fase</font>

### <font color='blue'>Predição de pregões futuros de ativos que compõem o índice SP500.</font>

![title](data\image\logo.jpeg)

In [None]:
# Versão da Linguagem Python
from platform import python_version
print('Versão da Linguagem Python Usada Neste Jupyter Notebook:', python_version())

In [None]:
# Instala o pacote watermark. 
# Esse pacote é usado para gravar as versões de outros pacotes usados neste jupyter notebook.
!pip install -q -U watermark

In [None]:
# Bibliotecas e Frameworks

import numpy as np
import pandas as pd
import pandas_datareader.data as web
import tensorflow as tf
from tensorflow import keras
from keras.layers import LSTM, Dense, Dropout
from keras.models import Sequential
from keras.optimizers import *
from keras.callbacks import TensorBoard, EarlyStopping, ReduceLROnPlateau, TerminateOnNaN
from keras.wrappers.scikit_learn import KerasRegressor
from keras.losses import MeanSquaredError
from tensorboard import notebook
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn.pipeline import Pipeline
from sklearn.model_selection import GridSearchCV
from sklearn.metrics import mean_squared_error, make_scorer
import matplotlib.pyplot as plt
import seaborn as sns
import warnings
from time import time
from datetime import datetime
import os

In [None]:
# Versões dos pacotes usados neste jupyter notebook

%reload_ext watermark
%watermark -a "Equipe DIOMGIS" --iversions

In [None]:
sns.set_style('whitegrid')
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
%matplotlib inline
warnings.filterwarnings("ignore", category=FutureWarning)
warnings.filterwarnings("ignore", category=DeprecationWarning)
plt.rcParams['figure.figsize'] = (15, 10)

In [None]:
#Confirma se o TensorFlow pode acessar a GPU

device_name = tf.test.gpu_device_name()
if not device_name:
    raise SystemError('GPU device not found')
    
print('Found GPU at: {}'.format(device_name))

In [None]:
# Estado da GPU

!nvidia-smi

In [None]:
# Parametros fixos de treinamento

verbose = 2
seed = 25
steps = 30
epochs = 2000
batch_size = 32
nKFold = 5
logRetPeriod = 20
graphic = False
downloadData = False

np.random.seed(seed)

In [None]:
forecast = ['2022-10-24', '2022-10-25', '2022-10-26', '2022-10-27', '2022-10-28', 
            '2022-10-31', '2022-11-01', '2022-11-02', '2022-11-03', '2022-11-04', 
            '2022-11-07', '2022-11-08', '2022-11-09', '2022-11-10', '2022-11-11',
            '2022-11-14', '2022-11-15', '2022-11-16', '2022-11-17', '2022-11-18']

In [None]:
setores = {
    'Industrials': ['MMM', 'AOS', 'ALK', 'ALLE', 'AAL', 'AME', 'BA',
                    'CHRW', 'CARR', 'CAT', 'CTAS', 'CPRT', 'CSGP',
                    'CSX', 'CMI', 'DE', 'DAL', 'DOV', 'ETN', 'EMR',
                    'EFX', 'EXPD', 'FAST', 'FDX', 'FTV', 'FBHS',
                    'GNRC', 'GD', 'GE', 'HON', 'HWM', 'HII', 'IEX',
                    'ITW', 'IR', 'JBHT', 'J', 'JCI', 'LHX', 'LDOS',
                    'LMT', 'MAS', 'NDSN', 'NSC', 'NOC', 'ODFL',
                    'OTIS', 'PCAR', 'PH', 'PNR', 'PWR', 'RTX', 'RSG',
                    'RHI', 'ROK', 'ROL', 'SNA', 'LUV', 'SWK', 'TXT',
                    'TT', 'TDG', 'UNP', 'UAL', 'UPS', 'URI', 'VRSK',
                    'WAB', 'WM', 'GWW', 'XYL'],
    
    'HealthCare': ['ABT', 'ABBV', 'ABMD', 'A', 'ALGN', 'ABC', 'AMGN',
                   'BAX', 'BDX', 'BIO', 'TECH', 'BIIB', 'BSX', 'BMY',
                   'CAH', 'CTLT', 'CNC', 'CRL', 'CI', 'COO', 'CVS',
                   'DHR', 'DVA', 'XRAY', 'DXCM', 'EW', 'ELV', 'LLY',
                   'GILD', 'HCA', 'HSIC', 'HOLX', 'HUM', 'IDXX',
                   'ILMN', 'INCY', 'ISRG', 'IQV', 'JNJ', 'LH', 'MCK',
                   'MDT', 'MRK', 'MTD', 'MRNA', 'MOH', 'OGN', 'PKI',
                   'PFE', 'DGX', 'REGN', 'RMD', 'STE', 'SYK', 'TFX',
                   'TMO', 'UNH', 'UHS', 'VRTX', 'VTRS', 'WAT',
                   'WST', 'ZBH', 'ZTS'],
    
    'InformationTechnology': ['ACN', 'ADBE', 'ADP', 'AKAM', 'AMD', 'APH',
                              'ADI', 'ANSS', 'AAPL', 'AMAT', 'ANET', 'ADSK',
                              'AVGO', 'BR', 'CDNS', 'CDW', 'CDAY', 'CSCO',
                              'CTSH', 'GLW', 'DXC', 'ENPH', 'EPAM', 'FFIV',
                              'FIS', 'FISV', 'FLT', 'FTNT', 'IT', 'GPN',
                              'HPE', 'HPQ', 'IBM', 'INTC', 'INTU', 'JKHY',
                              'JNPR', 'KEYS', 'KLAC', 'LRCX', 'MA', 'MCHP',
                              'MU', 'MSFT', 'MPWR', 'MSI', 'NTAP', 'NLOK',
                              'NVDA', 'NXPI', 'ON', 'ORCL', 'PAYX', 'PAYC',
                              'PYPL', 'PTC', 'QRVO', 'QCOM', 'ROP', 'CRM',
                              'STX', 'NOW', 'SWKS', 'SEDG', 'SNPS', 'TEL',
                              'TDY', 'TER', 'TXN', 'TRMB', 'TYL', 'VRSN',
                              'V', 'WDC', 'ZBRA'],
    
    'CommunicationServices': ['ATVI', 'GOOGL', 'GOOG', 'T', 'CHTR', 'CMCSA',
                              'DISH', 'DIS', 'EA', 'FOXA', 'FOX', 'IPG', 'LYV',
                              'LUMN', 'MTCH', 'META', 'NFLX', 'NWSA', 'NWS',
                              'OMC', 'PARA', 'TMUS', 'TTWO', 'TWTR', 'VZ', 'WBD'],
    
    'ConsumerStaples': ['ADM', 'MO', 'BF.B', 'CPB', 'CHD', 'CLX', 'KO', 'CL',
                        'CAG', 'STZ', 'COST', 'EL', 'GIS', 'HSY', 'HRL', 'K',
                        'KDP', 'KMB', 'KHC', 'KR', 'LW', 'MKC', 'TAP', 'MDLZ',
                        'MNST', 'PEP', 'PM', 'PG', 'SJM', 'SYY', 'TSN', 'WBA',
                        'WMT'],
    
    'ConsumerDiscretionary': ['AAP', 'AMZN', 'APTV', 'AZO', 'BBWI',
                              'BBY', 'BKNG', 'BWA', 'CZR', 'KMX', 'CCL',
                              'CMG', 'DHI', 'DRI', 'DG', 'DLTR',
                              'DPZ', 'EBAY', 'ETSY', 'EXPE', 'F',
                              'GRMN', 'GM', 'GPC', 'HAS', 'HLT', 'HD',
                              'LVS', 'LEN', 'LKQ', 'LOW', 'MAR', 'MCD',
                              'MGM', 'MHK', 'NWL', 'NKE', 'NCLH', 'NVR',
                              'ORLY', 'POOL', 'PHM', 'RL', 'ROST', 'RCL',
                              'SBUX', 'TPR', 'TGT', 'TSLA', 'TJX',
                              'TSCO', 'ULTA', 'VFC', 'WHR', 'WYNN', 'YUM'],
    
    'Utilities': ['AES', 'LNT', 'AEE', 'AEP', 'AWK', 'ATO', 'CNP',
                  'CMS', 'ED', 'CEG', 'D', 'DTE', 'DUK', 'EIX',
                  'ETR', 'EVRG', 'ES', 'EXC', 'FE', 'NEE', 'NI',
                  'NRG', 'PCG', 'PNW', 'PPL', 'PEG', 'SRE', 'SO',
                  'WEC', 'XEL'],
    
    'Financials': ['AFL', 'ALL', 'AXP', 'AIG', 'AMP', 'AON', 'AJG',
                   'AIZ', 'BAC', 'WRB', 'BRK.B', 'BLK', 'BK', 'BRO',
                   'COF', 'CBOE', 'SCHW', 'CB', 'CINF', 'C', 'CFG',
                   'CME', 'CMA', 'DFS', 'RE', 'FDS', 'FITB', 'FRC',
                   'BEN', 'GL', 'GS', 'HIG', 'HBAN', 'ICE', 'IVZ',
                   'JPM', 'KEY', 'LNC', 'L', 'MTB', 'MKTX', 'MMC',
                   'MET', 'MCO', 'MS', 'MSCI', 'NDAQ', 'NTRS', 'PNC',
                   'PFG', 'PGR', 'PRU', 'RJF', 'RF', 'SPGI', 'SBNY',
                   'STT', 'SIVB', 'SYF', 'TROW', 'TRV', 'TFC',
                   'USB', 'WFC', 'WTW', 'ZION',  'NLSN'],
    
    'Materials': ['APD', 'ALB', 'AMCR', 'AVY', 'BALL', 'CE', 'CF',
                  'CTVA', 'DOW', 'DD', 'EMN', 'ECL', 'FMC', 'FCX',
                  'IP', 'IFF', 'LIN', 'LYB', 'MLM', 'MOS', 'NEM',
                  'NUE', 'PKG', 'PPG', 'SEE', 'SHW', 'VMC', 'WRK'],
    
    'RealEstate': ['ARE', 'AMT', 'AVB', 'BXP', 'CPT', 'CBRE', 'CCI',
                   'DLR', 'EQIX', 'EQR', 'ESS', 'EXR', 'FRT', 'PEAK',
                   'HST', 'INVH', 'IRM', 'KIM', 'MAA', 'PLD', 'PSA',
                   'O', 'REG', 'SBAC', 'SPG', 'UDR', 'VTR', 'VICI',
                   'VNO', 'WELL', 'WY'],
    
    'Energy': ['APA','BKR', 'CVX', 'COP', 'CTRA', 'DVN', 'FANG', 'EOG',
               'EQT', 'XOM', 'HAL', 'HES', 'KMI', 'MRO', 'MPC', 'OXY',
               'OKE', 'PSX', 'PXD', 'SLB', 'VLO', 'WMB']
}

In [None]:
ativos = []
for setor, empresas in setores.items():
    ativos.extend(empresas)
    
ativos.sort()

### Download dos Dados

In [None]:
if downloadData:

    start_date = "2017-10-21"
    end_date = "2022-10-21"

    data = web.DataReader(name = '^GSPC', data_source = 'yahoo', start = start_date, end = end_date)
    SP500_index = pd.DataFrame(data['Close']).reset_index().rename(columns={'Close': 'SP500', 'Date': 'Dia'})

    SP500_close = pd.DataFrame()

    for ativo in ativos:
  
        if ativo == 'BF.B':
            ativo = 'BF-B'

        if ativo == 'BRK.B':
            ativo = 'BRK-B'

        data = web.DataReader(name = ativo, data_source = 'yahoo', start = start_date, end = end_date)
        temp_close = pd.DataFrame(data['Close'])
        SP500_close = pd.concat([SP500_close, temp_close], axis = 1)

        
    SP500_close.columns = ativos
    SP500_close.reset_index(inplace = True)
    SP500_close.rename(columns={'Date': 'Dia'}, inplace = True)

    outdir = './data/{}-{}'.format(start_date, end_date)

    if not os.path.exists(outdir):
        os.mkdir(outdir)
    
    SP500_close.to_csv(path_or_buf = os.path.join(outdir, 'SP500_close'), index = False)
    SP500_index.to_csv(path_or_buf = os.path.join(outdir, 'SP500_index'), index = False)
    
else:
    
    SP500_close = pd.read_csv('data/SP500_close')
    SP500_index = pd.read_csv('data/SP500_index')

## Pré-Processamento dos Dados

In [None]:
def generatorTimeframeTable(table, ativo):
    
    nameColumns = []

    for i in range(steps,-1,-1):
        nameColumns.append('Close-{}'.format(i))
    
    TimeframeTable = pd.DataFrame(np.zeros((len(table[ativo])-steps, steps+1), dtype='float64'), columns = nameColumns)

    for index, close in enumerate(table[ativo]):
        tempA = index
        tempB = 0
        for i in range(steps+1):
            if tempA < len(table[ativo])-steps and tempA >=0:
                TimeframeTable.iloc[tempA, tempB] = close

            tempA -= 1
            tempB += 1

    timeIndex = table.iloc[steps:,0]
    TimeframeTable["Dia"] = timeIndex.to_numpy()
    TimeframeTable.set_index("Dia", inplace = True)
    
    return TimeframeTable

In [None]:
def createTrainScaler(df):
    
    trainScaler = pd.DataFrame()
 
    for _ in range(steps+1):
        temp_close = pd.DataFrame(df.iloc[:,-1])
        trainScaler = pd.concat([trainScaler, temp_close], axis = 1)

    scaler = StandardScaler()

    scaler.fit(trainScaler)

    return scaler

In [None]:
def Preprocessingdata(steps, df, ativos):
    
    nameColumns = []

    for i in range(steps,-1,-1):
        nameColumns.append('Close-{}'.format(i))
    

    aux = []
    
    for ativo in ativos:
        trainDataAtivo = generatorTimeframeTable(df, ativo)
        trainDataAtivo.dropna(axis = 0, inplace = True)
        
        #----Score-Z--------------------------------------
        scaler = createTrainScaler(trainDataAtivo)
        trainDataAtivo = scaler.transform(trainDataAtivo)
        #-------------------------------------------------
        aux.append(trainDataAtivo)
    
    trainData = np.concatenate(tuple(aux), axis=0)
    
    X = trainData[:, :-1]
    y = trainData[:, -1]
    

    #------Divisão de dados entre Treino e Validação------------------------------------------------
    
    X_treino, X_teste, y_treino, y_teste = train_test_split(X, y, test_size = 0.2, shuffle = False)

    X_treino = X_treino.reshape((-1, steps, 1))
    X_teste = X_teste.reshape((-1, steps, 1))
    #-----------------------------------------------------------------------------------------------
    
    return [X_treino, X_teste, y_treino, y_teste]

In [None]:
X_treino, X_teste, y_treino, y_teste = Preprocessingdata(steps, SP500_index, ['SP500'])

## Construção, Treinamento e Avaliação do Modelo Piloto

In [None]:
# Callbacks
   
tensorboard = TensorBoard(log_dir="logs/{}".format(datetime.now().strftime('%d-%B-%Ih%Mmin')))

earlystop = EarlyStopping(monitor='val_loss',
                          min_delta=0,
                          patience=20,
                          verbose = verbose,
                          restore_best_weights=True)

reduce_lr = ReduceLROnPlateau(monitor='loss',
                              factor=0.2,
                              patience=3,
                              mode="min",
                              verbose = verbose,
                              min_delta=0.0001,
                              min_lr=0)

callbacks = [tensorboard, earlystop, reduce_lr, TerminateOnNaN()]

In [None]:
def create_model(optimizer, layers, n_lstm, dropoutFoward):
     
    model = Sequential()
    
    model.add(LSTM(n_lstm,
                   activation = 'tanh',
                   recurrent_activation = 'sigmoid',
                   return_sequences = True,
                   input_shape = (steps, 1)))  

    
    #################################################################
    
    for layer in range(layers):
                
        model.add(Dropout(dropoutFoward))
        
        model.add(LSTM(n_lstm,
                       activation = 'tanh',
                       recurrent_activation = 'sigmoid',
                       return_sequences = True))  
    
    
    ##################################################################
    
    model.add(LSTM(n_lstm,
                   activation = 'tanh',
                   recurrent_activation = 'sigmoid',
                   return_sequences = False)) 
    
    
    model.add(Dense(1, activation = 'linear'))
    
    Lmse = MeanSquaredError()

    model.compile(loss= Lmse, optimizer=optimizer)

    return model

In [None]:
# Modelo

model = KerasRegressor(build_fn = create_model,
                        verbose = verbose,
                        callbacks = callbacks)

In [None]:
#Pipeline

estimator = Pipeline([("model", model)], verbose = verbose)

In [None]:
# Definição dos parametros (GridSearch)

# Optimizer
learning_rate = 0.01

opt_SGD = SGD(
    learning_rate = learning_rate,
    momentum = 0.0,
    nesterov = False)

opt_RMSprop = RMSprop(
    learning_rate = learning_rate,
    rho = 0.9,
    momentum = 0.0,
    epsilon = 1e-07,
    centered = False)

opt_Adam = Adam(
    learning_rate = learning_rate,
    beta_1 = 0.9,
    beta_2 = 0.999,
    epsilon = 1e-07,
    amsgrad = False)

opt_Adadelta = Adadelta(
    learning_rate = learning_rate,
    rho = 0.95,
    epsilon = 1e-07)

opt_Adagrad = Adagrad(
    learning_rate = learning_rate,
    initial_accumulator_value = 0.1,
    epsilon = 1e-07)

opt_Adamax = Adamax(
    learning_rate = learning_rate,
    beta_1 = 0.9,
    beta_2 = 0.999,
    epsilon = 1e-07)

opt_Nadam = Nadam(
    learning_rate = learning_rate,
    beta_1 = 0.9,
    beta_2 = 0.999,
    epsilon = 1e-07)

opt_Ftrl = Ftrl(
    learning_rate = learning_rate,
    learning_rate_power = -0.5,
    initial_accumulator_value = 0.1,
    l1_regularization_strength = 0.0,
    l2_regularization_strength = 0.0,
    l2_shrinkage_regularization_strength = 0.0,
    beta = 0.0)

params_grid = {
    # [opt_SGD, opt_RMSprop, opt_Adam, opt_Adadelta, opt_Adagrad, opt_Adamax, opt_Nadam, opt_Ftrl]
    'model__optimizer': [opt_Adadelta],
    'model__layers': [1], # + 2 Por padrão já possui duas camadas LSTM
    'model__n_lstm': [160],
    'model__dropoutFoward': [0]
}

In [None]:
# Grid Search e Cross Validation

grid = GridSearchCV(estimator = estimator,
                    scoring = 'neg_root_mean_squared_error',
                    verbose = verbose,
                    return_train_score = False,
                    cv = nKFold,
                    # n_jobs = -2 # "-2": mantem 1 processador livre
                    # pre_dispatch = '2*n_jobs',
                    refit = True,
                    param_grid = params_grid)

In [None]:
# Monitoramento de Otimização

# tensorboard --logdir logs
# notebook.display(port=6006, height=1000)

In [None]:
# Treinamento

fit_params = {
    'model__batch_size': batch_size,
    'model__epochs': epochs,
    'model__verbose': verbose,
    'model__validation_data': (X_teste, y_teste),
    'model__shuffle': False,
    'model__validation_steps': None,
    'model__validation_freq': 1,
}

grid_result = grid.fit(X_treino, y_treino, **fit_params)

### Avaliação do Modelo

In [None]:
# Resultado do SearchGridCV

pd.concat([
           pd.DataFrame(grid.cv_results_)[['rank_test_score', 'mean_test_score', 'mean_fit_time']],
           pd.DataFrame(grid.cv_results_['params'])
          ],
           axis=1,
           join='inner').set_index('rank_test_score').sort_values('rank_test_score')

# Ranqueamento segundo métrica do GridSearchCV: neg_root_mean_squared_error

In [None]:
best_params = grid.best_params_
best_model = grid.best_estimator_

scoreTrain = best_model.score(X_treino, y_treino)
scoreTest = best_model.score(X_teste, y_teste)

print('\n\nErro quadrático médio em dados de treinamento: {:.5f}\n\nErro quadrático médio em dados de validação: {:.5f}\n\n'\
      .format(-scoreTrain, -scoreTest))

In [None]:
def fillTableFrame(ativo, tablePrevision, table = SP500_close):
    
    TimeframeTable = generatorTimeframeTable(table, ativo)
    
    index_data = TimeframeTable.index
    
    scaler = createTrainScaler(TimeframeTable)

    TimeframeTable = scaler.transform(TimeframeTable)
    
    nameColumns = []

    for i in range(steps,-1,-1):
        nameColumns.append('Close-{}'.format(i))

    TimeframeTable = pd.DataFrame(TimeframeTable, columns = nameColumns, index = index_data)
    
    
    for day in forecast:
        
        current_info = TimeframeTable.iloc[-1, 1:].to_numpy()
        
        standardCurrentInfo = current_info.reshape(1, steps, 1).astype('float32')
        
        current_forecast = best_model.predict(standardCurrentInfo, verbose=False).reshape(1,)
        
        new_line = np.concatenate((current_info, current_forecast), axis = 0)
        
        TimeframeTable = pd.concat([TimeframeTable,
                                    pd.DataFrame(new_line.reshape(1, -1),
                                                 columns = nameColumns,
                                                 index = [day])], axis = 0)
        
        
    index_data = TimeframeTable.index  
    
    TimeframeTable = scaler.inverse_transform(TimeframeTable)
    
    TimeframeTable = pd.DataFrame(TimeframeTable, columns = nameColumns, index = index_data)
    
    TimeframeTable.index = pd.to_datetime(TimeframeTable.index)
    
    
    #--------Popula tabela de previsão---------------------------------------------------
    if ativo in ativos:
            for day in forecast:
                tablePrevision.loc[day, ativo] = TimeframeTable.loc[day, 'Close-0']
    #------------------------------------------------------------------------------------
   
    return TimeframeTable

In [None]:
# Popula tabela de log-Retorno e gera gráficos

def fillPrediction(tableLogRet, tablePrevision, ativos):
    lengthTable = len(tableLogRet)

    for ativo in ativos:

        TimeframeSPAux = fillTableFrame(ativo, tablePrevision)

        #-----------Graphic------------------------------------------------------------------------------------------
        if graphic:
            
            outdir = './graphics/score-{:.4f}-{}'.format(-scoreTest, datetime.now().strftime('%d-%B-%Ih%Mmin'))

            if not os.path.exists(outdir):
                os.mkdir(outdir)
            
            fig, ax = plt.subplots()
            ax.plot(TimeframeSPAux.index[:-len(forecast)], TimeframeSPAux.iloc[:-len(forecast), -1], linewidth=1.0, c = 'b')
            ax.plot(TimeframeSPAux.index[-len(forecast):], TimeframeSPAux.iloc[-len(forecast):, -1], linewidth=1.0, c = 'r', ls = '-')
            ax.legend(['Atual', 'Previsão'])
            ax.set_title('Preço de Fechamento - {}'.format(ativo))
            ax.set(xlabel='Tempo (ano)', ylabel='Preço ($)')
            nameGraphic = '{}-{}.jpg'.format(ativo, datetime.now().strftime('%d-%B-%Ih%Mmin'))
            fullname = os.path.join(outdir, nameGraphic)
            plt.savefig(fullname)
            plt.close(fig)
        #------------------------------------------------------------------------------------------------------------

        #--------Popula tabela de Log Retorno------------------------------------------------------------------------
        for n in range(len(forecast)):
            tableLogRet.loc[lengthTable-n-1, ativo] = \
            np.log(TimeframeSPAux.iloc[lengthTable-steps-n-1, -1] / TimeframeSPAux.iloc[lengthTable-steps-n-1-logRetPeriod, -1])
        #------------------------------------------------------------------------------------------------------------

In [None]:
# Cria tabela de Previsão

update = pd.DataFrame(index = pd.to_datetime(forecast), columns = ativos) \
    .reset_index().rename(columns={'index': 'Dia'})

tablePrevision = pd.concat([SP500_close, update], axis = 0, ignore_index = True).set_index('Dia')

tablePrevision.index = pd.to_datetime(tablePrevision.index)

In [None]:
# Cria tabela de Log-Retorno vazia 

index_data = pd.to_datetime(SP500_close['Dia'].append(pd.Series(forecast)))

tableLogRet = pd.DataFrame(index = index_data,
                           columns = ativos).reset_index().rename(columns={'index': 'Dia'})

tableLogRet['Dia'] = tableLogRet['Dia'].apply(lambda date: date.strftime('%d/%m'))

In [None]:
fillPrediction(tableLogRet, tablePrevision, ativos)

In [None]:
tableLogRet

In [None]:
tablePrevision

### Métricas

In [None]:
# Salva tabela de previsão

outdirP = './previsao/score-{:.4f}-{}'.format(-scoreTest, datetime.now().strftime('%d-%B-%Ih%Mmin'))

if not os.path.exists(outdirP):
    os.mkdir(outdirP)

nameTableP = 'predicao.csv'

fullnameP = os.path.join(outdirP, nameTableP)

tablePrevision.to_csv(fullnameP, index = True, decimal = '.', sep=',')  

In [None]:
# Salva tabela Entregável do Log-Retorno no padrão

outdirLR = './logRetorno/score-{:.4f}-{}'.format(-scoreTest, datetime.now().strftime('%d-%B-%Ih%Mmin'))

if not os.path.exists(outdirLR):
    os.mkdir(outdirLR)

nameTableLR = 'predicao.csv'

fullnameLR = os.path.join(outdirLR, nameTableLR)

tableLogRet.iloc[-len(forecast):, :].to_csv(fullnameLR, index = False, decimal = '.', sep=',')       