## Data Mining - Mineração de Dados para o Mercado Financeiro

### Selecao dos dados brutos

In [1]:
# Importação das bibliotecas básicas
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [2]:
# O banco de dado do Índice Bovespa
df = pd.read_csv('DADOS_IBOV_JAN_2020_2021.csv',sep=';',encoding='utf-8')

In [3]:
df.head(3)

Unnamed: 0,Data,LastPrice,Volume,BOVA11,Close_VALE,Close_ITUB,Close_PETR,Close_B3SA,Close_BBDC,Close_PETR.1,...,Power_BRML,Power_CRFB,Power_TAEE,Power_BRKM,Power_EMBR,Power_MULT,Power_CPFE,Power_MRVE,Power_MRFG,Power_ENBR
0,2020.01.02 09:00:00,117000.0,140,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
1,2020.01.02 09:01:00,117020.0,53,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2,2020.01.02 09:02:00,117025.0,72,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264


In [4]:
# Importamos a biblioteca re "expressão regular" 
# elininamos caracteres por espaços vacios e padronizamos pra letras nimusculas com lower()
import re
def corrige_colunas(col_name):
    return re.sub(r"[_| ]", "", col_name).lower()

In [5]:
# Vamos corrigir todas as columnas do data
df.columns = [corrige_colunas(col) for col in df.columns]

In [6]:
df.head(3)

Unnamed: 0,data,lastprice,volume,bova11,closevale,closeitub,closepetr,closeb3sa,closebbdc,closepetr.1,...,powerbrml,powercrfb,powertaee,powerbrkm,powerembr,powermult,powercpfe,powermrve,powermrfg,powerenbr
0,2020.01.02 09:00:00,117000.0,140,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
1,2020.01.02 09:01:00,117020.0,53,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2,2020.01.02 09:02:00,117025.0,72,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264


In [7]:
# visualizamos o nomes de todas as colunas
list(df)

['data',
 'lastprice',
 'volume',
 'bova11',
 'closevale',
 'closeitub',
 'closepetr',
 'closeb3sa',
 'closebbdc',
 'closepetr.1',
 'closeabev',
 'closewege',
 'closemglu',
 'closeitsa',
 'closegndi',
 'closebbas',
 'closesuzb',
 'closentco',
 'closerent',
 'closejbss',
 'closelren',
 'closeggbr',
 'closebbdc.1',
 'closeugpa',
 'closebrdt',
 'closeradl',
 'closecsna',
 'closevvar',
 'closerail',
 'closeklbn',
 'closeeqtl',
 'closebpac',
 'closelame',
 'closebbse',
 'closevivt',
 'closehapv',
 'closeenev',
 'closebrfs',
 'closebrap',
 'closesanb',
 'closesbsp',
 'closecmig',
 'closeccro',
 'closebtow',
 'closehype',
 'closetots',
 'closeelet',
 'closeengi',
 'closepcar',
 'closeazul',
 'closesula',
 'closetims',
 'closeegie',
 'closecsan',
 'closeyduq',
 'closeprio',
 'closeirbr',
 'closequal',
 'closelcam',
 'closecple',
 'closecogn',
 'closegoau',
 'closeelet.1',
 'closeusim',
 'closeflry',
 'closecyre',
 'closebrml',
 'closecrfb',
 'closetaee',
 'closebrkm',
 'closeembr',
 'closemult

In [8]:
# podemos ver o tipos de dados
df.dtypes

data          object
lastprice    float64
volume         int64
bova11       float64
closevale    float64
              ...   
powermult    float64
powercpfe    float64
powermrve    float64
powermrfg    float64
powerenbr    float64
Length: 810, dtype: object

In [9]:
# transformando coluna de data em data
df['data'] = pd.to_datetime(df['data'])

In [10]:
df.dtypes

data         datetime64[ns]
lastprice           float64
volume                int64
bova11              float64
closevale           float64
                  ...      
powermult           float64
powercpfe           float64
powermrve           float64
powermrfg           float64
powerenbr           float64
Length: 810, dtype: object

In [11]:
# verificamos a existencia de vaores nulos
df.isnull().sum()

data         0
lastprice    0
volume       0
bova11       0
closevale    0
            ..
powermult    0
powercpfe    0
powermrve    0
powermrfg    0
powerenbr    0
Length: 810, dtype: int64

In [12]:
# Vamos indexar a data
df = df.set_index('data')

In [13]:
df.head(3)

Unnamed: 0_level_0,lastprice,volume,bova11,closevale,closeitub,closepetr,closeb3sa,closebbdc,closepetr.1,closeabev,...,powerbrml,powercrfb,powertaee,powerbrkm,powerembr,powermult,powercpfe,powermrve,powermrfg,powerenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,117000.0,140,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2020-01-02 09:01:00,117020.0,53,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2020-01-02 09:02:00,117025.0,72,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264


In [14]:
# podemos listar o nome das colunas de forma que podamos ver os indices
k = 0
for i in df.columns:
    print(str(k)+' -> '+i)
    k+=1

0 -> lastprice
1 -> volume
2 -> bova11
3 -> closevale
4 -> closeitub
5 -> closepetr
6 -> closeb3sa
7 -> closebbdc
8 -> closepetr.1
9 -> closeabev
10 -> closewege
11 -> closemglu
12 -> closeitsa
13 -> closegndi
14 -> closebbas
15 -> closesuzb
16 -> closentco
17 -> closerent
18 -> closejbss
19 -> closelren
20 -> closeggbr
21 -> closebbdc.1
22 -> closeugpa
23 -> closebrdt
24 -> closeradl
25 -> closecsna
26 -> closevvar
27 -> closerail
28 -> closeklbn
29 -> closeeqtl
30 -> closebpac
31 -> closelame
32 -> closebbse
33 -> closevivt
34 -> closehapv
35 -> closeenev
36 -> closebrfs
37 -> closebrap
38 -> closesanb
39 -> closesbsp
40 -> closecmig
41 -> closeccro
42 -> closebtow
43 -> closehype
44 -> closetots
45 -> closeelet
46 -> closeengi
47 -> closepcar
48 -> closeazul
49 -> closesula
50 -> closetims
51 -> closeegie
52 -> closecsan
53 -> closeyduq
54 -> closeprio
55 -> closeirbr
56 -> closequal
57 -> closelcam
58 -> closecple
59 -> closecogn
60 -> closegoau
61 -> closeelet.1
62 -> closeusim
63

In [15]:
# vamos extrair dados de preços de fechamentos fazendo facheamento
df_close= df.iloc[:,2:75]

In [16]:
df_close.head(3)

Unnamed: 0_level_0,bova11,closevale,closeitub,closepetr,closeb3sa,closebbdc,closepetr.1,closeabev,closewege,closemglu,...,closebrml,closecrfb,closetaee,closebrkm,closeembr,closemult,closecpfe,closemrve,closemrfg,closeenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:01:00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:02:00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [17]:
# vamos concatenar uma colunas a lado de um data frame
df_close = pd.concat([df['lastprice'],df_close],axis=1)
df_close.head(3) 

Unnamed: 0_level_0,lastprice,bova11,closevale,closeitub,closepetr,closeb3sa,closebbdc,closepetr.1,closeabev,closewege,...,closebrml,closecrfb,closetaee,closebrkm,closeembr,closemult,closecpfe,closemrve,closemrfg,closeenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,117000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:01:00,117020.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:02:00,117025.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [18]:
# minha variavel dependente é 'lastprice'
# fazemos um novo facheamento
df_volumem= df.iloc[:,75:147]
df_volumem.head(3)

Unnamed: 0_level_0,volumevale,volumeitub,volumepetr,volumeb3sa,volumebbdc,volumepetr.1,volumeabev,volumewege,volumemglu,volumeitsa,...,volumebrml,volumecrfb,volumetaee,volumebrkm,volumeembr,volumemult,volumecpfe,volumemrve,volumemrfg,volumeenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:01:00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:02:00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [19]:
# vamos concatenar uma colunas a lado de um data frame
df_volumem = pd.concat([df['volume'],df_volumem],axis=1)
df_volumem.head(3)

Unnamed: 0_level_0,volume,volumevale,volumeitub,volumepetr,volumeb3sa,volumebbdc,volumepetr.1,volumeabev,volumewege,volumemglu,...,volumebrml,volumecrfb,volumetaee,volumebrkm,volumeembr,volumemult,volumecpfe,volumemrve,volumemrfg,volumeenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,140,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:01:00,53,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2020-01-02 09:02:00,72,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [20]:
df_prob = df.iloc[:,147:161]
df_prob.head(3)

Unnamed: 0_level_0,probsubir,probsubircorr,probsubirpondpesos,probsubirpondcorrpessos,indc,indv,powerc,powerv,probcurtoc,probmedioc,problongoc,probcurtosobe,probmediosobe,problongosobe
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
2020-01-02 09:00:00,0.413,0.411,0.311,0.325,5.0,6.0,11.642,-58.525,0.25,0.155,0.448,0.347,0.222,0.479
2020-01-02 09:01:00,0.413,0.375,0.311,0.333,5.0,6.0,11.642,-58.525,0.25,0.155,0.448,0.347,0.222,0.479
2020-01-02 09:02:00,0.413,0.25,0.311,0.0,5.0,6.0,11.642,-58.525,0.25,0.155,0.448,0.347,0.222,0.479


In [21]:
df_prob = pd.concat([df['lastprice'],df_prob],axis=1)
df_prob.head(3) 

Unnamed: 0_level_0,lastprice,probsubir,probsubircorr,probsubirpondpesos,probsubirpondcorrpessos,indc,indv,powerc,powerv,probcurtoc,probmedioc,problongoc,probcurtosobe,probmediosobe,problongosobe
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
2020-01-02 09:00:00,117000.0,0.413,0.411,0.311,0.325,5.0,6.0,11.642,-58.525,0.25,0.155,0.448,0.347,0.222,0.479
2020-01-02 09:01:00,117020.0,0.413,0.375,0.311,0.333,5.0,6.0,11.642,-58.525,0.25,0.155,0.448,0.347,0.222,0.479
2020-01-02 09:02:00,117025.0,0.413,0.25,0.311,0.0,5.0,6.0,11.642,-58.525,0.25,0.155,0.448,0.347,0.222,0.479


In [22]:
df_hurst = df.iloc[:,665:737]
df_hurst.head(3)

Unnamed: 0_level_0,hurstvale,hurstitub,hurstpetr,hurstb3sa,hurstbbdc,hurstpetr.1,hurstabev,hurstwege,hurstmglu,hurstitsa,...,hurstbrml,hurstcrfb,hursttaee,hurstbrkm,hurstembr,hurstmult,hurstcpfe,hurstmrve,hurstmrfg,hurstenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,0.399463,0.520877,0.508757,0.644406,0.445753,0.495473,0.560413,0.525755,0.522074,0.518396,...,0.576707,0.582902,0.464416,0.512689,0.499057,0.54102,0.509332,0.585283,0.488627,0.479591
2020-01-02 09:01:00,0.399463,0.520877,0.508757,0.644406,0.445753,0.495473,0.560413,0.525755,0.522074,0.518396,...,0.576707,0.582902,0.464416,0.512689,0.499057,0.54102,0.509332,0.585283,0.488627,0.479591
2020-01-02 09:02:00,0.399463,0.520877,0.508757,0.644406,0.445753,0.495473,0.560413,0.525755,0.522074,0.518396,...,0.576707,0.582902,0.464416,0.512689,0.499057,0.54102,0.509332,0.585283,0.488627,0.479591


In [23]:
df_hurst = pd.concat([df['lastprice'],df_hurst],axis=1)
df_hurst.head(3) 

Unnamed: 0_level_0,lastprice,hurstvale,hurstitub,hurstpetr,hurstb3sa,hurstbbdc,hurstpetr.1,hurstabev,hurstwege,hurstmglu,...,hurstbrml,hurstcrfb,hursttaee,hurstbrkm,hurstembr,hurstmult,hurstcpfe,hurstmrve,hurstmrfg,hurstenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,117000.0,0.399463,0.520877,0.508757,0.644406,0.445753,0.495473,0.560413,0.525755,0.522074,...,0.576707,0.582902,0.464416,0.512689,0.499057,0.54102,0.509332,0.585283,0.488627,0.479591
2020-01-02 09:01:00,117020.0,0.399463,0.520877,0.508757,0.644406,0.445753,0.495473,0.560413,0.525755,0.522074,...,0.576707,0.582902,0.464416,0.512689,0.499057,0.54102,0.509332,0.585283,0.488627,0.479591
2020-01-02 09:02:00,117025.0,0.399463,0.520877,0.508757,0.644406,0.445753,0.495473,0.560413,0.525755,0.522074,...,0.576707,0.582902,0.464416,0.512689,0.499057,0.54102,0.509332,0.585283,0.488627,0.479591


In [24]:
df_power = df.iloc[:,737:]
df_power.head(3)

Unnamed: 0_level_0,powervale,poweritub,powerpetr,powerb3sa,powerbbdc,powerpetr.1,powerabev,powerwege,powermglu,poweritsa,...,powerbrml,powercrfb,powertaee,powerbrkm,powerembr,powermult,powercpfe,powermrve,powermrfg,powerenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,-3.62577,-1.854003,0.510349,-99.192203,1.536298,-10.323456,-3.672887,13.916746,-10.307105,4.47438,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2020-01-02 09:01:00,-3.62577,-1.854003,0.510349,-99.192203,1.536298,-10.323456,-3.672887,13.916746,-10.307105,4.47438,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2020-01-02 09:02:00,-3.62577,-1.854003,0.510349,-99.192203,1.536298,-10.323456,-3.672887,13.916746,-10.307105,4.47438,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264


In [25]:
df_power = pd.concat([df['lastprice'],df_power],axis=1)
df_power.head(3) 

Unnamed: 0_level_0,lastprice,powervale,poweritub,powerpetr,powerb3sa,powerbbdc,powerpetr.1,powerabev,powerwege,powermglu,...,powerbrml,powercrfb,powertaee,powerbrkm,powerembr,powermult,powercpfe,powermrve,powermrfg,powerenbr
data,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2020-01-02 09:00:00,117000.0,-3.62577,-1.854003,0.510349,-99.192203,1.536298,-10.323456,-3.672887,13.916746,-10.307105,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2020-01-02 09:01:00,117020.0,-3.62577,-1.854003,0.510349,-99.192203,1.536298,-10.323456,-3.672887,13.916746,-10.307105,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264
2020-01-02 09:02:00,117025.0,-3.62577,-1.854003,0.510349,-99.192203,1.536298,-10.323456,-3.672887,13.916746,-10.307105,...,-4.289072,3.623279,11.529932,21.974516,3.138655,13.196638,3.231047,10.351668,11.907891,13.964264


## Salvar dados da selecao

In [26]:
df_close.to_csv('D_CLOSE.csv')

In [27]:
df_volumem.to_csv('D_VOLUMEM.csv')

In [28]:
df_prob.to_csv('D_PROB.csv')
df_hurst.to_csv('D_HURST.csv')
df_power.to_csv('D_POWER.csv')