<h1>Limpagem de dados XBT para inserçao MongoDB</h1>
<br>
Este notebook foi criado por <b>Bruno da Silva Andrade</b>. Aqui irei crair a rotina de limpagem e estruturação para a inserção no banco de dados MongoDB

In [23]:
import numpy as np
import matplotlib.pyplot as plt
import codecs 
import json

<h2>Definindo estruturas de colunas</h2>
<b>Tipo 1 de dado</b>
<br>
<p>Num Data Fields   :  5                  
Field1&nbsp;      :Time (sec)                 
Field2            :  Resistance (ohms)      
Field3            :  Depth (m)        
Field4            :  Temperature (?C)
<br>Field5            :  Sound Velocity (m/s)</p>

<b>Tipo 2 de dado</b><br>
<br>
Num Data Fields   :  3<br>
Field1            :  Temperature (?C)<br>
Field2            :  Depth (m)<br>
Field3            :  Sound Velocity (m/s)<br>

In [24]:
dtype2 = [('time', 'f4'),('resistance', 'f4'),('depth', 'f4'), ('temperature', 'f4'), ('vel','f4')]


form = dict(usecols=(0, 1, 2), dtype=dtype)
form1 = dict(usecols=(0, 1, 2, 3, 4), dtype=dtype2)

xbt_raw = np.genfromtxt('./data/XBT1.EDF', skip_header=32, **form)
xbt_raw2 = np.genfromtxt('./data/XBT2.EDF', skip_header=45, **form1)


<h2>Exibindo dados do dataset em seu formato bruto</h2>

In [25]:
xbt_raw

array([(  0. , 21.2 , 1519.2 ), (  0.7, 21.16, 1519.1 ),
       (  1.3, 21.15, 1519.09), (  2. , 21.15, 1519.09),
       (  2.7, 21.14, 1519.09), (  3.3, 21.14, 1519.1 ),
       (  4. , 21.14, 1519.1 ), (  4.7, 21.14, 1519.11),
       (  5.4, 21.14, 1519.12), (  6. , 21.14, 1519.14),
       (  6.7, 21.14, 1519.14), (  7.4, 21.13, 1519.14),
       (  8. , 21.14, 1519.16), (  8.7, 21.14, 1519.17),
       (  9.4, 21.13, 1519.17), ( 10. , 21.13, 1519.17),
       ( 10.7, 21.13, 1519.18), ( 11.4, 21.13, 1519.19),
       ( 12. , 21.13, 1519.21), ( 12.7, 21.13, 1519.22),
       ( 13.4, 21.13, 1519.24), ( 14. , 21.13, 1519.25),
       ( 14.7, 21.13, 1519.26), ( 15.4, 21.13, 1519.27),
       ( 16. , 21.13, 1519.28), ( 16.7, 21.13, 1519.29),
       ( 17.4, 21.13, 1519.3 ), ( 18. , 21.13, 1519.31),
       ( 18.7, 21.13, 1519.33), ( 19.4, 21.13, 1519.34),
       ( 20.1, 21.13, 1519.35), ( 20.7, 21.13, 1519.36),
       ( 21.4, 21.13, 1519.37), ( 22.1, 21.13, 1519.38),
       ( 22.7, 21.13, 1519.39),

In [26]:
xbt_raw2

array([( 0.1, 5530.981,   0.67, 22.71, 1528.71),
       ( 0.2, 5550.41 ,   1.34, 22.63, 1528.52),
       ( 0.3, 5558.083,   2.01, 22.6 , 1528.45),
       ( 0.4, 5561.029,   2.68, 22.59, 1528.43),
       ( 0.5, 5560.842,   3.34, 22.59, 1528.44),
       ( 0.6, 5561.597,   4.01, 22.59, 1528.45),
       ( 0.7, 5561.891,   4.68, 22.59, 1528.46),
       ( 0.8, 5561.374,   5.35, 22.59, 1528.47),
       ( 0.9, 5561.605,   6.02, 22.59, 1528.48),
       ( 1. , 5561.549,   6.69, 22.59, 1528.49),
       ( 1.1, 5561.772,   7.36, 22.59, 1528.5 ),
       ( 1.2, 5561.558,   8.03, 22.59, 1528.52),
       ( 1.3, 5561.629,   8.69, 22.59, 1528.53),
       ( 1.4, 5562.229,   9.36, 22.59, 1528.53),
       ( 1.5, 5562.307,  10.03, 22.59, 1528.54),
       ( 1.6, 5562.167,  10.7 , 22.59, 1528.55),
       ( 1.7, 5562.321,  11.37, 22.59, 1528.56),
       ( 1.8, 5563.007,  12.04, 22.58, 1528.57),
       ( 1.9, 5563.491,  12.7 , 22.58, 1528.57),
       ( 2. , 5564.979,  13.37, 22.58, 1528.57),
       ( 2.1, 5565.0

<h2>Colocando os datasets em formato JSON para posteriormente a inserção no banco </h2>

In [27]:
for d in xbt_raw:
        print('{\n\t"depth":',d[0],',\n\t"temperature":',d[1],',\n\t"sound_velocity":',d[2],'\n},')

{
	"depth": 0.0 ,
	"temperature": 21.2 ,
	"sound_velocity": 1519.2 
},
{
	"depth": 0.7 ,
	"temperature": 21.16 ,
	"sound_velocity": 1519.1 
},
{
	"depth": 1.3 ,
	"temperature": 21.15 ,
	"sound_velocity": 1519.09 
},
{
	"depth": 2.0 ,
	"temperature": 21.15 ,
	"sound_velocity": 1519.09 
},
{
	"depth": 2.7 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.09 
},
{
	"depth": 3.3 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.1 
},
{
	"depth": 4.0 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.1 
},
{
	"depth": 4.7 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.11 
},
{
	"depth": 5.4 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.12 
},
{
	"depth": 6.0 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.14 
},
{
	"depth": 6.7 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.14 
},
{
	"depth": 7.4 ,
	"temperature": 21.13 ,
	"sound_velocity": 1519.14 
},
{
	"depth": 8.0 ,
	"temperature": 21.14 ,
	"sound_velocity": 1519.16 
},
{
	"depth": 8.7 ,
	"temperature": 21.14 ,
	"sound_veloci

},
{
	"depth": 273.8 ,
	"temperature": 14.34 ,
	"sound_velocity": 1503.25 
},
{
	"depth": 274.5 ,
	"temperature": 14.34 ,
	"sound_velocity": 1503.25 
},
{
	"depth": 275.1 ,
	"temperature": 14.33 ,
	"sound_velocity": 1503.23 
},
{
	"depth": 275.8 ,
	"temperature": 14.32 ,
	"sound_velocity": 1503.22 
},
{
	"depth": 276.4 ,
	"temperature": 14.32 ,
	"sound_velocity": 1503.21 
},
{
	"depth": 277.1 ,
	"temperature": 14.31 ,
	"sound_velocity": 1503.18 
},
{
	"depth": 277.7 ,
	"temperature": 14.3 ,
	"sound_velocity": 1503.16 
},
{
	"depth": 278.4 ,
	"temperature": 14.28 ,
	"sound_velocity": 1503.13 
},
{
	"depth": 279.0 ,
	"temperature": 14.27 ,
	"sound_velocity": 1503.08 
},
{
	"depth": 279.7 ,
	"temperature": 14.23 ,
	"sound_velocity": 1502.99 
},
{
	"depth": 280.3 ,
	"temperature": 14.2 ,
	"sound_velocity": 1502.89 
},
{
	"depth": 281.0 ,
	"temperature": 14.17 ,
	"sound_velocity": 1502.79 
},
{
	"depth": 281.6 ,
	"temperature": 14.14 ,
	"sound_velocity": 1502.7 
},
{
	"depth": 282.3 ,
	"tem

	"temperature": 10.36 ,
	"sound_velocity": 1493.52 
},
{
	"depth": 515.8 ,
	"temperature": 10.35 ,
	"sound_velocity": 1493.49 
},
{
	"depth": 516.4 ,
	"temperature": 10.34 ,
	"sound_velocity": 1493.48 
},
{
	"depth": 517.1 ,
	"temperature": 10.34 ,
	"sound_velocity": 1493.47 
},
{
	"depth": 517.7 ,
	"temperature": 10.33 ,
	"sound_velocity": 1493.48 
},
{
	"depth": 518.3 ,
	"temperature": 10.33 ,
	"sound_velocity": 1493.47 
},
{
	"depth": 519.0 ,
	"temperature": 10.33 ,
	"sound_velocity": 1493.46 
},
{
	"depth": 519.6 ,
	"temperature": 10.32 ,
	"sound_velocity": 1493.47 
},
{
	"depth": 520.2 ,
	"temperature": 10.32 ,
	"sound_velocity": 1493.46 
},
{
	"depth": 520.9 ,
	"temperature": 10.3 ,
	"sound_velocity": 1493.41 
},
{
	"depth": 521.5 ,
	"temperature": 10.23 ,
	"sound_velocity": 1493.17 
},
{
	"depth": 522.1 ,
	"temperature": 10.17 ,
	"sound_velocity": 1492.97 
},
{
	"depth": 522.8 ,
	"temperature": 10.33 ,
	"sound_velocity": 1493.55 
},
{
	"depth": 523.4 ,
	"temperature": 10.29 ,
	"

In [28]:
for d in xbt_raw2:
        print('{\n\t"time":',d[0],',\n\t"resistance":',d[1],',\n\t"depth":',d[2],',\n\t"temperature":',d[3],',\n\t"sound_velocity":',d[4],'\n},')

{
	"time": 0.1 ,
	"resistance": 5530.981 ,
	"depth": 0.67 ,
	"temperature": 22.71 ,
	"sound_velocity": 1528.71 
},
{
	"time": 0.2 ,
	"resistance": 5550.41 ,
	"depth": 1.34 ,
	"temperature": 22.63 ,
	"sound_velocity": 1528.52 
},
{
	"time": 0.3 ,
	"resistance": 5558.083 ,
	"depth": 2.01 ,
	"temperature": 22.6 ,
	"sound_velocity": 1528.45 
},
{
	"time": 0.4 ,
	"resistance": 5561.029 ,
	"depth": 2.68 ,
	"temperature": 22.59 ,
	"sound_velocity": 1528.43 
},
{
	"time": 0.5 ,
	"resistance": 5560.842 ,
	"depth": 3.34 ,
	"temperature": 22.59 ,
	"sound_velocity": 1528.44 
},
{
	"time": 0.6 ,
	"resistance": 5561.597 ,
	"depth": 4.01 ,
	"temperature": 22.59 ,
	"sound_velocity": 1528.45 
},
{
	"time": 0.7 ,
	"resistance": 5561.891 ,
	"depth": 4.68 ,
	"temperature": 22.59 ,
	"sound_velocity": 1528.46 
},
{
	"time": 0.8 ,
	"resistance": 5561.374 ,
	"depth": 5.35 ,
	"temperature": 22.59 ,
	"sound_velocity": 1528.47 
},
{
	"time": 0.9 ,
	"resistance": 5561.605 ,
	"depth": 6.02 ,
	"temperature": 22.59 

	"resistance": 6244.578 ,
	"depth": 128.3 ,
	"temperature": 20.0 ,
	"sound_velocity": 1523.61 
},
{
	"time": 19.4 ,
	"resistance": 6243.88 ,
	"depth": 128.96 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.63 
},
{
	"time": 19.5 ,
	"resistance": 6243.446 ,
	"depth": 129.62 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.65 
},
{
	"time": 19.6 ,
	"resistance": 6242.941 ,
	"depth": 130.28 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.66 
},
{
	"time": 19.7 ,
	"resistance": 6242.938 ,
	"depth": 130.94 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.67 
},
{
	"time": 19.8 ,
	"resistance": 6242.719 ,
	"depth": 131.6 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.69 
},
{
	"time": 19.9 ,
	"resistance": 6242.597 ,
	"depth": 132.26 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.7 
},
{
	"time": 20.0 ,
	"resistance": 6241.881 ,
	"depth": 132.92 ,
	"temperature": 20.01 ,
	"sound_velocity": 1523.72 
},
{
	"time": 20.1 ,
	"resistance": 6241.718 ,
	"depth": 133.58 ,
	"temperature": 