In [15]:
import pandas as pd
import re
from sqlalchemy import *
from sqlalchemy.ext.automap import automap_base
from sqlalchemy.orm import Session
from flask import Flask, jsonify

In [16]:
engine = create_engine("sqlite:///db/belly_button_biodiversity.sqlite", echo=False)

In [17]:
# Reflecting db into a new model
Base = automap_base()

# reflect tables
Base.prepare(engine, reflect=True)

# Save tables to classes
Metadata = Base.classes.samples_metadata
Otu = Base.classes.otu
Samples = Base.classes.samples

#initiate a session
session = Session(engine)

In [18]:
inspector = inspect(engine)
inspector.get_table_names()

['otu', 'samples', 'samples_metadata']

In [19]:
columns = inspector.get_columns('samples')
for c in columns:
    print(c['name'], c["type"])

otu_id INTEGER
BB_940 INTEGER
BB_941 INTEGER
BB_943 INTEGER
BB_944 INTEGER
BB_945 INTEGER
BB_946 INTEGER
BB_947 INTEGER
BB_948 INTEGER
BB_949 INTEGER
BB_950 INTEGER
BB_952 INTEGER
BB_953 INTEGER
BB_954 INTEGER
BB_955 INTEGER
BB_956 INTEGER
BB_958 INTEGER
BB_959 INTEGER
BB_960 INTEGER
BB_961 INTEGER
BB_962 INTEGER
BB_963 INTEGER
BB_964 INTEGER
BB_966 INTEGER
BB_967 INTEGER
BB_968 INTEGER
BB_969 INTEGER
BB_970 INTEGER
BB_971 INTEGER
BB_972 INTEGER
BB_973 INTEGER
BB_974 INTEGER
BB_975 INTEGER
BB_978 INTEGER
BB_1233 INTEGER
BB_1234 INTEGER
BB_1235 INTEGER
BB_1236 INTEGER
BB_1237 INTEGER
BB_1238 INTEGER
BB_1242 INTEGER
BB_1243 INTEGER
BB_1246 INTEGER
BB_1253 INTEGER
BB_1254 INTEGER
BB_1258 INTEGER
BB_1259 INTEGER
BB_1260 INTEGER
BB_1264 INTEGER
BB_1265 INTEGER
BB_1273 INTEGER
BB_1275 INTEGER
BB_1276 INTEGER
BB_1277 INTEGER
BB_1278 INTEGER
BB_1279 INTEGER
BB_1280 INTEGER
BB_1281 INTEGER
BB_1282 INTEGER
BB_1283 INTEGER
BB_1284 INTEGER
BB_1285 INTEGER
BB_1286 INTEGER
BB_1287 INTEGER
BB_1288 IN

In [20]:
engine.execute('SELECT * FROM samples LIMIT 1').fetchall()

[(1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0)]

In [21]:
columns = inspector.get_columns('otu')
for c in columns:
    print(c['name'], c["type"])

otu_id INTEGER
lowest_taxonomic_unit_found TEXT


In [22]:
engine.execute('SELECT * FROM otu LIMIT 10').fetchall()

[(1, 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus'),
 (2, 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus'),
 (3, 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Natronorubrum'),
 (4, 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 (5, 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 (6, 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 (7, 'Bacteria'),
 (8, 'Bacteria'),
 (9, 'Bacteria'),
 (10, 'Bacteria')]

In [23]:
columns = inspector.get_columns('samples_metadata')
for c in columns:
    print(c['name'], c["type"])

SAMPLEID INTEGER
EVENT TEXT
ETHNICITY TEXT
GENDER TEXT
AGE INTEGER
WFREQ INTEGER
BBTYPE TEXT
LOCATION TEXT
COUNTRY012 TEXT
ZIP012 INTEGER
COUNTRY1319 TEXT
ZIP1319 INTEGER
DOG TEXT
CAT TEXT
IMPSURFACE013 INTEGER
NPP013 FLOAT
MMAXTEMP013 FLOAT
PFC013 FLOAT
IMPSURFACE1319 INTEGER
NPP1319 FLOAT
MMAXTEMP1319 FLOAT
PFC1319 FLOAT


In [24]:
engine.execute('SELECT SAMPLEID FROM samples_metadata LIMIT 10').fetchall()

[(940,),
 (941,),
 (943,),
 (944,),
 (945,),
 (946,),
 (947,),
 (948,),
 (949,),
 (950,)]

In [26]:
sample_names = session.query(Base.classes.samples_metadata.SAMPLEID).all()

In [31]:
#List of sample names
['BB_' + str(name[0]) for name in sample_names]

['BB_940',
 'BB_941',
 'BB_943',
 'BB_944',
 'BB_945',
 'BB_946',
 'BB_947',
 'BB_948',
 'BB_949',
 'BB_950',
 'BB_952',
 'BB_953',
 'BB_954',
 'BB_955',
 'BB_956',
 'BB_958',
 'BB_959',
 'BB_960',
 'BB_961',
 'BB_962',
 'BB_963',
 'BB_964',
 'BB_966',
 'BB_967',
 'BB_968',
 'BB_969',
 'BB_970',
 'BB_971',
 'BB_972',
 'BB_973',
 'BB_974',
 'BB_975',
 'BB_978',
 'BB_1233',
 'BB_1234',
 'BB_1235',
 'BB_1236',
 'BB_1237',
 'BB_1238',
 'BB_1242',
 'BB_1243',
 'BB_1246',
 'BB_1253',
 'BB_1254',
 'BB_1258',
 'BB_1259',
 'BB_1260',
 'BB_1264',
 'BB_1265',
 'BB_1273',
 'BB_1275',
 'BB_1276',
 'BB_1277',
 'BB_1278',
 'BB_1279',
 'BB_1280',
 'BB_1281',
 'BB_1282',
 'BB_1283',
 'BB_1284',
 'BB_1285',
 'BB_1286',
 'BB_1287',
 'BB_1288',
 'BB_1289',
 'BB_1290',
 'BB_1291',
 'BB_1292',
 'BB_1293',
 'BB_1294',
 'BB_1295',
 'BB_1296',
 'BB_1297',
 'BB_1298',
 'BB_1308',
 'BB_1309',
 'BB_1310',
 'BB_1374',
 'BB_1415',
 'BB_1439',
 'BB_1441',
 'BB_1443',
 'BB_1486',
 'BB_1487',
 'BB_1489',
 'BB_1490',
 

In [32]:
otu_descs = session.query(Base.classes.otu.lowest_taxonomic_unit_found).all()

In [35]:
[x[0] for x in otu_descs]

['Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus',
 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus',
 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Natronorubrum',
 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter',
 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter',
 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bact

In [42]:
metadata_sample = session.query(Base.classes.samples_metadata).filter(Base.classes.samples_metadata.SAMPLEID == int('970'))

metadata_sample[0].SAMPLEID

970

In [44]:
session.query(Base.classes.samples_metadata.WFREQ).filter(Base.classes.samples_metadata.SAMPLEID == int('970'))[0]

(0)

In [63]:

result_df = pd.read_sql("SELECT otu_id, (%s) FROM samples" % ('BB_970'), session.bind)
result_df.columns = ['otu_id','BB_970']
result_df = result_df.sort_values(by='BB_970', ascending=False)
otu_list = result_df['otu_id'].tolist()
sample_value = result_df['BB_970'].tolist()
result = {
    'otu_ids': otu_list,
    'sample_values': sample_value
}
result

{'otu_ids': [1795,
  3360,
  3544,
  3288,
  3541,
  1724,
  1408,
  3030,
  3581,
  1929,
  3511,
  1651,
  1352,
  1652,
  3120,
  3378,
  922,
  3312,
  944,
  1720,
  3543,
  3042,
  3537,
  2859,
  1645,
  3561,
  2447,
  2446,
  2448,
  2453,
  2449,
  2450,
  2454,
  2455,
  2451,
  2445,
  2456,
  2444,
  2443,
  2452,
  2437,
  2442,
  2428,
  2417,
  2418,
  2419,
  2420,
  2421,
  2422,
  2423,
  2424,
  2425,
  2426,
  2427,
  2429,
  2441,
  2430,
  2431,
  2432,
  2433,
  2434,
  2435,
  2436,
  2458,
  2438,
  2439,
  2440,
  2457,
  2463,
  2459,
  2503,
  2491,
  2492,
  2493,
  2494,
  2495,
  2496,
  2497,
  2498,
  2499,
  2500,
  2501,
  2502,
  2504,
  2489,
  2505,
  2506,
  2507,
  2508,
  2509,
  2510,
  2511,
  2512,
  2513,
  2514,
  2515,
  2516,
  2490,
  2488,
  2460,
  2473,
  2461,
  2462,
  2415,
  2464,
  2465,
  2466,
  2467,
  2468,
  2469,
  2470,
  2471,
  2472,
  2474,
  2487,
  2475,
  2476,
  2477,
  2478,
  2479,
  2480,
  2481,
  2482,
  2483,