In [103]:
# Python SQL toolkit and Object Relational Mapper
import sqlalchemy
from sqlalchemy.ext.automap import automap_base
from sqlalchemy import Column, Integer, String
from sqlalchemy.ext.declarative import declarative_base
from sqlalchemy.sql.expression import cast
from sqlalchemy import create_engine, inspect, func
from sqlalchemy.orm import Session, aliased
from datetime import datetime
import numpy as np
import pandas as pd


In [105]:
Base = declarative_base()


In [106]:
# Create an engine for the `belly_button_biodiversity.sqlite` database
### BEGIN SOLUTION
engine = create_engine("sqlite:///belly_button_biodiversity.sqlite", echo=False)
### END SOLUTION

In [107]:
# Use the Inspector to explore the database and print the table names
### BEGIN SOLUTION
inspector = inspect(engine)
inspector.get_table_names()
### END SOLUTION

['otu', 'samples', 'samples_metadata']

In [108]:
# Use Inspector to print the column names and types
### BEGIN SOLUTION
columns = inspector.get_columns('otu')
for c in columns:
    print(c['name'], c["type"])
### END SOLUTION

otu_id INTEGER
lowest_taxonomic_unit_found TEXT


In [109]:
engine.execute('SELECT * FROM otu LIMIT 10').fetchall()

[(1, 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus'),
 (2, 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus'),
 (3, 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Natronorubrum'),
 (4, 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 (5, 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 (6, 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 (7, 'Bacteria'),
 (8, 'Bacteria'),
 (9, 'Bacteria'),
 (10, 'Bacteria')]

In [110]:
columns = inspector.get_columns('samples')
for c in columns:
    print(c['name'], c["type"])

otu_id INTEGER
BB_940 INTEGER
BB_941 INTEGER
BB_943 INTEGER
BB_944 INTEGER
BB_945 INTEGER
BB_946 INTEGER
BB_947 INTEGER
BB_948 INTEGER
BB_949 INTEGER
BB_950 INTEGER
BB_952 INTEGER
BB_953 INTEGER
BB_954 INTEGER
BB_955 INTEGER
BB_956 INTEGER
BB_958 INTEGER
BB_959 INTEGER
BB_960 INTEGER
BB_961 INTEGER
BB_962 INTEGER
BB_963 INTEGER
BB_964 INTEGER
BB_966 INTEGER
BB_967 INTEGER
BB_968 INTEGER
BB_969 INTEGER
BB_970 INTEGER
BB_971 INTEGER
BB_972 INTEGER
BB_973 INTEGER
BB_974 INTEGER
BB_975 INTEGER
BB_978 INTEGER
BB_1233 INTEGER
BB_1234 INTEGER
BB_1235 INTEGER
BB_1236 INTEGER
BB_1237 INTEGER
BB_1238 INTEGER
BB_1242 INTEGER
BB_1243 INTEGER
BB_1246 INTEGER
BB_1253 INTEGER
BB_1254 INTEGER
BB_1258 INTEGER
BB_1259 INTEGER
BB_1260 INTEGER
BB_1264 INTEGER
BB_1265 INTEGER
BB_1273 INTEGER
BB_1275 INTEGER
BB_1276 INTEGER
BB_1277 INTEGER
BB_1278 INTEGER
BB_1279 INTEGER
BB_1280 INTEGER
BB_1281 INTEGER
BB_1282 INTEGER
BB_1283 INTEGER
BB_1284 INTEGER
BB_1285 INTEGER
BB_1286 INTEGER
BB_1287 INTEGER
BB_1288 IN

In [111]:
engine.execute('SELECT * FROM samples LIMIT 1').fetchall()

[(1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0)]

In [112]:
columns = inspector.get_columns('Samples_metadata')
for c in columns:
    print(c['name'], c["type"])

SAMPLEID INTEGER
EVENT TEXT
ETHNICITY TEXT
GENDER TEXT
AGE INTEGER
WFREQ INTEGER
BBTYPE TEXT
LOCATION TEXT
COUNTRY012 TEXT
ZIP012 INTEGER
COUNTRY1319 TEXT
ZIP1319 INTEGER
DOG TEXT
CAT TEXT
IMPSURFACE013 INTEGER
NPP013 FLOAT
MMAXTEMP013 FLOAT
PFC013 FLOAT
IMPSURFACE1319 INTEGER
NPP1319 FLOAT
MMAXTEMP1319 FLOAT
PFC1319 FLOAT


In [113]:
engine.execute('SELECT * FROM Samples_metadata LIMIT 5').fetchall()

[(940, 'BellyButtonsScienceOnline', 'Caucasian', 'F', 24, 2, 'I', 'Beaufort/NC', 'usa', 22306, 'usa', 22306, 'no', 'no', 8852, 37.17222214, 54.5, 0.0, 1, 0.0, 33.99000168, 25.5),
 (941, '0', 'Caucasian/Midleastern', 'F', 34, 1, 'I', 'Chicago/IL', '0', 0, '0', 0, '0', '0', 0, 0.0, 0.0, 0.0, 0, 0.0, 0.0, 0.0),
 (943, 'BellyButtonsScienceOnline', 'Caucasian', 'F', 49, 1, 'I', 'Omaha/NE', '0', 0, '0', 0, '0', '0', 0, 0.0, 0.0, 0.0, 0, 0.0, 0.0, 0.0),
 (944, 'BellyButtonsScienceOnline', 'European', 'M', 44, 1, 'I', 'NewHaven/CT', 'usa', 7079, 'usa', 8822, 'no', 'yes', 0, 35.81666565, 16.0, 0.0, 0, 6567.0, 32.40333176, 28.5),
 (945, 'BellyButtonsScienceOnline', 'Caucasian', 'F', 48, 1, 'I', 'Philidelphia/PA', 'usa', 84404, 'usa', 96025, 'no', 'no', 0, 37.78333282, 4.0, 0.0, 0, 5613.0, 33.63444519, 24.0)]

In [114]:
# Declare a Base using `automap_base()`
Base = automap_base()

In [115]:
# Use the Base class to reflect the database tables
Base.prepare(engine, reflect=True)

In [116]:
# Print all of the classes mapped to the Base
Base.classes.keys()

['otu', 'samples', 'samples_metadata']

In [117]:
Otu = Base.classes.otu

In [118]:
Samples=Base.classes.samples

In [119]:
Samples_metadata = Base.classes.samples_metadata

In [120]:
# Create a session
session = Session(engine)

In [121]:
sampleId_result=Samples.__table__.columns.keys()
sampleId_result

['otu_id',
 'BB_940',
 'BB_941',
 'BB_943',
 'BB_944',
 'BB_945',
 'BB_946',
 'BB_947',
 'BB_948',
 'BB_949',
 'BB_950',
 'BB_952',
 'BB_953',
 'BB_954',
 'BB_955',
 'BB_956',
 'BB_958',
 'BB_959',
 'BB_960',
 'BB_961',
 'BB_962',
 'BB_963',
 'BB_964',
 'BB_966',
 'BB_967',
 'BB_968',
 'BB_969',
 'BB_970',
 'BB_971',
 'BB_972',
 'BB_973',
 'BB_974',
 'BB_975',
 'BB_978',
 'BB_1233',
 'BB_1234',
 'BB_1235',
 'BB_1236',
 'BB_1237',
 'BB_1238',
 'BB_1242',
 'BB_1243',
 'BB_1246',
 'BB_1253',
 'BB_1254',
 'BB_1258',
 'BB_1259',
 'BB_1260',
 'BB_1264',
 'BB_1265',
 'BB_1273',
 'BB_1275',
 'BB_1276',
 'BB_1277',
 'BB_1278',
 'BB_1279',
 'BB_1280',
 'BB_1281',
 'BB_1282',
 'BB_1283',
 'BB_1284',
 'BB_1285',
 'BB_1286',
 'BB_1287',
 'BB_1288',
 'BB_1289',
 'BB_1290',
 'BB_1291',
 'BB_1292',
 'BB_1293',
 'BB_1294',
 'BB_1295',
 'BB_1296',
 'BB_1297',
 'BB_1298',
 'BB_1308',
 'BB_1309',
 'BB_1310',
 'BB_1374',
 'BB_1415',
 'BB_1439',
 'BB_1441',
 'BB_1443',
 'BB_1486',
 'BB_1487',
 'BB_1489',
 '

In [122]:
sampleId_result.pop(0)
sampleId_result

['BB_940',
 'BB_941',
 'BB_943',
 'BB_944',
 'BB_945',
 'BB_946',
 'BB_947',
 'BB_948',
 'BB_949',
 'BB_950',
 'BB_952',
 'BB_953',
 'BB_954',
 'BB_955',
 'BB_956',
 'BB_958',
 'BB_959',
 'BB_960',
 'BB_961',
 'BB_962',
 'BB_963',
 'BB_964',
 'BB_966',
 'BB_967',
 'BB_968',
 'BB_969',
 'BB_970',
 'BB_971',
 'BB_972',
 'BB_973',
 'BB_974',
 'BB_975',
 'BB_978',
 'BB_1233',
 'BB_1234',
 'BB_1235',
 'BB_1236',
 'BB_1237',
 'BB_1238',
 'BB_1242',
 'BB_1243',
 'BB_1246',
 'BB_1253',
 'BB_1254',
 'BB_1258',
 'BB_1259',
 'BB_1260',
 'BB_1264',
 'BB_1265',
 'BB_1273',
 'BB_1275',
 'BB_1276',
 'BB_1277',
 'BB_1278',
 'BB_1279',
 'BB_1280',
 'BB_1281',
 'BB_1282',
 'BB_1283',
 'BB_1284',
 'BB_1285',
 'BB_1286',
 'BB_1287',
 'BB_1288',
 'BB_1289',
 'BB_1290',
 'BB_1291',
 'BB_1292',
 'BB_1293',
 'BB_1294',
 'BB_1295',
 'BB_1296',
 'BB_1297',
 'BB_1298',
 'BB_1308',
 'BB_1309',
 'BB_1310',
 'BB_1374',
 'BB_1415',
 'BB_1439',
 'BB_1441',
 'BB_1443',
 'BB_1486',
 'BB_1487',
 'BB_1489',
 'BB_1490',
 

In [123]:
Otu_result=session.query(Otu.lowest_taxonomic_unit_found).all()
Otu_result

[('Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus'),
 ('Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus'),
 ('Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Natronorubrum'),
 ('Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 ('Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 ('Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 ('Bacteria'),
 

In [124]:
Otu_result= list(np.ravel(Otu_result))
Otu_result

['Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus',
 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Halococcus',
 'Archaea;Euryarchaeota;Halobacteria;Halobacteriales;Halobacteriaceae;Natronorubrum',
 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter',
 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter',
 'Archaea;Euryarchaeota;Methanobacteria;Methanobacteriales;Methanobacteriaceae;Methanobrevibacter',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bacteria',
 'Bact

In [125]:
metadata_results = session.query(Samples_metadata.AGE, Samples_metadata.BBTYPE,
        Samples_metadata.ETHNICITY,
        Samples_metadata.GENDER,
        Samples_metadata.LOCATION,
        Samples_metadata.SAMPLEID).all()
        

In [126]:
metadata_results

[(24, 'I', 'Caucasian', 'F', 'Beaufort/NC', 940),
 (34, 'I', 'Caucasian/Midleastern', 'F', 'Chicago/IL', 941),
 (49, 'I', 'Caucasian', 'F', 'Omaha/NE', 943),
 (44, 'I', 'European', 'M', 'NewHaven/CT', 944),
 (48, 'I', 'Caucasian', 'F', 'Philidelphia/PA', 945),
 (42, 'I', 'Caucasian', 'F', 'Deerfield/MA', 946),
 (49, 'I', 'Caucasian', 'M', 'ChapelHill/NC', 947),
 (20, 'I', 'Caucasian', 'M', 'ChapelHill/NC', 948),
 (51, 'I', 'Caucasian', 'F', 'Durham/NC', 949),
 (51, 'I', 'Caucasian', 'M', 'NewYork/NY', 950),
 (51, 'I', 'Caucasian', 'F', 'Seattle/WA', 952),
 (38, 'I', 'Caucasian', 'F', 'Chicago/IL', 953),
 (26, 'I', 'Caucasian', 'M', 'NewYork/NY', 954),
 (27, 'I', 'Caucasian', 'F', 'NewYork/NY', 955),
 (16, 'I', 'Caucasian', 'M', 'Jacksonville/NC', 956),
 (43, 'I', 'Caucasian', 'M', 'Wilmington/NC', 958),
 (40, 'I', 'Caucasian', 'M', 'Carrboro/NC', 959),
 (48, 'I', 'Caucasian', 'M', 'Lexington/NC', 960),
 (35, 'i', 'Caucasian', 'F', 'Edmonton,AB', 961),
 (56, 'i', 'Caucasian', 'F', 'Wash

In [127]:
metadata = []
for samples in metadata_results:
        metadata_dict = {}
        metadata_dict["AGE"] = samples[0]
        metadata_dict["BBTYPE"] = samples[1]
        metadata_dict["ETHNICITY"] = samples[2]
        metadata_dict["GENDER"] = samples[3]
        metadata_dict["LOCATION"] = samples[4]
        metadata_dict["SAMPLEID"] = samples[5]
        
        metadata.append(metadata_dict)
metadata    

[{'AGE': 24,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian',
  'GENDER': 'F',
  'LOCATION': 'Beaufort/NC',
  'SAMPLEID': 940},
 {'AGE': 34,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian/Midleastern',
  'GENDER': 'F',
  'LOCATION': 'Chicago/IL',
  'SAMPLEID': 941},
 {'AGE': 49,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian',
  'GENDER': 'F',
  'LOCATION': 'Omaha/NE',
  'SAMPLEID': 943},
 {'AGE': 44,
  'BBTYPE': 'I',
  'ETHNICITY': 'European',
  'GENDER': 'M',
  'LOCATION': 'NewHaven/CT',
  'SAMPLEID': 944},
 {'AGE': 48,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian',
  'GENDER': 'F',
  'LOCATION': 'Philidelphia/PA',
  'SAMPLEID': 945},
 {'AGE': 42,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian',
  'GENDER': 'F',
  'LOCATION': 'Deerfield/MA',
  'SAMPLEID': 946},
 {'AGE': 49,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian',
  'GENDER': 'M',
  'LOCATION': 'ChapelHill/NC',
  'SAMPLEID': 947},
 {'AGE': 20,
  'BBTYPE': 'I',
  'ETHNICITY': 'Caucasian',
  'GENDER': 'M',
  'LOCATION': 'ChapelHill/NC',
  'SAMPLEID'

In [128]:
WQREF_results= session.query(Samples_metadata.SAMPLEID, Samples_metadata.WFREQ).all()
WQREF_list= []

for result in WQREF_results:
    row = {"SAMPLEID":"WQREF"}
    row["SAMPLEID"] = result[0]
    row["WQREF"] = float(result[1])
    WQREF_list.append(row)
WQREF_list        

[{'SAMPLEID': 940, 'WQREF': 2.0},
 {'SAMPLEID': 941, 'WQREF': 1.0},
 {'SAMPLEID': 943, 'WQREF': 1.0},
 {'SAMPLEID': 944, 'WQREF': 1.0},
 {'SAMPLEID': 945, 'WQREF': 1.0},
 {'SAMPLEID': 946, 'WQREF': 3.0},
 {'SAMPLEID': 947, 'WQREF': 6.0},
 {'SAMPLEID': 948, 'WQREF': 0.0},
 {'SAMPLEID': 949, 'WQREF': 3.0},
 {'SAMPLEID': 950, 'WQREF': 5.0},
 {'SAMPLEID': 952, 'WQREF': 7.0},
 {'SAMPLEID': 953, 'WQREF': 2.0},
 {'SAMPLEID': 954, 'WQREF': 7.0},
 {'SAMPLEID': 955, 'WQREF': 7.0},
 {'SAMPLEID': 956, 'WQREF': 7.0},
 {'SAMPLEID': 958, 'WQREF': 5.0},
 {'SAMPLEID': 959, 'WQREF': 5.0},
 {'SAMPLEID': 960, 'WQREF': 7.0},
 {'SAMPLEID': 961, 'WQREF': 4.0},
 {'SAMPLEID': 962, 'WQREF': 1.0},
 {'SAMPLEID': 963, 'WQREF': 3.5},
 {'SAMPLEID': 964, 'WQREF': 7.0},
 {'SAMPLEID': 966, 'WQREF': 0.0},
 {'SAMPLEID': 967, 'WQREF': 1.0},
 {'SAMPLEID': 968, 'WQREF': 6.0},
 {'SAMPLEID': 969, 'WQREF': 7.0},
 {'SAMPLEID': 970, 'WQREF': 0.0},
 {'SAMPLEID': 971, 'WQREF': 1.0},
 {'SAMPLEID': 972, 'WQREF': 7.0},
 {'SAMPLEID': 

In [140]:
  
df_data = pd.read_csv("belly_button_biodiversity_samples.csv"  , encoding="iso-8859-1", low_memory=False)

In [138]:
df_data.head()

Unnamed: 0,otu_id,BB_940,BB_941,BB_943,BB_944,BB_945,BB_946,BB_947,BB_948,BB_949,...,BB_1562,BB_1563,BB_1564,BB_1572,BB_1573,BB_1574,BB_1576,BB_1577,BB_1581,BB_1601
0,1,0.0,0,0,0,0,0,0,0.0,0,...,0,0,0,0,0,0,0,0,0,0
1,2,0.0,0,0,0,0,0,0,0.0,0,...,0,0,0,0,0,0,0,0,0,0
2,3,0.0,0,0,0,0,0,0,0.0,0,...,0,0,0,0,0,0,0,0,0,0
3,4,0.0,0,0,0,0,0,0,0.0,0,...,0,0,0,0,0,0,0,0,0,0
4,5,0.0,0,0,0,0,0,0,0.0,0,...,0,0,0,0,0,0,0,0,0,0


In [155]:
col_list= list(df_data)
col_list.remove('otu_id')
col_list

df_data['eachID_total_sample_value'] = df_data[col_list].sum(axis=1)
df_data.head()



Unnamed: 0,otu_id,BB_940,BB_941,BB_943,BB_944,BB_945,BB_946,BB_947,BB_948,BB_949,...,BB_1572,BB_1573,BB_1574,BB_1576,BB_1577,BB_1581,BB_1601,sample_value,total_sample_value,eachID_total_sample_value
1794,1795,10.0,40,2,11,141,2,102,8.0,3,...,26,3,14,1,130,176,97,36192.0,54288.0,108576.0
921,922,1.0,27,1,278,129,1,45,185.0,1,...,0,92,13,0,152,0,10,20156.0,30234.0,60468.0
943,944,19.0,178,0,8,274,7,135,9.0,4,...,13,0,15,0,3,1,25,11752.0,17628.0,35256.0
2418,2419,13.0,162,0,0,110,36,412,55.0,8,...,2,5,16,0,0,0,22,8590.0,12885.0,25770.0
1166,1167,163.0,24,0,0,32,217,27,18.0,0,...,93,0,14,0,0,0,73,8488.0,12732.0,25464.0


In [156]:
df_data = df_data.sort_values('eachID_total_sample_value', ascending=False)
df_data.head()

Unnamed: 0,otu_id,BB_940,BB_941,BB_943,BB_944,BB_945,BB_946,BB_947,BB_948,BB_949,...,BB_1572,BB_1573,BB_1574,BB_1576,BB_1577,BB_1581,BB_1601,sample_value,total_sample_value,eachID_total_sample_value
1794,1795,10.0,40,2,11,141,2,102,8.0,3,...,26,3,14,1,130,176,97,36192.0,54288.0,108576.0
921,922,1.0,27,1,278,129,1,45,185.0,1,...,0,92,13,0,152,0,10,20156.0,30234.0,60468.0
943,944,19.0,178,0,8,274,7,135,9.0,4,...,13,0,15,0,3,1,25,11752.0,17628.0,35256.0
2418,2419,13.0,162,0,0,110,36,412,55.0,8,...,2,5,16,0,0,0,22,8590.0,12885.0,25770.0
1166,1167,163.0,24,0,0,32,217,27,18.0,0,...,93,0,14,0,0,0,73,8488.0,12732.0,25464.0


In [157]:
sample_value_list=[]
for sample in sampleId_result:
    sample_value_dict={}
    sample_df = df_data.sort_values(sample, ascending=False)
    otu_id= sample_df["otu_id"].tolist()
    sample_value= sample_df[sample].tolist()
        
    sample_value_dict= {"otu_ids": otu_id, "sample_values": sample_value}
    sample_value_list.append(sample_value_dict)
sample_value_list[0]


{'otu_ids': [1167,
  2859,
  482,
  2264,
  41,
  1189,
  352,
  189,
  2318,
  1977,
  3450,
  874,
  1959,
  2191,
  1950,
  2077,
  2275,
  2184,
  944,
  2244,
  2811,
  2024,
  2419,
  2782,
  165,
  2247,
  2011,
  2396,
  830,
  1795,
  2964,
  2722,
  307,
  2908,
  2178,
  1193,
  2039,
  2167,
  1208,
  1274,
  2739,
  2737,
  2186,
  2335,
  907,
  1962,
  1314,
  833,
  2936,
  2483,
  513,
  2188,
  1232,
  2110,
  2065,
  2291,
  1498,
  1503,
  2342,
  2491,
  2546,
  170,
  1505,
  159,
  121,
  725,
  2350,
  259,
  357,
  2235,
  340,
  1960,
  258,
  1968,
  412,
  1169,
  2475,
  2571,
  342,
  1497,
  1947,
  866,
  2542,
  386,
  1179,
  1174,
  328,
  42,
  39,
  564,
  2229,
  1984,
  2136,
  373,
  2473,
  794,
  2795,
  24,
  226,
  22,
  593,
  19,
  361,
  2423,
  2165,
  2068,
  1576,
  821,
  2829,
  414,
  2334,
  407,
  1159,
  2873,
  3439,
  154,
  122,
  3427,
  185,
  2750,
  359,
  246,
  81,
  198,
  922,
  381,
  881,
  2968,
  2549,
  2837,
  11,