In [1]:
import warnings   
warnings.simplefilter("ignore") 
import matplotlib as mpl
import matplotlib.pyplot as plt
import pylab
%matplotlib notebook

import calour as cl
import numpy as np
import pandas as pd

from scipy.stats import sem
import pickle
cl.set_log_level(40) 

## DME

In [2]:
with open('../results_all/dme_subsample.pkl', 'rb') as f:
    ss_dme, otu_ds_dme, otu_bh_dme, otu_fbh_dme, err_ds_dme,err_bh_dme, err_fbh_dme = pickle.load(f)

In [3]:
ds_dme = plt.figure(figsize=(7, 5))
plt.errorbar(ss_dme, otu_ds_dme, yerr=err_ds_dme, color = 'red', label = 'DS')
plt.errorbar(ss_dme, otu_fbh_dme, yerr=err_fbh_dme, color = 'orange', label = 'FBH')
plt.errorbar(ss_dme, otu_bh_dme, yerr=err_bh_dme, color = 'blue', label = 'BH')
pylab.legend(loc ='center left', frameon=False)
plt.xlabel('Sub sample size', fontsize = 20)
plt.ylabel('Bacterial taxa detected', fontsize = 20)

plt.plot([7.1, 16], [np.max(otu_bh_dme), np.max(otu_bh_dme)], 'k-', lw=2, linestyle='--', 
         color = 'green')

plt.xticks(np.arange(2, 18, 2))
plt.tick_params(labeltop='off', labelright='off')
plt.tick_params(labelsize=15)
plt.tight_layout()
ds_dme.savefig('../figures/ds_dme.pdf', dpi=300)

<IPython.core.display.Javascript object>

In [18]:
# statistics
print('significant taxa: %s' %(np.max(otu_bh_dme)))
print('samples compared to BH: %s' %((7-16)/16*100))
print('samples compared to FBH: %s' %((7-9)/9*100))

significant taxa: 72.48
samples compared to BH: -56.25
samples compared to FBH: -22.22222222222222


## UKT

In [4]:
with open('../results_all/ukt_subsample_B700.pkl', 'rb') as f:
    ss_ukt, otu_ds_ukt, otu_bh_ukt, otu_fbh_ukt, err_ds_ukt,err_bh_ukt, err_fbh_ukt = pickle.load(f)

In [5]:
print(max(err_ds_ukt))

4.41995340172


In [6]:
ds_ukt = plt.figure(figsize=(7, 5))
plt.errorbar(ss_ukt, otu_ds_ukt, yerr=err_ds_ukt, color = 'red', label='DS')
plt.errorbar(ss_ukt, otu_fbh_ukt, yerr=err_bh_ukt, color = 'orange', label='FBH')
plt.errorbar(ss_ukt, otu_bh_ukt, yerr=err_bh_ukt, color = 'blue', label='BH')


plt.xlabel('Sub sample size', fontsize = 20)
plt.ylabel('Bacterial taxa detected', fontsize = 20)

plt.plot([83, 100], [np.max(otu_bh_ukt), np.max(otu_bh_ukt)], 'k-', lw=2, linestyle='--', 
         color = 'green')

plt.xticks(np.arange(10, 110, 20))
plt.tick_params(labeltop='off', labelright='off')
plt.tick_params(labelsize=15)
plt.tight_layout()
ds_ukt.savefig('../figures/ds_ukt.pdf', dpi=300)

<IPython.core.display.Javascript object>

In [19]:
# statistics
print('significant taxa: %s' %(np.max(otu_bh_ukt)))
print('samples compared to BH: %s' %((83-100)/100*100))
print('samples compared to FBH: %s' %((83-93)/93*100))

significant taxa: 61.44
samples compared to BH: -17.0
samples compared to FBH: -10.75268817204301


## DIBD

In [7]:
with open('../results_all/dibd_subsample.pkl', 'rb') as f:
    ss_dibd, otu_ds_dibd, otu_bh_dibd, otu_fbh_dibd, err_ds_dibd, err_bh_dibd, err_fbh_dibd = pickle.load(f)

In [8]:
print(max(err_ds_dibd))

1.43375610396


In [9]:
ds_dibd = plt.figure(figsize=(7, 5))
plt.errorbar(ss_dibd, otu_ds_dibd, yerr=err_ds_dibd, color = 'red', label='DS')
plt.errorbar(ss_dibd, otu_fbh_dibd, yerr=err_fbh_dibd, color = 'orange', label='FBH')
plt.errorbar(ss_dibd, otu_bh_dibd, yerr=err_bh_dibd, color = 'blue', label='BH')

plt.xlabel('Sub sample size', fontsize = 20)
plt.ylabel('Bacterial taxa detected', fontsize = 20)

plt.plot([42, 65], [np.max(otu_bh_dibd), np.max(otu_bh_dibd)], 'k-', lw=2, linestyle='--', 
         color = 'green')

plt.xticks(np.arange(0, 70, 10))
plt.tick_params(labeltop='off', labelright='off')
plt.tick_params(labelsize=15)
plt.tight_layout()
ds_dibd.savefig('../figures/ds_dibd.pdf', dpi=300)

<IPython.core.display.Javascript object>

In [20]:
# statistics
print('significant taxa: %s' %(np.max(otu_bh_dibd)))
print('samples compared to BH: %s' %((42-65)/65*100))
print('samples compared to FBH: %s' %((42-45)/45*100))

significant taxa: 86.08
samples compared to BH: -35.38461538461539
samples compared to FBH: -6.666666666666667


## GCD

In [10]:
with open('../results_all/gcd_subsample.pkl', 'rb') as f:
    ss_gcd, otu_ds_gcd, otu_bh_gcd, otu_fbh_gcd, err_ds_gcd, err_bh_gcd, err_fbh_gcd = pickle.load(f)

In [11]:
ds_gcd = plt.figure(figsize=(7, 5))
plt.errorbar(ss_gcd, otu_ds_gcd, yerr=err_ds_gcd, color = 'red', label='DS')
plt.errorbar(ss_gcd, otu_fbh_gcd, yerr=err_fbh_gcd, color = 'orange', label='FBH')
plt.errorbar(ss_gcd, otu_bh_gcd, yerr=err_bh_gcd, color = 'blue', label='BH')
pylab.legend(loc ='lower right', frameon=False)

plt.xlabel('Sub sample size', fontsize = 20)
plt.ylabel('Bacterial taxa detected', fontsize = 20)

plt.plot([265, 320], [np.max(otu_bh_gcd), np.max(otu_bh_gcd)], 'k-', lw=2, linestyle='--', 
         color = 'green')

plt.xticks(np.arange(20, 340, 40))
plt.tick_params(labeltop='off', labelright='off')
plt.tick_params(labelsize=15)
plt.tight_layout()
ds_gcd.savefig('../figures/ds_gcd.pdf', dpi=300)

<IPython.core.display.Javascript object>

In [21]:
# statistics
print('significant taxa: %s' %(np.max(otu_bh_gcd)))
print('samples compared to BH: %s' %((270-320)/320*100))
print('samples compared to FBH: %s' %((270-280)/280*100))

significant taxa: 716.85
samples compared to BH: -15.625
samples compared to FBH: -3.571428571428571


## American Gut

## Antibiotic history

In [12]:
with open('../results_all/aga_subsample.pkl', 'rb') as f:
    ss_aga, otu_ds_aga, otu_bh_aga, otu_fbh_aga, err_ds_aga, err_bh_aga, err_fbh_aga = pickle.load(f)

In [13]:
ds_aga = plt.figure(figsize=(7, 5))
plt.errorbar(ss_aga, otu_ds_aga, yerr=err_ds_aga, color = 'red', label='DS')
plt.errorbar(ss_aga, otu_fbh_aga, yerr=err_fbh_aga, color = 'orange', label='FBH')
plt.errorbar(ss_aga, otu_bh_aga, yerr=err_bh_aga, color = 'blue', label='BH')

plt.xlabel('Sub sample size', fontsize = 20)
plt.ylabel('Bacterial taxa detected', fontsize = 20)

plt.plot([58, 120], [np.max(otu_bh_aga), np.max(otu_bh_aga)], 'k-', lw=2, linestyle='--', 
         color = 'green')

plt.xticks(np.arange(20, 140, 20))
plt.tick_params(labeltop='off', labelright='off')
plt.tick_params(labelsize=15)
plt.tight_layout()
ds_ukt.savefig('../figures/ds_aga.pdf', dpi=300)

<IPython.core.display.Javascript object>

In [22]:
# statistics
print('significant taxa: %s' %(np.max(otu_bh_aga)))
print('samples compared to BH: %s' %((58-120)/120*100))
print('samples compared to FBH: %s' %((58-60)/60*100))

significant taxa: 215.17
samples compared to BH: -51.66666666666667
samples compared to FBH: -3.3333333333333335


# plants numbers

In [14]:
with open('../results_all/agp_subsample_v2.pkl', 'rb') as f:
    ss_agp, otu_ds_agp, otu_bh_agp, otu_fbh_agp, err_ds_agp, err_bh_agp, err_fbh_agp = pickle.load(f)

In [15]:
ds_agp = plt.figure(figsize=(7, 5))
plt.errorbar(ss_agp, otu_ds_agp, yerr=err_ds_agp, color = 'red', label='DS')
plt.errorbar(ss_agp, otu_fbh_agp, yerr=err_fbh_agp, color = 'orange', label='FBH')
plt.errorbar(ss_agp, otu_bh_agp, yerr=err_bh_agp, color = 'blue', label='BH')

plt.xlabel('Sub sample size', fontsize = 20)
plt.ylabel('Bacterial taxa detected', fontsize = 20)

plt.plot([80, 200], [np.max(otu_bh_agp), np.max(otu_bh_agp)], 'k-', lw=2, linestyle='--', 
         color = 'green')

plt.xticks(np.arange(40, 220, 40))
plt.tick_params(labeltop='off', labelright='off')
plt.tick_params(labelsize=15)
plt.tight_layout()
ds_agp.savefig('../figures/ds_agp.pdf', dpi=300)

<IPython.core.display.Javascript object>

In [23]:
# statistics
print('significant taxa: %s' %(np.max(otu_bh_agp)))
print('samples compared to BH: %s' %((80-200)/200*100))
print('samples compared to FBH: %s' %((80-90)/90*100))

significant taxa: 102.12
samples compared to BH: -60.0
samples compared to FBH: -11.11111111111111
