### This script:
    - performs rarefaction
    - calculates alpha diversity for each subject 
    - calculates correlation between alpha diversity and time
    - creates rarefied feature table
#### Needs to be runned in an envrionment with QIIME2

In [2]:
import pandas as pd

In [8]:
ftable_file = '550_feces.tsv'
metadata_file = 'feces_metadata.tsv'

In [11]:
#get dataframe only feces and no mislabeled
df = pd.read_csv(ftable_file, sep = '\t')
#metadata only feces and no mislabeled
metadata = pd.read_csv(metadata_file, sep = '\t')

In [16]:
#make qza from tsv
!biom convert -i 550_feces.tsv -o converted_table.biom --to-hdf5

qiime tools import \
  --input-path converted_table.biom \
  --type 'FeatureTable[Frequency]' \
  --input-format BIOMV210Format \
  --output-path 550_feces.qza

In [17]:
#summarize
!qiime feature-table summarize \
  --i-table 550_feces.qza \
  --o-visualization summary.qzv \
  --m-sample-metadata-file feces_metadata.tsv

[32mSaved Visualization to: summary.qzv[0m


In [18]:
#filter rep sequences
!qiime feature-table filter-seqs \
--i-data rep_seqs.qza \
--i-table 550_feces.qza \
--o-filtered-data feces_res_seqs.qza

[32mSaved FeatureData[Sequence] to: feces_res_seqs.qza[0m


In [19]:
%mkdir phylogeny

In [21]:
#phylogeny
!qiime phylogeny align-to-tree-mafft-fasttree \
--i-sequences feces_rep_seqs.qza \
--o-alignment phylogeny/aligned-rep-seqs.qza \
--o-masked-alignment phylogeny/masked-aligned-rep-seqs.qza \
--o-tree phylogeny/unrooted-tree.qza \
--o-rooted-tree phylogeny/rooted-tree.qza

[32mSaved FeatureData[AlignedSequence] to: phylogeny/aligned-rep-seqs.qza[0m
[32mSaved FeatureData[AlignedSequence] to: phylogeny/masked-aligned-rep-seqs.qza[0m
[32mSaved Phylogeny[Unrooted] to: phylogeny/unrooted-tree.qza[0m
[32mSaved Phylogeny[Rooted] to: phylogeny/rooted-tree.qza[0m


In [38]:
#rarefaction curves
!qiime diversity alpha-rarefaction \
  --i-table 550_feces.qza \
  --m-metadata-file feces_metadata.tsv \
  --o-visualization alpha_rarefaction_curves.qzv \
  --p-min-depth 10711 \
  --p-max-depth 41122

[32mSaved Visualization to: alpha_rarefaction_curves.qzv[0m


In [40]:
#alpha diversity
!qiime diversity core-metrics-phylogenetic \
  --i-phylogeny phylogeny/rooted-tree.qza \
  --i-table 550_feces.qza  \
  --p-sampling-depth 16000 \
  --m-metadata-file feces_metadata.tsv \
  --output-dir core-metrics-results

[32mSaved FeatureTable[Frequency] to: core-metrics-results/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: core-metrics-results/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: core-metrics-results/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: core-metrics-results/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: core-metrics-results/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: core-metrics-results/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: core-metrics-results/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: core-metrics-results/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: core-metrics-results/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: core-metrics-results/unweighted_unifrac_pcoa_results.qza[0m
[32mSaved PCoAResults to: core-metrics-results/weighted_unifrac_pcoa_results.qza[0m
[32mSaved PCoAResults to: core

In [48]:
%mkdir plots

In [49]:
#alpha group significance between two subjects: faiths
!qiime diversity alpha-group-significance \
  --i-alpha-diversity core-metrics-results/faith_pd_vector.qza \
  --m-metadata-file feces_metadata.tsv \
  --o-visualization plots/faith-pd-group-significance.qzv

[32mSaved Visualization to: plots/faith-pd-group-significance.qzv[0m


In [50]:
!qiime diversity alpha-group-significance \
  --i-alpha-diversity core-metrics-results/shannon_vector.qza \
  --m-metadata-file feces_metadata.tsv \
  --o-visualization plots/shannon-group-significance.qzv

[32mSaved Visualization to: plots/shannon-group-significance.qzv[0m


## alpha for separate subjects

In [79]:
metadata[metadata['sex'] == 'female']['sample_name'].to_csv('female_to_keep.tsv', sep = '\t', index = False)
metadata[metadata['sex'] == 'male']['sample_name'].to_csv('male_to_keep.tsv', sep = '\t', index = False)

In [81]:
!qiime feature-table filter-samples \
  --i-table 550_feces.qza \
  --m-metadata-file female_to_keep.tsv \
  --o-filtered-table female_filtered.qza

[32mSaved FeatureTable[Frequency] to: female_filtered.qza[0m


In [82]:
!qiime feature-table filter-samples \
  --i-table 550_feces.qza \
  --m-metadata-file male_to_keep.tsv \
  --o-filtered-table male_filtered.qza

[32mSaved FeatureTable[Frequency] to: male_filtered.qza[0m


### this cell will create rarefied table rarefied_table.qza for male subject

In [86]:
#core metrics - male
!qiime diversity core-metrics-phylogenetic \
  --i-phylogeny phylogeny/rooted-tree.qza \
  --i-table male_metrics/male_filtered.qza  \
  --p-sampling-depth 16000 \
  --m-metadata-file feces_metadata.tsv \
  --output-dir male_metrics/core-metrics-results

[32mSaved FeatureTable[Frequency] to: male_metrics/core-metrics-results/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: male_metrics/core-metrics-results/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: male_metrics/core-metrics-results/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: male_metrics/core-metrics-results/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: male_metrics/core-metrics-results/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: male_metrics/core-metrics-results/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: male_metrics/core-metrics-results/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: male_metrics/core-metrics-results/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: male_metrics/core-metrics-results/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: male_metrics/core-metrics-results/unweighted_unifrac_pcoa_res

### this cell will create rarefied table rarefied_table.qza for female subject

In [87]:
#core metrics - female
!qiime diversity core-metrics-phylogenetic \
  --i-phylogeny phylogeny/rooted-tree.qza \
  --i-table female_metrics/female_filtered.qza  \
  --p-sampling-depth 16000 \
  --m-metadata-file feces_metadata.tsv \
  --output-dir female_metrics/core-metrics-results

[32mSaved FeatureTable[Frequency] to: female_metrics/core-metrics-results/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: female_metrics/core-metrics-results/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: female_metrics/core-metrics-results/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: female_metrics/core-metrics-results/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: female_metrics/core-metrics-results/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: female_metrics/core-metrics-results/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: female_metrics/core-metrics-results/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: female_metrics/core-metrics-results/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: female_metrics/core-metrics-results/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: female_metrics/core-metrics-results/unweigh

In [88]:
!qiime diversity alpha-correlation \
--i-alpha-diversity male_metrics/core-metrics-results/shannon_vector.qza \
--m-metadata-file feces_metadata.tsv \
--o-visualization male_metrics/shannon_cor.qzv

!qiime diversity alpha-correlation \
--i-alpha-diversity female_metrics/core-metrics-results/shannon_vector.qza \
--m-metadata-file feces_metadata.tsv \
--o-visualization female_metrics/shannon_cor.qzv

[32mSaved Visualization to: male_metrics/shannon_cor.qzv[0m


In [None]:
qiime diversity alpha-correlation \
--i-alpha-diversity core-metrics-results/observed_features_vector.qza \
--m-metadata-file 550_metadata.txt \
--o-visualization correlation_analysis/observed_features_corr.qzv

In [89]:
!qiime diversity alpha-correlation \
--i-alpha-diversity male_metrics/core-metrics-results/faith_pd_vector.qza \
--m-metadata-file feces_metadata.tsv \
--o-visualization male_metrics/faith_cor.qzv


!qiime diversity alpha-correlation \
--i-alpha-diversity female_metrics/core-metrics-results/faith_pd_vector.qza \
--m-metadata-file feces_metadata.tsv \
--o-visualization female_metrics/faith_cor.qzv

[32mSaved Visualization to: male_metrics/faith_cor.qzv[0m
