# Qiime2 Pipeline (Version 2018.2)

## Import Sequences and create quality-score plot visualizations

In [None]:
#Song
!qiime tools import \
    --type 'SampleData[PairedEndSequencesWithQuality]' \
    --source-format CasavaOneEightSingleLanePerSampleDirFmt \
    --input-path SongBact-seqs/ \
    --output-path SongBact.qza

!qiime demux summarize \
--i-data SongBact.qza \
--o-visualization SongBact.qzv



#Yao
!qiime tools import \
--type 'SampleData[PairedEndSequencesWithQuality]'  \
--source-format CasavaOneEightSingleLanePerSampleDirFmt \
--input-path YaoBact-seqs/ \
--output-path yaobact.qza

!qiime demux summarize \
--i-data yaobact.qza \
--o-visualization yaobact.qzv



#Dai2017
!qiime tools import --type 'SampleData[PairedEndSequencesWithQuality]'  \
    --source-format CasavaOneEightSingleLanePerSampleDirFmt \
    --input-path Dai2017-seqs/ \
    --output-path Dai2017.qza

!qiime demux summarize \
    --i-data Dai2017.qza \
    --o-visualization Dai2017.qzv



#Imparato
!qiime tools import \
--type 'SampleData[PairedEndSequencesWithQuality]'  \
--source-format CasavaOneEightSingleLanePerSampleDirFmt \
--input-path imparato-seqs/ \
--output-path imparato.qza

!qiime demux summarize \
--i-data imparato.qza \
--o-visualization imparato.qzv



#Dai2016
!qiime tools import \
--type 'SampleData[PairedEndSequencesWithQuality]'  \
--source-format CasavaOneEightSingleLanePerSampleDirFmt \
--input-path Dai2016-seqs/ \
--output-path Dai2016.qza

!qiime demux summarize \
--i-data Dai2016.qza \
--o-visualization Dai2016.qzv



#Wu
!qiime tools import \
--type 'SampleData[PairedEndSequencesWithQuality]'  \
--source-format CasavaOneEightSingleLanePerSampleDirFmt \
--input-path wu-seqs/ \
--output-path wu.qza

!qiime demux summarize \
--i-data wu.qza \
--o-visualization wu.qzv



#Whitman
!qiime tools import \
--type 'SampleData[PairedEndSequencesWithQuality]'  \
--source-format CasavaOneEightSingleLanePerSampleDirFmt \
--input-path whitman-seqs/ \
--output-path whitman.qza

!qiime demux summarize \
--i-data whitman.qza \
--o-visualization whitman.qzv



#Ye
!qiime tools import \
--type 'SampleData[PairedEndSequencesWithQuality]'  \
--source-format CasavaOneEightSingleLanePerSampleDirFmt \
--input-path Ye-seqs/ \
--output-path Ye.qza

!qiime demux summarize \
--i-data Ye.qza \
--o-visualization Ye.qzv



#Nielsen *single-end sequences*
!qiime tools import \
  --type 'SampleData[SequencesWithQuality]' \
  --input-path Nielsen2014-manifest.csv \
  --output-path Nielsen2014-demux.qza \
  --source-format SingleEndFastqManifestPhred33

!qiime demux summarize \
--i-data Nielsen2014-demux.qza \
--o-visualization Nielsen2014.qzv

## View visualizations

In [None]:
## View one at a time

!qiime tools view SongBact.qzv

#!qiime tools view yaobact.qzv

#!qiime tools view Dai2017.qzv

#!qiime tools view imparato.qzv

#!qiime tools view Dai2016.qzv

#!qiime tools view wu.qzv

#!qiime tools view whitman.qzv

#!qiime tools view Ye.qzv

#!qiime tools view Nielsen2014.qzv

## Quality control using DADA2 and generate OTU table
#### Each dataset went through trimming and truncating optimization to allow for best sequence retention
#### Noisy sequences were trimmed off the beginning and most datasets were truncated where sequences consistantly dropped under a qc-score of 35; Whitman and Ye were exceptions.

In [None]:
# Song

!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs SongBact.qza \
  --o-table Song-bact-table \
  --o-representative-sequences song-bact-rep-seqs \
  --p-n-threads 0 \
  --p-trim-left-f 25 \
  --p-trim-left-r 26 \
  --p-trunc-len-f 297 \
  --p-trunc-len-r 210 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table Song-bact-table.qza \
--o-visualization Song-bact-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data song-bact-rep-seqs.qza \
--o-visualization song-bact-rep-seqs.qzv

# View visualizations for OTU table and representative sequences 
!qiime tools view Song-bact-table.qzv
!qiime tools view song-rep-seqs.qzv

In [None]:
#Yao

!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs yaobact.qza \
  --o-table yaobact-table \
  --o-representative-sequences yaobact-rep-seqs \
  --p-trim-left-f 22 \
  --p-trim-left-r 26 \
  --p-trunc-len-f 268 \
  --p-trunc-len-r 204 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table yaobact-table.qza \
--o-visualization yaobact-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data yaobact-rep-seqs.qza \
--o-visualization yaobact-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view yaobact-table.qzv
!qiime tools view yaobact-rep-seqs.qzv

In [None]:
#Dai2017

!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs dai2017.qza \
  --o-table dai2017-table \
  --o-representative-sequences dai2017-rep-seqs \
  --p-trim-left-f 25 \
  --p-trim-left-r 26 \
  --p-trunc-len-f 286 \
  --p-trunc-len-r 200 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table dai2017-table.qza \
--o-visualization dai2017-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data dai2017-rep-seqs.qza \
--o-visualization dai2017-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view dai2017-table.qzv
!qiime tools view dai2017-rep-seqs.qzv

In [None]:
#Imparato

!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs imparato.qza \
  --o-table imparato-table \
  --o-representative-sequences imparato-rep-seqs \
  --p-trim-left-f 25 \
  --p-trim-left-r 25 \
  --p-trunc-len-f 243 \
  --p-trunc-len-r 228 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table imparato-table.qza \
--o-visualization imparato-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data imparato-rep-seqs.qza \
--o-visualization imparato-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view imparato-table.qzv
!qiime tools view imparato-rep-seqs.qzv

In [None]:
#Dai2016
!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs Dai2016.qza \
  --o-table Dai2016-table \
  --o-representative-sequences Dai2016-rep-seqs \
  --p-trim-left-f 22 \
  --p-trim-left-r 26 \
  --p-trunc-len-f 200 \
  --p-trunc-len-r 210 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table  Dai2016-table.qza \
--o-visualization Dai2016-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data Dai2016-rep-seqs.qza \
--o-visualization Dai2016-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view Dai2016-table.qzv
!qiime tools view Dai2016-rep-seqs.qzv

In [None]:
#Wu
!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs wu.qza \
  --o-table wu-table \
  --o-representative-sequences wu-rep-seqs \
  --p-trim-left-f 26 \
  --p-trim-left-r 26 \
  --p-trunc-len-f 270 \
  --p-trunc-len-r 230 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table wu-table.qza \
--o-visualization wu-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data wu-rep-seqs.qza \
--o-visualization wu-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view wu-table.qzv
!qiime tools view wu-rep-seqs.qzv

In [None]:
#Whitman
!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs whitman.qza \
  --o-table whitman-table \
  --o-representative-sequences whitman-rep-seqs \
  --p-trim-left-f 5 \
  --p-trim-left-r 5 \
  --p-trunc-len-f 275 \
  --p-trunc-len-r 200 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table  whitman-table.qza \
--o-visualization whitman-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data whitman-rep-seqs.qza \
--o-visualization whitman-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view whitman-table.qzv
!qiime tools view whitman-rep-seqs.qzv

In [None]:
#Ye
!qiime dada2 denoise-paired --verbose \
  --i-demultiplexed-seqs Ye.qza \
  --o-table Ye-table-v3 \
  --o-representative-sequences Ye-rep-seqs-v3 \
  --p-trim-left-f 6 \
  --p-trim-left-r 6 \
  --p-trunc-len-f 290 \
  --p-trunc-len-r 269 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table Ye-table-v3.qza \
--o-visualization Ye-table-v3.qzv 

!qiime feature-table tabulate-seqs \
--i-data Ye-rep-seqs-v3.qza \
--o-visualization Ye-rep-seqs-v3.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view Ye-table-v3.qzv
!qiime tools view Ye-rep-seqs-v3.qzv

In [None]:
#Nielsen
!qiime dada2 denoise-single --verbose \
  --i-demultiplexed-seqs Nielsen2014-demux.qza \
  --o-table Nielsen2014-table \
  --o-representative-sequences Nielsen2014-rep-seqs \
  --p-trim-left 9 \
  --p-trunc-len 70 

# Create visualizations for OTU table and representative sequences
!qiime feature-table summarize \
--i-table  Nielsen2014-table.qza \
--o-visualization Nielsen2014-table.qzv 

!qiime feature-table tabulate-seqs \
--i-data Nielsen2014-rep-seqs.qza \
--o-visualization Nielsen2014-rep-seqs.qzv

# View visualizations for OTU table and representative sequences
!qiime tools view Nielsen2014-table.qzv
!qiime tools view Nielsen2014-rep-seqs.qzv

# Taxonomy assignment

Download Silva_132 zip file ( https://www.arb-silva.de/download/archive/qiime ) and train the classifer to primers used in samples. 

Classifier is trained on each different primer combinations (for primers modified, use most ambiguous one (i.e. for 515f/907R use Whitman primer combinations) 

Dai2016- 515F GTGCCAGCMGCCGCGGTAA ; 806R GGACTACHVGGGTWTCTAAT  

Dai2017- 338F ACTCCTACGGGAGGCAGCA ; 806R GGACTACHVGGGTWTCTAAT

Song- 338F ACTCCTACGGGAGGCAGCA ; 806R GGACTACHVGGGTWTCTAAT

Wu- 338F ACTCCTACGGGAGGCAGCAG ; 806R GGACTACHVGGGTWTCTAAT 

Imparato- 341F CCTAYGGGRBGCASCAG ; 806R GGACTACNNGGGTATCTAAT 

Whitman- 515F GTGYCAGCMGCMGCGGTRA ; 907R CCGYCCAATTYMTTTRAGTTT

Yao- 515F GTGCCAGCMGCCGCGG ; 907R CCGTCAATTCMTTTRAGTTT

Ye - 27F AGAGTTTGATCMTGGCTCAG ; 519R GWATTACCGCGGCKGCTG

Nielsen - 515F GTGCCAGCMGCCGCGGTAA ; 806R GGACTACHVGGGTWTCTAAT

In [None]:
# Import Silva132 99% sequence file and taxonomy as a Qiime artifact - we used the majority taxonomy 7 levels

!qiime tools import \
  --type 'FeatureData[Sequence]' \
  --input-path silva132_99.fna \
  --output-path silva132_99.qza

!qiime tools import \
  --type 'FeatureData[Taxonomy]' \
  --source-format HeaderlessTSVTaxonomyFormat \
  --input-path majority_taxonomy_7_levels.txt \
  --output-path ref-taxonomy.qza

### Train Silva132 classifier to each primer pair

In [None]:
## This step sometimes freezes up, so it is best to run each one at a time

# 515f and 806r
!qiime feature-classifier extract-reads \
  --i-sequences silva132_99.qza \
  --p-f-primer GTGCCAGCMGCCGCGGTAA \
  --p-r-primer GGACTACHVGGGTWTCTAAT \
  --o-reads 515f-806r-ref-seqs.qza

!qiime feature-classifier fit-classifier-naive-bayes --verbose\
  --i-reference-reads 515f-806r-ref-seqs.qza \
  --i-reference-taxonomy ref-taxonomy.qza \
  --o-classifier 515f-806r-classifier.qza

# 338f and 806r
!qiime feature-classifier extract-reads \
  --i-sequences silva132_99.qza \
  --p-f-primer ACTCCTACGGGAGGCAGCA \
  --p-r-primer GGACTACHVGGGTWTCTAAT \
  --o-reads 338f-806r-ref-seqs.qza

!qiime feature-classifier fit-classifier-naive-bayes \
  --i-reference-reads 338f-806r-ref-seqs.qza \
  --i-reference-taxonomy ref-taxonomy.qza \
  --o-classifier 338f-806r-classifier.qza

# 341f and 806r
!qiime feature-classifier extract-reads \
  --i-sequences silva132_99.qza \
  --p-f-primer CCTAYGGGRBGCASCAG \
  --p-r-primer GGACTACNNGGGTATCTAAT \
  --o-reads 341f-806r-ref-seqs.qza

!qiime feature-classifier fit-classifier-naive-bayes \
  --i-reference-reads 341f-806r-ref-seqs.qza \
  --i-reference-taxonomy ref-taxonomy.qza \
  --o-classifier 341f-806r-classifier.qza

# 515f and 907r
!qiime feature-classifier extract-reads \
  --i-sequences silva132_99.qza \
  --p-f-primer GTGYCAGCMGCMGCGGTRA \
  --87`6p-r-primer CCGYCCAATTYMTTTRAGTTT \
  --o-reads 515f-907r-ref-seqs.qza

!qiime feature-classifier fit-classifier-naive-bayes \
  --i-reference-reads 515f-907r-ref-seqs.qza \
  --i-reference-taxonomy ref-taxonomy.qza \
  --o-classifier 515f-907r-classifier.qza

# 27f and 519r
!qiime feature-classifier extract-reads \
  --i-sequences silva132_99.qza \
  --p-f-primer AGAGTTTGATCMTGGCTCAG \
  --p-r-primer GWATTACCGCGGCKGCTG \
  --o-reads 27f-519r-ref-seqs.qza

!qiime feature-classifier fit-classifier-naive-bayes \
  --i-reference-reads 27f-519r-ref-seqs.qza \
  --i-reference-taxonomy ref-taxonomy.qza \
  --o-classifier 27f-519r-classifier.qza

### Classify representative sequences

In [None]:
## This step sometimes freezes up, so it is best to run each one at a time


#Dai2016
!qiime feature-classifier classify-sklearn \
  --i-classifier 515f-806r-classifier.qza \
  --i-reads Dai2016-rep-seqs.qza \
  --o-classification Dai2016-taxonomy.qza 

#Dai2017
!qiime feature-classifier classify-sklearn \
--i-classifier 338f-806r-classifier.qza \
--i-reads dai2017-rep-seqs.qza \
--o-classification dai2017-taxonomy.qza

#Song
!qiime feature-classifier classify-sklearn \
--i-classifier 338f-806r-classifier.qza \
--i-reads song-bact-rep-seqs.qza \
--o-classification song-bact-taxonomy.qza

#Wu
!qiime feature-classifier classify-sklearn \
--i-classifier 338f-806r-classifier.qza \
--i-reads wu-rep-seqs.qza \
--o-classification wu-taxonomy.qza

#Imparato
!qiime feature-classifier classify-sklearn \
--i-classifier 341f-806r-classifier.qza \
--i-reads imparato-rep-seqs.qza \
--o-classification imparato-taxonomy.qza

#Whitman
!qiime feature-classifier classify-sklearn \
--i-classifier 515f-907r-classifier.qza \
--i-reads whitman-rep-seqs.qza \
--o-classification whitman-taxonomy.qza

#Yao
!qiime feature-classifier classify-sklearn \
--i-classifier 515f-907r-classifier.qza \
--i-reads yaobact-rep-seqs.qza \
--o-classification yao-taxonomy.qza

#Ye
!qiime feature-classifier classify-sklearn \
--i-classifier 27f-519r-classifier.qza \
--i-reads Ye-rep-seqs-v3.qza \
--o-classification ye-taxonomy-v3.qza

#Nielsen
!qiime feature-classifier classify-sklearn \
--i-classifier 515f-806r-classifier.qza \
--i-reads Nielsen2014-rep-seqs.qza \
--o-classification Nielsen2014-taxonomy.qza

## Export representative sequences, taxonomy, OTU table, and metadata to create a .biom file to use for data analysis

In [None]:
## Dai2016

# Make a new directory to export the files to
!mkdir dai2016_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)  
!qiime tools export Dai2016-table.qza --output-dir Dai2016_OTU_table
!qiime tools export Dai2016-rep-seqs.qza --output-dir Dai2016_OTU_table
!qiime tools export Dai2016-taxonomy.qza --output-dir Dai2016_OTU_table
!cp dai2016-metadata.txt Dai2016_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls Dai2016_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Dai2016_OTU_table/feature-table.biom \
-o Dai2016_OTU_table/feature-table-metaD.biom \
-m Dai2016_OTU_table/dai2016-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i Dai2016_OTU_table/feature-table-metaD.biom \
-o Dai2016_OTU_table/feature-table-metaD-tax.biom \
--observation-metadata-fp Dai2016_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Dai2016_OTU_table/feature-table-metaD-tax.biom \
-o Dai2016_OTU_table/feature-table-metaD-tax-summary.txt

!head -20 Dai2016_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Dai2016_OTU_table/feature-table-metaD-tax.biom \
-o Dai2016_OTU_table/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json

In [None]:
## Dai2017

# Make a new directory to export the files to
!mkdir Dai2017_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export dai2017-table.qza --output-dir Dai2017_OTU_table
!qiime tools export dai2017-rep-seqs.qza --output-dir Dai2017_OTU_table
!qiime tools export dai2017-taxonomy.qza --output-dir Dai2017_OTU_table
!cp dai2017-metadata.txt Dai2017_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
ls Dai2017_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Dai2017_OTU_table/feature-table.biom \
-o Dai2017_OTU_table/feature-table-metaD.biom \
-m Dai2017_OTU_table/dai2017-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i Dai2017_OTU_table/feature-table-metaD.biom \
-o Dai2017_OTU_table/feature-table-metaD-tax.biom \
--observation-metadata-fp Dai2017_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Dai2017_OTU_table/feature-table-metaD-tax.biom \
-o Dai2017_OTU_table/feature-table-metaD-tax-summary.txt

!head -20 Dai2017_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Dai2017_OTU_table/feature-table-metaD-tax.biom \
-o Dai2017_OTU_table/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json

In [None]:
## Song

# Make a new directory to export the files to
!mkdir Song_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export Song-bact-table.qza --output-dir Song_OTU_table
!qiime tools export song-bact-rep-seqs.qza --output-dir Song_OTU_table
!qiime tools export song-bact-taxonomy.qza --output-dir Song_OTU_table

!cp song-meta-assume.txt Song_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls Song_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Song_OTU_table/feature-table.biom \
-o Song_OTU_table/feature-table-metaD-assume.biom \
-m Song_OTU_table/song-meta-assume.txt

# Add taxonomy data
!biom add-metadata \
-i Song_OTU_table/feature-table-metaD-assume.biom \
-o Song_OTU_table/feature-table-metaD-tax-assume.biom \
--observation-metadata-fp Song_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Song_OTU_table/feature-table-metaD-tax-assume.biom \
-o Song_OTU_table/feature-table-metaD-tax-summary-assume.txt

!head -20 Song_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Song_OTU_table/feature-table-metaD-tax-assume.biom \
-o Song_OTU_table/feature-table-metaD-tax-assume_json.biom \
--table-type="OTU table" \
--to-json

In [None]:
## Wu

# Make a new directory to export the files to
!mkdir Wu_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export wu-table.qza --output-dir Wu_OTU_table
!qiime tools export wu-rep-seqs.qza --output-dir Wu_OTU_table
!qiime tools export wu-taxonomy.qza --output-dir Wu_OTU_table

!cp wu-metadata.txt Wu_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt


# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Wu_OTU_table/feature-table.biom \
-o Wu_OTU_table/feature-table-metaD.biom \
-m Wu_OTU_table/wu-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i Wu_OTU_table/feature-table-metaD.biom \
-o Wu_OTU_table/feature-table-metaD-tax.biom \
--observation-metadata-fp Wu_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Wu_OTU_table/feature-table-metaD-tax.biom \
-o Wu_OTU_table/feature-table-metaD-tax-summary.txt

!head -20 Wu_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package

!biom convert \
-i Wu_OTU_table/feature-table-metaD-tax.biom \
-o Wu_OTU_table/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json

In [None]:
## Imparato

# Make a new directory to export the files to
!mkdir Imparato_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export imparato-table.qza --output-dir Imparato_OTU_table
!qiime tools export imparato-rep-seqs.qza --output-dir Imparato_OTU_table
!qiime tools export imparato-taxonomy.qza --output-dir Imparato_OTU_table

!cp imparato-metadata.txt Imparato_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls Imparato_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Imparato_OTU_table/feature-table.biom \
-o Imparato_OTU_table/feature-table-metaD.biom \
-m Imparato_OTU_table/imparato-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i Imparato_OTU_table/feature-table-metaD.biom \
-o Imparato_OTU_table/feature-table-metaD-tax.biom \
--observation-metadata-fp Imparato_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Imparato_OTU_table/feature-table-metaD-tax.biom \
-o Imparato_OTU_table/feature-table-metaD-tax-summary.txt

!head -20 Imparato_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Imparato_OTU_table/feature-table-metaD-tax.biom \
-o Imparato_OTU_table/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json


In [None]:
## Whitman

# Make a new directory to export the files to
!mkdir Whitman_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export whitman-table.qza --output-dir Whitman_OTU_table
!qiime tools export whitman-rep-seqs.qza --output-dir Whitman_OTU_table
!qiime tools export whitman-taxonomy.qza --output-dir Whitman_OTU_table

!cp whitman-metadata.txt Whitman_OTU_table/
# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls Whitman_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Whitman_OTU_table/feature-table.biom \
-o Whitman_OTU_table/feature-table-metaD-ncbiID.biom \
-m Whitman_OTU_table/whitman-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i Whitman_OTU_table/feature-table-metaD-ncbiID.biom \
-o Whitman_OTU_table/feature-table-metaD-tax-ncbiID.biom \
--observation-metadata-fp Whitman_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Whitman_OTU_table/feature-table-metaD-tax-ncbiID.biom \
-o Whitman_OTU_table/feature-table-metaD-tax-summary-ncbiID.txt

!head -20 Whitman_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Whitman_OTU_table/feature-table-metaD-tax-ncbiID.biom \
-o Whitman_OTU_table/feature-table-metaD-tax_json-ncbiID.biom \
--table-type="OTU table" \
--to-json

In [None]:
# Yao

# Make a new directory to export the files to
!mkdir YaoBact_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export yaobact-table.qza --output-dir YaoBact_OTU_table
!qiime tools export yaobact-rep-seqs.qza --output-dir YaoBact_OTU_table
!qiime tools export yao-taxonomy.qza --output-dir YaoBact_OTU_table

!cp Yao-metadata.txt YaoBact_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls YaoBact_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i YaoBact_OTU_table/feature-table.biom \
-o YaoBact_OTU_table/feature-table-metaD.biom \
-m YaoBact_OTU_table/Yao-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i YaoBact_OTU_table/feature-table-metaD.biom \
-o YaoBact_OTU_table/feature-table-metaD-tax.biom \
--observation-metadata-fp YaoBact_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i YaoBact_OTU_table/feature-table-metaD.biom \
-o YaoBact_OTU_table/feature-table-metaD-tax-summary.txt

!head -20 YaoBact_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i YaoBact_OTU_table/feature-table-metaD-tax.biom \
-o YaoBact_OTU_table/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json

In [None]:
## Ye

# Make a new directory to export the files to
!mkdir Ye_OTU_table-v3

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export Ye-table-v3.qza --output-dir Ye_OTU_table-v3
!qiime tools export Ye-rep-seqs-v3.qza --output-dir Ye_OTU_table-v3
!qiime tools export ye-taxonomy-v3.qza --output-dir Ye_OTU_table-v3

!cp Ye-metadata.txt Ye_OTU_table-v3/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls Ye_OTU_table-v3/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Ye_OTU_table-v3/feature-table.biom \
-o Ye_OTU_table-v3/feature-table-metaD.biom \
-m Ye_OTU_table-v3/Ye-metadata.txt

# Add taxonomy data
!biom add-metadata \
-i Ye_OTU_table-v3/feature-table-metaD.biom \
-o Ye_OTU_table-v3/feature-table-metaD-tax.biom \
--observation-metadata-fp Ye_OTU_table-v3/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Ye_OTU_table-v3/feature-table-metaD.biom \
-o Ye_OTU_table-v3/feature-table-metaD-tax-summary.txt

!head -20 Ye_OTU_table-v3/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Ye_OTU_table-v3/feature-table-metaD-tax.biom \
-o Ye_OTU_table-v3/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json

In [None]:
## Nielsen

# Make a new directory to export the files to
!mkdir Nielsen2014_OTU_table

# Export OTU table, representative sequences, and taxonomy; copy metadata (.txt)
!qiime tools export Nielsen2014-table.qza --output-dir Nielsen2014_OTU_table
!qiime tools export Nielsen2014-rep-seqs.qza --output-dir Nielsen2014_OTU_table
!qiime tools export Nielsen2014-taxonomy.qza --output-dir Nielsen2014_OTU_table

!cp Nielsen2014-metadata2.txt Nielsen2014_OTU_table/

# Check out files in directory; should have dna-sequences.fastq, taxonomy.tsv, feature-table.biom, and the metadata.txt
!ls Nielsen2014_OTU_table/

# Add information from metadata.txt to the feature-table.biom
!biom add-metadata \
-i Nielsen2014_OTU_table/feature-table.biom \
-o Nielsen2014_OTU_table/feature-table-metaD.biom \
-m Nielsen2014_OTU_table/Nielsen2014-metadata2.txt

# Add taxonomy data
!biom add-metadata \
-i Nielsen2014_OTU_table/feature-table-metaD.biom \
-o Nielsen2014_OTU_table/feature-table-metaD-tax.biom \
--observation-metadata-fp Nielsen2014_OTU_table/taxonomy.tsv \
--sc-separated taxonomy \
--observation-header OTUID,taxonomy

# Check your work by creating a summary text file - view summary to make sure information was saved to .biom
!biom summarize-table \
-i Nielsen2014_OTU_table/feature-table-metaD.biom \
-o Nielsen2014_OTU_table/feature-table-metaD-tax-summary.txt

!head -20 Nielsen2014_OTU_table/feature-table-metaD-tax-summary.txt

# convert the .biom to json format to work with phyloseq package
!biom convert \
-i Nielsen2014_OTU_table/feature-table-metaD-tax.biom \
-o Nielsen2014_OTU_table/feature-table-metaD-tax_json.biom \
--table-type="OTU table" \
--to-json