In [10]:
# importing all required packages & notebook extensions at the start of the notebook
import os
import biom
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import pandas as pd
import qiime2 as q2
from qiime2 import Visualization
%matplotlib inline

In [11]:
# assigning variables throughout the notebook
raw_data_dir = "../data/raw"
data_dir = "../data/processed"
vis_dir  = "../results"

In [25]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/weighted_unifrac_emperor.qzv")

In [6]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/bray_curtis_emperor.qzv")

In [33]:
md = pd.read_csv(f"{data_dir}/metadata.tsv", sep='\t')
md = md.fillna(0)
md.to_csv(f"{data_dir}/metadata_fillna.tsv", sep='\t', index=False)

In [34]:
! qiime diversity adonis \
--i-distance-matrix $data_dir/core-metrics-results-bt/weighted_unifrac_distance_matrix.qza \
--m-metadata-file $data_dir/metadata_fillna.tsv \
--p-formula Cohort_Number*Stool_Consistency*Patient_Sex*Sample_Day*Recovery_Day \
--o-visualization $data_dir/core-metrics-results-bt/weighted_unifrac_adonis.qzv

[32mSaved Visualization to: ../data/processed/core-metrics-results-bt/weighted_unifrac_adonis.qzv[0m
[0m

In [35]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/weighted_unifrac_adonis.qzv")

In [13]:
metadata = pd.read_csv(f"{data_dir}/metadata.tsv", sep='\t')
metadata['Cohort_Number_Bin'] = metadata['Cohort_Number'].map({1: 'Abduction', 2: 'Recovery'})
metadata.to_csv(f"{data_dir}/metadata_binned.tsv", sep='\t', index=False)

In [10]:
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results-bt/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/metadata_binned.tsv \
    --m-metadata-column Cohort_Number_Bin \
    --p-pairwise \
    --o-visualization $data_dir/core-metrics-results-bt/weighted_unifrac-Cohort-number-significance.qzv

[32mSaved Visualization to: ../data/processed/core-metrics-results-bt/weighted_unifrac-Cohort-number-significance.qzv[0m
[0m

In [14]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/weighted_unifrac-Cohort-number-significance.qzv")

In [27]:
! qiime diversity beta-correlation \
    --i-distance-matrix $data_dir/core-metrics-results-bt/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/metadata.tsv \
    --m-metadata-column Cohort_Number \
    --p-intersect-ids \
    --o-metadata-distance-matrix $data_dir/core-metrics-results-bt/beta-correlation/spearman.qza \
    --o-mantel-scatter-visualization $data_dir/core-metrics-results-bt/beta-correlation/scatter-plot.qzv

[32mSaved DistanceMatrix to: ../data/processed/core-metrics-results-bt/beta-correlation/spearman.qza[0m
[32mSaved Visualization to: ../data/processed/core-metrics-results-bt/beta-correlation/scatter-plot.qzv[0m
[0m

In [29]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/beta-correlation/scatter-plot.qzv")

In [38]:
! qiime diversity beta-correlation \
    --i-distance-matrix $data_dir/core-metrics-results-bt/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/metadata.tsv \
    --m-metadata-column Sample_Day \
    --p-intersect-ids \
    --o-metadata-distance-matrix $data_dir/core-metrics-results-bt/beta-correlation/spearman-sample-day.qza \
    --o-mantel-scatter-visualization $data_dir/core-metrics-results-bt/beta-correlation/scatter-plot-sample-day.qzv

[32mSaved DistanceMatrix to: ../data/processed/core-metrics-results-bt/beta-correlation/spearman-sample-day.qza[0m
[32mSaved Visualization to: ../data/processed/core-metrics-results-bt/beta-correlation/scatter-plot-sample-day.qzv[0m
[0m

In [39]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/beta-correlation/scatter-plot-sample-day.qzv")

In [41]:
! qiime diversity beta-correlation \
    --i-distance-matrix $data_dir/core-metrics-results-bt/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/metadata_fillna.tsv \
    --m-metadata-column Recovery_Day \
    --p-intersect-ids \
    --o-metadata-distance-matrix $data_dir/core-metrics-results-bt/beta-correlation/spearman-recov-day.qza \
    --o-mantel-scatter-visualization $data_dir/core-metrics-results-bt/beta-correlation/scatter-plot-recov-day.qzv

[32mSaved DistanceMatrix to: ../data/processed/core-metrics-results-bt/beta-correlation/spearman-recov-day.qza[0m
[32mSaved Visualization to: ../data/processed/core-metrics-results-bt/beta-correlation/scatter-plot-recov-day.qzv[0m
[0m

In [42]:
Visualization.load(f"{data_dir}/core-metrics-results-bt/beta-correlation/scatter-plot-recov-day.qzv")

In [None]:
# weak positive correlation for Cohort_Number and Sample_Day