# Beta diversity

In [2]:
import os
import pandas as pd
import qiime2 as q2
from skbio import OrdinationResults
from qiime2 import Visualization
from seaborn import scatterplot

%matplotlib inline

In [3]:
data_dir = 'Alien_data'

In [3]:
# create a feature table from the filtered table
! qiime feature-table summarize \
  --i-table $data_dir/table-filtered.qza \
  --m-sample-metadata-file $data_dir/sample_metadata.tsv \
  --o-visualization $data_dir/feature_table.qzv

[32mSaved Visualization to: Alien_data/feature_table.qzv[0m
[0m

In [23]:
Visualization.load(f'{data_dir}/feature_table.qzv')

ValueError: Alien_data/feature_table.qzv does not exist.

In [7]:
# sepp-tree
! qiime diversity core-metrics-phylogenetic \
  --i-table $data_dir/table-filtered.qza \
  --i-phylogeny $data_dir/sepp-tree.qza \
  --m-metadata-file $data_dir/sample_metadata.tsv \
  --p-sampling-depth 3000 \
  --output-dir $data_dir/core-metrics-results

[32mSaved FeatureTable[Frequency] to: Alien_data/core-metrics-results/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: Alien_data/core-metrics-results/unweighted_unifrac_pcoa_results.qza[0m
[32mSa

In [32]:
#raxml-cat-bootstrap-rooted tree
! qiime diversity core-metrics-phylogenetic \
  --i-table $data_dir/table-filtered.qza \
  --i-phylogeny $data_dir/raxml-cat-bootstrap-rooted.qza \
  --m-metadata-file $data_dir/sample_metadata.tsv \
  --p-sampling-depth 3000 \
  --output-dir $data_dir/core-metrics-results-2

[32mSaved FeatureTable[Frequency] to: Alien_data/core-metrics-results-2/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-2/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-2/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-2/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-2/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-2/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-2/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-2/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-2/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: Alien_data/core-metrics-results-2/unweighted_unifrac_pcoa_res

In [34]:
# sampling depth of 2000 is chosen (no significant differences)
! qiime diversity core-metrics-phylogenetic \
  --i-table $data_dir/table-filtered.qza \
  --i-phylogeny $data_dir/raxml-cat-bootstrap-rooted.qza \
  --m-metadata-file $data_dir/sample_metadata.tsv \
  --p-sampling-depth 2000 \
  --output-dir $data_dir/core-metrics-results-3

[32mSaved FeatureTable[Frequency] to: Alien_data/core-metrics-results-3/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-3/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-3/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-3/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results-3/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-3/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-3/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-3/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results-3/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: Alien_data/core-metrics-results-3/unweighted_unifrac_pcoa_res

## unweighted_unifrac_emperor：

In [36]:
# view PCoA plot from `unweighted_unifrac_emperor.qzv` (sepp-tree/ 3000)
Visualization.load(f'{data_dir}/core-metrics-results/unweighted_unifrac_emperor.qzv')

In [37]:
# view PCoA-1 plot from `unweighted_unifrac_emperor.qzv` (raxml-cat-bootstrap-rooted tree/ 3000)
Visualization.load(f'{data_dir}/core-metrics-results-2/unweighted_unifrac_emperor.qzv')

In [38]:
# view PCoA-1 plot from `unweighted_unifrac_emperor.qzv` (raxml-cat-bootstrap-rooted tree/ 2000)
Visualization.load(f'{data_dir}/core-metrics-results-3/unweighted_unifrac_emperor.qzv')

In [9]:
#Beta -- disease comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column disease \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-env-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/uw_unifrac-env-significance.qzv[0m
[0m

In [15]:
Visualization.load(f'{data_dir}/Unifrac_output/uw_unifrac-env-significance.qzv')

In [17]:
#Beta -- categorical_time comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column categorical_time_relative_to_engraftment \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-categorical_time-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/uw_unifrac-categorical_time-significance.qzv[0m
[0m

In [18]:
Visualization.load(f'{data_dir}/Unifrac_output/uw_unifrac-categorical_time-significance.qzv')

In [19]:
#Beta -- hct_source comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column hct_source \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-hct_source-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/uw_unifrac-hct_source-significance.qzv[0m
[0m

In [20]:
Visualization.load(f'{data_dir}/Unifrac_output/uw_unifrac-hct_source-significance.qzv')

In [21]:
#Beta -- stool_consistency comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column stool_consistency \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-stool_consistency-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/uw_unifrac-stool_consistency-significance.qzv[0m
[0m

In [22]:
Visualization.load(f'{data_dir}/Unifrac_output/uw_unifrac-stool_consistency-significance.qzv')

In [22]:
Visualization.load(f'{data_dir}/Unifrac_output/uw_unifrac-stool_consistency-significance.qzv')

In [52]:
#Beta -- alleged_abduction comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/ed-sample_metadata.tsv \
    --m-metadata-column alleged_abduction \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-alleged_abduction-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/uw_unifrac-alleged_abduction-significance.qzv[0m
[0m

In [53]:
Visualization.load(f'{data_dir}/Unifrac_output/weighted_unifrac-alleged_abduction-significance.qzv')

## weighted_unifrac_emperor：

In [40]:
# view PCoA plot from `weighted_unifrac_emperor.qzv` (sepp-tree)
Visualization.load(f'{data_dir}/core-metrics-results/weighted_unifrac_emperor.qzv')

In [41]:
# view PCoA-1 plot from `weighted_unifrac_emperor.qzv` (raxml-cat-bootstrap-rooted tree/ 3000)
Visualization.load(f'{data_dir}/core-metrics-results-2/weighted_unifrac_emperor.qzv')

In [42]:
# view PCoA-1 plot from `weighted_unifrac_emperor.qzv` (raxml-cat-bootstrap-rooted tree/ 2000)
Visualization.load(f'{data_dir}/core-metrics-results-3/weighted_unifrac_emperor.qzv')

In [13]:
#Beta -- disease comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column disease \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/wed_unifrac-env-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/wed_unifrac-env-significance.qzv[0m
[0m

In [43]:
Visualization.load(f'{data_dir}/Unifrac_output/wed_unifrac-env-significance.qzv')

In [44]:
#Beta -- categorical_time comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column categorical_time_relative_to_engraftment \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/weighted_unifrac-categorical_time-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/weighted_unifrac-categorical_time-significance.qzv[0m
[0m

In [45]:
Visualization.load(f'{data_dir}/Unifrac_output/weighted_unifrac-categorical_time-significance.qzv')

In [46]:
#Beta -- hct_source comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column hct_source \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/weighted_unifrac-hct_source-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/weighted_unifrac-hct_source-significance.qzv[0m
[0m

In [47]:
Visualization.load(f'{data_dir}/Unifrac_output/weighted_unifrac-hct_source-significance.qzv')

In [48]:
#Beta -- stool_consistency comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column stool_consistency \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/weighted_unifrac-stool_consistency-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/weighted_unifrac-stool_consistency-significance.qzv[0m
[0m

In [49]:
Visualization.load(f'{data_dir}/Unifrac_output/weighted_unifrac-stool_consistency-significance.qzv')

In [50]:
#Beta -- alleged_abduction comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/ed-sample_metadata.tsv \
    --m-metadata-column alleged_abduction \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/weighted_unifrac-alleged_abduction-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/weighted_unifrac-alleged_abduction-significance.qzv[0m
[0m

In [51]:
Visualization.load(f'{data_dir}/Unifrac_output/weighted_unifrac-alleged_abduction-significance.qzv')