# Beta diversity

In [2]:
import os
import pandas as pd
import qiime2 as q2
from skbio import OrdinationResults
from qiime2 import Visualization
from seaborn import scatterplot

%matplotlib inline

In [3]:
data_dir = 'Alien_data'

In [3]:
# create a feature table from the filtered table
! qiime feature-table summarize \
  --i-table $data_dir/table-filtered.qza \
  --m-sample-metadata-file $data_dir/sample_metadata.tsv \
  --o-visualization $data_dir/feature_table.qzv

[32mSaved Visualization to: Alien_data/feature_table.qzv[0m
[0m

In [4]:
Visualization.load(f'{data_dir}/feature_table.qzv')

In [7]:
# sampling depth of 3000 is chosen (we can also discuss which is the best depth to chose)
! qiime diversity core-metrics-phylogenetic \
  --i-table $data_dir/table-filtered.qza \
  --i-phylogeny $data_dir/sepp-tree.qza \
  --m-metadata-file $data_dir/sample_metadata.tsv \
  --p-sampling-depth 3000 \
  --output-dir $data_dir/core-metrics-results

[32mSaved FeatureTable[Frequency] to: Alien_data/core-metrics-results/rarefied_table.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/faith_pd_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/observed_features_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/shannon_vector.qza[0m
[32mSaved SampleData[AlphaDiversity] to: Alien_data/core-metrics-results/evenness_vector.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/unweighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/weighted_unifrac_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/jaccard_distance_matrix.qza[0m
[32mSaved DistanceMatrix to: Alien_data/core-metrics-results/bray_curtis_distance_matrix.qza[0m
[32mSaved PCoAResults to: Alien_data/core-metrics-results/unweighted_unifrac_pcoa_results.qza[0m
[32mSa

In [None]:
# sampling depth of 3000 is chosen (we can also discuss which is the best depth to chose)
! qiime diversity core-metrics-phylogenetic \
  --i-table $data_dir/table-filtered.qza \
  --i-phylogeny $data_dir/raxml-cat-bootstrap-rooted.qza \
  --m-metadata-file $data_dir/sample_metadata.tsv \
  --p-sampling-depth 3000 \
  --output-dir $data_dir/core-metrics-results-2

## unweighted_unifrac_emperor：

In [7]:
# view PCoA plot from `unweighted_unifrac_emperor.qzv`
Visualization.load(f'{data_dir}/core-metrics-results/unweighted_unifrac_emperor.qzv')

In [9]:
#Beta -- disease comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column disease \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-env-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/uw_unifrac-env-significance.qzv[0m
[0m

In [10]:
Visualization.load(f'{data_dir}/Unifrac_output/uw_unifrac-env-significance.qzv')

In [11]:
#Beta -- alleged_abduction comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/unweighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column alleged_abduction \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/uw_unifrac-env-significance.qzv

Usage: [94mqiime diversity beta-group-significance[0m [OPTIONS]

  Determine whether groups of samples are significantly different from one
  another using a permutation-based statistical test.

[1mInputs[0m:
  [94m[4m--i-distance-matrix[0m ARTIFACT
    [32mDistanceMatrix[0m     Matrix of distances between pairs of samples.
                                                                    [35m[required][0m
[1mParameters[0m:
  [94m[4m--m-metadata-file[0m METADATA
  [94m[4m--m-metadata-column[0m COLUMN  [32mMetadataColumn[Categorical][0m
                       Categorical sample metadata column.          [35m[required][0m
  [94m--p-method[0m TEXT [32mChoices('permanova', 'anosim', 'permdisp')[0m
                       The group significance test to be applied.
                                                        [35m[default: 'permanova'][0m
  [94m--p-pairwise[0m / [94m--p-no-pairwise[0m
                       Perform pairwise tests between all pairs

## weighted_unifrac_emperor：

In [12]:
# view PCoA plot from `weighted_unifrac_emperor.qzv`
Visualization.load(f'{data_dir}/core-metrics-results/weighted_unifrac_emperor.qzv')

In [13]:
#Beta -- disease comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column disease \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/wed_unifrac-env-significance.qzv

[32mSaved Visualization to: Alien_data/Unifrac_output/wed_unifrac-env-significance.qzv[0m
[0m

In [14]:
Visualization.load(f'{data_dir}/Unifrac_output/wed_unifrac-env-significance.qzv')

In [11]:
#Beta -- alleged_abduction comparison
! qiime diversity beta-group-significance \
    --i-distance-matrix $data_dir/core-metrics-results/weighted_unifrac_distance_matrix.qza \
    --m-metadata-file $data_dir/sample_metadata.tsv \
    --m-metadata-column alleged_abduction \
    --p-pairwise \
    --o-visualization $data_dir/Unifrac_output/weighted_unifrac-env-significance.qzv

Usage: [94mqiime diversity beta-group-significance[0m [OPTIONS]

  Determine whether groups of samples are significantly different from one
  another using a permutation-based statistical test.

[1mInputs[0m:
  [94m[4m--i-distance-matrix[0m ARTIFACT
    [32mDistanceMatrix[0m     Matrix of distances between pairs of samples.
                                                                    [35m[required][0m
[1mParameters[0m:
  [94m[4m--m-metadata-file[0m METADATA
  [94m[4m--m-metadata-column[0m COLUMN  [32mMetadataColumn[Categorical][0m
                       Categorical sample metadata column.          [35m[required][0m
  [94m--p-method[0m TEXT [32mChoices('permanova', 'anosim', 'permdisp')[0m
                       The group significance test to be applied.
                                                        [35m[default: 'permanova'][0m
  [94m--p-pairwise[0m / [94m--p-no-pairwise[0m
                       Perform pairwise tests between all pairs