#### This analysis is performed under the "q2-boots-2024.5.beta" environment.

In [1]:
import os
import pandas as pd
import qiime2 as q2

In [2]:
path = "/Users/cheesemania/PycharmProjects/mscthesis_wrkdir"

#### Test on resampling time n = 5, 10, 20, 50, 100.
#### No difference in terms of the number of samples, and no obvious different in terms of pairwise group significance of observed features.

#### Decided on using n=50 for the balance of robustness and saving time and computational resources.

In [36]:
# Final feature table of case-control samples
# Observed features
!qiime boots alpha \
    --i-table {path}/src-analysis/feature-table/health-disease-case-control/case_control_feature_table_remove_h1n1.qza \
    --p-sampling-depth 3000 \
    --p-metric 'observed_features' \
    --p-n 50 \
    --p-no-replacement \
    --p-average-method 'median' \
    --o-average-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/observed_features_vector.qza

# "Median" is generally preferred if your dataset is prone to outliers or has a skewed distribution, as it provides a more robust measure of central tendency.

[32mSaved SampleData[AlphaDiversity] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/observed_features_vector.qza[0m
[0m

In [37]:
# Observed features
!qiime diversity alpha-group-significance \
    --i-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/observed_features_vector.qza \
    --m-metadata-file {path}/metadata/case_control_metadata_remove_h1n1.tsv \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/observed-features-group-significance.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/observed-features-group-significance.qzv[0m
[0m

In [38]:
# Final feature table of case-control samples
# Shannon entropy
!qiime boots alpha \
    --i-table {path}/src-analysis/feature-table/health-disease-case-control/case_control_feature_table_remove_h1n1.qza \
    --p-sampling-depth 3000 \
    --p-metric 'shannon' \
    --p-n 50 \
    --p-no-replacement \
    --p-average-method 'median' \
    --o-average-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/shannon_vector.qza

[32mSaved SampleData[AlphaDiversity] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/shannon_vector.qza[0m
[0m

In [39]:
# Shannon entropy
!qiime diversity alpha-group-significance \
    --i-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/shannon_vector.qza \
    --m-metadata-file {path}/metadata/case_control_metadata_remove_h1n1.tsv \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/shannon-group-significance.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-non-filtered/shannon-group-significance.qzv[0m
[0m

### Filtered non-resident fungi from the final (original) non-rarefied feature table

In [40]:
# Filter non-resident fungi from case_control_feature_table_remove_h1n1_filtered1_table (filtered1: excluding four projects with small sample sizes)
!qiime feature-table filter-features \
    --i-table {path}/src-analysis/feature-table/health-disease-case-control/case_control_feature_table_remove_h1n1_filtered1.qza \
    --m-metadata-file {path}/metadata/fungal-traits/non-resident_ids.tsv \
    --p-exclude-ids True \
    --o-filtered-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qza

[32mSaved FeatureTable[Frequency] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qza[0m
[0m

In [41]:
!qiime feature-table summarize \
    --i-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qza \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qzv[0m
[0m

In [42]:
# Observed features
!qiime boots alpha \
    --i-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qza \
    --p-sampling-depth 3000 \
    --p-metric 'observed_features' \
    --p-n 50 \
    --p-no-replacement \
    --p-average-method 'median' \
    --o-average-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/observed_features_vector.qza

[32mSaved SampleData[AlphaDiversity] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/observed_features_vector.qza[0m
[0m

In [43]:
# Observed features
!qiime diversity alpha-group-significance \
    --i-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/observed_features_vector.qza \
    --m-metadata-file {path}/metadata/case_control_metadata_remove_h1n1_filtered1.tsv \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/observed-features-group-significance.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/observed-features-group-significance.qzv[0m
[0m

In [44]:
# Shannon entropy
!qiime boots alpha \
    --i-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/case_control_filt_nonresident_feature_table.qza \
    --p-sampling-depth 3000 \
    --p-metric 'shannon' \
    --p-n 50 \
    --p-no-replacement \
    --p-average-method 'median' \
    --o-average-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/shannon_vector.qza

[32mSaved SampleData[AlphaDiversity] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/shannon_vector.qza[0m
[0m

In [45]:
# Shannon entropy
!qiime diversity alpha-group-significance \
    --i-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/shannon_vector.qza \
    --m-metadata-file {path}/metadata/case_control_metadata_remove_h1n1_filtered1.tsv \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/shannon-group-significance.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-filt-nonresident/shannon-group-significance.qzv[0m
[0m

### Subsetting the final (original) non-rarefied feature table with only non-resident fungi

In [46]:
# Retain only non-resident fungi in the case_control_feature_table_remove_h1n1_filtered1_table (filtered1: excluding four projects with small sample sizes)
!qiime feature-table filter-features \
    --i-table {path}/src-analysis/feature-table/health-disease-case-control/case_control_feature_table_remove_h1n1_filtered1.qza \
    --m-metadata-file {path}/metadata/fungal-traits/non-resident_ids.tsv \
    --p-exclude-ids False \
    --o-filtered-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qza

[32mSaved FeatureTable[Frequency] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qza[0m
[0m

In [47]:
!qiime feature-table summarize \
    --i-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qza \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qzv[0m
[0m

In [48]:
# Observed features
!qiime boots alpha \
    --i-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qza \
    --p-sampling-depth 3000 \
    --p-metric 'observed_features' \
    --p-n 50 \
    --p-no-replacement \
    --p-average-method 'median' \
    --o-average-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/observed_features_vector.qza

[32mSaved SampleData[AlphaDiversity] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/observed_features_vector.qza[0m
[0m

In [49]:
# Observed features
!qiime diversity alpha-group-significance \
    --i-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/observed_features_vector.qza \
    --m-metadata-file {path}/metadata/case_control_metadata_remove_h1n1_filtered1.tsv \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/observed-features-group-significance.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/observed-features-group-significance.qzv[0m
[0m

In [50]:
# Shannon entropy
!qiime boots alpha \
    --i-table {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/case_control_nonresident_feature_table.qza \
    --p-sampling-depth 3000 \
    --p-metric 'shannon' \
    --p-n 50 \
    --p-no-replacement \
    --p-average-method 'median' \
    --o-average-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/shannon_vector.qza

[32mSaved SampleData[AlphaDiversity] to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/shannon_vector.qza[0m
[0m

In [51]:
# Shannon entropy
!qiime diversity alpha-group-significance \
    --i-alpha-diversity {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/shannon_vector.qza \
    --m-metadata-file {path}/metadata/case_control_metadata_remove_h1n1_filtered1.tsv \
    --o-visualization {path}/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/shannon-group-significance.qzv

[32mSaved Visualization to: /Users/cheesemania/PycharmProjects/mscthesis_wrkdir/src-analysis/diversity-analysis/q2-boots/n50/alpha-diversity-results-nonresident/shannon-group-significance.qzv[0m
[0m