### import packages

In [1]:
import os
import pandas as pd
from qiime2 import Visualization
import matplotlib.pyplot as plt

%matplotlib inline

### creating data directory 

In [2]:
data_dir = 'CE'

if not os.path.isdir(data_dir):
    os.makedirs(data_dir)

In [3]:
print([f for f in os.listdir('.') if os.path.isfile(f)])

['CE_file_downloads.ipynb', '1CheezEyez draft.ipynb', 'metadata.ipynb', 'README.md', '.gitignore']


### don't need to run every time? qza file download

In [4]:
! wget -nv -O $data_dir/cheese-single-end-demux.qza 'https://polybox.ethz.ch/index.php/s/2AYhc9EgbtA7wsE/download'

2022-10-12 09:33:12 URL:https://polybox.ethz.ch/index.php/s/2AYhc9EgbtA7wsE/download [959420090/959420090] -> "CE/cheese-single-end-demux.qza" [1]


In [5]:
! ls -1 $data_dir

cheese-single-end-demux.qza


### tsv file download

In [5]:
! wget -nv -O $data_dir/food-metadata.tsv 'https://polybox.ethz.ch/index.php/s/nEd4l5CWGWGEtae/download'

2022-10-12 09:33:24 URL:https://polybox.ethz.ch/index.php/s/nEd4l5CWGWGEtae/download [42810/42810] -> "CE/food-metadata.tsv" [1]


In [7]:
! ls -1 $data_dir

cheese-single-end-demux.qza
food-metadata.tsv


In [7]:
df_meta = pd.read_csv(f'{data_dir}/food-metadata.tsv', sep='\t', index_col=0)

### Denoising

Visual summary of the QIIME Artifact without changes:

In [11]:
! qiime demux summarize \
    --i-data $data_dir/cheese-single-end-demux.qza \
    --o-visualization $data_dir/cheese-single-end-demux.qzv

[32mSaved Visualization to: CE/cheese-single-end-demux.qzv[0m
[0m

In [12]:
Visualization.load(f'{data_dir}/cheese-single-end-demux.qzv')

Denoising:
    --p-trunc-len: the length of the reads will be truncated to 100bp (maybe use different truncating length? Max. length is 101)

In [10]:
! qiime dada2 denoise-single \
    --i-demultiplexed-seqs $data_dir/cheese-single-end-demux.qza \
    --p-trunc-len 100 \
    --p-n-threads 3 \
    --o-table $data_dir/dada2_table.qza \
    --o-representative-sequences $data_dir/dada2_rep_set.qza \
    --o-denoising-stats $data_dir/dada2_stats.qza

[32mSaved FeatureTable[Frequency] to: CE/dada2_table.qza[0m
[32mSaved FeatureData[Sequence] to: CE/dada2_rep_set.qza[0m
[32mSaved SampleData[DADA2Stats] to: CE/dada2_stats.qza[0m
[0m

Inspect denoising stats:

In [13]:
! qiime metadata tabulate \
    --m-input-file $data_dir/dada2_stats.qza \
    --o-visualization $data_dir/dada2_stats.qzv

[32mSaved Visualization to: CE/dada2_stats.qzv[0m
[0m

In [14]:
Visualization.load(f'{data_dir}/dada2_stats.qzv')

Visualize feature table: