# Generation of count matrices

Count matrices are generated using Kallisto | Bustools workflow.

The raw scRNA-Seq files (fastq.gz) are in "./kallisto_bustools/raw_data/".

The count matrices are stored in "./kallisto_bustools/".

# Prepare a mouse RNA velocity index for pseudoalignment.

In [None]:
!pip install kb-python

In [None]:
%%bash

cd kallisto_bustools/ \
    && wget ftp://ftp.ensembl.org/pub/release-98/fasta/mus_musculus/dna/Mus_musculus.GRCm38.dna.primary_assembly.fa.gz \ 
    && gunzip Mus_musculus.GRCm38.dna.primary_assembly.fa.gz
cd kallisto_bustools/ \
    && wget ftp://ftp.ensembl.org/pub/release-98/gtf/mus_musculus/Mus_musculus.GRCm38.98.gtf.gz \
    && gunzip Mus_musculus.GRCm38.98.gtf.gz

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb ref --overwrite -i index.idx -g t2g.txt -f1 cdna.fa -f2 intron.fa -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno \
    Mus_musculus.GRCm38.dna.primary_assembly.fa \
    Mus_musculus.GRCm38.98.gtf

# Generate count matrix for each sample.

### T0_1

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o T0_1_S9 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/T0_1_S9*.fastq.gz

### T0_2

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o T0_2_S10 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/T0_2_S10*.fastq.gz

### DMSO_2h

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o DMSO_2h_S11 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/DMSO_2h_S11*.fastq.gz

### N6_2h

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o N6_2h_S12 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/N6_2h_S12*.fastq.gz

### DMSO_24h

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o DMSO_24h_S13 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/DMSO_24h_S13*.fastq.gz

### N6_24h

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o N6_24h_S14 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/N6_24h_S14*.fastq.gz

### DMSO_48h

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o DMSO_48h_S15 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/DMSO_48h_S15*.fastq.gz

### N6_48h

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o N6_48h_S16 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/N6_48h_S16*.fastq.gz

### DMSO_d7

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o 1_CpG_S3 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/1_CpG_S3*.fastq.gz

### N6_d7

In [None]:
%%bash

cd kallisto_bustools/ \
    && kb count --h5ad --overwrite -i index.idx -g t2g.txt -x 10xv3 -o 2_N6_S2 \
    -c1 spliced_t2c.txt -c2 unspliced_t2c.txt --workflow lamanno --filter bustools -t 2 -m 64G\
    raw_data/2_N6_S2*.fastq.gz