**RNA Sequencing Analysis**

**UNZIP data**

```
find . -name "*.gz" | while read filename; do gunzip "`dirname "$filename"`" "$filename"; done;
```

**Move all the files fom inside a folder to outside**

```
find . -name '*.fq' -exec mv {} . \;
find . -depth -type d -empty -exec rmdir {} \;
```

**Rename the files**

```
for file in *; do mv "${file}" "${file/-1a_HV2WVDSXX_L2/}"; done # Remove defined string from name
```

**Create a sample description file**


(echo 'samplename,description'; for f in raw_files/*fq*; do readlink -f $f | perl -pe 's/(.*?_(S[0-9]+)_.*)/\1,\2/'; done) > alignment.csv

Edit alignment.csv remotely

**Download the reference genome**

```
mkdir reference
wget ftp://ftp.ensembl.org/pub/release-96/fasta/homo_sapiens/cdna/Homo_sapiens.GRCh38.cdna.all.fa.gz
wget ftp://ftp.ensembl.org/pub/release-96/gtf/homo_sapiens/Homo_sapiens.GRCh38.96.gtf.gz
gunzip *
```

**Prepare the O2.yaml file**

```
details:
  - analysis: RNA-seq
    genome_build: hg38
    algorithm:
      transcriptome_fasta: /n/scratch2/ajit/duvelisib/RNASEQ/reference/Homo_sapiens.GRCh38.cdna.all.fa
      transcriptome_gtf: /n/scratch2/ajit/duvelisib/RNASEQ/reference/Homo_sapiens.GRCh38.96.gtf
      aligner: hisat2
      strandedness: unstranded
      tools_on: [bcbiornaseq]
      bcbiornaseq:
          organism: homo sapiens
upload:
  dir: ../final
```

**Intiate bcBio**

```
module load bcbio/latest
unset PYTHONPATH
bcbio_nextgen.py -w template O2.yaml alignment.csv raw_files/
```

**Submit Job to O2**

```
cd alignment/work
vim submit_bcbio.sh

#!/bin/sh
#SBATCH -p long
#SBATCH -J bcbio_O2              
#SBATCH -o run.o
#SBATCH -e run.e
#SBATCH -t 7-00:00
#SBATCH --cpus-per-task=3
#SBATCH --mem=150G
#SBATCH --mail-type=END         # Type of email notification- BEGIN,END,FAIL,ALL
#SBATCH --mail-user=ajitj_nirmal@dfci.harvard.edu   # Email to which notifications will be sent

export PATH=/n/app/bcbio/tools/bin:$PATH
bcbio_nextgen.py ../config/alignment.yaml \
    -n 24 -t ipython -s slurm -q long -r t=7-00:00 --timeout 2000

sbatch submit_bcbio.sh
```

----