# Coverage of fragments in STARR-seq results
- depth in bedgraph format
- depth per base

**Set environment**

In [1]:
source ../config_duke.sh

You are on Duke Server: DCC
BASE DIRECTORY:     /work/kk319
WORK DIRECTORY:     /work/kk319/out/CombEffect_STARR
LOG  DIRECTORY:     /work/kk319/out/CombEffect_STARR/log
PATH OF SOURCE:     /work/kk319/source
PATH OF EXECUTABLE: /work/kk319/exe
PATH OF ANNOTATION: /work/kk319/annotation



## Get coverage of all chromosomes

**RUN**

In [2]:
source ../config_duke.sh
source ../load_module_bedtools.sh

sbatch -p scavenger \
    --array 0-23 \
    --mem 8G \
    -o ${FD_LOG}/coverage_perbase_chrom.%a.txt \
    <<'EOF'
#!/bin/bash
### set directories & global variables
source ../config_duke.sh
CHROMS=($(seq 1 22) X Y)
CHROM=chr${CHROMS[${SLURM_ARRAY_TASK_ID}]}
TARGET=${CHROM}

### set input and output
FD_BEDS=($(ls -d ${FD_WRK}/data/*/))
FN_BED=${CHROM}.bed

FD_GEN=${FD_ANN}/genome/hg38
FN_GEN=hg38.chrom.sizes.${CHROM}

### print start message
echo "Slurm Array Index: " ${SLURM_ARRAY_TASK_ID}

### loop through each sample and count each fragment of a chromosome
echo "RUN: loop through samples; count fragment"

for FD_BED in ${FD_BEDS[@]}; do
    SAMPLE=$(basename ${FD_BED})
    FD_OUT=${FD_WRK}/coverage/${SAMPLE}
    FN_OUT=${TARGET}_perbase.txt
    
    ### START Message
    echo ++++++++++++++++++++++++++++++++++++++++++++++++
    echo "Input  file: " ${FD_BED}/${FN_BED}
    echo "Output file: " ${FD_OUT}/${FN_OUT}
    echo
    echo "Show the first few lines of the input file"
    echo ${FD_BED}/${FN_BED}
    head -n 5 ${FD_BED}/${FN_BED}
    echo
    echo "Show the last few lines of the input file"
    echo ${FD_BED}/${FN_BED}
    tail -n 5 ${FD_BED}/${FN_BED}
    echo
    
    ### init: create output folder if not exist
    mkdir -p ${FD_OUT}
    
    ### run: Bedtools genomecov -d to get coverage per base
    echo "Get coverage per base"
    bedtools genomecov -i ${FD_BED}/${FN_BED} -g ${FD_GEN}/${FN_GEN} -d > ${FD_OUT}/${FN_OUT}
    echo
    
    ### END Message
    echo "Show the first few lines of the output file"
    echo ${FD_OUT}/${FN_OUT}
    head -n 5 ${FD_OUT}/${FN_OUT}
    echo
    echo "Show the last few lines of the output file"
    echo ${FD_OUT}/${FN_OUT}
    tail -n 5 ${FD_OUT}/${FN_OUT}
    echo
done
echo "Done!"

EOF

You are on Duke Server: DCC
BASE DIRECTORY:     /work/kk319
WORK DIRECTORY:     /work/kk319/out/CombEffect_STARR
LOG  DIRECTORY:     /work/kk319/out/CombEffect_STARR/log
PATH OF SOURCE:     /work/kk319/source
PATH OF EXECUTABLE: /work/kk319/exe
PATH OF ANNOTATION: /work/kk319/annotation

You are on Duke Server: DCC
Bedtools 2.27.1[m
[K[?1l>Submitted batch job 15006846


**CHECK**

In [26]:
readlink -f ${FD_LOG}/coverage_chrom.0.txt

/work/kk319/out/CombEffect_STARR/log/coverage_chrom.0.txt


In [2]:
cat ${FD_LOG}/coverage_perbase_chrom.0.txt

You are on Duke Server: DCC
BASE DIRECTORY:     /work/kk319
WORK DIRECTORY:     /work/kk319/out/CombEffect_STARR
LOG  DIRECTORY:     /work/kk319/out/CombEffect_STARR/log
PATH OF SOURCE:     /work/kk319/source
PATH OF EXECUTABLE: /work/kk319/exe
PATH OF ANNOTATION: /work/kk319/annotation

Slurm Array Index:  0
RUN: loop through samples; count fragment
++++++++++++++++++++++++++++++++++++++++++++++++
Input  file:  /work/kk319/out/CombEffect_STARR/data/Input//chr1.bed
Output file:  /work/kk319/out/CombEffect_STARR/coverage/Input/chr1_perbase.txt

Show the first few lines of the input file
/work/kk319/out/CombEffect_STARR/data/Input//chr1.bed
chr1	13868	14793
chr1	14843	15828
chr1	14868	15889
chr1	14875	15723
chr1	16771	17773

Show the last few lines of the input file
/work/kk319/out/CombEffect_STARR/data/Input//chr1.bed
chr1	248944005	248944992
chr1	248944015	248944963
chr1	248944029	248944962
chr1	248944048	248944948
chr1	248945363	248946213

Get coverage per base

Show the first few lin

In [3]:
cat ${FD_LOG}/coverage_perbase_chrom.16.txt

You are on Duke Server: DCC
BASE DIRECTORY:     /work/kk319
WORK DIRECTORY:     /work/kk319/out/CombEffect_STARR
LOG  DIRECTORY:     /work/kk319/out/CombEffect_STARR/log
PATH OF SOURCE:     /work/kk319/source
PATH OF EXECUTABLE: /work/kk319/exe
PATH OF ANNOTATION: /work/kk319/annotation

Slurm Array Index:  16
RUN: loop through samples; count fragment
++++++++++++++++++++++++++++++++++++++++++++++++
Input  file:  /work/kk319/out/CombEffect_STARR/data/Input//chr17.bed
Output file:  /work/kk319/out/CombEffect_STARR/coverage/Input/chr17_perbase.txt

Show the first few lines of the input file
/work/kk319/out/CombEffect_STARR/data/Input//chr17.bed
chr17	159510	160362
chr17	182115	183108
chr17	197679	198597
chr17	201123	201925
chr17	201133	201985

Show the last few lines of the input file
/work/kk319/out/CombEffect_STARR/data/Input//chr17.bed
chr17	83236101	83237202
chr17	83240987	83242875
chr17	83241073	83242992
chr17	83241856	83242863
chr17	83244716	83245595

Get coverage per base

Show th

In [4]:
tail -n 3 ${FD_LOG}/coverage_perbase_chrom.*.txt

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.0.txt <==
chr1	248956422	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.1.txt <==
chr2	242193529	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.10.txt <==
chr11	135086622	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.11.txt <==
chr12	133275309	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.12.txt <==
chr13	114364328	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.13.txt <==
chr14	107043718	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.14.txt <==
chr15	101991189	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.15.txt <==
chr16	90338345	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.16.txt <==
chr17	83257441	0

Done!

==> /work/kk319/out/CombEffect_STARR/log/coverage_perbase_chrom.17.txt <==
chr18	80373285	0

Done