**Set environment**

In [1]:
suppressMessages(suppressWarnings(source("../run_config_project_sing.R")))
show_env()

You are working on        Singularity 
BASE DIRECTORY (FD_BASE): /mount 
REPO DIRECTORY (FD_REPO): /mount/repo 
WORK DIRECTORY (FD_WORK): /mount/work 
DATA DIRECTORY (FD_DATA): /mount/data 

You are working with      ENCODE FCC 
PATH OF PROJECT (FD_PRJ): /mount/repo/Proj_ENCODE_FCC 
PROJECT RESULTS (FD_RES): /mount/repo/Proj_ENCODE_FCC/results 
PROJECT SCRIPTS (FD_EXE): /mount/repo/Proj_ENCODE_FCC/scripts 
PROJECT DATA    (FD_DAT): /mount/repo/Proj_ENCODE_FCC/data 
PROJECT NOTE    (FD_NBK): /mount/repo/Proj_ENCODE_FCC/notebooks 
PROJECT DOCS    (FD_DOC): /mount/repo/Proj_ENCODE_FCC/docs 
PROJECT LOG     (FD_LOG): /mount/repo/Proj_ENCODE_FCC/log 
PROJECT APP     (FD_APP): /mount/repo/Proj_ENCODE_FCC/app 
PROJECT REF     (FD_REF): /mount/repo/Proj_ENCODE_FCC/references 



**Set global variables**

In [2]:
TXT_REGION_FOLDER = "encode_crispri_hcrff"

## Import data

**Check data**

In [3]:
txt_folder = TXT_REGION_FOLDER
txt_fdiry  = file.path(FD_DAT, "external", txt_folder)
vec = dir(txt_fdiry)
for (txt in vec){cat(txt, "\n")}

K562.hg38.ENCSR009KPS.ENCFF514PCW.CRISPRi_HCRFF.signal_R1.HDAC6.bw 
K562.hg38.ENCSR009KPS.ENCFF607OIW.CRISPRi_HCRFF.signal_R2.HDAC6.bw 
K562.hg38.ENCSR009KPS.ENCFF632PQY.CRISPRi_HCRFF.CASA.HDAC6.bed.gz 
K562.hg38.ENCSR157WAN.ENCFF186XBW.CRISPRi_HCRFF.signal_R1.CD164.bw 
K562.hg38.ENCSR157WAN.ENCFF270LYK.CRISPRi_HCRFF.CASA.CD164.bed.gz 
K562.hg38.ENCSR157WAN.ENCFF786CHF.CRISPRi_HCRFF.signal_R2.CD164.bw 
K562.hg38.ENCSR278YTB.ENCFF151MNC.CRISPRi_HCRFF.CASA.FEN1.bed.gz 
K562.hg38.ENCSR278YTB.ENCFF571LUW.CRISPRi_HCRFF.signal_R1.FEN1.bw 
K562.hg38.ENCSR278YTB.ENCFF666DNQ.CRISPRi_HCRFF.signal_R2.FEN1.bw 
K562.hg38.ENCSR321CEH.ENCFF114EMW.CRISPRi_HCRFF.signal_R2.LMO2.bw 
K562.hg38.ENCSR321CEH.ENCFF469FXP.CRISPRi_HCRFF.CASA.LMO2.bed.gz 
K562.hg38.ENCSR321CEH.ENCFF756AUB.CRISPRi_HCRFF.signal_R1.LMO2.bw 
K562.hg38.ENCSR382ZJS.ENCFF090IXH.CRISPRi_HCRFF.signal_R1.FADS1.bw 
K562.hg38.ENCSR382ZJS.ENCFF161WBO.CRISPRi_HCRFF.signal_R2.FADS1.bw 
K562.hg38.ENCSR382ZJS.ENCFF786ZPA.CRISPRi_HCRFF.CASA.FADS1

**Read table**

In [13]:
### set directory
txt_folder = TXT_REGION_FOLDER
txt_fdiry  = file.path(FD_DAT, "external", txt_folder)
txt_fname  = "K562.hg38.*.bed.gz"
txt_fglob  = file.path(txt_fdiry, txt_fname)

### get file paths
vec_txt_fpath = Sys.glob(txt_fglob)

### read table
lst = lapply(vec_txt_fpath, function(txt_fpath){
    dat = read_tsv(txt_fpath, col_names = FALSE, show_col_types = FALSE)
    dat = dat %>% dplyr::select(X1, X2, X3, X5, X14, X15)
    colnames(dat) = c("Chrom", "ChromStart", "ChromEnd", "Score", "Gene_Symbol", "Gene_Ensembl")
    return(dat)
})
dat = bind_rows(lst)

### show and assign
dat_region_import = dat
fun_display_table(head(dat))

Chrom,ChromStart,ChromEnd,Score,Gene_Symbol,Gene_Ensembl
chrX,48786297,48786997,-1.4253163,HDAC6,ENSG00000094631
chrX,48800297,48801097,1.3966617,HDAC6,ENSG00000094631
chrX,48801697,48802997,2.5875531,HDAC6,ENSG00000094631
chr6,109236645,109237345,0.3466277,CD164,ENSG00000135535
chr6,109301445,109302345,0.2394284,CD164,ENSG00000135535
chr6,109303145,109306545,3.4797733,CD164,ENSG00000135535


In [15]:
dat = dat_region_import
dat = dat %>%
    dplyr::mutate(
        Name = paste0(Chrom, ":", ChromStart, "-", ChromEnd),
        Strand = ".",
        Group  = "CRISPRi-HCRFF",
        Label  = paste0("CRISPRi-HCRFF", ":", Gene_Symbol)
    ) %>%
    dplyr::select(
        Chrom, ChromStart, ChromEnd, Name, Score, Strand, 
        Gene_Symbol, Gene_Ensembl,
        Group, Label
    ) %>%
    dplyr::arrange(Chrom, ChromStart, ChromEnd)

### show and assign
dat_region_arrange = dat
fun_display_table(head(dat))

Chrom,ChromStart,ChromEnd,Name,Score,Strand,Gene_Symbol,Gene_Ensembl,Group,Label
chr11,5248847,5249047,chr11:5248847-5249047,1.068624,.,HBG1,ENST00000330597.5,CRISPRi-HCRFF,CRISPRi-HCRFF:HBG1
chr11,5248847,5249047,chr11:5248847-5249047,0.9357701,.,HBG2,ENST00000336906.6,CRISPRi-HCRFF,CRISPRi-HCRFF:HBG2
chr11,5249847,5250847,chr11:5249847-5250847,1.8908899,.,HBG1,ENST00000330597.5,CRISPRi-HCRFF,CRISPRi-HCRFF:HBG1
chr11,5249847,5250847,chr11:5249847-5250847,1.9229558,.,HBG2,ENST00000336906.6,CRISPRi-HCRFF,CRISPRi-HCRFF:HBG2
chr11,5253147,5253547,chr11:5253147-5253547,1.3303423,.,HBG1,ENST00000330597.5,CRISPRi-HCRFF,CRISPRi-HCRFF:HBG1
chr11,5253147,5253547,chr11:5253147-5253547,1.3232571,.,HBG2,ENST00000336906.6,CRISPRi-HCRFF,CRISPRi-HCRFF:HBG2


In [16]:
txt_fpath = vec_txt_fpath[1]
dat = read_tsv(txt_fpath, col_names = FALSE, show_col_types = FALSE)
fun_display_table(head(dat))

X1,X2,X3,X4,X5,X6,X7,X8,X9,X10,X11,X12,X13,X14,X15,X16,X17,X18,X19,X20,X21,X22,X23,X24,X25
chrX,48786297,48786997,chrX:48786297-48786997:.,-1.425316,.,chrX:48786297-48786997:.,chrX,48802033,48802034,+,,,HDAC6,ENSG00000094631,,,True,,,,,,True,
chrX,48800297,48801097,chrX:48800297-48801097:.,1.396662,.,chrX:48800297-48801097:.,chrX,48802033,48802034,+,,,HDAC6,ENSG00000094631,,,True,,,,,,True,
chrX,48801697,48802997,chrX:48801697-48802997:.,2.587553,.,chrX:48801697-48802997:.,chrX,48802033,48802034,+,,,HDAC6,ENSG00000094631,,,True,,,,,,True,


## Save results

**Write tables**

In [13]:
### set directory
txt_folder = TXT_REGION_FOLDER
txt_fdiry = file.path(FD_RES, "region", txt_folder)
txt_cmd   = paste("mkdir -p", txt_fdiry)
system(txt_cmd)

### write table: cCREs
txt_fname = "K562.hg38.CRISPRi_HCRFF.CASA.bed.gz"

txt_fpath = file.path(txt_fdiry, txt_fname)
dat = dat_region_ccres_arrange
write_tsv(dat, txt_fpath, col_names = FALSE)