**Set environment**

In [1]:
suppressWarnings(suppressMessages(source("../config/config_sing.R")))
show_env()

You are in Singularity: singularity_proj_combeffect 
BASE DIRECTORY:     /mount/work 
PATH OF SOURCE:     /mount/work/source 
PATH OF EXECUTABLE: /mount/work/exe 
PATH OF ANNOTATION: /mount/work/annotation 
PATH OF PROJECT:    /mount/project 
PATH OF RESULTS:    /mount/work/out/proj_combeffect_encode_fcc 


**Check data**

In [2]:
dir(FD_RES)

In [3]:
prefix = "KS91_K562_ASTARRseq"
fdiry  = file.path(FD_RES, prefix, "coverage", "library_size")
dir(fdiry)

## Import library size counts

In [4]:
### file directory
fdiry = file.path(FD_RES, prefix, "coverage", "library_size")
fname = "library_size_input.csv"
fpath = file.path(fdiry, fname)

### set columns
cnames = c("Fpath", "Count")

### import data
dat_lib_inp = read_csv(fpath, col_names = cnames, show_col_types = FALSE)
dat_lib_inp

Fpath,Count
<chr>,<dbl>
KS91_K562_hg38_ASTARRseq_Input_rep1.masked.dedup.fragments.counts.txt.gz,348695063
KS91_K562_hg38_ASTARRseq_Input_rep2.masked.dedup.fragments.counts.txt.gz,451369741
KS91_K562_hg38_ASTARRseq_Input_rep3.masked.dedup.fragments.counts.txt.gz,487579055
KS91_K562_hg38_ASTARRseq_Input_rep4.masked.dedup.fragments.counts.txt.gz,456246254
KS91_K562_hg38_ASTARRseq_Input_rep5.masked.dedup.fragments.counts.txt.gz,444268950
KS91_K562_hg38_ASTARRseq_Input_rep6.masked.dedup.fragments.counts.txt.gz,397333562


In [5]:
### file directory
fdiry = file.path(FD_RES, prefix, "coverage", "library_size")
fname = "library_size_output.csv"
fpath = file.path(fdiry, fname)

### set columns
cnames = c("Fpath", "Count")

### import data
dat_lib_out = read_csv(fpath, col_names = cnames, show_col_types = FALSE)
dat_lib_out

Fpath,Count
<chr>,<dbl>
KS91_K562_hg38_ASTARRseq_Output_rep1.f3q10.fragments.counts.txt.gz,44103844
KS91_K562_hg38_ASTARRseq_Output_rep2.f3q10.fragments.counts.txt.gz,97471282
KS91_K562_hg38_ASTARRseq_Output_rep3.f3q10.fragments.counts.txt.gz,84103298
KS91_K562_hg38_ASTARRseq_Output_rep4.f3q10.fragments.counts.txt.gz,183115379


## Summarize the information and save the tables

In [6]:
dat_inp = dat_lib_inp
dat_inp$Sample = paste0("Input_rep", 1:6)
dat_inp$Group  = "Input"
dat_inp$Rep    = paste0("rep", 1:6)
dat_inp

Fpath,Count,Sample,Group,Rep
<chr>,<dbl>,<chr>,<chr>,<chr>
KS91_K562_hg38_ASTARRseq_Input_rep1.masked.dedup.fragments.counts.txt.gz,348695063,Input_rep1,Input,rep1
KS91_K562_hg38_ASTARRseq_Input_rep2.masked.dedup.fragments.counts.txt.gz,451369741,Input_rep2,Input,rep2
KS91_K562_hg38_ASTARRseq_Input_rep3.masked.dedup.fragments.counts.txt.gz,487579055,Input_rep3,Input,rep3
KS91_K562_hg38_ASTARRseq_Input_rep4.masked.dedup.fragments.counts.txt.gz,456246254,Input_rep4,Input,rep4
KS91_K562_hg38_ASTARRseq_Input_rep5.masked.dedup.fragments.counts.txt.gz,444268950,Input_rep5,Input,rep5
KS91_K562_hg38_ASTARRseq_Input_rep6.masked.dedup.fragments.counts.txt.gz,397333562,Input_rep6,Input,rep6


In [7]:
dat_out = dat_lib_out
dat_out$Sample = paste0("Output_rep", 1:4)
dat_out$Group  = "Output"
dat_out$Rep    = paste0("rep", 1:4)
dat_out

Fpath,Count,Sample,Group,Rep
<chr>,<dbl>,<chr>,<chr>,<chr>
KS91_K562_hg38_ASTARRseq_Output_rep1.f3q10.fragments.counts.txt.gz,44103844,Output_rep1,Output,rep1
KS91_K562_hg38_ASTARRseq_Output_rep2.f3q10.fragments.counts.txt.gz,97471282,Output_rep2,Output,rep2
KS91_K562_hg38_ASTARRseq_Output_rep3.f3q10.fragments.counts.txt.gz,84103298,Output_rep3,Output,rep3
KS91_K562_hg38_ASTARRseq_Output_rep4.f3q10.fragments.counts.txt.gz,183115379,Output_rep4,Output,rep4


**Combine the results**

In [10]:
dat_lib = bind_rows(dat_inp, dat_out) %>% dplyr::select(Sample, Group, Rep, Count, Fpath)
dat_lib

Sample,Group,Rep,Count,Fpath
<chr>,<chr>,<chr>,<dbl>,<chr>
Input_rep1,Input,rep1,348695063,KS91_K562_hg38_ASTARRseq_Input_rep1.masked.dedup.fragments.counts.txt.gz
Input_rep2,Input,rep2,451369741,KS91_K562_hg38_ASTARRseq_Input_rep2.masked.dedup.fragments.counts.txt.gz
Input_rep3,Input,rep3,487579055,KS91_K562_hg38_ASTARRseq_Input_rep3.masked.dedup.fragments.counts.txt.gz
Input_rep4,Input,rep4,456246254,KS91_K562_hg38_ASTARRseq_Input_rep4.masked.dedup.fragments.counts.txt.gz
Input_rep5,Input,rep5,444268950,KS91_K562_hg38_ASTARRseq_Input_rep5.masked.dedup.fragments.counts.txt.gz
Input_rep6,Input,rep6,397333562,KS91_K562_hg38_ASTARRseq_Input_rep6.masked.dedup.fragments.counts.txt.gz
Output_rep1,Output,rep1,44103844,KS91_K562_hg38_ASTARRseq_Output_rep1.f3q10.fragments.counts.txt.gz
Output_rep2,Output,rep2,97471282,KS91_K562_hg38_ASTARRseq_Output_rep2.f3q10.fragments.counts.txt.gz
Output_rep3,Output,rep3,84103298,KS91_K562_hg38_ASTARRseq_Output_rep3.f3q10.fragments.counts.txt.gz
Output_rep4,Output,rep4,183115379,KS91_K562_hg38_ASTARRseq_Output_rep4.f3q10.fragments.counts.txt.gz


**Save the table**

In [11]:
fdiry = file.path(FD_RES, prefix, "coverage", "library_size")
fname = "library_size_summary.csv"
fpath = file.path(fdiry, fname)
write_csv(dat_lib, fpath)