# Set environment

In [53]:
library(tidyverse)

In [54]:
library(foreach)

# Import data

In [55]:
OUTDIR  = "/data/clintko/flow_EQAPOL"
DATADIR = "/data/flow/EQAPOL_normal"

In [56]:
files = system("ls /data/flow/EQAPOL_normal | grep txt | grep -v markers", intern = TRUE)
print(files)

 [1] "AMJ_5L_CMV_pp65.txt"      "AMJ_5L_Costim.txt"       
 [3] "AMJ_5L_SEB.txt"           "B6901GFJ-08_CMV_pp65.txt"
 [5] "B6901GFJ-08_Costim.txt"   "B6901GFJ-08_SEB.txt"     
 [7] "E6901F0T-07_CMV_pp65.txt" "E6901F0T-07_Costim.txt"  
 [9] "E6901F0T-07_SEB.txt"      "E6901FYZ-01_CMV_pp65.txt"
[11] "E6901FYZ-01_Costim.txt"   "E6901FYZ-01_SEB.txt"     
[13] "F69018CN-01_CMV_pp65.txt" "F69018CN-01_Costim.txt"  
[15] "F69018CN-01_SEB.txt"      "F6901DJK-01_CMV_pp65.txt"
[17] "F6901DJK-01_Costim.txt"   "F6901DJK-01_SEB.txt"     
[19] "G6901B3H-01_CMV_pp65.txt" "G6901B3H-01_Costim.txt"  
[21] "G6901B3H-01_SEB.txt"      "J6901CDB-01_CMV_pp65.txt"
[23] "J6901CDB-01_Costim.txt"   "J6901CDB-01_SEB.txt"     
[25] "J6901HJ1-06_CMV_pp65.txt" "J6901HJ1-06_Costim.txt"  
[27] "J6901HJ1-06_SEB.txt"      "K690194C-01_CMV_pp65.txt"
[29] "K690194C-01_Costim.txt"   "K690194C-01_SEB.txt"     
[31] "K6901DKW-01_CMV_pp65.txt" "K6901DKW-01_Costim.txt"  
[33] "K6901DKW-01_SEB.txt"     


In [57]:
tmp = files
tmp[grepl("Costim", tmp)] = "Costim" # negative control
tmp[grepl("CMV",    tmp)] = "CMV"    # CMB peptide stimulation
tmp[grepl("SEB",    tmp)] = "SEB"    # positive control

dat_pheno = data.frame(file_name = files, trt = tmp)

In [58]:
dat_pheno

file_name,trt
AMJ_5L_CMV_pp65.txt,CMV
AMJ_5L_Costim.txt,Costim
AMJ_5L_SEB.txt,SEB
B6901GFJ-08_CMV_pp65.txt,CMV
B6901GFJ-08_Costim.txt,Costim
B6901GFJ-08_SEB.txt,SEB
E6901F0T-07_CMV_pp65.txt,CMV
E6901F0T-07_Costim.txt,Costim
E6901F0T-07_SEB.txt,SEB
E6901FYZ-01_CMV_pp65.txt,CMV


# Markers

In [59]:
dat_markers = read_csv(
    file.path(DATADIR, "markers.txt"), 
    col_types = c(col_character(), col_character()),
    col_names = FALSE)
colnames(dat_markers) = c("type", "marker")

dat_markers

type,marker
Scatter,FSC-H
Scatter,FSC-W
Scatter,FSC-A
Basic,CD14 CD19 vAmine
Basic,CD3 AmCyan
Basic,CD4 PerCP Cy55
Basic,CD8 APC Cy7
Maturational,CD45RO ECD
Maturational,CD27 APC
Maturational,CD57 FITC


# Flow data

In [36]:
files

In [40]:
### column types
coltypes <- list(
    col_double(), col_double(), col_double(), col_double(),
    col_double(), col_double(), col_double(), col_double(),
    col_double(), col_double(), col_double(), col_double(),
    col_double(), col_double())

### read in all data into a list
dat_raw = foreach(file = files) %do% {
    read_delim(
        file.path(DATADIR, file), 
        delim = " ", 
        col_names = FALSE,
        col_types = coltypes)
}

In [42]:
length(files)

In [41]:
length(dat_raw)

In [43]:
names(dat_raw) = files

In [60]:
outfile = file.path(OUTDIR, "EQAPOL_normal.RData")
save(dat_raw, dat_markers, dat_pheno, file = outfile)