<h1>Table of Contents<span class="tocSkip"></span></h1>
<div class="toc"><ul class="toc-item"><li><span><a href="#Dependencies" data-toc-modified-id="Dependencies-1">Dependencies</a></span></li><li><span><a href="#Functions" data-toc-modified-id="Functions-2">Functions</a></span></li><li><span><a href="#Paths" data-toc-modified-id="Paths-3">Paths</a></span></li><li><span><a href="#Main" data-toc-modified-id="Main-4">Main</a></span><ul class="toc-item"><li><span><a href="#Make-list-of-files-for-pbmc-and-cfdna" data-toc-modified-id="Make-list-of-files-for-pbmc-and-cfdna-4.1">Make list of files for pbmc and cfdna</a></span></li><li><span><a href="#PBMCs" data-toc-modified-id="PBMCs-4.2">PBMCs</a></span></li><li><span><a href="#cfDNA" data-toc-modified-id="cfDNA-4.3">cfDNA</a></span></li><li><span><a href="#PBMCs-and-cfDNA" data-toc-modified-id="PBMCs-and-cfDNA-4.4">PBMCs and cfDNA</a></span></li><li><span><a href="#Tumour-and-PBMCs" data-toc-modified-id="Tumour-and-PBMCs-4.5">Tumour and PBMCs</a></span><ul class="toc-item"><li><span><a href="#407-DLBCL" data-toc-modified-id="407-DLBCL-4.5.1">407 DLBCL</a></span></li><li><span><a href="#404-ERMS" data-toc-modified-id="404-ERMS-4.5.2">404 ERMS</a></span></li><li><span><a href="#394-ERMS" data-toc-modified-id="394-ERMS-4.5.3">394 ERMS</a></span></li><li><span><a href="#372-BL" data-toc-modified-id="372-BL-4.5.4">372 BL</a></span></li><li><span><a href="#370-ALCL" data-toc-modified-id="370-ALCL-4.5.5">370 ALCL</a></span></li><li><span><a href="#364-OS" data-toc-modified-id="364-OS-4.5.6">364 OS</a></span></li><li><span><a href="#361-HD" data-toc-modified-id="361-HD-4.5.7">361 HD</a></span></li></ul></li><li><span><a href="#Tumour-and-cfDNA" data-toc-modified-id="Tumour-and-cfDNA-4.6">Tumour and cfDNA</a></span><ul class="toc-item"><li><span><a href="#361-HD" data-toc-modified-id="361-HD-4.6.1">361 HD</a></span></li><li><span><a href="#370-ALCL" data-toc-modified-id="370-ALCL-4.6.2">370 ALCL</a></span></li><li><span><a href="#372" data-toc-modified-id="372-4.6.3">372</a></span></li><li><span><a href="#401" data-toc-modified-id="401-4.6.4">401</a></span></li><li><span><a href="#380" data-toc-modified-id="380-4.6.5">380</a></span></li></ul></li></ul></li></ul></div>

# Dependencies

In [1]:
library(ggalluvial)
library(randomcoloR)

Loading required package: ggplot2
“package ‘randomcoloR’ was built under R version 3.5.2”

# Functions

In [2]:
cdr3_dataframe.fx <- function(datapath, chain, filelist, totalinframe){
  
  if (!(totalinframe %in% c("total", "inframe"))) {
    stop("Error: unknown argument ", totalinframe, ". Please provide either total (for all clonotypes) or inframe (for in-frame clonotypes only)")
  }  
  
  # Ensure only one chain is included
  filelist <- filelist[grepl(chain, filelist)]
  
  #Compile a big file with patient's mixcr files
  i <- 1
  for (f in filelist){
    mixcrfle <- read.table(paste(datapath, f, sep = ""), 
                           header = TRUE, sep = "\t",
                           stringsAsFactors = FALSE,
                           na.strings = c("", "NA"))
    if(i == 1){
# Remove duplicated CDR3s
    message("duplicated sequences:")
     print(mixcrfle$aaSeqCDR3[duplicated(mixcrfle$aaSeqCDR3)]) 
      compldfle <- mixcrfle[!duplicated(mixcrfle$aaSeqCDR3),]
      compldfle <- cbind(cloneno = row.names(compldfle), 
                         filename = f, 
                         compldfle)
      i <- i + 1   
    }
    else{
      compldfle1 <- mixcrfle[!duplicated(mixcrfle$aaSeqCDR3),]
      compldfle1 <- cbind(cloneno = row.names(compldfle1), 
                          filename = f, 
                          compldfle1)
      compldfle <- rbind(compldfle, compldfle1)
      rm(compldfle1)
    }
  }
  myfiles <- unique(as.character(compldfle$filename))
  message("my files:")
  print(myfiles)
  
  message("Total recovered clonotypes:")
  print(length(compldfle$aaSeqCDR3))    
  
  message("Total out-of-frame clonotypes:")    
  print(length(compldfle$aaSeqCDR3[grepl("_", compldfle$aaSeqCDR3)]))     
  message("Total clonotypes with stop codon:")    
  print(length(compldfle$aaSeqCDR3[grepl("[*]", compldfle$aaSeqCDR3) &
                                     !grepl("_", compldfle$aaSeqCDR3)]))     
  
#make samplename column
  compldfle$filename <- as.character(compldfle$filename)
  compldfle$samplename <- gsub(".*.CLONES_","", compldfle$filename) 
  
# remove out-of-frame clonotypes and those with stop codon    
  compldfle_clean <- compldfle[!grepl("_", compldfle$aaSeqCDR3) &
                                 !grepl("[*]", compldfle$aaSeqCDR3),]
  
  message("Total productive clonotypes:")
  print(length(compldfle_clean$aaSeqCDR3))      
  
  if(totalinframe == "inframe"){
    message("Output contains in_frame clonotypes only")
    return(compldfle_clean)}
  if(totalinframe == "total"){
    message("Output contains all clonotypes")
    return(compldfle)}
}


In [12]:
plot_clonetracks.fx <- function(compldfle, plotpath, chain, countfrac, clnefrc){
  
  if (!(countfrac %in% c("cloneFraction", "cloneCount"))) {
    stop("Error: unknown argument ", countfrac, ". Please provide either cloneFraction or cloneCount.")
  }  
  
  message("list of samples to track clones: ")
  mysamples <- unique(compldfle$samplename)
  print(mysamples)
  
  
# Subset df
  CDR3_fraction <- compldfle[, c("samplename","aaSeqCDR3","cloneFraction", "cloneCount")]
# Subset to include only clonotypes with more than specified clonal fraction    
  CDR3_fraction <- CDR3_fraction[CDR3_fraction$cloneFraction > clnefrc,] 
  
#Assign colors to recurring clonotypes
  recurring <- unique(CDR3_fraction$aaSeqCDR3[duplicated(CDR3_fraction$aaSeqCDR3)])
  notrecurring <- CDR3_fraction$aaSeqCDR3[!CDR3_fraction$aaSeqCDR3 %in% recurring]
  
  message("Total number of recurring clonotypes: ")     
  print(length(recurring))
  
  if(length(recurring) == 0){
#Introduce a dummy common cdr3 dataframe for alluvia 
    mydummy_df <- as.data.frame(matrix(ncol = 4, nrow = length(mysamples)))
    colnames(mydummy_df) <- colnames(CDR3_fraction)
    
    mydummy_df$samplename <- mysamples
    mydummy_df$aaSeqCDR3 <-  "XXXXX"
    mydummy_df$cloneFraction <- 0
    mydummy_df$cloneCount <- 0     
    CDR3_fraction <- rbind(CDR3_fraction, mydummy_df)
    
    recurring <- "XXXXX"
    
  }
  if(length(recurring) > 50){
    recurring_df <- CDR3_fraction[CDR3_fraction$aaSeqCDR3 %in% recurring,]
    recurringcdr3_ordered <- unique(recurring_df$aaSeqCDR3[order(recurring_df$cloneCount, decreasing = TRUE)])
    message("Total number of recurring clonotypes > 50 ")   
    message("Tracking top 10 recurring clonotypes ")  
    myColors <- distinctColorPalette(10)
    
    myColors <- c(myColors, rep("white",length(recurring)-10),
                  rep("white",length(notrecurring)))
    names(myColors) <- c(recurringcdr3_ordered, notrecurring)
    
    message("these are what we color: ")  
    print(myColors[myColors != "white"])         
  }
  else{
    myColors <- distinctColorPalette(length(recurring))
    myColors <- c(myColors, rep("white",length(notrecurring)))
    names(myColors) <- c(recurring, notrecurring)
    
    myColors[names(myColors) == "XXXXX"] <- "white"
    
    message("these are what we color: ")  
    print(myColors[myColors != "white"]) 
  }
  
# Generate a row for each sample that doesnot have recurring clonotype
## This ensures alluvia are colored
  
  for(c in recurring){
    tmp <- CDR3_fraction[CDR3_fraction$aaSeqCDR3 == c,]
    nonexsiting <- mysamples[!mysamples %in% tmp$samplename]
    if(length(nonexsiting) > 0){
      newentries <- data.frame("samplename" = nonexsiting, "aaSeqCDR3" = c, 
                               "cloneFraction" = 0, "cloneCount" = 0)
      CDR3_fraction <- rbind(CDR3_fraction, newentries)
    }
  }
  
  
  p <-  ggplot(CDR3_fraction, aes(x = samplename, 
                                  y = eval(as.name(countfrac)),
                                  fill = aaSeqCDR3,
                                  stratum = aaSeqCDR3,
                                  alluvium = aaSeqCDR3,
                                  label = aaSeqCDR3))
  
  myp <- p + geom_alluvium(decreasing = FALSE) + 
    geom_stratum(decreasing = FALSE, stat = "alluvium") + 
    scale_fill_manual(breaks = names(myColors[myColors != "white"]),
                      values = myColors) +
    theme(axis.title.y = element_text(size = 50),
          axis.title.x = element_blank(),
          axis.line = element_line(color = "black"),
          axis.text = element_text(size = 50),
          axis.text.x = element_text(angle = 45, hjust = 1)) +
    theme(panel.grid.major = element_blank(),
          panel.grid.minor = element_blank(),
          panel.background = element_rect(fill = "transparent",colour = NA),
          legend.key = element_rect(fill = "white", colour = "white"),
          legend.position = "none",
          plot.margin = unit(c(0.2,0,0,0),"cm")) + 
    labs(y = countfrac) 
  
  pdf(paste0(plotpath, "clonetrack_cfDNA", mysamples[1],
             chain, countfrac, ".pdf"),
      width = 15, 
      height = 20,
      useDingbats = FALSE,
      onefile = FALSE)       
  print(myp)  
  dev.off()      
  
}

# Paths

In [4]:
datapath <- "/Users/anabbi/OneDrive - UHN/Documents/INTERCEPT/Data/Nextseq/"
plotpath <- "/Users/anabbi/OneDrive - UHN/Documents/INTERCEPT/Plots/"

# Main

In [5]:
master_df <- read.csv("/Users/anabbi/OneDrive - UHN/Documents/INTERCEPT/Data/ATC_Tcells_NCR.csv",
                      stringsAsFactors = F)

In [6]:
master_df[ master_df$Patient == "364",]

Unnamed: 0_level_0,Patient,cycle,FOLD,ATC,Age,Disease_type,TE_fold,Pass,CD3,EM,⋯,TIM3,CTLA4,PD1.,PDL1.,LAG3.,TIM3.,CTLA4.,Any.NCR,PD1...LAG3...TIM3,group
Unnamed: 0_level_1,<int>,<int>,<dbl>,<dbl>,<dbl>,<chr>,<chr>,<lgl>,<int>,<int>,⋯,<int>,<int>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<chr>
171,364,1,2.3,877.68,16,OS,2.3,,2411,33.0,⋯,303.0,,12.5674,,5.060141,12.5674,,,,Solid
172,364,2,1.9,0.0,16,OS,1.9,,2487,18.0,⋯,153.0,,6.15199,,5.589063,6.15199,,,,Solid
173,364,3,0.0,0.0,16,OS,0.0,,0,,⋯,,,,,,,,,,Solid
174,364,4,4.0,0.0,16,OS,4.0,,2454,9.0,⋯,610.0,,24.85738,,19.845151,24.85738,,,,Solid
175,364,5,5.0,0.0,16,OS,5.0,,2119,103.0,⋯,586.0,,27.65455,,4.341671,27.65455,,,,Solid


## Make list of files for pbmc and cfdna

In [21]:
flelst <- list.files(datapath,
                     recursive = TRUE,
                     pattern = paste("CLONES", "TRB", sep = "_"))

# subset to include only downsampled files
ds_flelst <- flelst[grepl("2000000", flelst)]

# remove normals
ds_flelst_normalrm <- ds_flelst[!grepl("batchNormal", ds_flelst)]

ds_flelst_chp_PBMC <- ds_flelst_normalrm[grepl("PBMC", ds_flelst_normalrm)]
ds_flelst_chp_cfDNA <- ds_flelst_normalrm[grepl("cfDNA", ds_flelst_normalrm)]
ds_flelst_chp_ffpe <- ds_flelst_normalrm[grepl("FFPE", ds_flelst_normalrm)]

## PBMCs

In [22]:
manifest_df <- cbind.data.frame(ds_flelst_chp_PBMC, NA,NA,stringsAsFactors = F)

colnames(manifest_df) <- c("filename", "patient", "cycle")

In [23]:
manifest_df$filename <- gsub(".*CLONES", "CLONES", manifest_df$filename)

manifest_df$patient <- gsub("CLONES_TRBCHP_", "", manifest_df$filename)
manifest_df$patient <- gsub("-.*", "", manifest_df$patient)

manifest_df$cycle <- substr(manifest_df$filename, 19,20)
#manifest_df$cycle <- gsub("-PBMC-DNA_2000000.txt", "", manifest_df$cycle)

In [10]:
ptlist <- as.data.frame(table(manifest_df$patient))

In [11]:
for(pt in ptlist$Var1[ptlist$Freq > 2]){
    print(pt)
    tmp <- ds_flelst_chp_PBMC[grepl(pt, ds_flelst_chp_PBMC)]
    cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
    cdr3df$samplename <- gsub("-DNA.*", "", cdr3df$samplename)
    cdr3df$samplename <- gsub("_DNA.*", "", cdr3df$samplename)
    cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)
    plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)
}

[1] "323"


duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_323-03-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_323-04-PBMC-DNA_2000000.txt"
[3] "batch7/ds_batch7/CLONES_TRBCHP_323-05-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 254


Total out-of-frame clonotypes:


[1] 55


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 196


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_323-03-PBMC" "CHP_323-04-PBMC" "CHP_323-05-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "338"


duplicated sequences:


[1] "CASTKSRGQ_HYSNQPQHF" "CAIRPGQGDTGELFF"    


my files:


[1] "batch2/ds_batch2/CLONES_TRBCHP_338-04-PBMC-DNA_2000000.txt"
[2] "batch2/ds_batch2/CLONES_TRBCHP_338-05-PBMC-DNA_2000000.txt"
[3] "batch4/ds_batch4/CLONES_TRBCHP_338-03-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 1012


Total out-of-frame clonotypes:


[1] 202


Total clonotypes with stop codon:


[1] 16


Total productive clonotypes:


[1] 794


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_338-04-PBMC" "CHP_338-05-PBMC" "CHP_338-03-PBMC"


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSFNTEAFF 
  "#BEB3B2" 
[1] "340"


duplicated sequences:


 [1] "CAISRTDNSPLHF"       "CASSKAGE_VALGALHF"   "CASSQEGPLGRSYNSPLHF"
 [4] "CASSGDVRGPKLGEQYF"   "CASSQTGSGRPGELFF"    "CASSGPGTGGSEQYF"    
 [7] "CASSEVLAVYEQYF"      "CASSPATSGREQYF"      "CASNRGLDYGYTF"      
[10] "CAGL_EAFF"          


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_340-05-PBMC-DNA_2000000.txt"  
[2] "batch4/ds_batch4/CLONES_TRBCHP_340-03-PBMC-DNA_2000000.txt"  
[3] "batch6a/ds_batch6a/CLONES_TRBCHP_340-04-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 869


Total out-of-frame clonotypes:


[1] 193


Total clonotypes with stop codon:


[1] 19


Total productive clonotypes:


[1] 657


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_340-05-PBMC" "CHP_340-03-PBMC" "CHP_340-04-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "343"


duplicated sequences:


character(0)


my files:


[1] "batch2/ds_batch2/CLONES_TRBCHP_343-02-PBMC-DNA_2000000.txt"
[2] "batch2/ds_batch2/CLONES_TRBCHP_343-03-PBMC-DNA_2000000.txt"
[3] "batch2/ds_batch2/CLONES_TRBCHP_343-04-PBMC-DNA_2000000.txt"
[4] "batch4/ds_batch4/CLONES_TRBCHP_343-05-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 119


Total out-of-frame clonotypes:


[1] 21


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 97


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_343-02-PBMC" "CHP_343-03-PBMC" "CHP_343-04-PBMC" "CHP_343-05-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "344"


duplicated sequences:


[1] "CASSQDKCSGGVLTDTQYF" "CASSVSPRLAGTSQFF"    "CASSLVPYEQYF"       


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_344-05-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_344-02-PBMC-DNA_2000000.txt"
[3] "batch7/ds_batch7/CLONES_TRBCHP_344-03-PBMC-DNA_2000000.txt"
[4] "batch8/ds_batch8/CLONES_TRBCHP_344-04-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 244


Total out-of-frame clonotypes:


[1] 32


Total clonotypes with stop codon:


[1] 5


Total productive clonotypes:


[1] 207


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_344-05-PBMC" "CHP_344-02-PBMC" "CHP_344-03-PBMC" "CHP_344-04-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "345"


duplicated sequences:


[1] "CASSPGQGALYSNQPQHF" "CASSPGQGALYSNQPQHF"


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_345-04-PBMC-DNA_2000000.txt"
[2] "batch3/ds_batch3/CLONES_TRBCHP_345-05-PBMC-DNA_2000000.txt"
[3] "batch4/ds_batch4/CLONES_TRBCHP_345-02-PBMC-DNA_2000000.txt"
[4] "batch7/ds_batch7/CLONES_TRBCHP_345-03-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 717


Total out-of-frame clonotypes:


[1] 179


Total clonotypes with stop codon:


[1] 11


Total productive clonotypes:


[1] 527


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_345-04-PBMC" "CHP_345-05-PBMC" "CHP_345-02-PBMC" "CHP_345-03-PBMC"


Total number of recurring clonotypes: 


[1] 14


these are what we color: 


                                                                CASSPDGPRGTQYF 
                                                                     "#D9D298" 
                                                                  CASTYNDNEQFF 
                                                                     "#80E8D7" 
                                                               CAISESGGSHNEQFF 
                                                                     "#797CD8" 
                                                               CASSPDRGGRDGYTF 
                                                                     "#DFD553" 
                                                               CASSQGLAGSYEQYF 
                                                                     "#7EB6D8" 
                                                             CASSHISDLPNPYEQYF 
                                                                     "#D2B0E1" 
                                        

duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_347-01-PBMC-DNA_2000000.txt"  
[2] "batch4/ds_batch4/CLONES_TRBCHP_347-02-PBMC-DNA_2000000.txt"  
[3] "batch6a/ds_batch6a/CLONES_TRBCHP_347-04-PBMC-DNA_2000000.txt"
[4] "batch7/ds_batch7/CLONES_TRBCHP_347-03-PBMC-DNA_2000000.txt"  
[5] "batch8/ds_batch8/CLONES_TRBCHP_347-05-PBMC-DNA_2000000.txt"  


Total recovered clonotypes:


[1] 863


Total out-of-frame clonotypes:


[1] 155


Total clonotypes with stop codon:


[1] 13


Total productive clonotypes:


[1] 695


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_347-01-PBMC" "CHP_347-02-PBMC" "CHP_347-04-PBMC" "CHP_347-03-PBMC"
[5] "CHP_347-05-PBMC"


Total number of recurring clonotypes: 


[1] 2


these are what we color: 


CASNFAGGMSTGELFF    CSARTGGVYEQYF 
       "#BF8ACA"        "#B7D39D" 
[1] "348"


duplicated sequences:


[1] "CAWDREREQYF"


my files:


[1] "batch1/ds_batch1/CLONES_TRBCHP_348-03-PBMC-DNA_2000000.txt"
[2] "batch1/ds_batch1/CLONES_TRBCHP_348-04-PBMC-DNA_2000000.txt"
[3] "batch2/ds_batch2/CLONES_TRBCHP_348-01-PBMC-DNA_2000000.txt"
[4] "batch2/ds_batch2/CLONES_TRBCHP_348-02-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 313


Total out-of-frame clonotypes:


[1] 56


Total clonotypes with stop codon:


[1] 7


Total productive clonotypes:


[1] 250


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_348-03-PBMC" "CHP_348-04-PBMC" "CHP_348-01-PBMC" "CHP_348-02-PBMC"


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASRPIAGGGADTQYF 
       "#BEB3B2" 
[1] "350"


duplicated sequences:


[1] "CASSHRQGE_SGANVLTF"


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_350-01-PBMC-DNA_2000000.txt"
[2] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_350-02-PBMC-DNA_2000000.txt"
[3] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_350-03-PBMC-DNA_2000000.txt"
[4] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_350-04-PBMC-DNA_2000000.txt"
[5] "batch3/ds_batch3/CLONES_TRBCHP_350-05-PBMC-DNA_2000000.txt"          


Total recovered clonotypes:


[1] 889


Total out-of-frame clonotypes:


[1] 181


Total clonotypes with stop codon:


[1] 16


Total productive clonotypes:


[1] 692


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_350-01-PBMC" "CHP_350-02-PBMC" "CHP_350-03-PBMC" "CHP_350-04-PBMC"
[5] "CHP_350-05-PBMC"


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSLGGPYEQYF 
    "#BEB3B2" 
[1] "353"


duplicated sequences:


[1] "CASSEAGAGELFF"


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_353-02-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_353-01-PBMC-DNA_2000000.txt"          
[3] "batch7/ds_batch7/CLONES_TRBCHP_353-03-PBMC-DNA_2000000.txt"          
[4] "batch7/ds_batch7/CLONES_TRBCHP_353-05-PBMC-DNA_2000000.txt"          


Total recovered clonotypes:


[1] 864


Total out-of-frame clonotypes:


[1] 148


Total clonotypes with stop codon:


[1] 15


Total productive clonotypes:


[1] 701


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_353-02-PBMC" "CHP_353-01-PBMC" "CHP_353-03-PBMC" "CHP_353-05-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "356"


duplicated sequences:


character(0)


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_356-03-PBMC-DNA_2000000.txt"
[2] "batch1/ds_batch1/CLONES_TRBCHP_356-05-PBMC-DNA_2000000.txt"          
[3] "batch8/ds_batch8/CLONES_TRBCHP_356-02-PBMC-DNA_2000000.txt"          


Total recovered clonotypes:


[1] 111


Total out-of-frame clonotypes:


[1] 19


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 89


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_356-03-PBMC" "CHP_356-05-PBMC" "CHP_356-02-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "357"


duplicated sequences:


[1] "CASSHLTVGGGYEQYF" "CASSARQ_QGSPLHF"  "CSPSQTSGDNEQFF"  


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_357-01-PBMC-DNA_2000000.txt"  
[2] "batch6a/ds_batch6a/CLONES_TRBCHP_357-03-PBMC-DNA_2000000.txt"
[3] "batch7/ds_batch7/CLONES_TRBCHP_357-04-PBMC-DNA_2000000.txt"  
[4] "batch8/ds_batch8/CLONES_TRBCHP_357-02-PBMC-DNA_2000000.txt"  


Total recovered clonotypes:


[1] 1042


Total out-of-frame clonotypes:


[1] 270


Total clonotypes with stop codon:


[1] 31


Total productive clonotypes:


[1] 741


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_357-01-PBMC" "CHP_357-03-PBMC" "CHP_357-04-PBMC" "CHP_357-02-PBMC"


Total number of recurring clonotypes: 


[1] 3


these are what we color: 


                  CASRLGWIV_TGGHEQYF                      CASRKLDREGNTIYF 
                           "#B9D77A"                            "#BD70C8" 
CASSESTVLHSCLLSMPS_CDFHLDPCHCVNTEAFF 
                           "#B7C2C8" 
[1] "358"


duplicated sequences:


character(0)


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_358-02-PBMC-DNA_2000000.txt"
[2] "batch1/ds_batch1/CLONES_TRBCHP_358-01-PBMC-DNA_2000000.txt"          
[3] "batch3/ds_batch3/CLONES_TRBCHP_358-03-PBMC-DNA_2000000.txt"          
[4] "batch3/ds_batch3/CLONES_TRBCHP_358-05-PBMC-DNA_2000000.txt"          


Total recovered clonotypes:


[1] 1501


Total out-of-frame clonotypes:


[1] 288


Total clonotypes with stop codon:


[1] 23


Total productive clonotypes:


[1] 1190


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_358-02-PBMC" "CHP_358-01-PBMC" "CHP_358-03-PBMC" "CHP_358-05-PBMC"


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSHSSYNSPLHF 
     "#BEB3B2" 
[1] "359"


duplicated sequences:


[1] "CASSQEAGGAEAFF"


my files:


[1] "batch6a/ds_batch6a/CLONES_TRBCHP_359-02-PBMC-DNA_2000000.txt"
[2] "batch6a/ds_batch6a/CLONES_TRBCHP_359-04-PBMC-DNA_2000000.txt"
[3] "batch7/ds_batch7/CLONES_TRBCHP_359-01-PBMC-DNA_2000000.txt"  


Total recovered clonotypes:


[1] 828


Total out-of-frame clonotypes:


[1] 143


Total clonotypes with stop codon:


[1] 12


Total productive clonotypes:


[1] 673


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_359-02-PBMC" "CHP_359-04-PBMC" "CHP_359-01-PBMC"


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSEAGGNQPQHF 
     "#BEB3B2" 
[1] "360"


duplicated sequences:


[1] "CASSDYRTS_EGPEAKYF" "CASSFSGQGGYEQYF"   


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_360-03-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_360-02-PBMC-DNA_2000000.txt"
[3] "batch8/ds_batch8/CLONES_TRBCHP_360-05-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 795


Total out-of-frame clonotypes:


[1] 154


Total clonotypes with stop codon:


[1] 14


Total productive clonotypes:


[1] 627


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_360-03-PBMC" "CHP_360-02-PBMC" "CHP_360-05-PBMC"


Total number of recurring clonotypes: 


[1] 4


these are what we color: 


    CASSPLYEQYF CASSLGQGIVAEAFF   CAISESVHNEQFF CASSETSGSTDTQYF 
      "#BBDB73"       "#B570D4"       "#D89FA5"       "#9CD1CF" 
[1] "361"


duplicated sequences:


[1] "CASSDKTANEKLFF"    "CASRPGGALISTDTQYF" "CASSFRLDSNEKLFF"  


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_361-02-PBMC-DNA_2000000.txt"
[2] "batch3/ds_batch3/CLONES_TRBCHP_361-03-PBMC-DNA_2000000.txt"
[3] "batch4/ds_batch4/CLONES_TRBCHP_361-01-PBMC-DNA_2000000.txt"
[4] "batch7/ds_batch7/CLONES_TRBCHP_361-04-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 333


Total out-of-frame clonotypes:


[1] 74


Total clonotypes with stop codon:


[1] 5


Total productive clonotypes:


[1] 254


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_361-02-PBMC" "CHP_361-03-PBMC" "CHP_361-01-PBMC" "CHP_361-04-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "362"


duplicated sequences:


[1] "CASSQDLPGA_NTSNYGYTF" "CASETGGLMNTEAFF"      "CSARVIGAGNQPQHF"     
[4] "CASSFPGQVEKLFF"       "CASGTSQPQHF"         


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_362-02-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_362-01-PBMC-DNA_2000000.txt"          
[3] "batch7/ds_batch7/CLONES_TRBCHP_362-03-PBMC-DNA_2000000.txt"          
[4] "batch7/ds_batch7/CLONES_TRBCHP_362-04-PBMC-DNA_2000000.txt"          


Total recovered clonotypes:


[1] 691


Total out-of-frame clonotypes:


[1] 151


Total clonotypes with stop codon:


[1] 13


Total productive clonotypes:


[1] 527


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_362-02-PBMC" "CHP_362-01-PBMC" "CHP_362-03-PBMC" "CHP_362-04-PBMC"


Total number of recurring clonotypes: 


[1] 3


these are what we color: 


 CASSLGLA_SSYNEQFF CASRQYRLGRGPNQPQHF    CSARDGQAGDTEAFF 
         "#B6C2C8"          "#BD70C8"          "#BAD679" 
[1] "364"


duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_364-01-PBMC-DNA_2000000.txt"
[2] "batch4/ds_batch4/CLONES_TRBCHP_364-02-PBMC-DNA_2000000.txt"
[3] "batch4/ds_batch4/CLONES_TRBCHP_364-04-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 360


Total out-of-frame clonotypes:


[1] 72


Total clonotypes with stop codon:


[1] 8


Total productive clonotypes:


[1] 280


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_364-01-PBMC" "CHP_364-02-PBMC" "CHP_364-04-PBMC"


Total number of recurring clonotypes: 


[1] 2


these are what we color: 


CAISGPGTSGRAQDTQYF     CASSGLAGADTQYF 
         "#B7D39D"          "#BF8ACA" 
[1] "368"


duplicated sequences:


[1] "CASSLQGMGGYTF"   "CASSAANTDTQYF"   "CASSERTALNTEAFF" "CASSLAPGNTEAFF" 
[5] "CSASGSL_TDTQYF"  "CASSPFHTDTQYF"   "CASSLTSDTQYF"   


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_368-05-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_368-01-PBMC-DNA_2000000.txt"
[3] "batch7/ds_batch7/CLONES_TRBCHP_368-04-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 924


Total out-of-frame clonotypes:


[1] 238


Total clonotypes with stop codon:


[1] 20


Total productive clonotypes:


[1] 666


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_368-05-PBMC" "CHP_368-01-PBMC" "CHP_368-04-PBMC"


Total number of recurring clonotypes: 


[1] 15


these are what we color: 


                                              CASSQESSPIGTEAFF 
                                                     "#DAB0E2" 
                                               CASSGSGTVWETQYF 
                                                     "#7978D9" 
                                         CASSQDLGETLLFMNTGELFF 
                                                     "#E46749" 
                                               CASSAGGTANTEAFF 
                                                     "#75E8A8" 
                                              CASSKGAC_TNEKLFF 
                                                     "#7DAB8B" 
                                                CASTLPN_GKKLFF 
                                                     "#E2D151" 
                                                 CASSQSYYLEQFF 
                                                     "#83ABD8" 
     CASSGSGTVWETQYFGPGTRLLVLGERG_AGARARAAWVWFLRGVPGLCSGANVLTF 
                                        

duplicated sequences:


[1] "CASSDSGGQGRKDSNQPQHF" "CASSSPGTRGGGELFF"     "CASSLPGTGSYEQYF"     
[4] "CASSLGWGNTEAFF"       "CASSVGGGSEAFF"       


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_370-02-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_370-01-PBMC-DNA_2000000.txt"
[3] "batch7/ds_batch7/CLONES_TRBCHP_370-05-PBMC-DNA_2000000.txt"
[4] "batch8/ds_batch8/CLONES_TRBCHP_370-03-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 1123


Total out-of-frame clonotypes:


[1] 194


Total clonotypes with stop codon:


[1] 25


Total productive clonotypes:


[1] 904


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_370-02-PBMC" "CHP_370-01-PBMC" "CHP_370-05-PBMC" "CHP_370-03-PBMC"


Total number of recurring clonotypes: 


[1] 4


these are what we color: 


CASSIGGTLWAGGTEAFF    CASSLGTLPNQPQHF   CASRSGGYSYNSPLHF     CASSDSSGANVLTF 
         "#98D7C8"          "#C0D66C"          "#B667D3"          "#CCA4BA" 
[1] "373"


duplicated sequences:


[1] "CASSLGARSSGSYNEQFF" "CASSQEYSTDTQYF"    


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_373-01-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_373-02-PBMC-DNA_2000000.txt"
[3] "batch8/ds_batch8/CLONES_TRBCHP_373-03-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 452


Total out-of-frame clonotypes:


[1] 102


Total clonotypes with stop codon:


[1] 9


Total productive clonotypes:


[1] 341


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_373-01-PBMC" "CHP_373-02-PBMC" "CHP_373-03-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "374"


duplicated sequences:


[1] "CASRNRVTTDTQYF" "CASSLF_AREAFF" 


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_374-03-PBMC-DNA_2000000.txt"
[2] "batch3/ds_batch3/CLONES_TRBCHP_374-04-PBMC-DNA_2000000.txt"
[3] "batch3/ds_batch3/CLONES_TRBCHP_374-05-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 265


Total out-of-frame clonotypes:


[1] 66


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 197


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_374-03-PBMC" "CHP_374-04-PBMC" "CHP_374-05-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "375"


duplicated sequences:


character(0)


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_375-01-PBMC-DNA_2000000.txt"
[2] "batch11/CLONES_TRBCHP_375-05_PBMC_DNA_2000000.txt"                   
[3] "batch7/ds_batch7/CLONES_TRBCHP_375-02-PBMC-DNA_2000000.txt"          


Total recovered clonotypes:


[1] 855


Total out-of-frame clonotypes:


[1] 168


Total clonotypes with stop codon:


[1] 22


Total productive clonotypes:


[1] 665


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_375-01-PBMC" "CHP_375-05_PBMC" "CHP_375-02-PBMC"


Total number of recurring clonotypes: 


[1] 4


these are what we color: 


  CASSELAGGYNEQFF    CASSFAPGVSEQYF CASSPEFQGVSGNTIYF   CASSDSSGGANEQFF 
        "#ADCAD4"         "#B3DE7E"         "#D99277"         "#B971D0" 
[1] "378"


duplicated sequences:


[1] "CASSPGTGDNSPLHF"                                        
[2] "CASRRGPELFFGEGSRLTVLGKEAVGAPESSERAGWAEVSSCPTLRGAVLRGAAG"
[3] "CASSEGVSSYNSPLHF"                                       
[4] "CASSLAGGGGYGYTF"                                        
[5] "CASTQRWGPNTEAFF"                                        
[6] "CASSPFRSYNEQFF"                                         
[7] "CAISEVSTYGYTF"                                          


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_378-01-PBMC-DNA_2000000.txt"
[2] "batch7/ds_batch7/CLONES_TRBCHP_378-02-PBMC-DNA_2000000.txt"
[3] "batch8/ds_batch8/CLONES_TRBCHP_378-04-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 1161


Total out-of-frame clonotypes:


[1] 244


Total clonotypes with stop codon:


[1] 20


Total productive clonotypes:


[1] 897


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_378-01-PBMC" "CHP_378-02-PBMC" "CHP_378-04-PBMC"


Total number of recurring clonotypes: 


[1] 13


these are what we color: 


             CASSQTLA_GNQETQYF                 CASSHSTVNTEAFF 
                     "#72DEBA"                      "#8DE265" 
                   CAWSPNTEAFF             CASS*PLTG_QNDSPLHF 
                     "#824DDF"                      "#DC5CCB" 
              CASSGDRQVYPNEQFF                CASSGIELAKNIQYF 
                     "#D8A2DD"                      "#E0D557" 
                CASSHDWDTNTQYF               CASSQGAGFVNTEAFF 
                     "#D5A882"                      "#B86F88" 
                   CAWSPATEAFF CASSLDTV*QRLGGF_SGPGRLCSGNTIYF 
                     "#7E94DD"                      "#CBDEA8" 
                CASSPGDLNTEAFF               CASSGLPI_PDYEQYF 
                     "#D6CDDB"                      "#7DC7D4" 
               CASSDLGGARETQYF 
                     "#E36842" 
[1] "380"


duplicated sequences:


character(0)


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_380-02-PBMC-DNA_2000000.txt"
[2] "batch8/ds_batch8/CLONES_TRBCHP_380-03-PBMC-DNA_2000000.txt"
[3] "batch8/ds_batch8/CLONES_TRBCHP_380-05-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 196


Total out-of-frame clonotypes:


[1] 36


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 159


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_380-02-PBMC" "CHP_380-03-PBMC" "CHP_380-05-PBMC"


Total number of recurring clonotypes: 


[1] 10


these are what we color: 


     CASRSGSTEAFF CASSFKRGFSGANVLTF CASSEPPGANSYNEQFF   CASSPRSGDQETQYF 
        "#C2CEDA"         "#D0D39E"         "#74D7C6"         "#8395DB" 
      CASGFGGELFF CASSDDLTGGYTDTQYF   CASSHQGNTYNEQFF       CAKDG_REGHF 
        "#DCD855"         "#D3A2C3"         "#D968BF"         "#86E272" 
 CSARDLIR_QSYEQYF     CASSFSLPYEQYF 
        "#9E50E0"         "#DE7B58" 
[1] "382"


duplicated sequences:


[1] "CAWSVFSGYSYNEQFF"


my files:


[1] "batch11/CLONES_TRBCHP_382-03_PBMC_DNA_2000000.txt"         
[2] "batch11/CLONES_TRBCHP_382-04_PBMC_DNA_2000000.txt"         
[3] "batch8/ds_batch8/CLONES_TRBCHP_382-02-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 191


Total out-of-frame clonotypes:


[1] 50


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 139


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_382-03_PBMC" "CHP_382-04_PBMC" "CHP_382-02-PBMC"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "387"


duplicated sequences:


 [1] "CAWSVGGG_NTGELFF"                                                                 
 [2] "CASSKPRR_TGDEKLFF"                                                                
 [3] "CASSYREGQPQHF"                                                                    
 [4] "CASSLTPGAYNEQFFGPGTRLTVLGKKGAPGGREGEQPSL_TTPEPCS*GSGHWAIQGPPRGKRGLRQGPQGCANTGELFF"
 [5] "CASSLLGGARETQYFGPGTRLLVLGERG_AGARARAAWVWFLRGVPGLCSGANVLTF"                        
 [6] "CASSASGPGLAGGDSYNEQFF"                                                            
 [7] "CASSLAGQYFVTNEKLFF"                                                               
 [8] "CASSNGLAGGGSYEQYF"                                                                
 [9] "CASSQDNS_VLPNEQFF"                                                                
[10] "CASSESGTAGSYEQYF"                                                                 
[11] "CASSLGVGYPEDEQFF"                                                                 
[12] "CASSYSSQNTGELFF

my files:


[1] "batch11/CLONES_TRBCHP_387-02_PBMC_DNA_2000000.txt"         
[2] "batch11/CLONES_TRBCHP_387-03_PBMC_DNA_2000000.txt"         
[3] "batch8/ds_batch8/CLONES_TRBCHP_387-01-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 1171


Total out-of-frame clonotypes:


[1] 274


Total clonotypes with stop codon:


[1] 23


Total productive clonotypes:


[1] 874


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_387-02_PBMC" "CHP_387-03_PBMC" "CHP_387-01-PBMC"


Total number of recurring clonotypes: 


[1] 16


these are what we color: 


           CASSRNTQPQVGRSNEQFF                 CASRSSGSYNEQFF 
                     "#D1DFD9"                      "#D88DE3" 
                  CASSLVRGEAFF               CASS*WDR_GPETQYF 
                     "#CCDE9E"                      "#8FE545" 
                   CASSQ_FGYTF                CASSAGGQVNQPQHF 
                     "#DA4CB4"                      "#BB728D" 
               CASF*RG_YQETQYF                 CASSYSSGANVLTF 
                     "#869DDE"                      "#72DFC8" 
                  CASSLGTDTQYF             CASSLIVRDRAMNTEAFF 
                     "#E0D355"                      "#E36D43" 
                CASSPTGVYEKLFF                 CASRQRLAKNIQYF 
                     "#AE3FE8"                      "#85DF85" 
CASSLDTV*QRLGGF_SGPGRLCSGNTIYF        CATSDLTSGGSSSGGWVYNEQFF 
                     "#D0A885"                      "#DCBDDE" 
               CASSSLRGSNQPQHF                 CASSDLTGFKGYTF 
                     "#78BBCC"                      "#7

## cfDNA

In [24]:
manifest_df_cfdna <- cbind.data.frame(ds_flelst_chp_cfDNA, NA,NA,stringsAsFactors = F)

colnames(manifest_df_cfdna) <- c("filename", "patient", "cycle")

In [25]:
manifest_df_cfdna$filename <- gsub(".*CLONES", "CLONES", manifest_df_cfdna$filename)

manifest_df_cfdna$patient <- gsub("CLONES_TRBCHP_", "", manifest_df_cfdna$filename)
manifest_df_cfdna$patient <- gsub("-.*", "", manifest_df_cfdna$patient)

manifest_df_cfdna$cycle <- substr(manifest_df_cfdna$filename, 19,20)

In [26]:
ptlist_cfdna <- as.data.frame(table(manifest_df_cfdna$patient))

In [105]:
for(pt in ptlist_cfdna$Var1[ptlist_cfdna$Freq > 2]){
    print(pt)
    tmp <- ds_flelst_chp_cfDNA[grepl(pt, ds_flelst_chp_cfDNA)]
    cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
    cdr3df$samplename <- gsub("-cfDNA.*", "-cfDNA", cdr3df$samplename)
    cdr3df$samplename <- gsub("_cfDNA.*", "-cfDNA", cdr3df$samplename)
    cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)
    plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)
}

[1] "336"


my files:


[1] "batch10_cfDNA/CLONES_TRBCHP_336-03_cfDNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_336-04_cfDNA_2000000.txt"
[3] "batch10_cfDNA/CLONES_TRBCHP_336-05_cfDNA_2000000.txt"


Total recovered clonotypes:


[1] 34


Total out-of-frame clonotypes:


[1] 10


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 21


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_336-03-cfDNA" "CHP_336-04-cfDNA" "CHP_336-05-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "344"


my files:


[1] "batch3a9_cfDNA/CLONES_TRBCHP_344-02_cfDNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_344-04_cfDNA_2000000.txt"
[3] "batch3a9_cfDNA/CLONES_TRBCHP_344-05_cfDNA_2000000.txt"
[4] "batch5_cfDNA/CLONES_TRBCHP_344-01_cfDNA_2000000.txt"  


Total recovered clonotypes:


[1] 22


Total out-of-frame clonotypes:


[1] 3


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 19


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_344-02-cfDNA" "CHP_344-04-cfDNA" "CHP_344-05-cfDNA" "CHP_344-01-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "347"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_347-01-cfDNA_2000000.txt" 
[2] "batch10_cfDNA/CLONES_TRBCHP_347-04_cfDNA_2000000.txt"
[3] "batch5_cfDNA/CLONES_TRBCHP_347-02_cfDNA_2000000.txt" 


Total recovered clonotypes:


[1] 14


Total out-of-frame clonotypes:


[1] 2


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 11


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_347-01-cfDNA" "CHP_347-04-cfDNA" "CHP_347-02-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "351"


my files:


[1] "batch10_cfDNA/CLONES_TRBCHP_351-04_cfDNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_351-05_cfDNA_2000000.txt"
[3] "batch5_cfDNA/CLONES_TRBCHP_351-03_cfDNA_2000000.txt" 


Total recovered clonotypes:


[1] 15


Total out-of-frame clonotypes:


[1] 2


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 13


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_351-04-cfDNA" "CHP_351-05-cfDNA" "CHP_351-03-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "353"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_353-01-cfDNA_2000000.txt"  
[2] "batch10_cfDNA/CLONES_TRBCHP_353-05_cfDNA_2000000.txt" 
[3] "batch3a9_cfDNA/CLONES_TRBCHP_353-02_cfDNA_2000000.txt"
[4] "batch3a9_cfDNA/CLONES_TRBCHP_353-04_cfDNA_2000000.txt"


Total recovered clonotypes:


[1] 139


Total out-of-frame clonotypes:


[1] 24


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 114


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_353-01-cfDNA" "CHP_353-05-cfDNA" "CHP_353-02-cfDNA" "CHP_353-04-cfDNA"


Total number of recurring clonotypes: 


[1] 2


these are what we color: 


                                             CASSLRGNEAFF 
                                                "#B8D49F" 
CAWSGNPEAFFGQGTRLTVVGKTFFRFF_QIRHREKWVHSVPFRVAIFLCANYGYTF 
                                                "#BB82C9" 
[1] "357"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_357-03-cfDNA_2000000.txt"  
[2] "batch3a9_cfDNA/CLONES_TRBCHP_357-01_cfDNA_2000000.txt"
[3] "batch3a9_cfDNA/CLONES_TRBCHP_357-04_cfDNA_2000000.txt"
[4] "batch5_cfDNA/CLONES_TRBCHP_357-05_cfDNA_2000000.txt"  


Total recovered clonotypes:


[1] 56


Total out-of-frame clonotypes:


[1] 14


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 40


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_357-03-cfDNA" "CHP_357-01-cfDNA" "CHP_357-04-cfDNA" "CHP_357-05-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "358"


my files:


[1] "batch10_cfDNA/CLONES_TRBCHP_358-02_cfDNA_2000000.txt" 
[2] "batch3a9_cfDNA/CLONES_TRBCHP_358-01_cfDNA_2000000.txt"
[3] "batch3a9_cfDNA/CLONES_TRBCHP_358-03_cfDNA_2000000.txt"


Total recovered clonotypes:


[1] 143


Total out-of-frame clonotypes:


[1] 27


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 116


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_358-02-cfDNA" "CHP_358-01-cfDNA" "CHP_358-03-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "359"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_359-01-cfDNA_2000000.txt"  
[2] "batch1_cfDNA/CLONES_TRBCHP_359-04-cfDNA_2000000.txt"  
[3] "batch3a9_cfDNA/CLONES_TRBCHP_359-02_cfDNA_2000000.txt"


Total recovered clonotypes:


[1] 76


Total out-of-frame clonotypes:


[1] 13


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 63


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_359-01-cfDNA" "CHP_359-04-cfDNA" "CHP_359-02-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "361"


my files:


[1] "batch10_cfDNA/CLONES_TRBCHP_361-02_cfDNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_361-01_cfDNA_2000000.txt" 
[3] "batch5_cfDNA/CLONES_TRBCHP_361-03_cfDNA_2000000.txt" 
[4] "batch5_cfDNA/CLONES_TRBCHP_361-05_cfDNA_2000000.txt" 


Total recovered clonotypes:


[1] 108


Total out-of-frame clonotypes:


[1] 29


Total clonotypes with stop codon:


[1] 5


Total productive clonotypes:


[1] 74


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_361-02-cfDNA" "CHP_361-01-cfDNA" "CHP_361-03-cfDNA" "CHP_361-05-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "366"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_366-02-cfDNA_2000000.txt"  
[2] "batch10_cfDNA/CLONES_TRBCHP_366-04_cfDNA_2000000.txt" 
[3] "batch3a9_cfDNA/CLONES_TRBCHP_366-01_cfDNA_2000000.txt"
[4] "batch5_cfDNA/CLONES_TRBCHP_366-05_cfDNA_2000000.txt"  


Total recovered clonotypes:


[1] 41


Total out-of-frame clonotypes:


[1] 17


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 23


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_366-02-cfDNA" "CHP_366-04-cfDNA" "CHP_366-01-cfDNA" "CHP_366-05-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "368"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_368-05-cfDNA_2000000.txt"  
[2] "batch3a9_cfDNA/CLONES_TRBCHP_368-02_cfDNA_2000000.txt"
[3] "batch5_cfDNA/CLONES_TRBCHP_368-01_cfDNA_2000000.txt"  


Total recovered clonotypes:


[1] 37


Total out-of-frame clonotypes:


[1] 7


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 29


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_368-05-cfDNA" "CHP_368-02-cfDNA" "CHP_368-01-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "371"


my files:


[1] "batch1_cfDNA/CLONES_TRBCHP_371-01-cfDNA_2000000.txt"  
[2] "batch1_cfDNA/CLONES_TRBCHP_371-03-cfDNA_2000000.txt"  
[3] "batch3a9_cfDNA/CLONES_TRBCHP_371-04_cfDNA_2000000.txt"


Total recovered clonotypes:


[1] 15


Total out-of-frame clonotypes:


[1] 6


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 9


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_371-01-cfDNA" "CHP_371-03-cfDNA" "CHP_371-04-cfDNA"


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
[1] "385"


my files:


[1] "batch7_cfDNA/CLONES_TRBCHP_385-01_cfDNA_2000000.txt"
[2] "batch7_cfDNA/CLONES_TRBCHP_385-02_cfDNA_2000000.txt"
[3] "batch7_cfDNA/CLONES_TRBCHP_385-03_cfDNA_2000000.txt"


Total recovered clonotypes:


[1] 9


Total out-of-frame clonotypes:


[1] 4


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 5


Output contains all clonotypes
list of samples to track clones: 


[1] "CHP_385-01-cfDNA" "CHP_385-02-cfDNA" "CHP_385-03-cfDNA"


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSLDTV*QRLGGF_SGPGRLCSGNTIYF 
                     "#BDB3B1" 


## PBMCs and cfDNA

In [27]:
manifest_cfdna_pbmc <- merge(manifest_df_cfdna, manifest_df, by = c("patient", "cycle"))

In [28]:
manifest_cfdna_pbmc

patient,cycle,filename.x,filename.y
<chr>,<chr>,<chr>,<chr>
323,3,CLONES_TRBCHP_323-03_cfDNA_2000000.txt,CLONES_TRBCHP_323-03-PBMC-DNA_2000000.txt
338,3,CLONES_TRBCHP_338-03_cfDNA_2000000.txt,CLONES_TRBCHP_338-03-PBMC-DNA_2000000.txt
339,3,CLONES_TRBCHP_339-03_cfDNA_2000000.txt,CLONES_TRBCHP_339-03-PBMC-DNA_2000000.txt
340,3,CLONES_TRBCHP_340-03_cfDNA_2000000.txt,CLONES_TRBCHP_340-03-PBMC-DNA_2000000.txt
344,2,CLONES_TRBCHP_344-02_cfDNA_2000000.txt,CLONES_TRBCHP_344-02-PBMC-DNA_2000000.txt
344,4,CLONES_TRBCHP_344-04_cfDNA_2000000.txt,CLONES_TRBCHP_344-04-PBMC-DNA_2000000.txt
344,5,CLONES_TRBCHP_344-05_cfDNA_2000000.txt,CLONES_TRBCHP_344-05-PBMC-DNA_2000000.txt
345,2,CLONES_TRBCHP_345-02_cfDNA_2000000.txt,CLONES_TRBCHP_345-02-PBMC-DNA_2000000.txt
347,1,CLONES_TRBCHP_347-01-cfDNA_2000000.txt,CLONES_TRBCHP_347-01-PBMC-DNA_2000000.txt
347,2,CLONES_TRBCHP_347-02_cfDNA_2000000.txt,CLONES_TRBCHP_347-02-PBMC-DNA_2000000.txt


In [29]:
for(i in 1:nrow(manifest_cfdna_pbmc)){
    cfdnafile <- ds_flelst_chp_cfDNA[grepl(manifest_cfdna_pbmc$filename.x[i], ds_flelst_chp_cfDNA)]
    pbmcfile <- ds_flelst_chp_PBMC[grepl(manifest_cfdna_pbmc$filename.y[i], ds_flelst_chp_PBMC)]
    tmp <- c(pbmcfile, cfdnafile)
    
    cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
    cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)       
    cdr3df$samplename <- gsub("-cfDNA.*", "-cfDNA", cdr3df$samplename)
    cdr3df$samplename <- gsub("_cfDNA.*", "-cfDNA", cdr3df$samplename)
    cdr3df$samplename <- gsub("-PBMC.*", "-PBMC", cdr3df$samplename)
    cdr3df$samplename <- gsub("_PBMC.*", "-PBMC", cdr3df$samplename)

    cdr3df$samplename <- factor(cdr3df$samplename, levels = c(unique(cdr3df$samplename[grepl("PBMC",cdr3df$samplename)]),
                                                              unique(cdr3df$samplename[grepl("cfDNA",cdr3df$samplename)])))
    
    plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)
}

duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_323-03-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_323-03_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 168


Total out-of-frame clonotypes:


[1] 35


Total clonotypes with stop codon:


[1] 4


Total productive clonotypes:


[1] 129


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_323-03-PBMC  CHP_323-03-cfDNA
Levels: CHP_323-03-PBMC CHP_323-03-cfDNA


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSPQGGPHNEQFF 
      "#BEB3B2" 


duplicated sequences:


 [1] "CSAPGQGGGTEAFFGQGTRLTVVGKTFFRF_LQIRHREKWVHSVPFRVAIFLCANYGYTF"  
 [2] "CASSEQGSVTEAFFGQGTRLTVVGKTFFRF_LQIRHREKWVHSVPFRVAIFLCANYGYTF"  
 [3] "CASSLGLGSGVNTGELFFGEGSRLTVLGKEAVGAPESSERAGWAEVSSCPTLRGAVLRGAAG"
 [4] "CASSVGPSTYNEQFF"                                               
 [5] "CSTQGSRESTEAFF"                                                
 [6] "CAR*WDRSKTFIGFTDTQYF"                                          
 [7] "CAWSPGGFLQPSPLHF"                                              
 [8] "CASTAGGASKNIQYF"                                               
 [9] "CASSPNLGGNTEAFF"                                               
[10] "CATRL*R_INQPQHF"                                               


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_338-03-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_338-03_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 596


Total out-of-frame clonotypes:


[1] 129


Total clonotypes with stop codon:


[1] 12


Total productive clonotypes:


[1] 455


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_338-03-PBMC  CHP_338-03-cfDNA
Levels: CHP_338-03-PBMC CHP_338-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSFPGRNTEAFFGQGTRLTVVGKTFFRF_LQIRHREKWVHSVPFRVAIFLCANYGYTF"


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_339-03-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_339-03_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 35


Total out-of-frame clonotypes:


[1] 6


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 27


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_339-03-PBMC  CHP_339-03-cfDNA
Levels: CHP_339-03-PBMC CHP_339-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASHMNTEAFF"


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_340-03-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_340-03_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 104


Total out-of-frame clonotypes:


[1] 21


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 82


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_340-03-PBMC  CHP_340-03-cfDNA
Levels: CHP_340-03-PBMC CHP_340-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_344-02-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_344-02_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 16


Total out-of-frame clonotypes:


[1] 2


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 14


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_344-02-PBMC  CHP_344-02-cfDNA
Levels: CHP_344-02-PBMC CHP_344-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch8/ds_batch8/CLONES_TRBCHP_344-04-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_344-04_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 95


Total out-of-frame clonotypes:


[1] 13


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 80


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_344-04-PBMC  CHP_344-04-cfDNA
Levels: CHP_344-04-PBMC CHP_344-04-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSQDKCSGGVLTDTQYF" "CASSVSPRLAGTSQFF"    "CASSLVPYEQYF"       


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_344-05-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_344-05_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 134


Total out-of-frame clonotypes:


[1] 18


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 113


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_344-05-PBMC  CHP_344-05-cfDNA
Levels: CHP_344-05-PBMC CHP_344-05-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSQG_GLQQYF"


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_345-02-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_345-02_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 184


Total out-of-frame clonotypes:


[1] 48


Total clonotypes with stop codon:


[1] 4


Total productive clonotypes:


[1] 132


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_345-02-PBMC  CHP_345-02-cfDNA
Levels: CHP_345-02-PBMC CHP_345-02-cfDNA


Total number of recurring clonotypes: 


[1] 7


these are what we color: 


          CASRHQPQHF      CASSQGLAGSYEQYF         CASTYNDNEQFF 
           "#B2A6D7"            "#DCD066"            "#8FE275" 
     CASSHLGQGHTEAFF CATSDLLA*L_REAVDTQYF        CASSFF_*GGYTF 
           "#BC5ED1"            "#7BD6CA"            "#D6D2C0" 
 CASFPDFGG_PPPTDTQYF 
           "#D5786B" 


duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_347-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_347-01-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 173


Total out-of-frame clonotypes:


[1] 36


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 136


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_347-01-PBMC  CHP_347-01-cfDNA
Levels: CHP_347-01-PBMC CHP_347-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSLPRGPSSYNEQFF"


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_347-02-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_347-02_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 380


Total out-of-frame clonotypes:


[1] 68


Total clonotypes with stop codon:


[1] 8


Total productive clonotypes:


[1] 304


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_347-02-PBMC  CHP_347-02-cfDNA
Levels: CHP_347-02-PBMC CHP_347-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch6a/ds_batch6a/CLONES_TRBCHP_347-04-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_347-04_cfDNA_2000000.txt"        


Total recovered clonotypes:


[1] 78


Total out-of-frame clonotypes:


[1] 9


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 68


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_347-04-PBMC  CHP_347-04-cfDNA
Levels: CHP_347-04-PBMC CHP_347-04-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASKRWTGGQTEAFF"


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_351-04-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_351-04_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 119


Total out-of-frame clonotypes:


[1] 32


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 84


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_351-04-PBMC  CHP_351-04-cfDNA
Levels: CHP_351-04-PBMC CHP_351-04-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSPAVNTIYF"


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_353-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_353-01-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 262


Total out-of-frame clonotypes:


[1] 49


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 211


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_353-01-PBMC  CHP_353-01-cfDNA
Levels: CHP_353-01-PBMC CHP_353-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSEAGAGELFF"


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_353-02-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_353-02_cfDNA_2000000.txt"               


Total recovered clonotypes:


[1] 49


Total out-of-frame clonotypes:


[1] 8


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 38


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_353-02-PBMC  CHP_353-02-cfDNA
Levels: CHP_353-02-PBMC CHP_353-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSVGGNSNQPQHF"  "CASSEWGG_LQETQYF" "CASSSRGQGDNEQFF" 


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_353-05-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_353-05_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 442


Total out-of-frame clonotypes:


[1] 73


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 363


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_353-05-PBMC  CHP_353-05-cfDNA
Levels: CHP_353-05-PBMC CHP_353-05-cfDNA


Total number of recurring clonotypes: 


[1] 2


these are what we color: 


   CASSLRGNEAFF CASSPGGNSNQPQHF 
      "#B7D39D"       "#BF8ACA" 


duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_355-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_355-01-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 19


Total out-of-frame clonotypes:


[1] 2


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 15


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_355-01-PBMC  CHP_355-01-cfDNA
Levels: CHP_355-01-PBMC CHP_355-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch8/ds_batch8/CLONES_TRBCHP_356-02-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_356-02-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 115


Total out-of-frame clonotypes:


[1] 21


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 91


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_356-02-PBMC  CHP_356-02-cfDNA
Levels: CHP_356-02-PBMC CHP_356-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSHLTVGGGYEQYF" "CASSARQ_QGSPLHF"  "CSPSQTSGDNEQFF"  


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_357-01-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_357-01_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 337


Total out-of-frame clonotypes:


[1] 86


Total clonotypes with stop codon:


[1] 8


Total productive clonotypes:


[1] 243


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_357-01-PBMC  CHP_357-01-cfDNA
Levels: CHP_357-01-PBMC CHP_357-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch6a/ds_batch6a/CLONES_TRBCHP_357-03-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_357-03-cfDNA_2000000.txt"         


Total recovered clonotypes:


[1] 115


Total out-of-frame clonotypes:


[1] 30


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 79


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_357-03-PBMC  CHP_357-03-cfDNA
Levels: CHP_357-03-PBMC CHP_357-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_357-04-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_357-04_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 85


Total out-of-frame clonotypes:


[1] 20


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 62


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_357-04-PBMC  CHP_357-04-cfDNA
Levels: CHP_357-04-PBMC CHP_357-04-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch1/ds_batch1/CLONES_TRBCHP_358-01-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_358-01_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 95


Total out-of-frame clonotypes:


[1] 21


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 74


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_358-01-PBMC  CHP_358-01-cfDNA
Levels: CHP_358-01-PBMC CHP_358-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_358-02-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_358-02_cfDNA_2000000.txt"                


Total recovered clonotypes:


[1] 95


Total out-of-frame clonotypes:


[1] 17


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 78


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_358-02-PBMC  CHP_358-02-cfDNA
Levels: CHP_358-02-PBMC CHP_358-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSPIGRGGYTF"                                                                    
[2] "CASSLEQRSYNEQFFGPGTRLTVLGKKGAPGGREGEQPSL_TTPEPCS*GSGHWAIQGPPRGKRGLRQGPQGCANTGELFF"
[3] "CAIRGVLLQG_AEGNQPQHF"                                                             
[4] "CASSYELVARWAQDTEAFF"                                                              
[5] "CASSSRGREDTEAFF"                                                                  
[6] "CASSFFLEGTDTQYF"                                                                  
[7] "CASSFGVNTEAFF"                                                                    


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_358-03-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_358-03_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 742


Total out-of-frame clonotypes:


[1] 136


Total clonotypes with stop codon:


[1] 9


Total productive clonotypes:


[1] 597


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_358-03-PBMC  CHP_358-03-cfDNA
Levels: CHP_358-03-PBMC CHP_358-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_359-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_359-01-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 38


Total out-of-frame clonotypes:


[1] 8


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 30


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_359-01-PBMC  CHP_359-01-cfDNA
Levels: CHP_359-01-PBMC CHP_359-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSQEAGGAEAFF"


my files:


[1] "batch6a/ds_batch6a/CLONES_TRBCHP_359-02-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_359-02_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 522


Total out-of-frame clonotypes:


[1] 97


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 419


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_359-02-PBMC  CHP_359-02-cfDNA
Levels: CHP_359-02-PBMC CHP_359-02-cfDNA


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASRGENYMNTEAFF 
      "#BEB3B2" 


duplicated sequences:


[1] "CASSWRLAAGELFF"


my files:


[1] "batch6a/ds_batch6a/CLONES_TRBCHP_359-04-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_359-04-cfDNA_2000000.txt"         


Total recovered clonotypes:


[1] 344


Total out-of-frame clonotypes:


[1] 51


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 287


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_359-04-PBMC  CHP_359-04-cfDNA
Levels: CHP_359-04-PBMC CHP_359-04-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASWTGFPNYEQYF"  "CASTQGRDGPGELFF" "CASSLAGQSNQPQHF" "CASSQANTEAFF"   


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_360-02-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_360-02-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 308


Total out-of-frame clonotypes:


[1] 58


Total clonotypes with stop codon:


[1] 7


Total productive clonotypes:


[1] 243


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_360-02-PBMC  CHP_360-02-cfDNA
Levels: CHP_360-02-PBMC CHP_360-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_361-01-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_361-01_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 198


Total out-of-frame clonotypes:


[1] 46


Total clonotypes with stop codon:


[1] 5


Total productive clonotypes:


[1] 147


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_361-01-PBMC  CHP_361-01-cfDNA
Levels: CHP_361-01-PBMC CHP_361-01-cfDNA


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSLGGQGMGEQYF 
      "#BEB3B2" 


duplicated sequences:


[1] "CASSDKTANEKLFF"    "CASRPGGALISTDTQYF" "CASSFRLDSNEKLFF"  


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_361-02-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_361-02_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 132


Total out-of-frame clonotypes:


[1] 34


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 96


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_361-02-PBMC  CHP_361-02-cfDNA
Levels: CHP_361-02-PBMC CHP_361-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_361-03-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_361-03_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 66


Total out-of-frame clonotypes:


[1] 14


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 49


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_361-03-PBMC  CHP_361-03-cfDNA
Levels: CHP_361-03-PBMC CHP_361-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_362-03-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_362-03_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 125


Total out-of-frame clonotypes:


[1] 27


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 97


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_362-03-PBMC  CHP_362-03-cfDNA
Levels: CHP_362-03-PBMC CHP_362-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_362-04-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_362-04_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 32


Total out-of-frame clonotypes:


[1] 11


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 21


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_362-04-PBMC  CHP_362-04-cfDNA
Levels: CHP_362-04-PBMC CHP_362-04-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSQDPSGGAGELFF" "CASSLARNTGELFF"  


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_363-02-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_363-02_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 275


Total out-of-frame clonotypes:


[1] 60


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 209


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_363-02-PBMC  CHP_363-02-cfDNA
Levels: CHP_363-02-PBMC CHP_363-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch4/ds_batch4/CLONES_TRBCHP_364-02-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_364-02_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 101


Total out-of-frame clonotypes:


[1] 25


Total clonotypes with stop codon:


[1] 1


Total productive clonotypes:


[1] 75


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_364-02-PBMC  CHP_364-02-cfDNA
Levels: CHP_364-02-PBMC CHP_364-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSPPSGRGPYNEQFF" "CATSIDRGPYEQYF"   


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_366-01-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_366-01_cfDNA_2000000.txt"               


Total recovered clonotypes:


[1] 171


Total out-of-frame clonotypes:


[1] 37


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 132


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_366-01-PBMC  CHP_366-01-cfDNA
Levels: CHP_366-01-PBMC CHP_366-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSQGQVGHEKLFF" "CASSKRTGSYEQYF" 


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_368-01-PBMC-DNA_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_368-01_cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 301


Total out-of-frame clonotypes:


[1] 65


Total clonotypes with stop codon:


[1] 9


Total productive clonotypes:


[1] 227


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_368-01-PBMC  CHP_368-01-cfDNA
Levels: CHP_368-01-PBMC CHP_368-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSLQGMGGYTF"   "CASSAANTDTQYF"   "CASSERTALNTEAFF" "CASSLAPGNTEAFF" 
[5] "CSASGSL_TDTQYF"  "CASSPFHTDTQYF"   "CASSLTSDTQYF"   


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_368-05-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_368-05-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 552


Total out-of-frame clonotypes:


[1] 150


Total clonotypes with stop codon:


[1] 10


Total productive clonotypes:


[1] 392


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_368-05-PBMC  CHP_368-05-cfDNA
Levels: CHP_368-05-PBMC CHP_368-05-cfDNA


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSGSGTVWETQYF 
      "#BEB3B2" 


duplicated sequences:


[1] "CASSSMDRAGNTIYF" "CASSLSSSYEQFF"  


my files:


[1] "batch8/ds_batch8/CLONES_TRBCHP_369-02-PBMC-DNA_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_369-02_cfDNA_2000000.txt"      


Total recovered clonotypes:


[1] 315


Total out-of-frame clonotypes:


[1] 86


Total clonotypes with stop codon:


[1] 10


Total productive clonotypes:


[1] 219


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_369-02-PBMC  CHP_369-02-cfDNA
Levels: CHP_369-02-PBMC CHP_369-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_370-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_370-01-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 89


Total out-of-frame clonotypes:


[1] 14


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 73


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_370-01-PBMC  CHP_370-01-cfDNA
Levels: CHP_370-01-PBMC CHP_370-01-cfDNA


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASRGLSGNIQYF 
    "#BEB3B2" 


duplicated sequences:


character(0)


my files:


[1] "batch8/ds_batch8/CLONES_TRBCHP_370-03-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_370-03_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 337


Total out-of-frame clonotypes:


[1] 67


Total clonotypes with stop codon:


[1] 8


Total productive clonotypes:


[1] 262


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_370-03-PBMC  CHP_370-03-cfDNA
Levels: CHP_370-03-PBMC CHP_370-03-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


character(0)


my files:


[1] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_372-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_372-01-cfDNA_2000000.txt"                 


Total recovered clonotypes:


[1] 8


Total out-of-frame clonotypes:


[1] 1


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 7


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_372-01-PBMC  CHP_372-01-cfDNA
Levels: CHP_372-01-PBMC CHP_372-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSLGARSSGSYNEQFF" "CASSQEYSTDTQYF"    


my files:


[1] "batch3/ds_batch3/CLONES_TRBCHP_373-01-PBMC-DNA_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_373-01-cfDNA_2000000.txt"       


Total recovered clonotypes:


[1] 258


Total out-of-frame clonotypes:


[1] 54


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 202


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_373-01-PBMC  CHP_373-01-cfDNA
Levels: CHP_373-01-PBMC CHP_373-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CSARTGGRVTQYF"     "CASSQGVV_RGSYEQYF" "CASSSRTSEYTGELFF" 


my files:


[1] "batch7/ds_batch7/CLONES_TRBCHP_373-02-PBMC-DNA_2000000.txt"
[2] "batch3a9_cfDNA/CLONES_TRBCHP_373-02_cfDNA_2000000.txt"     


Total recovered clonotypes:


[1] 134


Total out-of-frame clonotypes:


[1] 35


Total clonotypes with stop codon:


[1] 3


Total productive clonotypes:


[1] 96


Output contains all clonotypes
list of samples to track clones: 


[1] CHP_373-02-PBMC  CHP_373-02-cfDNA
Levels: CHP_373-02-PBMC CHP_373-02-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


duplicated sequences:


[1] "CASSSRGAPGAVRYNEQFF" "CASSLSRLAGFLSYEQYF"  "CASSMTAASTDTQYF"    


ERROR: Error in data.frame(..., check.names = FALSE): arguments imply differing number of rows: 0, 1


## Tumour and PBMCs

In [155]:
manifest_df_ffpe <- cbind.data.frame(ds_flelst_chp_ffpe, NA,stringsAsFactors = F)

colnames(manifest_df_ffpe) <- c("filename", "patient")

In [156]:
manifest_df_ffpe$filename <- gsub(".*CLONES", "CLONES", manifest_df_ffpe$filename)

manifest_df_ffpe$patient <- gsub("CLONES_TRBCHP_", "", manifest_df_ffpe$filename)
manifest_df_ffpe$patient <- gsub("-.*", "", manifest_df_ffpe$patient)
manifest_df_ffpe$patient <- gsub("_.*", "", manifest_df_ffpe$patient)

In [157]:
manifest_df_ffpe$patient

I have to do all separately to make sure levels are correct

344, 380, 400, 401, doesnt have baseline pbmc
348 doesnt have ffpe
389, 390 412 418 419 no pbmc

In [158]:
master_df[ master_df$Patient == "387",]

Unnamed: 0_level_0,Patient,cycle,FOLD,ATC,Age,Disease_type,TE_fold,Pass,CD3,EM,⋯,TIM3,CTLA4,PD1.,PDL1.,LAG3.,TIM3.,CTLA4.,Any.NCR,PD1...LAG3...TIM3,group
Unnamed: 0_level_1,<int>,<int>,<dbl>,<dbl>,<dbl>,<chr>,<chr>,<lgl>,<int>,<int>,⋯,<int>,<int>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<chr>
286,387,1,0.8,288.99,13,T-ALL,0.8,,2414,209.0,⋯,100.0,,4.142502,,9.444905,4.142502,,,,Leukemia
287,387,2,4.9,254.8,13,T-ALL,4.9,,1387,0.0,⋯,254.0,,18.312906,,20.475847,18.312906,,,,Leukemia
288,387,3,,483.72,13,T-ALL,x,,2356,60.0,⋯,160.0,,60.836502,,109.125475,60.836502,,,,Leukemia
289,387,4,0.0,0.0,13,T-ALL,0,,0,,⋯,,,,,,,,,,Leukemia
290,387,5,0.0,0.0,13,T-ALL,0,,0,,⋯,,,,,,,,,,Leukemia


### 407 DLBCL

In [159]:
ffpefile <- ds_flelst_chp_ffpe[grepl("407", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("407", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S7_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_407-FFPE-DNA_S7_2000000.txt"
[2] "batch11/CLONES_TRBCHP_407-01_PBMC_DNA_2000000.txt"               
[3] "batch11/CLONES_TRBCHP_407-02_PBMC_DNA_2000000.txt"               


Total recovered clonotypes:


[1] 584


Total out-of-frame clonotypes:


[1] 147


Total clonotypes with stop codon:


[1] 15


Total productive clonotypes:


[1] 422


Output contains all clonotypes


In [160]:
unique(cdr3df$samplename)

In [161]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_407-FFPE", "CHP_407-01_PBMC", "CHP_407-02_PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_407-FFPE    CHP_407-01_PBMC CHP_407-02_PBMC
Levels: CHP_407-FFPE CHP_407-01_PBMC CHP_407-02_PBMC


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSYSIDQEFNEKLFF 
        "#BDB3B1" 


### 404 ERMS

In [162]:
ffpefile <- ds_flelst_chp_ffpe[grepl("404_B", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("404", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_404_B-FFPE-DNA_2000000.txt"
[2] "batch11/CLONES_TRBCHP_404-01_PBMC_DNA_2000000.txt"              
[3] "batch11/CLONES_TRBCHP_404-02_PBMC_DNA_2000000.txt"              


Total recovered clonotypes:


[1] 529


Total out-of-frame clonotypes:


[1] 93


Total clonotypes with stop codon:


[1] 13


Total productive clonotypes:


[1] 423


Output contains all clonotypes


In [163]:
unique(cdr3df$samplename)

In [164]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_404_B-FFPE", "CHP_404-01_PBMC", "CHP_404-02_PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_404_B-FFPE  CHP_404-01_PBMC CHP_404-02_PBMC
Levels: CHP_404_B-FFPE CHP_404-01_PBMC CHP_404-02_PBMC


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSFIGAEYVRETQYF 
        "#BDB3B1" 


### 394 ERMS

In [165]:
ffpefile <- ds_flelst_chp_ffpe[grepl("394", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("394", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("-DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S4_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_394-FFPE-DNA_S4_2000000.txt"
[2] "batch8/ds_batch8/CLONES_TRBCHP_394-01-PBMC-DNA_2000000.txt"      
[3] "batch8/ds_batch8/CLONES_TRBCHP_394-04-PBMC-DNA_2000000.txt"      


Total recovered clonotypes:


[1] 93


Total out-of-frame clonotypes:


[1] 13


Total clonotypes with stop codon:


[1] 2


Total productive clonotypes:


[1] 78


Output contains all clonotypes


In [166]:
unique(cdr3df$samplename)

In [167]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_394-FFPE", "CHP_394-01-PBMC", "CHP_394-04-PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_394-FFPE    CHP_394-01-PBMC CHP_394-04-PBMC
Levels: CHP_394-FFPE CHP_394-01-PBMC CHP_394-04-PBMC


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSPGTSANEQFF 
     "#BDB3B1" 


### 372 BL

In [168]:
ffpefile <- ds_flelst_chp_ffpe[grepl("372", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("372", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("-DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_372-FFPE-DNA_S1_2000000.txt"    
[2] "batch_reseq/ds_batch_reseq/CLONES_TRBCHP_372-01-PBMC-DNA_2000000.txt"


Total recovered clonotypes:


[1] 11


Total out-of-frame clonotypes:


[1] 1


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 10


Output contains all clonotypes


In [169]:
unique(cdr3df$samplename)

In [170]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_372-FFPE", "CHP_372-01-PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_372-FFPE    CHP_372-01-PBMC
Levels: CHP_372-FFPE CHP_372-01-PBMC


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


### 370 ALCL

In [171]:
ffpefile <- ds_flelst_chp_ffpe[grepl("370", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("370", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("-DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S5_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


[1] "CASRGLSGNIQYF"


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_370-FFPE-DNA_S5_2000000.txt"
[2] "batch3/ds_batch3/CLONES_TRBCHP_370-02-PBMC-DNA_2000000.txt"      
[3] "batch7/ds_batch7/CLONES_TRBCHP_370-01-PBMC-DNA_2000000.txt"      
[4] "batch7/ds_batch7/CLONES_TRBCHP_370-05-PBMC-DNA_2000000.txt"      
[5] "batch8/ds_batch8/CLONES_TRBCHP_370-03-PBMC-DNA_2000000.txt"      


Total recovered clonotypes:


[1] 1127


Total out-of-frame clonotypes:


[1] 194


Total clonotypes with stop codon:


[1] 25


Total productive clonotypes:


[1] 908


Output contains all clonotypes


In [172]:
unique(cdr3df$samplename)

In [173]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_370-FFPE", "CHP_370-01-PBMC", 
                                                          "CHP_370-02-PBMC", "CHP_370-03-PBMC", 
                                                          "CHP_370-05-PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneFraction", 0)

list of samples to track clones: 


[1] CHP_370-FFPE    CHP_370-02-PBMC CHP_370-01-PBMC CHP_370-05-PBMC
[5] CHP_370-03-PBMC
5 Levels: CHP_370-FFPE CHP_370-01-PBMC CHP_370-02-PBMC ... CHP_370-05-PBMC


Total number of recurring clonotypes: 


[1] 5


these are what we color: 


     CASRGLSGNIQYF CASSIGGTLWAGGTEAFF    CASSLGTLPNQPQHF   CASRSGGYSYNSPLHF 
         "#A2DAC7"          "#BA5ED4"          "#B1A6D3"          "#DE9D7A" 
    CASSDSSGANVLTF 
         "#AFE36F" 


### 364 OS

In [174]:
ffpefile <- ds_flelst_chp_ffpe[grepl("364", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("364", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("-DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_364-FFPE-DNA_S1_2000000.txt"
[2] "batch4/ds_batch4/CLONES_TRBCHP_364-01-PBMC-DNA_2000000.txt"      
[3] "batch4/ds_batch4/CLONES_TRBCHP_364-02-PBMC-DNA_2000000.txt"      
[4] "batch4/ds_batch4/CLONES_TRBCHP_364-04-PBMC-DNA_2000000.txt"      


Total recovered clonotypes:


[1] 372


Total out-of-frame clonotypes:


[1] 75


Total clonotypes with stop codon:


[1] 9


Total productive clonotypes:


[1] 288


Output contains all clonotypes


In [175]:
unique(cdr3df$samplename)

In [176]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_364-FFPE", "CHP_364-01-PBMC", 
                                                          "CHP_364-02-PBMC", "CHP_364-04-PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_364-FFPE    CHP_364-01-PBMC CHP_364-02-PBMC CHP_364-04-PBMC
Levels: CHP_364-FFPE CHP_364-01-PBMC CHP_364-02-PBMC CHP_364-04-PBMC


Total number of recurring clonotypes: 


[1] 4


these are what we color: 


      CASSLLEQPQHF CAISGPGTSGRAQDTQYF      CASSAGNTGELFF     CASSGLAGADTQYF 
         "#B76DD2"          "#ADE37C"          "#A6CBD1"          "#DE9D81" 


### 361 HD

In [177]:
ffpefile <- ds_flelst_chp_ffpe[grepl("361", ds_flelst_chp_ffpe)]
pbmcfiles <- ds_flelst_chp_PBMC[grepl("361", ds_flelst_chp_PBMC)]
tmp <- c(ffpefile, pbmcfiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")

cdr3df$samplename <- gsub("-DNA_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)


duplicated sequences:


[1] "CASSYGQGANGYTF"


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_361-FFPE-DNA_S1_2000000.txt"
[2] "batch3/ds_batch3/CLONES_TRBCHP_361-02-PBMC-DNA_2000000.txt"      
[3] "batch3/ds_batch3/CLONES_TRBCHP_361-03-PBMC-DNA_2000000.txt"      
[4] "batch4/ds_batch4/CLONES_TRBCHP_361-01-PBMC-DNA_2000000.txt"      
[5] "batch7/ds_batch7/CLONES_TRBCHP_361-04-PBMC-DNA_2000000.txt"      


Total recovered clonotypes:


[1] 502


Total out-of-frame clonotypes:


[1] 98


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 398


Output contains all clonotypes


In [178]:
unique(cdr3df$samplename)

In [179]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_361-FFPE", "CHP_361-01-PBMC", "CHP_361-02-PBMC",
                                                         "CHP_361-03-PBMC", "CHP_361-04-PBMC"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_361-FFPE    CHP_361-02-PBMC CHP_361-03-PBMC CHP_361-01-PBMC
[5] CHP_361-04-PBMC
5 Levels: CHP_361-FFPE CHP_361-01-PBMC CHP_361-02-PBMC ... CHP_361-04-PBMC


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


## Tumour and cfDNA

In [180]:
manifest_df_ffpe$patient

I have to do all separately to make sure levels are correct

364 no baseline cfdna

### 361 HD

In [189]:
ffpefile <- ds_flelst_chp_ffpe[grepl("361", ds_flelst_chp_ffpe)]
cfdnafiles <- ds_flelst_chp_cfDNA[grepl("361", ds_flelst_chp_cfDNA)]
tmp <- c(ffpefile, cfdnafiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


[1] "CASSYGQGANGYTF"


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_361-FFPE-DNA_S1_2000000.txt"
[2] "batch10_cfDNA/CLONES_TRBCHP_361-02_cfDNA_2000000.txt"            
[3] "batch5_cfDNA/CLONES_TRBCHP_361-01_cfDNA_2000000.txt"             
[4] "batch5_cfDNA/CLONES_TRBCHP_361-03_cfDNA_2000000.txt"             
[5] "batch5_cfDNA/CLONES_TRBCHP_361-05_cfDNA_2000000.txt"             


Total recovered clonotypes:


[1] 277


Total out-of-frame clonotypes:


[1] 53


Total clonotypes with stop codon:


[1] 6


Total productive clonotypes:


[1] 218


Output contains all clonotypes


In [190]:
unique(cdr3df$samplename)

In [191]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_361-FFPE", "CHP_361-01_cfDNA", 
                                                          "CHP_361-02_cfDNA", "CHP_361-03_cfDNA", "CHP_361-05_cfDNA"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_361-FFPE     CHP_361-02_cfDNA CHP_361-01_cfDNA CHP_361-03_cfDNA
[5] CHP_361-05_cfDNA
5 Levels: CHP_361-FFPE CHP_361-01_cfDNA CHP_361-02_cfDNA ... CHP_361-05_cfDNA


Total number of recurring clonotypes: 


[1] 1


these are what we color: 


CASSVGDSPYEQYF 
     "#BDB3B1" 


### 370 ALCL

In [200]:
ffpefile <- ds_flelst_chp_ffpe[grepl("370", ds_flelst_chp_ffpe)]
cfdnafiles <- ds_flelst_chp_cfDNA[grepl("370", ds_flelst_chp_cfDNA)]
tmp <- c(ffpefile, cfdnafiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S5", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


[1] "CASRGLSGNIQYF"


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_370-FFPE-DNA_S5_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_370-01-cfDNA_2000000.txt"             
[3] "batch3a9_cfDNA/CLONES_TRBCHP_370-03_cfDNA_2000000.txt"           


Total recovered clonotypes:


[1] 90


Total out-of-frame clonotypes:


[1] 18


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 72


Output contains all clonotypes


In [201]:
unique(cdr3df$samplename)

In [202]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_370-FFPE", "CHP_370-01-cfDNA", "CHP_370-03_cfDNA"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_370-FFPE     CHP_370-01-cfDNA CHP_370-03_cfDNA
Levels: CHP_370-FFPE CHP_370-01-cfDNA CHP_370-03_cfDNA


Total number of recurring clonotypes: 


[1] 2


these are what we color: 


   CASRGLSGNIQYF CASRKLAGMRTDTQYF 
       "#BB82C9"        "#B8D49F" 


### 372

In [238]:
ffpefile <- ds_flelst_chp_ffpe[grepl("372", ds_flelst_chp_ffpe)]
cfdnafiles <- ds_flelst_chp_cfDNA[grepl("372", ds_flelst_chp_cfDNA)]
tmp <- c(ffpefile, cfdnafiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_372-FFPE-DNA_S1_2000000.txt"
[2] "batch1_cfDNA/CLONES_TRBCHP_372-01-cfDNA_2000000.txt"             


Total recovered clonotypes:


[1] 13


Total out-of-frame clonotypes:


[1] 2


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 11


Output contains all clonotypes


In [239]:
unique(cdr3df$samplename)

In [240]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_372-FFPE", "CHP_372-01-cfDNA"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_372-FFPE     CHP_372-01-cfDNA
Levels: CHP_372-FFPE CHP_372-01-cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


### 401

In [232]:
ffpefile <- ds_flelst_chp_ffpe[grepl("401", ds_flelst_chp_ffpe)]
cfdnafiles <- ds_flelst_chp_cfDNA[grepl("401", ds_flelst_chp_cfDNA)]
tmp <- c(ffpefile, cfdnafiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


character(0)


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_401-FFPE-DNA_S1_2000000.txt"
[2] "batch7_cfDNA/CLONES_TRBCHP_401-01_cfDNA_2000000.txt"             


Total recovered clonotypes:


[1] 10


Total out-of-frame clonotypes:


[1] 0


Total clonotypes with stop codon:


[1] 0


Total productive clonotypes:


[1] 10


Output contains all clonotypes


In [233]:
unique(cdr3df$samplename)

In [234]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_401-FFPE", "CHP_401-01_cfDNA"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_401-FFPE     CHP_401-01_cfDNA
Levels: CHP_401-FFPE CHP_401-01_cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)


### 380

In [235]:
ffpefile <- ds_flelst_chp_ffpe[grepl("380", ds_flelst_chp_ffpe)]
cfdnafiles <- ds_flelst_chp_cfDNA[grepl("380", ds_flelst_chp_cfDNA)]
tmp <- c(ffpefile, cfdnafiles)
    
cdr3df <- cdr3_dataframe.fx(datapath, "TRB", tmp, "total")
cdr3df$samplename <- gsub("_2000000.txt", "", cdr3df$samplename)
cdr3df$samplename <- gsub("-DNA_S1", "", cdr3df$samplename)
cdr3df$samplename <- gsub("TRB", "", cdr3df$samplename)

duplicated sequences:


[1] "CASSPSFTDTQYF"


my files:


[1] "batchFFPE/ds_batchFFPE/CLONES_TRBCHP_380-FFPE-DNA_S1_2000000.txt"
[2] "batch5_cfDNA/CLONES_TRBCHP_380-01_cfDNA_2000000.txt"             


Total recovered clonotypes:


[1] 207


Total out-of-frame clonotypes:


[1] 41


Total clonotypes with stop codon:


[1] 5


Total productive clonotypes:


[1] 161


Output contains all clonotypes


In [236]:
unique(cdr3df$samplename)

In [237]:
cdr3df$samplename <- factor(cdr3df$samplename, levels = c("CHP_380-FFPE", "CHP_380-01_cfDNA"))

plot_clonetracks.fx(cdr3df, plotpath, "TRB", "cloneCount", 0)

list of samples to track clones: 


[1] CHP_380-FFPE     CHP_380-01_cfDNA
Levels: CHP_380-FFPE CHP_380-01_cfDNA


Total number of recurring clonotypes: 


[1] 0


these are what we color: 


named character(0)
