In [None]:
library("ggplot2")
library("data.table")
library("cowplot")

results = fread("./distances.csv")
results

In [None]:
options(repr.plot.width = 21, repr.plot.height=13)

In [None]:
p.nf = ggplot(results, aes(x = nf, y = e_nd)) + 
    facet_grid(rows="aligner", scale="free_y") + 
    geom_smooth(method="lm", se=TRUE, formula = y ~ splines::ns(x,3)) + 
    theme(text=element_text(size=15)) + 
    labs(x = "Nick Frequency", y = "Expected Node Distance")
p.nf

In [None]:
p.ov = ggplot(results, aes(x = ov, y = e_nd)) + 
    facet_grid(rows="aligner", scale="free_y", shrink=TRUE) + 
    geom_smooth(method="lm", se=TRUE, formula = y ~ splines::ns(x,3)) + 
    theme(text=element_text(size=15))+ 
    labs(x = "Overhang", y = "Expected Node Distance")

p.ov

In [None]:
p.ss = ggplot(results, aes(x = ss, y = e_nd)) +
    facet_grid(rows="aligner", scale="free_y", shrink=TRUE) + 
    geom_smooth(method="lm", se=TRUE, formula = y ~ splines::ns(x, 1)) + 
    theme(text=element_text(size=15))+ 
    labs(x = "Single Strand", y = "Expected Node Distance")

p.ss

In [None]:
p.ds = ggplot(results, aes(x = ds, y = e_nd)) +
    facet_grid(rows="aligner", scale="free_y", shrink=TRUE) + 
    geom_smooth(method="lm", se=TRUE, formula = y ~ splines::ns(x,2)) + 
    theme(text=element_text(size=15))+ 
    labs(x = "Double Strand", y = "Expected Node Distance")

p.ds

In [None]:
options(repr.plot.width = 18, repr.plot.height=14)
plot_grid(p.nf, p.ov, p.ss, p.ds, labels="AUTO")

In [None]:
p.nf = ggplot(results, aes(x = nf, y = e_nd)) + 
    facet_grid(rows="aligner", scale="free_y") + 
    geom_smooth(method="lm") + 
    theme(text=element_text(size=15)) + 
    labs(x = "Nick Frequency", y = "Expected Node Distance")
p.nf

In [None]:
p.nf = ggplot(results, aes(x = ov, y = e_nd)) + 
    facet_grid(rows="aligner", scale="free_y") + 
    geom_smooth(method="lm") + 
    theme(text=element_text(size=15)) + 
    labs(x = "Overhang", y = "Expected Node Distance")
p.nf

In [None]:
p.nf = ggplot(results, aes(x = ds, y = e_nd)) + 
    facet_grid(rows="aligner", scale="free_y") + 
    geom_smooth(method="lm") + 
    theme(text=element_text(size=15)) + 
    labs(x = "Double Strand", y = "Expected Node Distance")
p.nf

In [None]:
p.nf = ggplot(results, aes(x = ss, y = e_nd)) + 
    facet_grid(rows="aligner", scale="free_y") + 
    geom_smooth(method="lm") + 
    theme(text=element_text(size=15)) + 
    labs(x = "Single Strand", y = "Expected Node Distance")
p.nf

In [None]:
ggplot(results, aes(x = nf)) + geom_histogram()

In [None]:
ggplot(results, aes(x = ov)) + geom_histogram()

In [None]:
ggplot(results, aes(x = ds)) + geom_histogram()

In [None]:
ggplot(results, aes(x = ss)) + geom_histogram()

In [None]:
aligners <- factor(results$aligner)
models <- lapply(aligners, function(x){
    lm(e_nd ~ splines::ns(nf, 3) , results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ splines::ns(ov, 3) , results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ splines::ns(ss, 1) , results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ splines::ns(ds, 2) , results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ nf, results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ ov, results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ ss, results[aligner == x])
    })
lapply(models, summary)

In [None]:
models <- lapply(aligners, function(x){
    lm(e_nd ~ ds, results[aligner == x])
    })
lapply(models, summary)