In [None]:
library(tidyr)
library(dplyr)
library(ggplot2)
library(RColorBrewer)
library(gridExtra)
library(magrittr)
library(stringr)
library(tools)
library(patchwork)

In [None]:
options(repr.plot.width = 14, repr.plot.height = 9)

In [None]:
plot_biases <- function(data) {
    ggplot(data, aes(y = bias, fill = estimator)) +
    geom_boxplot() +
    geom_hline(yintercept = 0, linetype = "dashed",
               color = "black", size = 1) +
    theme(legend.position = "right",
          legend.box.just = "right",
          legend.margin = margin(6, 6, 6, 6),
          legend.title = element_text(size = 13, face = "bold"),
          legend.text = element_text(size = 12)) ->
    p

    return(p)
}

In [None]:
keycol <- "estimator"
valuecol <- "bias"
n_sim <- 500

In [None]:
data_1 <- read.csv("./comparisons/gcomp_500.csv")
data_1 <- as.data.frame(data_1[, "SDE"])
colnames(data_1) <- c("SDE")

data_2 <- read.csv("./sl_comparisons/gcomp_sde_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SDE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1) +
    theme(legend.position = "bottom")

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/gcomp_sde_500.png", p3)

In [None]:
data_1 <- read.csv("./comparisons/gcomp_500.csv")
data_1 <- as.data.frame(data_1[, "SIE"])
colnames(data_1) <- c("SIE")

data_2 <- read.csv("./sl_comparisons/gcomp_sie_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SIE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/gcomp_sie_500.png", p3)

In [None]:
data_1 <- read.csv("./comparisons/gcomp_posit_500.csv")
data_1 <- as.data.frame(data_1[, "SDE"])
colnames(data_1) <- c("SDE")

data_2 <- read.csv("./sl_comparisons/gcomp_sde_posit_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SDE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/gcomp_sde_posit_500.png", p3)

In [None]:
data_1 <- read.csv("./comparisons/gcomp_posit_500.csv")
data_1 <- as.data.frame(data_1[, "SIE"])
colnames(data_1) <- c("SIE")

data_2 <- read.csv("./sl_comparisons/gcomp_sie_posit_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SIE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/gcomp_sie_posit_500.png", p3)

In [None]:
data_1 <- read.csv("./comparisons/iptw_posit_500.csv")
data_1 <- as.data.frame(data_1[, "SDE"])
colnames(data_1) <- c("SDE")

data_2 <- read.csv("./sl_comparisons/iptw_sde_posit_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SDE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/iptw_sde_posit_500.png", p3)

In [None]:
data_1 <- read.csv("./comparisons/iptw_posit_500.csv")
data_1 <- as.data.frame(data_1[, "SIE"])
colnames(data_1) <- c("SIE")

data_2 <- read.csv("./sl_comparisons/iptw_sie_posit_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SIE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/iptw_sie_posit_500.png", p3)

In [None]:
true_sde_rud <- 0.124793
true_sie_rud <- 0.03026875

In [None]:
data_1 <- read.csv("./comparisons/tmle_rud_500.csv")
data_1 <- as.data.frame(data_1[, "SDE"])
data_1 <- data_1 - true_sde_rud
colnames(data_1) <- c("SDE")

data_2 <- read.csv("./sl_comparisons/tmle_sde_rud_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SDE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/tmle_sde_rud_500.png", p3)

In [None]:
data_1 <- read.csv("./comparisons/tmle_rud_500.csv")
data_1 <- as.data.frame(data_1[, "SIE"])
data_1 <- data_1 - true_sie_rud
colnames(data_1) <- c("SIE")

data_2 <- read.csv("./sl_comparisons/tmle_sie_rud_500.csv")
gathercols <- colnames(data_2)
data_2 <- gather_(data_2, keycol, valuecol, gathercols)
data_2$n <- c(rep(n_sim, n_sim))

p1 <- plot_biases(data_2)
p2 <- ggplot(data_1, aes(y = SIE)) +
    geom_boxplot(width=.1, fill = "#FFD92F") +
    lims(x = c(-.1, .1), y = c(min(data_2$bias), max(data_2$bias))) +
    geom_hline(yintercept = 0, linetype = "dashed", color = "black", size = 1)

p3 <- grid.arrange(p2, p1, nrow = 1)
ggsave("C:/Users/luis_/Downloads/tmle_sie_rud_500.png", p3)