In [1]:
library(ggplot2)
library(ggalluvial)

In [25]:
data <- read.csv("./CRC-P67-T_chr12_25245350:C>A.csv")
data$cluster <- factor(data$cluster, levels = c("Tumor", "Adjacent", "Normal"))
data_agg <- aggregate(cbind(count = base) ~ base + cluster, data, FUN = length)

In [26]:
sankey_plot <- ggplot(data = data_agg,
                      aes(axis1 = base, axis2 = cluster, y = count)) +
  geom_alluvium(aes(fill = cluster)) +
  geom_stratum(aes(fill = cluster), width = 1/12) +
  geom_text(stat = "stratum", aes(label = after_stat(stratum))) +
  scale_fill_manual(values = c("Tumor" = "#D75755", "Adjacent" = "#F1C548", "Normal" = "#83BC5B")) +
  theme_minimal() +
  theme(panel.grid.major = element_blank(), panel.grid.minor = element_blank()) +
  ggtitle("Sankey Diagram with ggalluvial") +
  xlab("Base to Cluster") +
  ylab("Count")

ggsave("./SupFigure/CRC-P67-T_kras.pdf",plot = sankey_plot, width = 5, height = 4)

In [27]:
data <- read.csv("./CRC-P59-T_2_chr12_25245350:C>T.csv")
data$cluster <- factor(data$cluster, levels = c("Tumor", "Adjacent", "Normal"))
data_agg <- aggregate(cbind(count = base) ~ base + cluster, data, FUN = length)

In [28]:
sankey_plot <- ggplot(data = data_agg,
                      aes(axis1 = base, axis2 = cluster, y = count)) +
  geom_alluvium(aes(fill = cluster)) +
  geom_stratum(aes(fill = cluster), width = 1/12) +
  geom_text(stat = "stratum", aes(label = after_stat(stratum))) +
  scale_fill_manual(values = c("Tumor" = "#D75755", "Adjacent" = "#F1C548", "Normal" = "#83BC5B")) +
  theme_minimal() +
  theme(panel.grid.major = element_blank(), panel.grid.minor = element_blank()) +
  ggtitle("Sankey Diagram with ggalluvial") +
  xlab("Base to Cluster") +
  ylab("Count")

ggsave("./SupFigure/CRC-P59-T_2_kras.pdf",plot = sankey_plot, width = 5, height = 4)

In [31]:
data <- read.csv("./CRC-P59-T_2_chr1_152033685:A>G.csv")
data$cluster <- factor(data$cluster, levels = c("Tumor", "Adjacent", "Normal"))
data_agg <- aggregate(cbind(count = base) ~ base + cluster, data, FUN = length)

In [32]:
sankey_plot <- ggplot(data = data_agg,
                      aes(axis1 = base, axis2 = cluster, y = count)) +
  geom_alluvium(aes(fill = cluster)) +
  geom_stratum(aes(fill = cluster), width = 1/12) +
  geom_text(stat = "stratum", aes(label = after_stat(stratum))) +
  scale_fill_manual(values = c("Tumor" = "#D75755", "Adjacent" = "#F1C548", "Normal" = "#83BC5B")) +
  theme_minimal() +
  theme(panel.grid.major = element_blank(), panel.grid.minor = element_blank()) +
  ggtitle("Sankey Diagram with ggalluvial") +
  xlab("Base to Cluster") +
  ylab("Count")

ggsave("./SupFigure/CRC-P59-T_2_s100a11.pdf",plot = sankey_plot, width = 5, height = 4)