In [1]:
library(ggtree)
library(treeio)
library(ggplot2)
library(ggnewscale)
library(ggtreeExtra)
library(dplyr)

ggtree v3.2.1  For help: https://yulab-smu.top/treedata-book/

If you use ggtree in published research, please cite the most appropriate paper(s):

1. Guangchuang Yu. Using ggtree to visualize data on tree-like structures. Current Protocols in Bioinformatics. 2020, 69:e96. doi:10.1002/cpbi.96
2. Guangchuang Yu, Tommy Tsan-Yuk Lam, Huachen Zhu, Yi Guan. Two methods for mapping and visualizing associated data on phylogeny using ggtree. Molecular Biology and Evolution. 2018, 35(12):3041-3043. doi:10.1093/molbev/msy194
3. Guangchuang Yu, David Smith, Huachen Zhu, Yi Guan, Tommy Tsan-Yuk Lam. ggtree: an R package for visualization and annotation of phylogenetic trees with their covariates and other associated data. Methods in Ecology and Evolution. 2017, 8(1):28-36. doi:10.1111/2041-210X.12628



treeio v1.18.1  For help: https://yulab-smu.top/treedata-book/

If you use treeio in published research, please cite:

LG Wang, TTY Lam, S Xu, Z Dai, L Zhou, T Feng, P Guo, CW Dunn, BR Jones, T Bra

In [2]:
tree <- read.tree('/Users/harihara/Mount/CMSC829A/Data/Core_Species_Trees.tree')
ddf_taxa <- read.csv('/Users/harihara/Mount/CMSC829A/Data/Taxonomy_Core_Genomes.txt')
ddf_taxa <- ddf_taxa[(ddf_taxa$Tree_Leaves %in% c(tree$tip.label)), ]
ddf_taxa[ddf_taxa$class=='',"class"] = "cyanobacteria"


In [3]:
tree_layout <- ggtree(tree,  layout="circular", size = 0.5)
tree_layout <- tree_layout %<+% ddf_taxa + geom_tippoint(mapping=aes(color=order), 
                                                         size=10, show.legend = FALSE)

tree_layout <- tree_layout + geom_fruit(
                                        geom=geom_bar,
                                        mapping=aes(x = 0, fill=order),
                                        pwidth=0.0, 
                                        orientation="y", 
                                        stat="identity") + 
                             scale_fill_discrete(name="Order",
                                                 guide=guide_legend(keywidth=5, 
                                                                    keyheight=5,
                                                                    ncol=1)
                                                )+ 
                             theme(legend.title=element_text(size=75), 
                                   legend.text=element_text(size=60))

tree_layout <- tree_layout + 
               new_scale_fill() + 
               geom_fruit(geom=geom_bar,
                          mapping=aes(x=1, 
                                      y=Tree_Leaves, 
                                      fill=phylum),
                          pwidth=0.05, 
                          orientation="y", 
                          stat="identity") +
               scale_fill_manual(values=c("red","blue",
                                          "green","orange",
                                          "yellow", "black",
                                          "gray"), 
                                 guide=guide_legend(keywidth=5, 
                                                    keyheight=5,
                                                    ncol=1),
                                 name = "Phylum")+ 
               theme(legend.title=element_text(size=75), 
                     legend.text=element_text(size=60))

“'edge.length' contains NA values...
## setting 'edge.length' to NULL automatically when plotting the tree...”


In [5]:
ggsave(filename = '/Users/harihara/UMD_Coursework/Fall_2021/CMSC829A/Project/Plots/Species_Tree.pdf', 
       plot = tree_layout, width=75, height=60,limitsize = FALSE)