Nothing
##' read beast/mrbayes/mega Nexus output
##'
##'
##' @rdname beast-parser
##' @title read.beast
##' @param file beast file
##' @return treedata object
##' @importFrom ape read.nexus
##' @export
##' @author Guangchuang Yu \url{https://guangchuangyu.github.io}
##' @examples
##' file <- system.file("extdata/BEAST", "beast_mcc.tree", package="treeio")
##' read.beast(file)
read.beast <- function(file) {
treetext <- read.treetext_beast(file)
stats <- read.stats_beast(file)
phylo <- read.nexus(file)
if (length(treetext) == 1) {
obj <- BEAST(file, treetext, stats, phylo)
} else {
obj <- lapply(seq_along(treetext), function(i) {
BEAST(file, treetext[i], stats[[i]], phylo[[i]])
})
class(obj) <- "treedataList"
}
return(obj)
}
##' @rdname beast-parser
##' @export
read.mrbayes <- read.beast
BEAST <- function(file, treetext, stats, phylo) {
stats$node <- gsub("\"*'*", "", stats$node)
phylo <- remove_quote_in_tree_label(phylo)
obj <- new("treedata",
## fields = fields,
treetext = treetext,
phylo = phylo,
data = stats,
file = filename(file)
)
return(obj)
}
remove_quote_in_tree_label <- function(phylo) {
if (!is.null(phylo$node.label)) {
phylo$node.label <- gsub("\"*'*", "", phylo$node.label)
}
if ( !is.null(phylo$tip.label)) {
phylo$tip.label <- gsub("\"*'*", "", phylo$tip.label)
}
return(phylo)
}
read.treetext_beast <- function(file) {
beast <- readLines(file)
ii <- grep("begin trees;", beast, ignore.case = TRUE)
jj <- grep("end;", beast, ignore.case = TRUE)
jj <- jj[jj > max(ii)][1]
jj <- c(ii[-1], jj)
trees <- lapply(seq_along(ii), function(i) {
tree <- beast[(ii[i]+1):(jj[i]-1)]
tree <- tree[grep("^\\s*tree", tree, ignore.case = TRUE)]
sub("[^(]*", "", tree)
}) %>% unlist
return(trees)
}
read.trans_beast <- function(file) {
beast <- readLines(file)
i <- grep("TRANSLATE", beast, ignore.case = TRUE)
if (length(i) == 0) {
return(matrix())
}
end <- grep(";", beast)
j <- end[which(end > i)[1]]
trans <- beast[(i+1):j] %>%
gsub("^\\s+", "", .) %>%
gsub(",|;", "", .)
trans <- trans[nzchar(trans)]
## remove quote if strings were quoted
trans <- gsub("'|\"", "", trans)
trans <- strsplit(trans, split="\\s+") %>%
do.call(rbind, .)
## trans is a matrix
return(trans)
}
read.stats_beast <- function(file) {
beast <- readLines(file)
trees <- read.treetext_beast(file)
if (length(trees) == 1) {
return(read.stats_beast_internal(beast, trees))
}
lapply(trees, read.stats_beast_internal, beast=beast)
}
read.stats_beast_internal <- function(beast, tree) {
##tree <- gsub(" ", "", tree)
## tree2 <- gsub("\\[[^\\[]*\\]", "", tree)
## phylo <- read.tree(text = tree2)
## tree2 <- add_pseudo_nodelabel(phylo, tree2)
phylo <- read.tree(text = tree)
tree2 <- add_pseudo_nodelabel(phylo)
## node name corresponding to stats
nn <- strsplit(tree2, split=",") %>% unlist %>%
strsplit(., split="\\)") %>% unlist %>%
gsub("\\(*", "", .) %>%
gsub("[:;].*", "", .) %>%
gsub(" ", "", .) %>%
gsub("'", "", .) %>%
gsub('"', "", .)
phylo <- read.tree(text = tree2)
root <- rootnode(phylo)
nnode <- phylo$Nnode
tree_label <- c(phylo$tip.label, phylo$node.label)
ii <- match(nn, tree_label)
if (any(grepl("TRANSLATE", beast, ignore.case = TRUE))) {
label2 <- c(phylo$tip.label,
root:getNodeNum(phylo))
## label2 <- c(treeinfo[treeinfo$isTip, "label"],
## root:(root+nnode-1))
} else {
## node <- as.character(treeinfo$node[match(nn, treeinfo$label)])
label2 <- as.character(1:getNodeNum(phylo))
}
node <- label2[match(nn, tree_label)]
## stats <- unlist(strsplit(tree, "\\["))[-1]
## stats <- sub(":.+$", "", stats
## BEAST1 edge stat fix
tree <- gsub("\\]:\\[&(.+?\\])", ",\\1:", tree)
tree <- gsub(":(\\[.+?\\])", "\\1:", tree)
if (grepl("\\]:[0-9\\.eE+\\-]*\\[", tree) || grepl("\\]\\[", tree)) {
## MrBayes output
stats <- strsplit(tree, "\\]:[0-9\\.eE+\\-]*\\[") %>% unlist
lstats <- lapply(stats, function(x) {
unlist(strsplit(x, split="\\][,\\)]"))
})
for (i in seq_along(stats)) {
n <- length(lstats[[i]])
if (i == length(stats)) {
stats[i] <- lstats[[i]][n]
} else {
stats[i] <- paste0(lstats[[i]][n],
sub("&", ",", lstats[[i+1]][1])
)
}
}
stats <- gsub("\\]\\[&", ",", stats)
} else {
## BEAST output
stats <- strsplit(tree, ":") %>% unlist
}
names(stats) <- node
stats <- stats[grep("\\[", stats)]
stats <- sub("[^\\[]*\\[", "", stats)
stats <- sub("^&", "", stats)
stats <- sub("];*$", "", stats)
stats <- gsub("\"", "", stats)
stats2 <- lapply(seq_along(stats), function(i) {
x <- stats[[i]]
y <- unlist(strsplit(x, ","))
sidx <- grep("=\\{", y)
eidx <- grep("\\}$", y)
flag <- FALSE
if (length(sidx) > 0) {
flag <- TRUE
SETS <- lapply(seq_along(sidx), function(k) {
p <- y[sidx[k]:eidx[k]]
gsub(".*=\\{", "", p) %>% gsub("\\}$", "", .)
})
names(SETS) <- gsub("=.*", "", y[sidx])
kk <- lapply(seq_along(sidx), function(k) {
sidx[k]:eidx[k]
}) %>%
unlist
y <- y[-kk]
}
if (length(y) == 0)
return(SETS)
name <- gsub("=.*", "", y)
val <- gsub(".*=", "", y) %>%
gsub("^\\{", "", .) %>%
gsub("\\}$", "", .)
if (flag) {
nn <- c(name, names(SETS))
} else {
nn <- name
}
res <- rep(NA, length(nn))
names(res) <- nn
for (i in seq_along(name)) {
res[i] <- if(is_numeric(val[i])) as.numeric(val[i]) else val[i]
}
if (flag) {
j <- i
for (i in seq_along(SETS)) {
if(is_numeric(SETS[[i]])) {
res[i+j] <- list(as.numeric(SETS[[i]]))
} else {
res[i+j] <- SETS[i]
}
}
}
return(res)
})
nn <- lapply(stats2, names) %>% unlist %>%
unique %>% sort
stats2 <- lapply(stats2, function(x) {
y <- x[nn]
names(y) <- nn
y[vapply(y, is.null, logical(1))] <- NA
y
})
stats3 <- do.call(rbind, stats2)
stats3 <- as_tibble(stats3)
## no need to extract sd from prob+-sd
## as the sd is stored in prob_stddev
##
## "prob_stddev" "prob(percent)" "prob+-sd"
##
##
##
## idx <- grep("\\+-", colnames(stats3))
## if (length(idx)) {
## for (i in idx) {
## stats3[,i] <- as.numeric(gsub("\\d+\\+-", "", stats3[,i]))
## }
## }
cn <- gsub("(\\d+)%", "0.\\1", colnames(stats3))
cn <- gsub("\\(([^\\)]+)\\)", "_\\1", cn)
## cn <- gsub("\\+-", "_", cn)
colnames(stats3) <- cn
stats3$node <- names(stats)
i <- vapply(stats3,
function(x) max(vapply(x, length, numeric(1))),
numeric(1))
for (j in which(i==1)) {
stats3[,j] <- unlist(stats3[,j])
}
stats3$node <- as.integer(stats3$node)
return(stats3)
}
add_pseudo_nodelabel <- function(phylo) {
if(is.null(phylo$node.label)) {
nnode <- phylo$Nnode
phylo$node.label <- paste("X", 1:nnode, sep="")
## for (i in 1:nnode) {
## treetext <- sub("\\)([:;])",
## paste0("\\)", nlab[i], "\\1"),
## treetext)
## }
}
## if tip.label contains () which will broken node name extraction
phylo$tip.label <- gsub("[\\(\\)]", "_", phylo$tip.label)
treetext <- write.tree(phylo)
return(treetext)
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.