R/MAboxplot7.R

#####MABoxPlot6#####
#MABoxPlot4
#Bug fix to not plot NA statistical values as significant
#New feature to allow input of statistical cutoff
#150809 Fixed bug that prevented boxplot of only two groups.
#MABoxPlot5
#New feature to plot sample names on plot
#MABoxPlot6
#Allow for further manipulation of color

# #Dummy Data
# gene<-AURKA.PROBES[2]
# sampleNames<-paste(finaleset$sampleNames, finaleset$Batch, sep="-")
# array<-data
# limma.obj<-limma.out
# classvec<-classvec
# stat.test="pairwiset"
# p.value=0.05
#display.brewer.all(n=NULL, type="all", select=NULL, exact.n=TRUE, colorblindFriendly=FALSE)


# setClass("ColPal", representation(pal="character"))
# new("ColPal", )

# CreateColObj<-function(n, factor=60, times = (1 + ceiling((start+(n-1))/17)), pie=TRUE, start=1,
#                          pal=rep(c(RColorBrewer::brewer.pal(9, "Set1"),  RColorBrewer::brewer.pal(8, "Set2")),times))
#   {
#   sel<-end<-start:(start+(n-1))
#   col2<-as.character(sapply(pal, function(x) LightenDarkenColor(x, factor)))
#   col3<-as.character(sapply(col2, function(x) LightenDarkenColor(x, factor+100)))
#    if(pie==TRUE){
#       par(mfrow=c(1,3))
#       pie(rep(1,length(pal[sel])), col=pal[sel], labels=pal[sel])
#       pie(rep(1,length(pal[sel])), col=col2[sel], labels=col2[sel])
#       pie(rep(1,length(pal[sel])), col=col3[sel], labels=col3[sel])
#    }
#   return(list(line=pal[sel], fill=col2[sel], dot=col3[sel]))
# }


#debug(MAboxplot6)

MAboxplot7<-function(gene, array, limma.obj=NULL, classvec, ColObj=NULL,
                     alpha=0.8, dot.size=6, box.size=1, box.width=1,
                     reorder=NULL, stat.test="pairwiset", annotate=TRUE, p.value=0.05, sampleNames=NULL){
  classvec<-as.factor(classvec)
  if(is.null(ColObj)==TRUE){stop("Need ColObj")}
  line.cols<-ColObj@match$line
  dot.fill.cols<-ColObj@match$fill
  box.fill.cols<-ColObj@match$fill
  if(is.null(reorder)==FALSE){classvec<-factor(classvec,levels(classvec)[reorder])
  line.cols<-line.cols[reorder]
  dot.fill.cols<-dot.fill.cols[reorder]
  box.fill.cols<-box.fill.cols[reorder]
  }
  if(is.null(ColObj)==TRUE){classvec<-factor(classvec,levels(classvec)[reorder])
                              line.cols<-line.cols[reorder]
                              dot.fill.cols<-dot.fill.cols[reorder]
                              box.fill.cols<-box.fill.cols[reorder]
  }
  obj<-array[gene,]
  df<-data.frame(gp=classvec, y=obj)
  maxh <- max(df$y)
  minh<-min(df$y)
  spread<-(maxh-minh)/14
  maxh<-maxh+spread
  df$maxh<-maxh
  df$spread<-spread
  ds <- plyr::ddply(df, plyr::as.quoted("gp"), plyr::summarise, mean = mean(y), sd = sd(y))
  if(stat.test=="pairwiset"){
    stats<-pairwise.t.test(df$y, classvec, p.adjust="fdr")
  }
  if(stat.test=="limma"){
    stat.df<-data.frame(Comp1=as.factor(limma.obj[[5]]$Comp1), Comp2=as.factor(limma.obj[[5]]$Comp2), p.value=ExtractLIMMA(limma.obj, gene)$adj.P.Val, stringsAsFactors=FALSE)
    stat.df<-stats.table(stat.df)
    if(length(levels(classvec))==2){
      if(is.null(reorder)==FALSE){
        stat.df<-t(data.frame(stat.df[reorder,]))
        colnames(stat.df)<-levels(classvec)[reorder]
      }
      else{
        stat.df<-t(data.frame(stat.df))
      }
      rownames(stat.df)<-levels(classvec)[2]
    }
    else{
      if(is.null(reorder)==FALSE){stat.df<-stat.df[,reorder]
      }
      rownames(stat.df)<-levels(classvec)[order(levels(classvec))][2:length(levels(classvec))]
    }

    #stat.df[is.na(stat.df)]<-1
    stats<-list(p.value=stat.df)
    array.ind<-as.data.frame(which(stats$p.value < p.value, arr.ind=T))
    if(length(levels(classvec))==2){
      if(is.null(reorder)==TRUE){
        array.ind$row<-match(rownames(stat.df)[array.ind$row], levels(classvec))
      }
    }
    else{array.ind$row<-match(rownames(stat.df)[array.ind$row], levels(classvec))}
    rownames(array.ind)<-NULL
    colnames(array.ind)<-c("start","end")
    array.ind$y<-seq(from=maxh+0.5*(spread), by=spread/2, length.out=nrow(array.ind))
  }
  if(stat.test=="pairwiset"){
    array.ind<-as.data.frame(which(stats$p.value < p.value, arr.ind=T))
    rownames(array.ind)<-NULL
    array.ind$row<-array.ind$row+1
    colnames(array.ind)<-c("start","end")
    array.ind$y<-seq(from=maxh+0.5*(spread), by=spread/2, length.out=nrow(array.ind))
  }
  #add sampleNames to df
  if(length(sampleNames)!=0){
    df$sampleNames<-sampleNames
    g<-ggplot2::ggplot(df, ggplot2::aes(x = gp, y = y)) +
      ggplot2::geom_boxplot(size=box.size, alpha=0.6, fill=box.fill.cols, colour=line.cols, outlier.size=NULL, width=box.width) +
      ggplot2::geom_point(size=dot.size, shape=21, colour=line.cols[classvec], width=box.width, fill=dot.fill.cols[classvec], alpha=alpha, position = ggplot2::position_jitter(width = .1)) +
      ggplot2::geom_text(data=df, ggplot2::aes(x = gp, y = y, label=sampleNames), size = 3, hjust=-1) +
      ggplot2::labs(list(x = NULL, y = "Log2 Transformed Data", title=gene)) +
      #ylab(expression(paste("Log", [2], " Transformed Data", sep="")))+
      ggplot2::theme_bw() +
      ggplot2::theme(axis.text=ggplot2::element_text(size=16),
          axis.title.x=ggplot2::element_text(size=20, vjust=1),
          axis.text.x = ggplot2::element_text(angle = 45, hjust=1),
          axis.title.y=ggplot2::element_text(size=16, vjust=0.5), plot.title = ggplot2::element_text(vjust = 0, size=20),
          axis.line = ggpolt2::element_line(colour = "black"),
          #text=ggplot2::element_text(family="Myriad Pro"),
          panel.grid.major = ggpolt2::element_blank(),
          panel.grid.minor = ggpolt2::element_blank(),
          panel.border = ggpolt2::element_blank(),
          panel.background = ggpolt2::element_blank())
    if(nrow(array.ind)==0){
      print(g)
    }
    else
    {
      for(i in 1:nrow(array.ind)){
        g<-g+ggplot2::geom_segment(ggplot2::aes_string(x = array.ind$start[i], y = array.ind$y[i], xend = array.ind$end[i], yend=array.ind$y[i]), lwd=0.5,arrow = arrow(angle=90, ends="both", length = grid::unit(0.1, "cm")))
      }
    }
    print(g)
    footie1<-ifelse(stat.test=="limma", paste("Mod. Bayesian T statistic corrected using ", limma.obj[[6]]$p.adjust, sep=""), "Pairwise T Test, FDR-corrected")
    Footnote.txt<-paste("Horizontal bars indicate p <0.05 using ", footie1, sep="")
    makeFootnote(Footnote.txt,  color = "black")
  }
  else
  {
      g<-ggplot2::ggplot(df, ggplot2::aes(x = gp, y = y)) +
        ggplot2::geom_boxplot(size=box.size, alpha=0.6, fill=box.fill.cols, width=box.width, colour=line.cols, outlier.size=NULL) +
        ggplot2::geom_point(size=dot.size, shape=21, colour=line.cols[classvec], fill=dot.fill.cols[classvec], alpha=alpha, position = ggplot2::position_jitter(width = .1)) +
        ggplot2::labs(list(x = NULL, y = "Log2 Transformed Data", title=gene)) +
        #ylab(expression(paste("Log", [2], " Transformed Data", sep="")))+
        ggplot2::theme_bw() +
        ggplot2::theme(axis.text=ggplot2::element_text(size=16),
              axis.title.x=ggplot2::element_text(size=20, vjust=1),
              axis.text.x = ggplot2::element_text(angle = 45, hjust=1),
              axis.title.y=ggplot2::element_text(size=16, vjust=0.5), plot.title = ggplot2::element_text(vjust = 0, size=20),
              axis.line = ggplot2::element_line(colour = "black"),
              #text=ggplot2::element_text(family="Myriad Pro"),
              panel.grid.major = ggplot2::element_blank(),
              panel.grid.minor = ggplot2::element_blank(),
              panel.border = ggplot2::element_blank(),
              panel.background = ggplot2::element_blank())
      if(nrow(array.ind)==0){
      }
      else
      {
        for(i in 1:nrow(array.ind)){
          g<-g+ggplot2::geom_segment(ggplot2::aes_string(x = array.ind$start[i], y = array.ind$y[i], xend = array.ind$end[i], yend=array.ind$y[i]), lwd=0.5,arrow = ggplot2::arrow(angle=90, ends="both", length = grid::unit(0.1, "cm")))
        }
      }
      print(g)
      footie1<-ifelse(stat.test=="limma", paste("Mod. Bayesian T statistic corrected using ", limma.obj[[6]]$p.adjust, sep=""), "Pairwise T Test, FDR-corrected")
      Footnote.txt<-paste("Horizontal bars indicate p <0.05 using ", footie1, sep="")
      makeFootnote(Footnote.txt,  color = "black")
    }
}

# write a simple function to add footnote
makeFootnote <- function(footnoteText =
                           format(Sys.time(), "%d %b %Y"),
                         size = .7, color = grey(.5))
{
  grid::pushViewport(grid::viewport())
  grid::grid.text(label = footnoteText ,
            x = grid::unit(1,"npc") - grid::unit(2, "mm"),
            y = grid::unit(2, "mm"),
            just = c("right", "bottom"),
            gp = grid::gpar(cex = size, col = color))
  grid::popViewport()
}


# extractColor<-function(classvec.sel, cols.list, show="fill"){
#   selected<-levels(classvec.sel)
#   colmatch<-data.frame(names = cols.list$group[match(selected,cols.list$group)],
#                        line = cols.list$cols[match(selected,cols.list$group)],
#                        fill = cols.list$fill[match(selected,cols.list$group)], stringsAsFactors=FALSE)
#   colmatch.ord<-colmatch[order(colmatch$names),]
#   if(show=="fill"){
#   pie(rep(1,nrow(colmatch.ord)), col=colmatch.ord$fill, labels=colmatch.ord$names)}
#   else
#   {pie(rep(1,nrow(colmatch.ord)), col=colmatch.ord$line, labels=colmatch.ord$names)}
#   return(colmatch)
# }

SigLevel<-function(vector){
  return(sapply(vector, function(x) ifelse(x>0.001 && x<0.05, "*", ifelse(x<0.001, "**", "NS"))))
}

FindContrasts<-function(object){
  return(print(names(object[[3]])))
}
scfurl/probedeeper documentation built on May 29, 2019, 3:25 p.m.