R/bedgraph.R

#' Get bedgraph from methylRaw, methylRawList and methylDiff objects
#'
#' The function converts \code{\link{methylRaw}}, \code{\link{methylRawDB}}, 
#' \code{\link{methylRawList}}, 
#' \code{\link{methylRawListDB}}, \code{\link{methylDiff}} or 
#' \code{\link{methylDiffDB}} object 
#' into a bedgraph format. It either writes as a file or returns a \code{data.frame}
#' @param methylObj a \code{\link{methylRaw}}, \code{\link{methylRawDB}}, 
#' \code{\link{methylRawList}}, 
#'                  \code{\link{methylRawListDB}}, \code{\link{methylDiff}} 
#'                  or \code{\link{methylDiffDB}} object
#' @param file.name  Default: NULL. if a string is given a bedgraph file will
#'  be written, if NULL a data.frame or a list of data frames will be returned
#' @param col.name   name of the column in \code{\link{methylRaw}}, 
#' \code{\link{methylRawDB}}, \code{\link{methylRawList}}, 
#'                  \code{\link{methylRawListDB}}, \code{\link{methylDiff}} 
#'                  or \code{\link{methylDiffDB}} objects to be used as a score
#'                   for the bedgraph.
#'                   For \code{methylDiff} or \code{methylDiffDB}, \code{col.name}
#'                    must be one of the following 'pvalue','qvalue', 
#'                    'meth.diff'. For \code{methylRaw}, 
#'                   \code{methylRawDB}, \code{methylRawList} and 
#'                   \code{methylRawListDB} it must be one of the following 
#'                   'coverage', 'numCs','numTs', 'perc.meth'
#' @param unmeth     when working with \code{methylRaw}, \code{methylRawDB}, 
#' \code{methylRawList} and \code{methylRawListDB} objects should you output 
#' unmethylated C percentage
#'                   this makes it easier to see the unmethylated bases because 
#'                   their methylation percentage values will be zero. Only 
#'                   invoked when file.name is not NULL.
#' @param log.transform Default FALSE, If TRUE the score column of the bedgraph 
#' wil be in log10 scale. Ignored when col.name='perc.meth'
#' @param negative Default FALSE, If TRUE, the score column of the bedgraph will
#'  be multiplied by -1. Ignored when col.name='perc.meth'
#' @param add.on additional string to be add on the track line of bedgraph. 
#' can be viewlimits,priority etc. Check bedgraph track line options at UCSC browser
#' @param chunk.size Number of rows to be taken as a chunk for processing the 
#' \code{methylRawDB}, \code{methylRawListDB} or \code{methylDiffDB} objects, 
#' default: 1e6
#'
#' @return Returns a \code{data.frame} or list of data.frames if
#'  \code{file.name=NULL}, if a file.name given appropriate bed file 
#'  will be written to that file
#' @examples
#' data(methylKit)
#' 
#' # getting a bedgraph file from a methylDiff object containing differential 
#' # methylation percentages
#' bedgraph(methylDiff.obj, file.name="test.bed", col.name="meth.diff", 
#'          unmeth=FALSE,log.transform=FALSE,negative=FALSE,add.on="")
#' 
#' # remove the file
#' unlink("test.bed")
#' 
#' # getting a bedgraph file from a methylBase object containing percent 
#' #methylation values
#' bedgraph(methylRawList.obj[[1]], file.name="test2.bed", col.name="perc.meth", 
#'          unmeth=FALSE,log.transform=FALSE,negative=FALSE,add.on="")
#' 
#' unlink("test2.bed") # remove the file
#' 
#' @section Details:
#' The parameter \code{chunk.size} is only used when working with 
#' \code{methylRawDB}, \code{methylRawListDB} or \code{methylDiffDB} objects, 
#' as they are read in chunk by chunk to enable processing large-sized objects
#'  which are stored as flat file database.
#' Per default the chunk.size is set to 1M rows, which should work for
#'  most systems. If you encounter memory problems or 
#' have a high amount of memory available feel free to adjust the 
#' \code{chunk.size}.
#' 
#' @export
#' @docType methods
#' @rdname bedgraph-methods
setGeneric("bedgraph", function(methylObj,file.name=NULL,col.name,unmeth=FALSE,
                                log.transform=FALSE,
                                negative=FALSE,add.on="",chunk.size=1e6) 
  standardGeneric("bedgraph") )


#' @rdname bedgraph-methods
#' @aliases bedgraph,methylDiff-method
setMethod("bedgraph", signature(methylObj="methylDiff"),
                    function(methylObj,file.name,col.name,unmeth,
                             log.transform,negative,add.on){

  if(! col.name %in% c('pvalue','qvalue', 'meth.diff') )
  {
    stop("col.name argument is not one of 'pvalue','qvalue', 'meth.diff'")
  }
  mdata=getData(methylObj)
  df=data.frame(chr=mdata$chr,
                start=mdata$start-1,
                end=mdata$end )
  df=cbind(df, score=mdata[col.name] )
  if(log.transform){
    df[,4]=log10(df[,4])
  }
  if(negative){
    df[,4]=-1*(df[,4])
  }
  
  if(is.null(file.name)){
    return(df)
  }else{
    track.line=paste(
    "track type=bedGraph name='",file.name,"' description='",col.name,
    "' visibility=full color=255,0,255 altColor=102,205,170 maxHeightPixels=80:80:11 ",
    add.on,sep="")
    
    cat(track.line,"\n",file=file.name)
    defsci=options()$scipen
    options(scipen = 999)
    write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                row.names=FALSE,sep="\t",append=TRUE)
    options(scipen = defsci)
  }
  
}
)

#' @rdname bedgraph-methods
#' @aliases bedgraph,methylRaw-method
setMethod("bedgraph", signature(methylObj="methylRaw"),
                    function(methylObj,file.name,col.name,unmeth,log.transform,
                             negative,add.on){
  if(!col.name %in%  c('coverage', 'numCs','numTs','perc.meth') ){
    stop("col.name argument is not one of 'coverage', 'numCs','numTs','perc.meth'")
  }
  mdata=getData(methylObj)
  df=data.frame(chr=mdata$chr,
                start=(mdata$start)-1,
                end=(mdata$end),stringsAsFactors=FALSE )
  if(col.name=="perc.meth"){
    df=cbind(df, score=100*mdata$numCs/mdata$coverage )
  }else{
    df=cbind(df, score=mdata[col.name] )
    if(log.transform){
      df[,4]=log10(df[,4])
    }
    if(negative){
      df[,4]=-1*(df[,4])
    }
  }
  
  if(is.null(file.name)){
    return(df)
  }else{
    defsci=options()$scipen
    options(scipen = 999)
    if(unmeth & col.name=="perc.meth")
    {
      track.line=paste(
          "track type=bedGraph name='",methylObj@sample.id,
          " METH Cs","' description='",methylObj@sample.id," METH Cs",
          "' visibility=full color=255,0,0 maxHeightPixels=80:80:11 ",
          add.on,sep="")                        
      cat(track.line,"\n",file=file.name)
      write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                  row.names=FALSE,sep="\t",append=TRUE)
      track.line2=paste(
          "track type=bedGraph name='",methylObj@sample.id,
          " UNMETH Cs","' description='",methylObj@sample.id," UNMETH Cs",
          "' visibility=full color=0,0,255 maxHeightPixels=80:80:11 ",
          add.on,sep="")
      cat(track.line2,"\n",file=file.name,append=TRUE)
      df[,4]=100-df[,4]
      write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                  row.names=FALSE,sep="\t",append=TRUE)
      
    }else{
      
    
      track.line=paste(
          "track type=bedGraph name='",methylObj@sample.id,col.name,
          "' description='",methylObj@sample.id,col.name,
          "' visibility=full color=255,0,0 maxHeightPixels=80:80:11 ",add.on,sep="")                        
      cat(track.line,"\n",file=file.name)
      
      
      write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                  row.names=FALSE,sep="\t",append=TRUE)
      
    }
    options(scipen = defsci)
  }
   
                        
}

)


#' @rdname bedgraph-methods
#' @aliases bedgraph,methylRawList-method
setMethod("bedgraph", signature(methylObj="methylRawList"),
                    function(methylObj,file.name,col.name,unmeth,
                             log.transform,negative,add.on){
      if(!col.name %in%  c('coverage', 'numCs','numTs','perc.meth') ){
        stop("col.name argument is not one of 'coverage', 'numCs','numTs',
             'perc.meth' options")
      }
      
      if( is.null(file.name) ){
        
        result=list()
        for(i in 1:length(methylObj))
        {
          result[[ methylObj[[i]]@sample.id ]]=bedgraph(methylObj[[i]],
                                                        file.name=NULL,
                                                   col.name=col.name,
                                                   unmeth=FALSE,
                                                   log.transform=log.transform,
                                                   negative=negative)
        }
        
        return(result)
      }else{
        defsci=options()$scipen
        options(scipen = 999)
        if(unmeth & col.name=="perc.meth")
        {
          
          df=bedgraph(methylObj[[1]],file.name=NULL,col.name=col.name,
                      unmeth=FALSE,log.transform=log.transform,
                                                   negative=negative)
          track.line=paste(
              "track type=bedGraph name='",methylObj[[1]]@sample.id,
              " METH Cs","' description='",methylObj[[1]]@sample.id," METH Cs",
              "' visibility=full color=255,0,0 maxHeightPixels=80:80:11 ",
              add.on,sep="")                        
          cat(track.line,"\n",file=file.name)
          write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                      row.names=FALSE,sep="\t",append=TRUE)
          track.line2=paste(
              "track type=bedGraph name='",methylObj[[1]]@sample.id,
              " UNMETH Cs","' description='",methylObj[[1]]@sample.id,
              " UNMETH Cs",
              "' visibility=full color=0,0,255 maxHeightPixels=80:80:11 ",
              add.on,sep="")
          cat(track.line2,"\n",file=file.name,append=TRUE)
          df[,4]=100-df[,4]
          write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                      row.names=FALSE,sep="\t",append=TRUE)

          
          for(i in 2:length(methylObj))
          {
            df=bedgraph(methylObj[[i]],file.name=NULL,col.name=col.name,
                        unmeth=FALSE,log.transform=log.transform,
                                                   negative=negative)
            track.line=paste(
              "track type=bedGraph name='",methylObj[[i]]@sample.id,
              " METH Cs","' description='",methylObj[[i]]@sample.id," METH Cs",
              "' visibility=full color=255,0,0 maxHeightPixels=80:80:11 ",
              add.on,sep="")                        
            cat(track.line,"\n",file=file.name,append=TRUE)
            write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                        row.names=FALSE,sep="\t",append=TRUE)
            track.line2=paste(
              "track type=bedGraph name='",methylObj[[i]]@sample.id,
              " UNMETH Cs","' description='",methylObj[[i]]@sample.id," UNMETH Cs",
              "' visibility=full color=0,0,255 maxHeightPixels=80:80:11 ",
              add.on,sep="")
            cat(track.line2,"\n",file=file.name,append=TRUE)
            df[,4]=100-df[,4]
            write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                        row.names=FALSE,sep="\t",append=TRUE)

          }
        }else{
          df=bedgraph(methylObj[[1]],file.name=NULL,col.name=col.name,
                      unmeth=FALSE,log.transform=log.transform,
                      negative=negative)
          track.line=paste(
              "track type=bedGraph name='",methylObj[[1]]@sample.id,col.name,
              "' description='",methylObj[[1]]@sample.id,col.name,
              "' visibility=full color=255,0,0 maxHeightPixels=80:80:11 ",
              add.on,sep="")                        
          cat(track.line,"\n",file=file.name)
          write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                      row.names=FALSE,sep="\t",append=TRUE)
          for(i in 2:length(methylObj))
          {
            df=bedgraph(methylObj[[i]],file.name=NULL,
                                                   col.name=col.name,
                        unmeth=FALSE,log.transform=log.transform,
                                                   negative=negative)
            track.line=paste(
              "track type=bedGraph name='",methylObj[[i]]@sample.id,col.name,
              "' description='",methylObj[[i]]@sample.id,col.name,
              "' visibility=full color=255,0,0 maxHeightPixels=80:80:11 ",
              add.on,sep="")                        
            cat(track.line,"\n",file=file.name,append=TRUE)
            write.table(df,file=file.name,quote=FALSE,col.names=FALSE,
                        row.names=FALSE,sep="\t",append=TRUE)
          
          
        }

        
        
      }
      
      options(scipen = defsci)
  }
})
 
qizhengyang2017/methylKit_1.8.1 documentation built on May 5, 2019, 7:58 p.m.