R/probe2gene.R

Defines functions probe2gene

Documented in probe2gene

#' Transform Probe Set to Gene Level Data
#' 
#' Function to transform expression values from probe set to gene level data. If
#' genes are represented by several probe sets then their mean intensities are used.
#' Probe sets not matching any gene ids are removed.
#' @param expr_df data.frame with probe set level expression data
#' @param annot data.frame containing probe set id (in row name slot) to
#' gene entrez id (in first column) mapping information
#' @return data.frame with gene level expression values
#' @examples
#' expr_df <- data.frame(t1=runif(3), t2=runif(3), row.names=paste0("p", 1:3))
#' annot <- data.frame(ENTREZID=c("123","123","124"), 
#'                     SYMBOL=c("g1","g1","g2"),
#'                     row.names=paste0("p", 1:3))
#' gdf <- probe2gene(expr_df, annot)
#' @export
probe2gene <- function(expr_df, annot){
    myAnnot <- annot[as.character(annot[,"ENTREZID"]) != "NA",]
    expr_df <- expr_df[rownames(myAnnot),]
    idlist <- tapply(row.names(myAnnot), as.character(myAnnot$ENTREZID), c)
    gexpr_df <- t(sapply(names(idlist), function(x) colMeans(expr_df[idlist[[x]], ])))
    return(gexpr_df)
}
yduan004/signatureSearch_data documentation built on April 7, 2023, 5:02 a.m.