R/TCGA_id_conversion.R

Defines functions id_conversion

Documented in id_conversion

#' Convert  ENSEMBL gene id to gene Symbol in TCGA
#'
#' @param profiles a data.frame
#' @param toType one of 'keytypes(org.Hs.eg.db)'
#'
#' @return a data.frame, gene symbols and their expression value
#' @export
#'
#' @examples
#' \dontrun{
#' library(org.Hs.eg.db)
#' profile <- GeoTcgaData::profile
#' result <- id_conversion(profile)
#' }
id_conversion <- function(profiles, toType = "SYMBOL"){  
    # rownames(profiles) <- unlist(lapply(rownames(profiles), function(x) unlist(strsplit(x,"\\."))[1]))
    # file3 <- hgnc
    # rownames(file3)<-file3[,5]
    # genes <- intersect(rownames(profiles), file3[,5])
    # mat <- file3[genes, c(1,5)]
    # profiles_new <- profiles[mat[,2],]
    # rownames(profiles_new) <- mat[,1]
    # profiles_new
    ## use clusterProfiler::bitr to convert gene id
    # rownames(profiles) <- unlist(lapply(rownames(profiles), function(x) unlist(strsplit(x,"\\."))[1]))
    rownames(profiles) <- gsub("\\..*", "", rownames(profiles))
    genes <- clusterProfiler::bitr(rownames(profiles), fromType = "ENSEMBL", 
        toType = toType, OrgDb = org.Hs.eg.db::org.Hs.eg.db, drop = FALSE)
    	
    genes <- genes[!duplicated(genes[, 1]), ]
    rownames(genes) <- genes[, 1]
    profiles2 <- as.matrix(profiles)
    rownames(profiles2) <- genes[rownames(profiles), 2]
    return(profiles2)
}

Try the GeoTcgaData package in your browser

Any scripts or data that you put into this service are public.

GeoTcgaData documentation built on Sept. 23, 2022, 9:05 a.m.