R/data.R

#' a data.frame of gene expression data
#'
#' It is a randomly generated expression data 
#' used as an example of functions in this package.
#' the rowname is gene symbols
#' the columns are gene expression values
#'
#' @format A data.frame with 10779 rows and 2 column
#'
"geneExpress"

# ' a matrix for Converting gene symbol to entrez_id or ensembl_gene_id
# '
# ' the hgnc data comes from HGNC website
# ' the columns represent "symbol", "locus_group", "locus_type", 
# ' "entrez_id" and "ensembl_gene_id"
# '
# ' @format A matrix with 37647 rows and 5 column
# '
"hgnc"

#' a matrix of gene expression data in TCGA
#'
#' It is a randomly generated expression data 
#' used as an example of functions in this package.
#' the first column represents the gene symbol
#'
#' the other columns represent the expression(FPKM) of genes
#'
#' @format A matrix with 10 rows and 10 column
#'
"profile"

#' a matrix of gene expression data in GEO
#'
#' It is a randomly generated expression data 
#' used as an example of functions in this package.
#' the first column represents the gene symbol
#'
#' the other columns represent the expression of genes
#'
#' @format A matrix with 32 rows and 20 column
#'
"ventricle"

#' a matrix of gene expression data in TCGA
#'
#' It is a randomly generated expression data 
#' used as an example of functions in this package.
#' the first column represents the gene symbol
#'
#' the other columns represent the expression(count) of genes
#'
#' @format A matrix with 100 rows and 150 column
#'
"kegg_liver"

#' a matrix of gene expression data in GEO
#'
#' the first column represents the gene symbol
#'
#' the other columns represent the expression of genes
#'
#' @format A matrix with 999 rows and 3 column
#'
"GSE66705_sample2"

#' a matrix of module name, gene symbols, and the number of gene symbols
#'
#' It is a randomly generated expression data 
#' used as an example of functions in this package.
#' @format A matrix with 176 rows and 3 column
#'
"module"


# ' a matrix for Converting gene symbol.
# ' 
# ' the hgnc data comes from HGNC website
# '
# ' @format A matrix with 43547 rows and 52 column
# '
"hgnc_file"


#' a data.frame of gene length and GC content
#'
#' the gene length and GC content data comes from 
#' TxDb.Hsapiens.UCSC.hg38.knownGene and
#' BSgenome.Hsapiens.UCSC.hg38
#'
#' @format A data.frame with 27341 rows and 2 column
#'
"gene_cov"
huerqiang/GeoTcgaData documentation built on March 21, 2024, 1:42 a.m.