RNAs and Their Interactions

Documented in extrProtCTDD

#' CTD Descriptors - Distribution
#'
#' CTD Descriptors - Distribution
#' 
#' This function calculates the Distribution descriptor of the 
#' CTD descriptors (Dim: 105).
#' 
#' @param x A character vector, as the input protein sequence. 
#'
#' @return A length 105 named vector
#' 
#' @keywords extract CTD CTDD extrProtCTDD Composition
#'
#' @aliases extrProtCTDD
#' 
#' @author Min-feng Zhu <\email{wind2zhu@@163.com}>, 
#'         Nan Xiao <\url{http://r2s.name}>
#' 
#' @seealso See \code{\link{extrProtCTDC}} and \code{\link{extrProtCTDT}} 
#'          for Composition and Transition of the CTD descriptors.
#' 
#' @export extrProtCTDD
#' 
#' @references
#' Inna Dubchak, Ilya Muchink, Stephen R. Holbrook and Sung-Hou Kim. 
#' Prediction of protein folding class using global description of 
#' amino acid sequence. \emph{Proceedings of the National Academy of Sciences}. 
#' USA, 1995, 92, 8700-8704.
#' 
#' Inna Dubchak, Ilya Muchink, Christopher Mayor, Igor Dralyuk and Sung-Hou Kim.
#' Recognition of a Protein Fold in the Context of the SCOP classification. 
#' \emph{Proteins: Structure, Function and Genetics}, 1999, 35, 401-407.
#' 
#' @examples
#' x = readFASTA(system.file('protseq/P00750.fasta', package = 'BioMedR'))[[1]]
#' extrProtCTDD(x)
#' 

extrProtCTDD = function (x) {

    if (checkProt(x) == FALSE) stop('x has unrecognized amino acid type')

    group1 = list(hydrophobicity  = c('R', 'K', 'E', 'D', 'Q', 'N'),
                  normwaalsvolume = c('G', 'A', 'S', 'T', 'P', 'D', 'C'),
                  polarity        = c('L', 'I', 'F', 'W', 'C', 'M', 'V', 'Y'),
                  polarizability  = c('G', 'A', 'S', 'D', 'T'),
                  charge          = c('K', 'R'),
                  secondarystruct = c('E', 'A', 'L', 'M', 'Q', 'K', 'R', 'H'),
                  solventaccess   = c('A', 'L', 'F', 'C', 'G', 'I', 'V', 'W'))

    group2 = list(hydrophobicity  = c('G', 'A', 'S', 'T', 'P', 'H', 'Y'),
                  normwaalsvolume = c('N', 'V', 'E', 'Q', 'I', 'L'),
                  polarity        = c('P', 'A', 'T', 'G', 'S'),
                  polarizability  = c('C', 'P', 'N', 'V', 'E', 'Q', 'I', 'L'),
                  charge          = c('A', 'N', 'C', 'Q', 'G', 'H', 'I', 'L', 
                                      'M', 'F', 'P', 'S', 'T', 'W', 'Y', 'V'),
                  secondarystruct = c('V', 'I', 'Y', 'C', 'W', 'F', 'T'),
                  solventaccess   = c('R', 'K', 'Q', 'E', 'N', 'D'))

    group3 = list(hydrophobicity  = c('C', 'L', 'V', 'I', 'M', 'F', 'W'),
                  normwaalsvolume = c('M', 'H', 'K', 'F', 'R', 'Y', 'W'),
                  polarity        = c('H', 'Q', 'R', 'K', 'N', 'E', 'D'),
                  polarizability  = c('K', 'M', 'H', 'F', 'R', 'Y', 'W'),
                  charge          = c('D', 'E'),
                  secondarystruct = c('G', 'N', 'P', 'S', 'D'),
                  solventaccess   = c('M', 'S', 'P', 'T', 'H', 'Y'))

    xSplitted = strsplit(x, split = '')[[1]]
    n  = nchar(x)

    G = vector('list', 7)
    for (i in 1:7) G[[i]] = rep(NA, n)

    # Get groups for each property & each amino acid

    for (i in 1:7) {
        try(G[[i]][which(xSplitted %in% group1[[i]])] <- 'G1')
        try(G[[i]][which(xSplitted %in% group2[[i]])] <- 'G2')
        try(G[[i]][which(xSplitted %in% group3[[i]])] <- 'G3')
    }

    # Compute Distribution

    D = vector('list', 7)
    for (i in 1:7) D[[i]] = matrix(ncol = 5, nrow = 3)

    for (i in 1:7) {
        inds = which(G[[i]] == 'G1')
        D[[i]][1, ] = (inds[c(1, floor(length(inds) * c(0.25, 0.5, 0.75)), length(inds))])*100/n
        inds = which(G[[i]] == 'G2')
        D[[i]][2, ] = (inds[c(1, floor(length(inds) * c(0.25, 0.5, 0.75)), length(inds))])*100/n
        inds = which(G[[i]] == 'G3')
        D[[i]][3, ] = (inds[c(1, floor(length(inds) * c(0.25, 0.5, 0.75)), length(inds))])*100/n
    }

    D = do.call(rbind, D)
    D = as.vector(t(D))

    names(D) = paste(rep(paste('prop', 1:7, sep = ''), each = 15),
                     rep(rep(c('.G1', '.G2', '.G3'), each = 5), times = 7),
                     rep(paste('.residue', c('0', '25', '50', '75', '100'), 
                               sep = ''), times = 21), sep = '')

    return(D)

}

Any scripts or data that you put into this service are public.

BioMedR documentation built on Nov. 17, 2017, 10:08 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

BioMedR
Generating Various Molecular Representations for Chemicals, Proteins, DNAs/RNAs and Their Interactions

R/509-extractProtCTDD.R
In BioMedR: Generating Various Molecular Representations for Chemicals, Proteins, DNAs/RNAs and Their Interactions

Defines functions extrProtCTDD

Documented in extrProtCTDD

Try the BioMedR package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

BioMedR Generating Various Molecular Representations for Chemicals, Proteins, DNAs/RNAs and Their Interactions

R/509-extractProtCTDD.R In BioMedR: Generating Various Molecular Representations for Chemicals, Proteins, DNAs/RNAs and Their Interactions

Defines functions extrProtCTDD

Documented in extrProtCTDD

Try the BioMedR package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

BioMedR
Generating Various Molecular Representations for Chemicals, Proteins, DNAs/RNAs and Their Interactions

R/509-extractProtCTDD.R
In BioMedR: Generating Various Molecular Representations for Chemicals, Proteins, DNAs/RNAs and Their Interactions