R/readXStringColumns.R

Defines functions readXStringColumns

Documented in readXStringColumns

readXStringColumns <-
    function(dirPath, pattern=character(0), 
             colClasses=list(NULL), nrows=-1L, skip=0L,
             sep="\t", header=FALSE, comment.char="#")
{
    if (!is.list(colClasses))
        .arg_mismatch_type_err("colClasses", "list()")
    colIndex <- which(!sapply(colClasses, is.null))
    colClasses <- sub("Set$", "", colClasses[colIndex])
    okClasses <- names(slot(getClass("XString"), "subclasses"))
    if (!all(colClasses %in% okClasses)) {
        bad <- colClasses[!colClasses %in% okClasses]
        .throw(SRError("UserArgumentMismatch",
                       "'colClasses' contains invalid class%s '%s';\n  must be one of '%s'",
                       if (length(colClasses)>1) "es" else "",
                       paste(bad, collapse="' '"),
                       paste(okClasses, collapse="', '")))
    }
    files <- .file_names(dirPath, pattern)
    res <- tryCatch({

        .Call(.read_XStringSet_columns, files, header, sep, colIndex,
              colClasses, as.integer(nrows), as.integer(skip),
              comment.char)

    }, error=function(err) {
        .throw(SRError("Input/Output",
                       "while reading files '%s':\n    %s",
                       paste(basename(files), collapse=", "),
                       conditionMessage(err)))
    })
    if (header) {
        gz <- gzfile(files[[1]]); open(gz)
        tryCatch({
            ln <- readLines(gz, skip+1)[skip+1]
        }, finally=close(gz))
        nms <- strsplit(ln, sep)[[1]]
        names(res) <- nms[colIndex]
    } else {
        names(res) <- names(colIndex)
    }
    res
}
Bioconductor/ShortRead documentation built on May 5, 2024, 4:14 a.m.