R/string.R

Defines functions .String_from_string `*.String` `+.String` `[.String` print.String is.String as.String.default as.String String

Documented in as.String is.String String

## A simple string class.

String <-
function(x)
{
    .String_from_string(as.character(x)[[1L]])
}

## Note subscripting by [[: this insists on the first element, and
## hence gives an error instead of NA_character_ if there is none.

as.String <-
function(x)
    UseMethod("as.String")

as.String.String <- identity

as.String.default <-
function(x)
    String(paste(x, collapse = "\n"))

is.String <-
function(x)
    inherits(x, "String")

print.String <-
function(x, ...)
    writeLines(x)

## Provide a '[' method performing slicing (as we cannot provide S3
## methods for substr, and clearly substrings of strings should be
## strings.

## Note that we have no distinction between spans and span arrays (same
## issue as having no distinction between strings and string arrays in
## base R).  Hence, we take spans to always operate in an array context
## (for now: we could add a drop = FALSE argument to have subscripting
## turn character vectors of length one back to strings again).

`[.String` <-
function(x, i, j)
{
    mysubstring <- function(x, i, j) {
        ## substring() recycles to max length of args only when this is
        ## positive.
        if(!length(i))
            character()
        else
            substring(x, i, j)
    }

    if(missing(j)) {
        if(is.Span(i))
            return(mysubstring(x, i$start, i$end))
        if(is.list(i)) {
            if(!length(i))
                return(list())
            else if(all(vapply(i, is.Span, NA))) 
                return(lapply(i,
                              function(e)
                                  mysubstring(x, e$start, e$end)))
        }
    }
    ## Regular slicing operators in a scalar context.
    String(substr(x, i, j))
}

## More methods?
##
## A popular mailing list discussion item is to use a Java style '+'
## operator for concatenating strings (not uniformly liked as the
## corresponding operation is not commutative):

`+.String` <-
function(e1, e2)
    .String_from_string(paste0(as.String(e1), as.String(e2)))

## Also provide Python-style string repetition.

`*.String` <-
function(e1, e2)
{
    if(is.numeric(e1) && (length(e1) == 1L))
        .String_from_string(paste(rep.int(e2, e1), collapse = ""))
    else if(is.numeric(e2) && (length(e2) == 1L))
        .String_from_string(paste(rep.int(e1, e2), collapse = ""))
    else
        stop("Invalid operands.")
}

## What about c.String?

.String_from_string <-
function(x)
{
    y <- enc2utf8(x)
    class(y) <- "String"
    y
}

Try the NLP package in your browser

Any scripts or data that you put into this service are public.

NLP documentation built on Oct. 23, 2020, 6:18 p.m.