Nothing
### ceeboo 2008
library("tau")
.format.count <- function(x)
data.frame(counts = x, bytes = nchar(names(x), type = "bytes",
allowNA = TRUE),
encoding = Encoding(names(x)),
stringsAsFactors = FALSE)
## latin capital letter a with diaresis
t1 <- c("abc", "a\xc4", "", NA)
Encoding(t1) <- c("unknow", "latin1", "unknown", "unknown")
t1
t2 <- c(paste("_", t1[1:2], "_", sep = ""), t1[3:4])
t2
## count n-grams
r <- .Call(tau:::tau_utf8CountNgram, list(t2), 3L, 0L, TRUE, FALSE, FALSE)
.format.count(r)
## incremental
.Call(tau:::tau_utf8CountNgram, list(t2), 3L, 0L, TRUE, TRUE, FALSE)
r <- .Call(tau:::tau_utf8CountNgram, list(t2), 3L, 0L, TRUE, FALSE, FALSE)
.format.count(r)
## count strings
r <- .Call(tau:::tau_utf8CountString, list(t1), 3L, 0L, 0L, TRUE, FALSE, FALSE)
.format.count(r)
## count prefixes
r <- .Call(tau:::tau_utf8CountString, list(t1), 3L, 0L, 1L, TRUE, FALSE, FALSE)
.format.count(r)
## count suffixes
r <- .Call(tau:::tau_utf8CountString, list(t1), 3L, 0L, 2L, TRUE, FALSE, FALSE)
.format.count(r)
## FIXME add to interface
r <- .Call(tau:::tau_utf8CountString, list(t1), 3L, 0L, 3L, TRUE, FALSE, FALSE)
.format.count(r)
## incremental
.Call(tau:::tau_utf8CountString, list(t1), 3L, 0L, 0L, TRUE, TRUE, FALSE)
r <- .Call(tau:::tau_utf8CountString, list(t1), 3L, 0L, 0L, TRUE, FALSE, FALSE)
.format.count(r)
###
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.