Nothing
## Chinese Word Segmentation
.onLoad <- function(libname, pkgname) {
rJava:::.jpackage(pkgname, lib.loc=libname)
## must use full access of :::
}
mmseg4j <- function (text, method = c("complex", "maxword", "simple"), dicDir = NULL)
{
## the plugins are from http://code.google.com/p/mmseg4j/
## this segmentation softeware seems most useful
## .jinit(system.file("java","Rmmseg4j.jar",package="rmmseg4j"), force.init = TRUE)
method = match.arg(method)
oriClass <- class(text)
if ( !inherits(text, "character") ) stop ("text should be character vector")
N <- length(text)
Rval <- vector(mode = "character", length = N)
if (method == "complex") mmseg <- .jnew("Rmmseg4j/RmmsegComplex")
if (method=="maxword") mmseg <- .jnew("Rmmseg4j/RmmsegMaxWord")
if (method=="simple") mmseg <- .jnew("Rmmseg4j/RmmsegSimple")
if (!is.null(dicDir)) {
mmseg$resetDefaultDicPath(dicDir)
} else {
mmseg$resetDefaultDicPath(file.path(system.file(package = "rmmseg4j"), "userDic"))
}
if (isTRUE(mmseg$needReload())) {
succeeded <- mmseg$reloadDic()
if (!succeeded) warning("Fail to reload the changed dictionary")
}
## automatically examine the status of dic, reload if changed
for (i in seq_len(N)) {
Val <- mmseg$segWords(text[i], " ")
Encoding(Val) <- "UTF-8"
Rval[i] <- Val
}
class(Rval) <- oriClass
Rval
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.