inst/doc/tm.plugin.koRpus_vignette.R

## ----setup, include=FALSE-------------------------------------------------------------------------
header_con <- file("vignette_header.html")
writeLines('<meta name="flattr:id" content="4zdzgd" />', header_con)
close(header_con)

## ---- include=FALSE, cache=FALSE------------------------------------------------------------------
# load knitr for better graphics support
library(knitr)

## ---- eval=FALSE----------------------------------------------------------------------------------
#  library(tm.plugin.koRpus)
#  library(koRpus.lang.de)
#  # set the root path to the sample files
#  sampleRoot <- file.path(path.package("tm.plugin.koRpus"), "tests", "testthat", "samples")
#  # the next call uses "hierarchy" to describe the directory structure
#  # and its meaning; see below
#  sampleTexts <- readCorpus(
#    dir=sampleRoot,
#    hierarchy=list(
#      Topic=c(
#        C3S="C3S SCE",
#        GEMA="GEMA e.V."
#      ),
#      Source=c(
#        Wikipedia_alt="Wikipedia (alt)",
#        Wikipedia_neu="Wikipedia (neu)"
#      )
#    ),
#    tagger="tokenize",
#    lang="de"
#  )

## ---- eval=FALSE----------------------------------------------------------------------------------
#  sampleTexts <- lex.div(sampleTexts)
#  corpusSummary(sampleTexts)

## ---- eval=FALSE----------------------------------------------------------------------------------
#  library(sciplot)
#  lineplot.CI(
#    x.factor=corpusSummary(sampleTexts)[["Source"]],
#    response=corpusSummary(sampleTexts)[["MTLD"]],
#    group=corpusSummary(sampleTexts)[["Topic"]],
#    type="l",
#    main="MTLD",
#    xlab="Media source",
#    ylab="Lexical diversity score",
#    col=c("grey", "black"),
#    lwd=2
#  )

## ---- eval=FALSE----------------------------------------------------------------------------------
#  sampleTexts <- read.corp.custom(sampleTexts, case.sens=FALSE)
#  sampleTextsWordFreq <- query(
#    corpusCorpFreq(sampleTexts),
#    var="wclass",
#    query=kRp.POS.tags(lang="de", list.classes=TRUE, tags="words")
#  )
#  head(sampleTextsWordFreq, 10)

## ---- eval=FALSE----------------------------------------------------------------------------------
#  require(wordcloud)
#  colors <- brewer.pal(8, "RdGy")
#  wordcloud(
#    head(sampleTextsWordFreq[["word"]], 200),
#    head(sampleTextsWordFreq[["freq"]], 200),
#    random.color=TRUE,
#    colors=colors
#  )
unDocUMeantIt/tm.plugin.koRpus documentation built on May 21, 2021, 9:27 p.m.