audubon: Japanese Text Processing Tools

testdata <- readRDS(system.file("testdata/testdata.rda", package = "audubon"))

tbl <- testdata[["raw_counts"]]

### tf*idf ----
test_that("tf*idf works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf", idf = "idf") |>
    dplyr::mutate(tf_idf = n * idf) |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(res, dplyr::arrange(testdata[["tf*idf"]], doc_id, token, tf_idf))
})

### tf2*idf ----
test_that("tf2*idf works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf2", idf = "idf") |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(
    res,
    dplyr::arrange(testdata[["tf2*idf"]], doc_id, token, tf_idf)
  )
})

### tf2*idf2 ----
test_that("tf2*idf2 works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf2", idf = "idf2") |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(
    res,
    dplyr::arrange(testdata[["tf2*idf2"]], doc_id, token, tf_idf)
  )
})

### tf3*idf ----
test_that("tf3*idf works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf3", idf = "idf") |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(
    res,
    dplyr::arrange(testdata[["tf3*idf"]], doc_id, token, tf_idf)
  )
})

### tf2*idf3 ----
test_that("tf2*idf3 works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf2", idf = "idf3") |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(
    res,
    dplyr::arrange(testdata[["tf2*idf3"]], doc_id, token, tf_idf)
  )
})

### tf2*idf4 ----
test_that("tf2*idf4 works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf2", idf = "idf4") |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(
    res,
    dplyr::arrange(testdata[["tf2*idf4"]], doc_id, token, tf_idf)
  )
})

### tf*idf*norm ----
test_that("tf*idf*norm works", {
  res <-
    bind_tf_idf2(tbl, tf = "tf", idf = "idf", norm = TRUE) |>
    dplyr::select(doc_id, token, tf_idf) |>
    dplyr::arrange(doc_id, token, tf_idf)
  expect_equal(
    res,
    dplyr::arrange(testdata[["tf*idf*norm"]], doc_id, token, tf_idf)
  )
})

paithiov909/audubon documentation built on June 2, 2025, 1:15 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

paithiov909/audubon
Japanese Text Processing Tools

tests/testthat/test-bind_tf_idf2.R
In paithiov909/audubon: Japanese Text Processing Tools

R Package Documentation

Browse R Packages

We want your feedback!

paithiov909/audubon Japanese Text Processing Tools

tests/testthat/test-bind_tf_idf2.R In paithiov909/audubon: Japanese Text Processing Tools

R Package Documentation

Browse R Packages

We want your feedback!

paithiov909/audubon
Japanese Text Processing Tools

tests/testthat/test-bind_tf_idf2.R
In paithiov909/audubon: Japanese Text Processing Tools