testdata <- readRDS(system.file("testdata/testdata.rda", package = "gibasa"))
df <- testdata[["raw_counts"]]
### tf*idf ----
test_that("tf*idf works", {
res <-
bind_tf_idf2(df, tf = "tf", idf = "idf") |>
dplyr::mutate(tf_idf = n * idf) |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(res, dplyr::arrange(testdata[["tf*idf"]], doc_id, token, tf_idf))
})
### tf2*idf ----
test_that("tf2*idf works", {
res <-
bind_tf_idf2(df, tf = "tf2", idf = "idf") |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(
res,
dplyr::arrange(testdata[["tf2*idf"]], doc_id, token, tf_idf)
)
})
### tf2*idf2 ----
test_that("tf2*idf2 works", {
res <-
bind_tf_idf2(df, tf = "tf2", idf = "idf2") |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(
res,
dplyr::arrange(testdata[["tf2*idf2"]], doc_id, token, tf_idf)
)
})
### tf3*idf ----
test_that("tf3*idf works", {
res <-
bind_tf_idf2(df, tf = "tf3", idf = "idf") |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(
res,
dplyr::arrange(testdata[["tf3*idf"]], doc_id, token, tf_idf)
)
})
### tf2*idf3 ----
test_that("tf2*idf3 works", {
res <-
bind_tf_idf2(df, tf = "tf2", idf = "idf3") |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(
res,
dplyr::arrange(testdata[["tf2*idf3"]], doc_id, token, tf_idf)
)
})
### tf2*idf4 ----
test_that("tf2*idf4 works", {
res <-
bind_tf_idf2(df, tf = "tf2", idf = "idf4") |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(
res,
dplyr::arrange(testdata[["tf2*idf4"]], doc_id, token, tf_idf)
)
})
### tf*idf*norm ----
test_that("tf*idf*norm works", {
res <-
bind_tf_idf2(df, tf = "tf", idf = "idf", norm = TRUE) |>
dplyr::select(doc_id, token, tf_idf) |>
dplyr::arrange(doc_id, token, tf_idf)
expect_equal(
res,
dplyr::arrange(testdata[["tf*idf*norm"]], doc_id, token, tf_idf)
)
})
### itf*df ----
test_that("itf*df works", {
res <-
bind_tf_idf2(df, tf = "itf", idf = "df") |>
dplyr::select(doc_id, tf_idf) |>
dplyr::arrange(doc_id, tf_idf) |>
dplyr::filter(as.integer(doc_id) < 5)
expect_snapshot_value(res, style = "json2", cran = FALSE)
})
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.