tests/testthat/test_readWikinews.R

context("read Wikipedia Pages")

test_that("readWikinews", {
  corp = readWikinews(path = "data/Wikinews")
  corp1 = readWikinews(path = "data/Wikinews", file = "Wikinews1.xml")
  corp2 = readWikinews(path = "data/Wikinews", file = "Wikinews2.xml")

  expect_true(is.textmeta(corp))
  expect_true(is.textmeta(corp1))
  expect_true(is.textmeta(corp2))
  expect_equal(mergeTextmeta(list(corp1, corp2)), corp)

  expect_equal(length(corp$text), nrow(corp$meta))
  expect_equal(length(corp$text), 4)
  expect_equal(length(corp1$text), nrow(corp1$meta))
  expect_equal(length(corp1$text), 3)
  expect_equal(length(corp2$text), nrow(corp2$meta))
  expect_equal(length(corp2$text), 1)

  expect_equal(corp$meta$date, as.Date(c("2018-03-30", "2018-04-04", "2018-04-07", "2018-03-31")))
  expect_equal(corp$meta$id, names(corp$text))
  expect_equal(corp$meta$id, c("ID2838764", "ID2839675", "ID2839732", "ID2839233"))
  expect_equal(corp1$meta$date, as.Date(c("2018-03-30", "2018-04-04", "2018-04-07")))
  expect_equal(corp1$meta$id, names(corp1$text))
  expect_equal(corp1$meta$id, c("ID2838764", "ID2839675", "ID2839732"))
  expect_equal(corp2$meta$date, as.Date("2018-03-31"))
  expect_equal(corp2$meta$id, names(corp2$text))
  expect_equal(corp2$meta$id, "ID2839233")
})
Docma-TU/tosca documentation built on June 2, 2025, 3:11 a.m.