tests/testthat/test_readWikinews.R

context("read Wikipedia Pages")

test_that("readWikinews", {
  corp = readWikinews(path = "data/Wikinews")
  corp1 = readWikinews(path = "data/Wikinews", file = "Wikinews1.xml")
  corp2 = readWikinews(path = "data/Wikinews", file = "Wikinews2.xml")

  expect_true(is.textmeta(corp))
  expect_true(is.textmeta(corp1))
  expect_true(is.textmeta(corp2))
  expect_equal(mergeTextmeta(list(corp1, corp2)), corp)

  expect_equal(length(corp$text), nrow(corp$meta))
  expect_equal(length(corp$text), 4)
  expect_equal(length(corp1$text), nrow(corp1$meta))
  expect_equal(length(corp1$text), 3)
  expect_equal(length(corp2$text), nrow(corp2$meta))
  expect_equal(length(corp2$text), 1)

  expect_equal(corp$meta$date, as.Date(c("2018-03-30", "2018-04-04", "2018-04-07", "2018-03-31")))
  expect_equal(corp$meta$id, names(corp$text))
  expect_equal(corp$meta$id, c("ID2838764", "ID2839675", "ID2839732", "ID2839233"))
  expect_equal(corp1$meta$date, as.Date(c("2018-03-30", "2018-04-04", "2018-04-07")))
  expect_equal(corp1$meta$id, names(corp1$text))
  expect_equal(corp1$meta$id, c("ID2838764", "ID2839675", "ID2839732"))
  expect_equal(corp2$meta$date, as.Date("2018-03-31"))
  expect_equal(corp2$meta$id, names(corp2$text))
  expect_equal(corp2$meta$id, "ID2839233")
})

Try the tosca package in your browser

Any scripts or data that you put into this service are public.

tosca documentation built on Oct. 28, 2021, 5:07 p.m.