data-raw/get_data.R

library(tidyverse)

## TEMPORARY FOR NOW
references_tibble <- tibble(
  reference = read_lines("data-raw/newstest2018-deen-ref-ts.en")
) %>%
  mutate(candidate_id = row_number(), reference_id = row_number())

cands <- list.files("data-raw/", pattern = "*.de-en", full.names = T)

wmt18example <- map_dfr(cands, function(x) {
  return(tibble(candidate = read_lines(x) %>% set_names(.)))
}, .id = "system") %>%
  group_by(system) %>%
  mutate(candidate_id = row_number()) %>%
  inner_join(references_tibble) %>%
  ungroup() %>%
  filter(reference != "NO REFERENCE AVAILABLE") %>%
  select(system, candidate_id, reference_id, candidate, reference)

usethis::use_data(wmt18example, overwrite = TRUE)
sinew::makeOxygen(wmt18example)
kanishkamisra/footrulr documentation built on May 23, 2019, 5:07 p.m.