inst/doc/epubr.R

## ----setup, include=FALSE-----------------------------------------------------
knitr::opts_chunk$set(
  collapse = TRUE, comment = "#>", message = FALSE, warning = FALSE, error = FALSE, tidy = TRUE
)
library(dplyr)

## ----read---------------------------------------------------------------------
library(epubr)
file <- system.file("dracula.epub", package = "epubr")
(x <- epub(file))

x$data[[1]]

## ----metadata-----------------------------------------------------------------
epub_meta(file)

## ----fields-------------------------------------------------------------------
epub(file, fields = c("title", "creator", "file"))

## ----drop_sections------------------------------------------------------------
epub(file, drop_sections = "cov")$data[[1]]

## ----chapters-----------------------------------------------------------------
x <- epub(file, drop_sections = "cov", chapter_pattern = "^item\\d\\d")
x

x$data[[1]]

## ----recombine1---------------------------------------------------------------
pat <- "CHAPTER [IVX]+"
x2 <- epub_recombine(x, pat)
x2

x2$data[[1]]

## ----recombine2---------------------------------------------------------------
library(dplyr)
x2 <- epub_recombine(x, pat) %>% epub_sift(n = 200)
x2

x2$data[[1]]

## ----recombine3---------------------------------------------------------------
#epub_recombine(x, pat) %>% epub_sift(n = 200) %>% epub_recombine(pat)
x2 <- epub_recombine(x, pat, sift = list(n = 200))
x2

x2$data[[1]]

## ----reorder1-----------------------------------------------------------------
set.seed(1)
x2$data[[1]] <- sample_frac(x2$data[[1]]) # randomize rows for example
x2$data[[1]]

## ----reorder2-----------------------------------------------------------------
f <- function(x, pattern) as.numeric(as.roman(gsub(pattern, "\\1", x)))

## ----reorder3-----------------------------------------------------------------
x2 <- epub_reorder(x2, f, "^CHAPTER ([IVX]+).*")
x2$data[[1]]

## ----unzip--------------------------------------------------------------------
bookdir <- file.path(tempdir(), "dracula")
epub_unzip(file, exdir = bookdir)
list.files(bookdir, recursive = TRUE)

## ----count_words--------------------------------------------------------------
x <- " This   sentence will be counted to have:\n\n10 (ten) words."
count_words(x)

Try the epubr package in your browser

Any scripts or data that you put into this service are public.

epubr documentation built on Sept. 12, 2024, 6:23 a.m.