#' Get screenshots and place them in relevant subfolder
#'
#' @param domain A character vector of one or more domains (e.g. "example.com").
#' @param shuffle Logical, defaults to TRUE. If TRUE, order in which domains are processed is randomised.
#' @return Nothing, used for its side effects.
#' @examples
#'
#' @export
get_screenshot <- function(domain, width = 1280, height = 1280, language = NULL, shuffle = TRUE) {
if (is.null(language)==TRUE) {
language <- list.dirs(file.path("data", "domains", "homepage"), recursive = FALSE, full.names = FALSE)
}
fs::dir_create(path = fs::path("data", "domains", "screenshots", language), recurse = TRUE)
fs::dir_create(path = fs::path("data", "domains", "screenshots_failed", language), recurse = TRUE)
today_path <- file.path("data", "domains", "screenshots", language, Sys.Date())
today_path_screenshots_failed <- file.path("data", "domains", "screenshots_failed", language, Sys.Date())
dir.create(path = today_path, showWarnings = FALSE)
dir.create(path = today_path_screenshots_failed, showWarnings = FALSE)
if (shuffle == TRUE) {
domain <- sample(domain)
}
pb <- dplyr::progress_estimated(length(domain))
purrr::walk(.x = domain,
.f = function(x) {pb$tick()$print()
if (networkedwebsitesdetector::check_if_exists(domain = x, type = "screenshots")==FALSE) {
tryCatch({webshot::webshot(url = paste0("http://", x),
file = file.path(today_path, paste0(x, ".png")),
vwidth = width,
vheight = height,
cliprect = "viewport")},
error=function(e){
readr::write_file(x = paste0("Could not download ", x),
path = file.path(today_path_screenshots_failed, paste0(stringr::str_remove(string = x, pattern = stringr::fixed("http://")), ".txt")))
message(paste0("Could not download ", x, ": "),
conditionMessage(e), "\n")})
}
}
)
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.