data-raw/friends_emotions.R

## code to prepare `friends_emotions` dataset goes here
library(tidyverse)
library(jsonlite)

extract_emotion <- function(x) {
  if (length(x) == 0) {
    return(NA)
  } else {
    x[[1]]
  }
}

read_utterances <- function(x) {
  res <- list(id = x$utterance_id,
              emotion = extract_emotion(x$emotion))
  res
}

read_scene <- function(x) {
  map_dfr(x$utterances, read_utterances)
}

read_episode <- function(x) {
  map_dfr(x$scenes, read_scene)
}

read_season <- function(x) {
  map_dfr(x$episodes, read_episode)
}

read_friends <- function() {
  season_numbers <- c("01", "02", "03", "04", "05", "06", "07", "08", "09", "10")
  urls <- glue::glue("https://raw.githubusercontent.com/emorynlp/character-mining/master/json/friends_season_{season_numbers}.json")
  map_dfr(urls, ~ .x %>% read_json() %>% read_season())
}

friends_raw <- read_friends()

friends_emotions <- friends_raw %>%
  filter(!is.na(emotion)) %>%
  separate(id, c("season", "episode", "scene", "utterance")) %>%
  mutate(across(c("season", "episode", "scene", "utterance"), parse_number)) %>%
  mutate(across(season:utterance, as.integer))

usethis::use_data(friends_emotions, overwrite = TRUE)
EmilHvitfeldt/friends documentation built on Dec. 24, 2021, 11:56 a.m.