R/gpt2samples.R

#' GPT-2 Samples
#'
#' This package contains all sample data as generated by OpenAI's GPT-2 language model.
#' The data includes conditional texts with sample prompts and their completions, as well as
#' the unconditional texts with samples of generated text.
#' @docType package
#' @name gpt2samples
#' @aliases gpt2samples gpt2samples-package
NULL

#' @title Conditional with temperature 0.7
#' @description Conditionally generated texts with contexts from WebText's test set
#' @format A tidy data frame with 24081 rows and 4 variables:
#' \describe{
#'   \item{\code{file}}{character - file reference}
#'   \item{\code{id}}{integer - sample and completion id number as referenced in the openai gpt2 sample file}
#'   \item{\code{type}}{character - indicator of whether the text is a sample context or a completion}
#'   \item{\code{text}}{character - the text, either a sample context or a completion}
#'}
#' @source \url{https://github.com/openai/gpt-2/tree/master/gpt-2-samples}
"conditional_t07"

#' @title Conditional with truncation 1 with top_40 k
#' @description Conditionally generated texts with contexts from WebText's test set
#' @format A tidy data frame with 20405 rows and 4 variables:
#' \describe{
#'   \item{\code{file}}{character - file reference}
#'   \item{\code{id}}{integer - sample and completion id number as referenced in the openai gpt2 sample file}
#'   \item{\code{type}}{character - indicator of whether the text is a sample context or a completion}
#'   \item{\code{text}}{character - the text, either a sample context or a completion}
#'}
#' @source \url{https://github.com/openai/gpt-2/tree/master/gpt-2-samples}
"conditional_topk40"

#' @title Conditional with default settings
#' @description Conditionally generated texts with contexts from WebText's test set
#' @format A tidy data frame with 18067 rows and 4 variables:
#' \describe{
#'   \item{\code{file}}{character - file identifier}
#'   \item{\code{id}}{integer - sample and completion number as referenced in the openai gpt2 sample file}
#'   \item{\code{type}}{character - indicator of whether the text is a sample context or a completion}
#'   \item{\code{text}}{character - the text, either a sample context or a completion}
#'}
#' @source \url{https://github.com/openai/gpt-2/tree/master/gpt-2-samples}
"conditional"

#' @title Unconditional samples with temperature 0.7
#' @description Unconditionally generated texts from Open AI GPT-2
#' @format A tidy data frame with 28841 rows and 3 variables:
#' \describe{
#'   \item{\code{file}}{character file identifier}
#'   \item{\code{id}}{integer sample id number as referenced in the openai gpt2 sample file}
#'   \item{\code{text}}{character - the text}
#'}
#' @source \url{https://github.com/openai/gpt-2/tree/master/gpt-2-samples}
"unconditional_t07"

#' @title Unconditional with truncation 1 with top_40 k
#' @description Unconditionally generated texts from Open AI GPT-2
#' @format A data frame with 21188 rows and 3 variables:
#' \describe{
#'   \item{\code{file}}{character file identifier}
#'   \item{\code{id}}{integer sample id number as referenced in the openai gpt2 sample file}
#'   \item{\code{text}}{character - the text}
#'}
#' @source \url{https://github.com/openai/gpt-2/tree/master/gpt-2-samples}
"unconditional_topk40"

#' @title Unconditional with default settings
#' @description Unconditionally generated texts from Open AI GPT-2
#' @format A data frame with 19468 rows and 3 variables:
#' \describe{
#'   \item{\code{file}}{character file identifier}
#'   \item{\code{id}}{integer sample id number as referenced in the openai gpt2 sample file}
#'   \item{\code{text}}{character - the text}
#'}
#' @source \url{https://github.com/openai/gpt-2/tree/master/gpt-2-samples}
"unconditional"
kanishkamisra/gpt2samples documentation built on May 31, 2019, 10:34 a.m.