Nothing
test_that("translate_to_messages works with example turns", {
ellmer_messages <- translate_to_messages(example_ellmer_solver()$set_system_prompt(
NULL
))
inspect_messages <- example_inspect_log()[["samples"]][[1]][["messages"]]
zap_id <- function(l) {
l[["id"]] <- NULL
l
}
expect_equal(
purrr::map(ellmer_messages, zap_id),
purrr::map(inspect_messages, zap_id)
)
})
test_that("logs including system prompts are compatible with inspect", {
skip_if(identical(Sys.getenv("OPENAI_API_KEY"), ""))
tmp_dir <- withr::local_tempdir()
withr::local_envvar(list(VITALS_LOG_DIR = tmp_dir))
withr::local_options(cli.default_handler = function(...) {
})
local_mocked_bindings(interactive = function(...) FALSE)
library(ellmer)
simple_addition <- tibble::tibble(
input = c("What's 2+2?", "What's 2+3?"),
target = c("4", "5")
)
tsk <- Task$new(
dataset = simple_addition,
solver = generate(chat_openai(
system_prompt = "Be terse.",
model = "gpt-4.1-nano"
)),
scorer = model_graded_qa()
)
tsk$eval()
expect_valid_log(tsk$log())
expect_true(any(grepl("Be terse", readLines(tsk$log()))))
})
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.