Nothing
## ----include = FALSE----------------------------------------------------------
knitr::opts_chunk$set(
collapse = TRUE,
comment = "#>"
)
## ----setup, eval=FALSE--------------------------------------------------------
# library(starburst)
# library(httr)
# library(jsonlite)
## ----api-function, eval=FALSE-------------------------------------------------
# fetch_company_data <- function(ticker) {
# # Add small delay to respect rate limits
# Sys.sleep(runif(1, 0.1, 0.3))
#
# # For demo purposes, we'll use a public API
# # In practice, replace with your actual API endpoint
# base_url <- "https://api.example.com/company"
#
# tryCatch({
# # Fetch company info
# response <- httr::GET(
# paste0(base_url, "/", ticker),
# httr::timeout(10),
# httr::add_headers(
# "User-Agent" = "staRburst-example/1.0"
# )
# )
#
# # Check for success
# if (httr::status_code(response) == 200) {
# data <- httr::content(response, "parsed")
#
# # Extract relevant fields
# list(
# ticker = ticker,
# success = TRUE,
# company_name = data$name %||% NA,
# market_cap = data$marketCap %||% NA,
# pe_ratio = data$peRatio %||% NA,
# revenue = data$revenue %||% NA,
# employees = data$employees %||% NA,
# sector = data$sector %||% NA,
# timestamp = Sys.time()
# )
# } else {
# # Handle API errors
# list(
# ticker = ticker,
# success = FALSE,
# error = paste("HTTP", httr::status_code(response)),
# timestamp = Sys.time()
# )
# }
# }, error = function(e) {
# # Handle network errors
# list(
# ticker = ticker,
# success = FALSE,
# error = as.character(e),
# timestamp = Sys.time()
# )
# })
# }
#
# # Helper: null-coalescing operator
# `%||%` <- function(x, y) if (is.null(x)) y else x
## ----mock-api, eval=FALSE-----------------------------------------------------
# # Mock function that simulates API with realistic delays
# fetch_company_data_mock <- function(ticker) {
# # Simulate network latency
# Sys.sleep(runif(1, 0.2, 0.8))
#
# # Simulate occasional failures (5% rate)
# if (runif(1) < 0.05) {
# return(list(
# ticker = ticker,
# success = FALSE,
# error = "API timeout",
# timestamp = Sys.time()
# ))
# }
#
# # Generate mock data
# list(
# ticker = ticker,
# success = TRUE,
# company_name = paste("Company", ticker),
# market_cap = round(rnorm(1, 50e9, 20e9), 0),
# pe_ratio = round(rnorm(1, 25, 10), 2),
# revenue = round(rnorm(1, 10e9, 5e9), 0),
# employees = round(rnorm(1, 50000, 20000), 0),
# sector = sample(c("Technology", "Healthcare", "Finance", "Energy"), 1),
# timestamp = Sys.time()
# )
# }
## ----sample-data, eval=FALSE--------------------------------------------------
# # Generate mock ticker symbols
# set.seed(123)
# n_companies <- 1000
# tickers <- paste0(
# sample(LETTERS, n_companies, replace = TRUE),
# sample(LETTERS, n_companies, replace = TRUE),
# sample(LETTERS, n_companies, replace = TRUE)
# )
#
# head(tickers)
# # [1] "NAL" "RPL" "OQM" "TYW" "AIT" "UMD"
## ----local, eval=FALSE--------------------------------------------------------
# cat(sprintf("Fetching data for %d companies locally...\n", length(tickers)))
#
# local_start <- Sys.time()
# local_results <- lapply(head(tickers, 50), fetch_company_data_mock)
# local_time <- as.numeric(difftime(Sys.time(), local_start, units = "secs"))
#
# cat(sprintf("✓ Completed 50 calls in %.1f seconds\n", local_time))
# cat(sprintf(" Estimated time for %d: %.1f minutes\n",
# n_companies, local_time * n_companies / 50 / 60))
## ----cloud, eval=FALSE--------------------------------------------------------
# cat(sprintf("Fetching data for %d companies on AWS...\n", n_companies))
#
# results <- starburst_map(
# tickers,
# fetch_company_data_mock,
# workers = 25,
# cpu = 1,
# memory = "2GB"
# )
## ----analysis, eval=FALSE-----------------------------------------------------
# # Convert results to data frame
# results_df <- do.call(rbind, lapply(results, function(x) {
# if (x$success) {
# data.frame(
# ticker = x$ticker,
# company_name = x$company_name,
# market_cap = x$market_cap,
# pe_ratio = x$pe_ratio,
# revenue = x$revenue,
# employees = x$employees,
# sector = x$sector,
# success = TRUE,
# error = NA,
# stringsAsFactors = FALSE
# )
# } else {
# data.frame(
# ticker = x$ticker,
# company_name = NA,
# market_cap = NA,
# pe_ratio = NA,
# revenue = NA,
# employees = NA,
# sector = NA,
# success = FALSE,
# error = x$error,
# stringsAsFactors = FALSE
# )
# }
# }))
#
# # Summary
# success_rate <- mean(results_df$success) * 100
# cat(sprintf("\n=== Results Summary ===\n"))
# cat(sprintf("Total companies: %d\n", nrow(results_df)))
# cat(sprintf("Successful fetches: %d (%.1f%%)\n",
# sum(results_df$success), success_rate))
# cat(sprintf("Failed fetches: %d\n", sum(!results_df$success)))
#
# # Show sample of results
# cat("\n=== Sample Results ===\n")
# print(head(results_df[results_df$success, ], 10))
#
# # Sector distribution
# cat("\n=== Sector Distribution ===\n")
# print(table(results_df$sector))
#
# # Market cap summary
# cat("\n=== Market Cap Summary ===\n")
# cat(sprintf("Mean: $%.2fB\n",
# mean(results_df$market_cap, na.rm = TRUE) / 1e9))
# cat(sprintf("Median: $%.2fB\n",
# median(results_df$market_cap, na.rm = TRUE) / 1e9))
# cat(sprintf("Range: $%.2fB - $%.2fB\n",
# min(results_df$market_cap, na.rm = TRUE) / 1e9,
# max(results_df$market_cap, na.rm = TRUE) / 1e9))
## ----rate-limiting, eval=FALSE------------------------------------------------
# # Add jitter to respect rate limits
# fetch_with_rate_limit <- function(ticker, rate_limit = 100) {
# # Add delay based on rate limit (calls per minute)
# delay <- 60 / rate_limit + runif(1, 0, 0.1)
# Sys.sleep(delay)
#
# fetch_company_data(ticker)
# }
#
# # Use with staRburst
# results <- starburst_map(
# tickers,
# function(x) fetch_with_rate_limit(x, rate_limit = 100),
# workers = 10 # Adjust workers based on API rate limit
# )
## ----error-handling, eval=FALSE-----------------------------------------------
# fetch_with_retry <- function(ticker, max_retries = 3) {
# for (attempt in 1:max_retries) {
# result <- fetch_company_data(ticker)
#
# if (result$success) {
# return(result)
# }
#
# # Exponential backoff
# if (attempt < max_retries) {
# Sys.sleep(2^attempt + runif(1, 0, 1))
# }
# }
#
# # Return failure after all retries
# result$error <- paste("Failed after", max_retries, "retries:", result$error)
# return(result)
# }
## ----eval=FALSE---------------------------------------------------------------
# system.file("examples/api-calls.R", package = "starburst")
## ----eval=FALSE---------------------------------------------------------------
# source(system.file("examples/api-calls.R", package = "starburst"))
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.