data-raw/createDatasets.R

source("R/externalConstants.R")
analysts <- data.table::data.table(read.csv("data-raw/analysts.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
data.table::setnames(analysts,  c("analystQryId", "siteID"), c("sourceId", "siteId"))
if(exists("analystCode", analysts))
  analysts[, analystCode := NULL]

analystPositions <- data.table::data.table(read.csv("data-raw/analystPositions.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
analystPositions[, position := names(position.Id)[which(position.Id == positionId)], by = "analystPosId"]
analystPositions[, positionId := NULL]

sites <- data.table::data.table(read.csv("data-raw/sites.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
data.table::setnames(sites, c("siteID", "playerIdCol"), c("siteId", "playerId"))
sites[playerId == "fftId", playerId := NA ]
if(exists("siteCode", sites))
  sites[, siteCode := NULL]

siteTables <- data.table::data.table(read.csv("data-raw/siteTables.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
data.table::setnames(siteTables, c("siteTableId",  "positionQryId"), c("tableId", "positionAlias"))
siteTables[, position := names(position.Id)[which(position.Id == positionId)], by = "tableId"]
siteTables[, positionId := NULL]

siteUrls <- data.table::data.table(read.csv("data-raw/siteUrls.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
data.table::setnames(siteUrls, c("urlData", "whichTable", "playerLinkString", "siteID"), c("urlType", "urlTable", "playerLink", "siteId"))
siteUrls[, urlID := NULL]

siteUrls[, siteUrl := gsub("{$PosID}", "{$Pos}", siteUrl, fixed = TRUE)]
siteUrls[siteId ==8 & urlPeriod == "week", urlTable := 1]
dataColumns <- data.table::data.table(read.csv("data-raw/dataColumns.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
tableColumns <- data.table::data.table(read.csv("data-raw/tableColumns.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
data.table::setnames(tableColumns, c("dataColID", "siteTableID"), c("dataColId", "tableId"))
tableColumns <- merge(tableColumns, dataColumns, by = "dataColId")
tableColumns <- tableColumns[, c("tableId", "columnName", "columnType", "columnOrder", "columnPeriod", "removeColumn"), with = FALSE]
tableColumns[columnName %in% c("team","games"), removeColumn := 0]

tableRowRemove <- data.table::data.table(read.csv("data-raw/tableRowRemove.csv", stringsAsFactors = FALSE, na.strings = c("NA", "NULL")))
data.table::setnames(tableRowRemove, "siteTableId", "tableId")
tableRowRemove[, rowRemoveId := NULL]

nfl_missing <- data.table::data.table(read.csv("data-raw/missing_nflID.csv", stringsAsFactors = FALSE))

devtools::use_data(analysts, analystPositions, sites, siteTables,nfl_missing,
                   siteUrls, tableColumns, tableRowRemove, overwrite = TRUE)

nflstats <- data.table::data.table(read.csv("data-raw/nflstats.csv", stringsAsFactors = FALSE))
yahooStats <- data.table::data.table(read.csv("data-raw/yahooStats.csv", stringsAsFactors = FALSE))
yahooCred <- list(key = "dj0yJmk9T09TRjdkWWR3TUpLJmQ9WVdrOVRuZFVURVF6TXpJbWNHbzlNQS0tJnM9Y29uc3VtZXJzZWNyZXQmeD1jOQ--",
                  secret = "418b1e7115f1b15557fe4c773f79ba1ab51e3b63")

yahoo_endpoint <- httr::oauth_endpoints("yahoo")
yahoo_app <- httr::oauth_app("yahoo", key = yahooCred$key, secret = yahooCred$secret)
yahoo_token <- httr::oauth1.0_token

devtools::use_data(nflstats, yahooStats, yahoo_app, yahoo_endpoint, yahoo_token, overwrite = TRUE, internal = TRUE)
dadrivr/ffanalytics documentation built on May 14, 2019, 3:12 p.m.