In RETURN-project/BenchmarkRecovery: Benchmark recovery indicators derived from remote sensing time series

knitr::opts_chunk$set(echo = TRUE, 
                      eval = T,
                      fig.width=18,
                      fig.height=10)

# Load libraries
library(devtools)
library(BenchmarkRecovery)
library(zoo)
library(plyr)
library(reshape2)
library(ggplot2)
library(profvis)
library(parallel)
library(pbapply)
library(bfast)
library(strucchange)
library(colorspace)

# Calculate the number of cores
no_cores <- detectCores()

Extract time series characteristics from sampled time series

The following characteristics are derived from the decomposed time series:

fraction of missing values
seasonal amplitude (one value for input each time series)
average seasonal pattern
offset
standard deviation of the remainder component (one value per input time series)
fitted ARMA model in the remainder component (one model per input time series)

# inputs
ifolder <- '../data/'
ofolder <- '../data/' # Folder where outputs will be written
basenames <- c('toyset', 'otherset') # Name of the input dataset (contains sampled satellite time series)
nyr <- 18 # Number of years in observation period
nobsYr <- 365 # Number of observations per year
caseList <- c('seasAmp','remSd','distMag','distT','distRec','missVal')# parameters to be evaluated

# NOTE: consider refactoring this chunk
# For instance, moving extract_settings to ./R and/or creating a settings generator
# and working through load/save sttngs into/from a file

# TODO: document this function
extract_settings <- function(basename, ifolder, nyr, nobsYr, ofolder = '') {
  ifileVI <- paste0(basename, '.rda') # For instance, toyset.rda
  dfVi <- loadRData(file = file.path(ifolder, ifileVI)) # For instance /data/toyset.rda 

  # First decompose time series into seasonality, trend and remainder:
  tmp <- decompTSbfast(dfVi, nyr, nobsYr)
  dataVISeasbf <-  tmp[[1]] # Sesonality (fitted harmonic function)
  dataVIRembf <- tmp[[2]] # Remainder
  dataVITrbf <- tmp[[3]] # Trend (linear trend without break)
  dataVISeasCoef <- tmp[[4]] # Coefficients of fitted harmonic functions 

  # Derive characteristics
  tsVIMissVal <- rowSums(is.na(dfVi))/(dim(dfVi)[2]-2) # Fraction missing values

  seasVImax <- apply(dataVISeasbf[,-c(1,2)], 1, max) # Seasonal amplitude for each pixel
  seasS <- dataVISeasbf[dataVISeasbf[,1]<0,] # Average seasonal pattern, only southern hemisphere to avoid interference of seasonal cycles
  seasVImean <- colMeans(as.matrix(seasS[,-c(1,2)]))

  TrVImean <- mean(rowMeans(as.matrix(dataVITrbf[,-c(1,2)])), na.rm=T) # Offset 

  Rem_VIsd <- apply(dataVIRembf[,-c(1,2)], 1, sd, na.rm=T) # SD of remainder per pixel

    # Settings  simulation
  STnobsYr <- 365
  Vqntl <- c( .05, .25, .4, .6, .75, .95)#c( .05, .25, .5, .75, .95)#c( .5)# c( .05, .25, .5, .75)# set of quantiles used to derive realistic values (for number of 

  sttngs <- list()
  sttngs$'seasAmp' <- list(type = 'dist', vals = c(0,0,quantile(seasVImax, Vqntl)), obs = seasVImax, fix = quantile(seasVImax, c(.4, .6)))
  sttngs$'missVal' <- list(type = 'dist',  vals = c(1-1/16,1-1/16,quantile(tsVIMissVal, Vqntl)), obs = tsVIMissVal, fix = quantile(tsVIMissVal, c(.4, .6)))
  sttngs$'remSd' <- list(type = 'dist',  vals = c(0,0,quantile(Rem_VIsd, Vqntl)), obs = Rem_VIsd, fix = quantile(Rem_VIsd, c(.4, .6)))
  sttngs$'nyr' <- list(type = 'range', vals = c(25), fix = 25)#seq(6,36, by = 6)
  sttngs$'distMag' <- list(type = 'range', vals = -c(0.1,0.2,0.25,0.35,0.4,0.5), fix = -c(0.25,0.35))
  sttngs$'distT' <- list(type = 'range', vals = c(3,6,9,12,15,18), fix = c(9,12))#seq(3,33, by = 6)
  sttngs$'distRec' <- list(type = 'range', vals = c(0.5,2,2.25,3.75,4,6.5)*STnobsYr, fix = c(2.25,3.75)*STnobsYr) #seq(0.5,6.5,by=0.5)
  sttngs$'nDr' <- list(type = 'range',  vals = c(0), fix = 0)
  sttngs$'distType' <- list(type = 'cat',  vals = c('piecewise'), fix = 'piecewise')#piecewise exponential diffEq
  sttngs$'DistMissVal' <- list(type = 'cat', vals = 'random', fix = 'random')
  sttngs$'trAv' <- list(type = 'range', vals = TrVImean, fix = TrVImean)
  sttngs$'general' <- list(
    eval = caseList,#parameters to be evaluated, can be  'distT','distRec', 'missVal' 'distMag', 'seasAmp', 'remSd'
    nTS = 100,
    nobsYr = STnobsYr,
    seasAv = seasVImean,
    # remcoef = Rem_VIcoef,
    parSetUp = 'int') # Parameter set-up: can be avg dist, comb, or int

  # remove redundant variables
  rm(list=setdiff(ls(), c("sttngs",'ifolder', 'ofolder', 'basename', 'ncores', 'pars')))

  # Save if desired
  save_results = (ofolder != '')
  if(save_results) {
      save(sttngs, file = file.path(ofolder, paste0(basename,  '_simTS_settings.rda')))
  }

  return(sttngs)
}

# Start clock
start_time <- Sys.time()

# Extract settings from data
sttngs_list <- mclapply(basenames, FUN = extract_settings, ifolder = ifolder, nyr = nyr, nobsYr = nobsYr, ofolder = ofolder, mc.cores = no_cores - 1)

# Stop clock
end_time <- Sys.time()
print(end_time - start_time)

Simulate time series, measure recovery and evaluate performance

Based on the characteristics of the measured time series, time series are simulated.

Define simulation settings

First, the simulation settings are defined in a settings list:

seasAmp: seasonal amplitude
missVal: fraction of missing values in time series
remSd: standard deviation of the remainder
nyr: time series length (number of years)
distMag: disturbance magnitude, should be a negative value to simulate a drop
distT: timing disturbance (disturbance year)
distRec: recovery half time after disturbance (number of observations)
nDr: number of simulated droughts
distType: Type of recovery (piecewise, exponential or realistic)
DistMissVal: defines how the introduced missing values should be distributed: random or at an equal interval
trAv: offset
eval: the parameters that should be evaluated
nTS: number of time series simulated per value of the evaluated parameter
nobsYr: number of observations simulated per year (this should equal the frequency of the sampled time series)
seasAv: represents the seasonal pattern
parSetUp: the parameter values selection approach (avg, dist, comb, or int)

For each of these parameters, the type is defined. There are three main parameter types: dist, range, and cat. For the dist parameters, parameter values that are observed from sampled time series are available. For range parameters no observed values are available, but an expected range of their values can be set. Finally, the cat parameters are categoric.

Next to the type of the parameter, a set of parameter values (vals) need to be defined. If the sensitivity of the recovery indicators to the parameter is being evaluated, the performance of the recovery indicators is evaluated with respect to each of these parameter values. For dist parameters, the observed parameter values (obs) need to be additionally provided. If the parameter set-up follows the int approach (see next section for more details), the values for the evaluated dist parameter are not set to predefined fixed values, but are randomly sampled over an interval. These intervals are defined in the vals setting: the first two values refer to the first interval, the next two values to the second interval, and so on.

While evaluating the sensitivity to one specific parameter, the values of all other parameters also need to be set. Four approaches can be used to achieve this. First, the avg and int approaches set the parameters to their average value. This equals the mean value of the distribution of observed values of dist parameters, the mean value of the range of values (given by vals) for range parameters and a randomly selected value (selected from the values give by vals) for cat parameters. Second, the dist approach selects values for the parameters given by the likelihood of their occurrence. The likelihood is defined by the histogram of observed values for dist parameters and a random selection of values is made for range and cat parameters. Third, the comb approach defines all combinations of evaluated values for each parameter (as defined in vals).

The following inputs are needed to calculate the recovery indicators:

funSet: list of settings for the computation of the recovery indicators. More than one value for each setting is allowed (yet an equal number of values for each parameter is required). The recovery indicators are then derived for each set of values of the setting parameters.

freq: 'dense', 'annual', or 'quarterly'. Defines the observation frequency. For 'dense' the original frequency is used. For 'annual' and 'quarterly', the time series are converted to annual or quarterly frequency, respectively.
input: 'smoothed', 'raw', 'segmented'. Defines the type of time series that is used for the recovery indicators. For 'raw', the simulated time series are directly used to calculate recovery, for 'smooth' a time series smoothing algorithm (rolling mean) is used before recovery calculation, for 'segmented' the trend component of the piecewise regression (BFAST0n) is used.
nPre: the number of years before the disturbance used to derive the pre-disturbance values
nDist: the number of years after the disturbance used to derive the value during the disturbance
nPostMin and nPostMax: the post-disturbance values are derived between nPostMin and nPostMax years after the disturbance
h: in case input equals 'segmented', the h value is used in the segmentation algorithm to define the minimal segment size either given as fraction relative to the sample size or as an integer giving the minimal number of observations in each segment
breaks: in case input equals 'segmented', the criterium given by breaks is used in the segmentation algorithm to define the optimal number of segments. Can be set to 'BIC' or 'LWZ' (but has been deactivated)
seas: in case input equals 'segmented', seas denotes whether a seasonal term needs to be used in the segmentation algorithm

# recovery settings
funSet <- list('freq' = c(rep('annual', 6),  rep('dense',6), rep('quarterly',6)),
               'input' = rep(c('raw', 'smoothed','segmented'),6),# settings for the recovery indicators
               'nPre' = rep(2,18),
               'nDist' = c(rep(0,6),rep(1,12)),
               'nPostMin' = rep(c(4,4,4,1,1,1), 3),
               'nPostMax' = c(rep(5,3), rep(1,3), rep(6,3), rep(2,3), rep(6,3), rep(2,3)),
               'h' = rep(0.15,18),
               'seas' = c(rep(F,6),rep(T,12)))

# Save all configurations (one per basename)
# although all of them are now identical
# NOTE: decide if we need this
mclapply(basenames, FUN = function(basename) { save(funSet, file = file.path(ofolder, paste0(basename, '_recSettings.rda')))  })

The specified settings are then used to simulate time series, calculate recovery indicators and evaluate their performance:

# Create all the tests to be performed and store them on a table
# This is the 'homework' list for the HPC
sttngs$general$eval
testsTable <- expand.grid(basename = basenames, case = caseList, stringsAsFactors = FALSE) # All combinations of cases and filenames

# Assign a column with the settings
# NOTE: in the future, perhaps use only basename (as sttngs is redundant)
testsTable$settings <- rep(NA, nrow(testsTable)) # Initialize settings column
testsTable$settings <- sttngs_list
testsTable <- tibble::tibble(testsTable) # Tibblify for increased readability

# Print for inspection
print(testsTable)

# Start clock
start_time <- Sys.time()
set_fast_options()

# Run the sensitivity analysis
results_list <- mcmapply(FUN = evalParam, evr = testsTable$case, basename = testsTable$basename, sttngs = testsTable$settings, # Iterate along these parameters
                         MoreArgs = list(funSet = funSet, ofolder = ofolder), # These parameters remain constant
                         mc.cores = no_cores - 1)

# stop clock
end_time <- Sys.time()
print(end_time - start_time)

Plot the performance indicators

# general settings
# characteristics for which a plot needs to be made


simFullName  <- list('Disturbance magnitude',
                     'Number of droughts',
                     'Time series length',
                     'Seasonal amplitude',
                     'SD remainder',
                     'Disturbance timing',
                     'Recovery period [years]',
                     'Missing values')
names(simFullName) <- c('distMag',
                        'nDr', 
                        'len',
                        'seasAmp',
                        'remSd',
                        'distT',
                        'distRec',
                        'missVal')

Compare the performance of each recovery indicator

for(vr in 1:length(caseList)){
  evr <- caseList[vr]# name of parameter that will be evaluated in the simulation
  # setvr <- sttngs[[evr]]# settings of simulation

  # NOTE: retrieve data from results_list instead of from saved files
  RRI_rsq <- loadRData(file.path(ofolder, paste0(basename, '_RRI_R2_' , evr, '.rda')))
  R80p_rsq <- loadRData(file.path(ofolder, paste0(basename, '_R80p_R2_' , evr, '.rda')))
  YrYr_rsq <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_R2_' , evr, '.rda')))

  RRI_mape <- loadRData(file.path(ofolder, paste0(basename, '_RRI_MAPE_' , evr, '.rda')))
  R80p_mape <- loadRData(file.path(ofolder, paste0(basename, '_R80p_MAPE_' , evr, '.rda')))
  YrYr_mape <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_MAPE_' , evr, '.rda')))

  RRI_nTS <- loadRData(file.path(ofolder, paste0(basename, '_RRI_nTS_' , evr, '.rda')))
  R80p_nTS <- loadRData(file.path(ofolder, paste0(basename, '_R80p_nTS_' , evr, '.rda')))
  YrYr_nTS <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_nTS_' , evr, '.rda')))

  tot_rsq <- melt(rbind(RRI_rsq, R80p_rsq, YrYr_rsq))
  tot_mape <- melt(rbind(RRI_mape, R80p_mape, YrYr_mape))
  tot_nTS <- melt(rbind(RRI_nTS, R80p_nTS, YrYr_nTS))


  tot_rsq$Period <- revalue(factor(tot_rsq$nPostMin), c("1"="Short", "4"="Long"))
  tot_mape$Period <- revalue(factor(tot_mape$nPostMin), c("1"="Short", "4"="Long"))
  tot_nTS$Period <- revalue(factor(tot_nTS$nPostMin), c("1"="Short", "4"="Long"))

   if((evr == 'remSd') || (evr == 'seasAmp') || (evr == 'missVal')) {
    tot_rsq$variable <- mapvalues(tot_rsq$variable, from = levels(tot_rsq$variable), to = c("no", "low", 'medium', 'high'))
    tot_mape$variable <-mapvalues(tot_mape$variable, from = levels(tot_mape$variable), to = c("no", "low", 'medium', 'high'))
    tot_nTS$variable <-mapvalues(tot_nTS$variable, from = levels(tot_nTS$variable), to = c("no", "low", 'medium', 'high'))
  }  else{
    tot_rsq$variable <-mapvalues(tot_rsq$variable, levels(tot_rsq$variable), to = c("low", 'medium', 'high'))
    tot_mape$variable <-mapvalues(tot_mape$variable, levels(tot_mape$variable), to = c("low", 'medium', 'high'))
    tot_nTS$variable <-mapvalues(tot_nTS$variable, levels(tot_nTS$variable), to = c("low", 'medium', 'high'))
  }
  # tot_rsq <- tot_rsq[(tot_rsq$Dense == 'dense' & tot_rsq$Smooth == 'raw' & tot_rsq$Period == 'Long'),]
  tot_rsq$param = simFullName[[caseList[[vr]]]]
  if(vr == 1){totp_rsq <- tot_rsq}else{totp_rsq <- rbind(totp_rsq,tot_rsq)}

  # tot_mape <- tot_mape[(tot_mape$Dense == 'dense' & tot_mape$Smooth == 'raw' & tot_mape$Period == 'Long'),]
  tot_mape$param = simFullName[[caseList[[vr]]]]
  if(vr == 1){totp_mape <- tot_mape}else{totp_mape <- rbind(totp_mape,tot_mape)}

  # tot_nTS <- tot_nTS[(tot_nTS$Dense == 'dense' & tot_nTS$Smooth == 'raw' & tot_nTS$Period == 'Long'),]
  tot_nTS$param = simFullName[[caseList[[vr]]]]
  if(vr == 1){totp_nTS <- tot_nTS}else{totp_nTS <- rbind(totp_nTS,tot_nTS)}
}

xlbl <- 'Metric'

  # plot R2
  data <- totp_rsq
  ylbl <- 'R²'
  pltR2 <- plotMet(data, xlbl, ylbl)
  png(file.path(ofolder, paste0(basename, '_RsqMet.png')),width = 1311,height =628 )
  print(pltR2)
  dev.off()

  # plot MAPE
  data <- totp_mape
  ylbl <- 'MAPE'
  pltMAPE <- plotMet(data,  xlbl, ylbl)
  png(file.path(ofolder, paste0(basename, '_MAPEMet.png')),width = 1311,height =628 )
  print(pltMAPE)
  dev.off()
   # plot fraction of time series processed
  data <- totp_nTS
  ylbl <- 'Fraction'
  pltnTS <- plotMet(data,  xlbl, ylbl)
  png(file.path(ofolder, paste0(basename, '_nTSMet.png')),width = 1311,height =628 )
  print(pltnTS)
  dev.off()

  print(pltR2)
  print(pltMAPE)
  print(pltnTS)

Which characteristics influence the performance the most?

# compare effect of each parameter on the 
caseList <- c( 'seasAmp', 'remSd', 'missVal','distRec','distT','distMag')# evaluated time series characteristics for which a plot needs to be made

simFullName  <- list('Disturbance magnitude',
                     'Disturbance timing',
                     'Recovery period',
                     'Number of droughts',
                     'Time series length',
                     'Seasonal amplitude',
                     'SD remainder',
                     'Missing values')
names(simFullName) <- c('distMag',
                        'distT',
                        'distRec',
                        'nDr', 
                        'len',
                        'seasAmp',
                        'remSd',
                        'missVal')

for(vr in 1:length(caseList)){
  evr <- caseList[vr]# name of parameter that will be evaluated in the simulation
  # setvr <- sttngs[[evr]]# settings of simulation

  RRI_rsq <- loadRData(file.path(ofolder, paste0(basename, '_RRI_R2_' , evr, '.rda')))
  R80p_rsq <- loadRData(file.path(ofolder, paste0(basename, '_R80p_R2_' , evr, '.rda')))
  YrYr_rsq <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_R2_' , evr, '.rda')))

  RRI_mape <- loadRData(file.path(ofolder, paste0(basename, '_RRI_MAPE_' , evr, '.rda')))
  R80p_mape <- loadRData(file.path(ofolder, paste0(basename, '_R80p_MAPE_' , evr, '.rda')))
  YrYr_mape <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_MAPE_' , evr, '.rda')))

  RRI_nTS <- loadRData(file.path(ofolder, paste0(basename, '_RRI_nTS_' , evr, '.rda')))
  R80p_nTS <- loadRData(file.path(ofolder, paste0(basename, '_R80p_nTS_' , evr, '.rda')))
  YrYr_nTS <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_nTS_' , evr, '.rda')))

  tot_rsq <- melt(rbind(RRI_rsq, R80p_rsq, YrYr_rsq))
  tot_mape <- melt(rbind(RRI_mape, R80p_mape, YrYr_mape))
  tot_nTS <- melt(rbind(RRI_nTS, R80p_nTS, YrYr_nTS))

  tot_rsq$Period <- revalue(factor(tot_rsq$nPostMin), c("1"="Short", "4"="Long"))
  tot_mape$Period <- revalue(factor(tot_mape$nPostMin), c("1"="Short", "4"="Long"))
  tot_nTS$Period <- revalue(factor(tot_nTS$nPostMin), c("1"="Short", "4"="Long"))

   if((evr == 'remSd') || (evr == 'seasAmp') || (evr == 'missVal')) {
    tot_rsq$variable <- mapvalues(tot_rsq$variable, from = levels(tot_rsq$variable), to = c("no", "low", 'medium', 'high'))
    tot_mape$variable <-mapvalues(tot_mape$variable, from = levels(tot_mape$variable), to = c("no", "low", 'medium', 'high'))
    tot_nTS$variable <-mapvalues(tot_nTS$variable, from = levels(tot_nTS$variable), to = c("no", "low", 'medium', 'high'))
  }  else{
    tot_rsq$variable <-mapvalues(tot_rsq$variable, levels(tot_rsq$variable), to = c("low", 'medium', 'high'))
    tot_mape$variable <-mapvalues(tot_mape$variable, levels(tot_mape$variable), to = c("low", 'medium', 'high'))
    tot_nTS$variable <-mapvalues(tot_nTS$variable, levels(tot_nTS$variable), to = c("low", 'medium', 'high'))
  }
  tot_rsq <- tot_rsq[(tot_rsq$Dense == 'dense' & tot_rsq$Smooth == 'raw' & tot_rsq$Period == 'Long'),]
  tot_rsq$param = simFullName[[caseList[[vr]]]]
  if(vr == 1){totp_rsq <- tot_rsq}else{totp_rsq <- rbind(totp_rsq,tot_rsq)}

  tot_mape <- tot_mape[(tot_mape$Dense == 'dense' & tot_mape$Smooth == 'raw' & tot_mape$Period == 'Long'),]
  tot_mape$param = simFullName[[caseList[[vr]]]]
  if(vr == 1){totp_mape <- tot_mape}else{totp_mape <- rbind(totp_mape,tot_mape)}

  tot_nTS <- tot_nTS[(tot_nTS$Dense == 'dense' & tot_nTS$Smooth == 'raw' & tot_nTS$Period == 'Long'),]
  tot_nTS$param = simFullName[[caseList[[vr]]]]
  if(vr == 1){totp_nTS <- tot_nTS}else{totp_nTS <- rbind(totp_nTS,tot_nTS)}
}


  totp_rsq$paramType <- 'Environmental parameter'
  totp_rsq[(totp_rsq$param == 'Disturbance magnitude' | totp_rsq$param == 'Recovery period' | totp_rsq$param == 'Disturbance timing'), ]$paramType <- 'Disturbance parameter'
  totp_mape$paramType <- 'Environmental parameter'
  totp_mape[(totp_mape$param == 'Disturbance magnitude' | totp_mape$param == 'Recovery period' | totp_mape$param == 'Disturbance timing' ),]$paramType  <- 'Disturbance parameter'
  totp_nTS$paramType <- 'Environmental parameter'
  totp_nTS[(totp_rsq$param == 'Disturbance magnitude' | totp_nTS$param == 'Recovery period' | totp_nTS$param == 'Disturbance timing' ),]$paramType  <- 'Disturbance parameter'

data <- totp_rsq
  data$param <- factor(data$param, levels = rev(unlist(simFullName[caseList])))
  xlbl <- 'Parameter value'
  ylbl <- 'R²'
  pltR2 <- plotEnv(data, xlbl, ylbl, scales = 'free_y')
  png(file.path(ofolder, paste0(basename, '_Rsq_Env.png')),width = 1311,height =628 )
  print(pltR2)
  dev.off()

  data <- totp_mape
  data$param <- factor(data$param, levels = rev(unlist(simFullName[caseList])))
  data$value[is.infinite(data$value)] <- NA
  xlbl <- 'Parameter value'
  ylbl <- 'MAPE'
  pltMAPE <- plotEnv(data, xlbl, ylbl, scales = 'free_y')
  png(file.path(ofolder, paste0(basename, '_MAPE_Env.png')),width = 1311,height =628 )
  print(pltMAPE)
  dev.off()

  data <- totp_nTS
  data$param <- factor(data$param, levels = rev(unlist(simFullName[caseList])))
  xlbl <- 'Parameter value'
  ylbl <- 'Fraction'
  pltnTS <- plotEnv(data, xlbl, ylbl, scales = 'free_y')
  png(file.path(ofolder, paste0(basename, '_nTS_Env.png')),width = 1311,height =628 )
  print(pltnTS)
  dev.off()

  print(pltR2)
  print(pltMAPE)
  print(pltnTS)

How can we improve the performance?

for(vr in 1:length(caseList)){
  evr <- caseList[vr]# name of parameter that will be evaluated in the simulation
  # setvr <- sttngs[[evr]]# settings of simulation

  RRI_rsq <- loadRData(file.path(ofolder, paste0(basename, '_RRI_R2_' , evr, '.rda')))
  R80p_rsq <- loadRData(file.path(ofolder, paste0(basename, '_R80p_R2_' , evr, '.rda')))
  YrYr_rsq <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_R2_' , evr, '.rda')))

  RRI_rmse <- loadRData(file.path(ofolder, paste0(basename, '_RRI_RMSE_' , evr, '.rda')))
  R80p_rmse <- loadRData(file.path(ofolder, paste0(basename, '_R80p_RMSE_' , evr, '.rda')))
  YrYr_rmse <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_RMSE_' , evr, '.rda')))

  RRI_mape <- loadRData(file.path(ofolder, paste0(basename, '_RRI_MAPE_' , evr, '.rda')))
  R80p_mape <- loadRData(file.path(ofolder, paste0(basename, '_R80p_MAPE_' , evr, '.rda')))
  YrYr_mape <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_MAPE_' , evr, '.rda')))

  RRI_nTS <- loadRData(file.path(ofolder, paste0(basename, '_RRI_nTS_' , evr, '.rda')))
  R80p_nTS <- loadRData(file.path(ofolder, paste0(basename, '_R80p_nTS_' , evr, '.rda')))
  YrYr_nTS <- loadRData(file.path(ofolder, paste0(basename, '_YrYr_nTS_' , evr, '.rda')))

  tot_rsq <- melt(rbind(RRI_rsq, R80p_rsq, YrYr_rsq))
  tot_rmse <- melt(rbind(RRI_rmse, R80p_rmse, YrYr_rmse))
  tot_mape <- melt(rbind(RRI_mape, R80p_mape, YrYr_mape))
  tot_nTS <- melt(rbind(RRI_nTS, R80p_nTS, YrYr_nTS))

  tot_rsq$Period <- revalue(factor(tot_rsq$nPostMin), c("1"="Short", "4"="Long"))
  tot_rmse$Period <- revalue(factor(tot_rmse$nPostMin), c("1"="Short", "4"="Long"))
  tot_mape$Period <- revalue(factor(tot_mape$nPostMin), c("1"="Short", "4"="Long"))
  tot_nTS$Period <- revalue(factor(tot_nTS$nPostMin), c("1"="Short", "4"="Long"))

   if((evr == 'remSd') || (evr == 'seasAmp') || (evr == 'missVal')) {
    tot_rsq$variable <- mapvalues(tot_rsq$variable, from = levels(tot_rsq$variable), to = c("no", "low", 'medium', 'high'))
    tot_rmse$variable <-mapvalues(tot_rmse$variable, from = levels(tot_rmse$variable), to = c("no", "low", 'medium', 'high'))
    tot_mape$variable <-mapvalues(tot_mape$variable, from = levels(tot_mape$variable), to = c("no", "low", 'medium', 'high'))
    tot_nTS$variable <-mapvalues(tot_nTS$variable, from = levels(tot_nTS$variable), to = c("no", "low", 'medium', 'high'))
  } else{ 
    tot_rsq$variable <- mapvalues(tot_rsq$variable, from = levels(tot_rsq$variable), to = c( "low", 'medium', 'high'))
    tot_rmse$variable <-mapvalues(tot_rmse$variable, from = levels(tot_rmse$variable), to = c( "low", 'medium', 'high'))
    tot_mape$variable <-mapvalues(tot_mape$variable, from = levels(tot_mape$variable), to = c( "low", 'medium', 'high'))
    tot_nTS$variable <-mapvalues(tot_nTS$variable, from = levels(tot_nTS$variable), to = c( "low", 'medium', 'high'))
    }

  lbls <- c("raw, BAP", 'piecewise, BAP', 'smoothed, BAP', "raw, dense", 'piecewise, dense', 'smoothed, dense', "raw, quarterly", 'piecewise, quarterly', 'smoothed, quarterly')
  sname <- caseList[[vr]]
  xlbl <- simFullName[[sname]]

  # plot R2
  data <- tot_rsq
  ylbl <- 'R²'
  pltR2 <- plotSens(data, lbls, xlbl, ylbl, scales = 'fixed')
  png(file.path(ofolder, paste0(basename, '_Rsq_',evr,'.png')),width = 1311,height =628 )
  print(pltR2)
  dev.off()

  # plot RMSE
  data <- tot_rmse
  ylbl <- 'RMSE'
  pltRMSE <- plotSens(data, lbls, xlbl, ylbl, scales = 'free_y')
  png(file.path(ofolder, paste0(basename, '_RMSE_',evr,'.png')),width = 1311,height =628 )
  print(pltRMSE)
  dev.off()
   # plot MAPE
  data <- tot_mape
  ylbl <- 'MAPE'
  pltMAPE <- plotSens(data, lbls, xlbl, ylbl, scales = 'free_y')
  png(file.path(ofolder, paste0(basename, '_MAPE_',evr,'.png')),width = 1311,height =628 )
  print(pltMAPE)
  dev.off()
   # plot fraction of time series processed
  data <- tot_nTS
  ylbl <- 'Fraction'
  pltnTS <- plotSens(data, lbls, xlbl, ylbl, scales = 'free_y')
  png(file.path(ofolder, paste0(basename, '_nTS_',evr,'.png')),width = 1311,height =628 )
  print(pltnTS)
  dev.off()

  print(pltR2)
  print(pltRMSE)
  print(pltMAPE)
  print(pltnTS)
}

RETURN-project/BenchmarkRecovery documentation built on July 13, 2021, 5:47 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

RETURN-project/BenchmarkRecovery
Benchmark recovery indicators derived from remote sensing time series

In RETURN-project/BenchmarkRecovery: Benchmark recovery indicators derived from remote sensing time series

Extract time series characteristics from sampled time series

Simulate time series, measure recovery and evaluate performance

Define simulation settings

Plot the performance indicators

R Package Documentation

Browse R Packages

We want your feedback!

RETURN-project/BenchmarkRecovery Benchmark recovery indicators derived from remote sensing time series

In RETURN-project/BenchmarkRecovery: Benchmark recovery indicators derived from remote sensing time series

Extract time series characteristics from sampled time series

Simulate time series, measure recovery and evaluate performance

Define simulation settings

Plot the performance indicators

R Package Documentation

Browse R Packages

We want your feedback!

RETURN-project/BenchmarkRecovery
Benchmark recovery indicators derived from remote sensing time series