paRticulates: Import and visualize fine dust sensor data

Documented in read.madavi

# Copyright 2020 Meik Michalke <meik.michalke@hhu.de>
#
# This file is part of the R package paRticulates.
#
# paRticulates is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# paRticulates is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with paRticulates.  If not, see <http://www.gnu.org/licenses/>.

#' Import CSV data as provided by madavi.de
#' 
#' @param path Either a path to a single CSV file, or to a directory which is then being scanned for CSV files.
#' @param dropEmptyCols Logical, whether to drop all columns without any data.
#' @param tz Time zone, used to calculate local time from the UTC raw data.
#' @return An object of class \code{\link[paRticulates:airData-class]{airData}}.
#' @export
#' @examples
#' \dontrun{
#' # import single CSV file ~/fine_dust_data/data-esp8266-1234567-2019-12-10.csv
#' x <- read.madavi(file.path("~","fine_dust_data","data-esp8266-1234567-2019-12-10.csv"))
#'
#' # import all CSV files from directory ~/fine_dust_data
#' x <- read.madavi(file.path("~","fine_dust_data"))
#' }

read.madavi <- function(
  path,
  dropEmptyCols=TRUE,
  tz="Europe/Berlin"
){
  if(file_test("-d", path)){
    CSV_files <- list.files(path, pattern="*.[cC][sS][vV]", full.names=TRUE)
    # TODO: simplify this to avoid rbind()
    file_data_list <- lapply(
      CSV_files,
      function(this_file){
        return(
          slot(
            read.madavi(
              path=this_file,
              dropEmptyCols=FALSE,
              tz=tz
            ),
            "data"
          )[["madavi"]]
        )
      }
    )
    file_data <- file_data_list[[1]]
    if(length(file_data_list) > 1){
      for(this_df in file_data_list[-1]){
        file_data <- rbind(file_data, this_df)
      }
    } else {}
  } else if(file_test("-f", path)) {
    file_data <- read.csv2(
      file=path,
      dec='.',
      row.names=NULL,
      colClasses = c(
        "character",
        rep("numeric", 23)
      ),
      strip.white = TRUE,
      stringsAsFactors=FALSE
    )
    file_data[["Time"]] <- as.POSIXct(file_data[["Time"]], tz="UTC")
  } else {
    stop(simpleError(paste0("Data can't be found:\n  ", path)))
  }
  if(isTRUE(dropEmptyCols)){
    no_data <- apply(file_data, 2, function(this_col) all(is.na(this_col)))
    file_data <- file_data[, !no_data]
  } else {}
  # convert UTC to local time
  file_data[["TimeLocal"]] <- as.POSIXct(format(file_data[["Time"]], tz=tz, usetz=TRUE), tz=tz)
  
  result <- airData(
    data=list(
      madavi=file_data
    ),
    layout=data.frame(
      obj=rep("madavi", 4),
      data=c("SDS_P1", "SDS_P2", "Humidity", "Temp"),
      time=rep("TimeLocal", 4),
      row.names=c("PM10", "PM2_5", "humidity", "temperature"),
      stringsAsFactors=FALSE
    )
  )

  return(result)
}