avutils: various utilities for DiViMe tools and audio processing

Documented in rttm2elan

#' convert .rttm to .eaf (ELAN)
#'
#' A very crude translator from rttm files to ELAN format
#' @param rttmfile path to SAD file
#' @param audiofile path to audio file
#' @param targetloc path to targt location, \code{NULL} by default, see details
#'
#' @details the output file is named as the audio file, except for the file extension and a prefix \code{out_}, e.g. if the audio file is 34_Ab.wav then the output from this function will be out_34_Ab.eaf. By default the location for writing this new file is the same as the audio file. If the audio file is not found, or the folder in which it supposedly resides does not exist, the output will be written to location of the rttm file. You can also specify a folder to where you want to write the output in the \code{targetloc=} argument.
#'
#' Also note that you need to specify an audio file, even if it does not exist (or is not available on your machine at this time). There are two reasons for this: first it is needed for establishing the output file name. Second, the ELAN file needs the location of the audio. When opening the .eaf file created with this function in ELAN and if the audio file does not exist in the location provided, ELAN will ask you to locate it.
#'
#' In terms of tiers: the function will always contain an empty 'default' tier. Any additional annotations will go in different tiers, depending on the kind of rttm file that was supplied.
#'
#' Further, the function assumes that the first column in the rttm file corresponds to the tier and the 8th column contains the content for the annotation.
#'
#' @return writes a file and returns the path to this file
#' @export
#' @importFrom utils read.table
#' @importFrom xml2 as_xml_document write_xml
#'

rttm2elan <- function(rttmfile, audiofile, targetloc = NULL) {

  # handle media link
  audiofile <- normalizePath(audiofile, winslash = "/", mustWork = FALSE)
  if (!file.exists(audiofile)) {
    warning(audiofile, " not found. \n.eaf file was created anyway, but you you will be prompted to locate the file when opening ELAN", call. = FALSE)
  }
  ml <- paste0("file://", audiofile)
  rml <- basename(audiofile)
  rml <- paste0("./", rml)

  # rttm ----------------------------------------------------------------
  rttmfile <- normalizePath(rttmfile, winslash = "/", mustWork = TRUE)
  rttm <- read.table(rttmfile, header = FALSE, sep = " ")
  colnames(rttm)[c(1, 4, 5, 8)] <- c("tier", "start", "dur", "anno_val")


  # file name for output
  # is based on audio file name (regardless of whether this file actually exists)
  outname <- gsub(pattern = ".wav", replacement = ".eaf", x = basename(audiofile), fixed = TRUE)
  outname <- paste0("out_", outname)

  # and location for output
  if (is.null(targetloc)) {
    if (dir.exists(dirname(audiofile))) {
      outloc <- dirname(audiofile)
    } else {
      outloc <- dirname(rttmfile)
    }
  } else {
    outloc <- normalizePath(targetloc, winslash = "/", mustWork = TRUE)
  }

  ## time order -------------------------------------------------------------
  time_order <- structure(list())
  cnt <- 1
  i=1
  for (i in 1:nrow(rttm)) {
    for (k in 1:2) {
      if (k == 1) tval <- round(rttm[i, 4] * 1000)
      if (k == 2) tval <- round((rttm[i, 4] + rttm[i, 5]) * 1000)

    temp <- structure(list(), TIME_SLOT_ID = paste0("ts", cnt), TIME_VALUE = tval)
    time_order[[length(time_order) + 1]] <- temp
    cnt <- cnt + 1
    }
  }
  names(time_order) <- rep("TIME_SLOT", nrow(rttm) * 2)

  ## annotations
  # how many are needed?
  ntiers <- length(unique(rttm$tier))
  # check for tier names
  # temp <- as.character(rttm[1, 2])
  tiernames <- unique(as.character(rttm$tier))
  # create tiers as lists plus one default tier
  tier_default <- structure(list(),
                            DEFAULT_LOCALE = "us",
                            LINGUISTIC_TYPE_REF = "default-lt",
                            TIER_ID = "default")
  for (i in tiernames) {
    temp <- structure(list(),
                      DEFAULT_LOCALE = "us",
                      LINGUISTIC_TYPE_REF = "default-lt",
                      TIER_ID = i)
    assign(x = paste0("tier_", i), value = temp)
  }

  cnt <- 1
  i=1
  for (i in 1:nrow(rttm)) {
    t1 <- paste0("ts", cnt)
    t2 <- paste0("ts", cnt + 1)
    temp_anno <- structure(list(ANNOTATION_VALUE = rttm$anno_val[i]))
    temp_anno <- structure(list(ALIGNABLE_ANNOTATION = structure(list(ANNOTATION_VALUE = temp_anno),
                                                                 ANNOTATION_ID = paste0("a", i),
                                                                 TIME_SLOT_REF1 = t1,
                                                                 TIME_SLOT_REF2 = t2)))
    # which tier to write to
    tier <- paste0("tier_", rttm$tier[i])
    # get a temp copy, write the anno into it, and put it back
    temp <- get(x = tier)
    temp[[length(temp) + 1]] <- temp_anno
    assign(x = tier, value = temp)
    cnt <- cnt + 2
  }

  # and now name all list elements appropriately
  for (tier in paste0("tier_", tiernames)) {
    temp <- get(x = tier)
    names(temp) <- rep("ANNOTATION", length(temp))
    assign(x = tier, value = temp)
  }

  # audio locations and meta data...
  media_descriptor <- structure(list(),
                                MEDIA_URL = ml,
                                MIME_TYPE = "audio/x-wav",
                                RELATIVE_MEDIA_URL = rml)
  property1 <- structure(list("urn:nl-mpi-tools-elan-eaf:28eb9227-5451-4c09-8cab-f0a959d09e20"),
                         NAME = "URN")
  property2 <- structure(list("lastUsedAnnotationId"),
                         NAME = 3)


  header <- structure(list(MEDIA_DESCRIPTOR = media_descriptor,
                           PROPERTY = property1,
                           PROPERTY = property2),
                      MEDIA_FILE = "",
                      TIME_UNITS = "milliseconds")

  linguistic_type <- structure(list(), GRAPHIC_REFERENCES = "false", LINGUISTIC_TYPE_ID = "default-lt", TIME_ALIGNABLE = "true")
  locale <- structure(list(), COUNTRY_CODE = "EN", LANGUAGE_CODE = "us")

  ANNOTATION_DOCUMENT <- structure(list(HEADER = header,
                                        TIME_ORDER = time_order,
                                        LINGUISTIC_TYPE = linguistic_type,
                                        LOCALE = locale,
                                        TIER = tier_default
                                        #TIER = tier1
                                        ),
                                   'AUTHOR' = "",
                                   DATE = "2019-09-19T20:17:07+01:00",
                                   FORMAT = "3.0",
                                   VERSION = "3.0",
                                   'xmlns:xsi' = "http://www.w3.org/2001/XMLSchema-instance",
                                   'xsi:noNamespaceSchemaLocation' = "http://www.mpi.nl/tools/elan/EAFv3.0.xsd")
  # and add the tiers
  for (i in 1:ntiers) {
    temp <- get(x = paste0("tier_", tiernames[i]))
    ANNOTATION_DOCUMENT[[length(ANNOTATION_DOCUMENT) + 1]] <- temp
    names(ANNOTATION_DOCUMENT)[length(ANNOTATION_DOCUMENT)] <- "TIER"
  }


  res <- list(ANNOTATION_DOCUMENT = ANNOTATION_DOCUMENT)
  res <- as_xml_document(res)

  # deal with output location
  out <- paste0(outloc, "/", outname)
  x <- write_xml(res, file = out, options = "format")
  if (file.exists(out)) {
    return(out)
  } else {
    return(NULL)
  }
}