#' run a DiViMe SAD module
#'
#' @param audio_loc character, path to the audio files
#' @param divime_loc character, path to the DiViMe directory with a VM
#' @param module character, which module to execute (default is \code{"noisemes"}), see details
#' @param splitaudio numeric, should audio files be split into smaller chunks before processing by SAD tool, default is \code{NULL}, see details
#' @param vmstart logical, perform a check whether the VM is running and if not start it up (by default \code{TRUE}). Turning this off, will speed up the function a little bit, but requires that you are sure that the VM is indeed running in \code{divime_loc}.
#' @param vmshutdown logical, should the VM shut down after the operations are done (by default \code{TRUE})
#' @param messages logical, should the file names of each processed file be printed
#' @param overwrite logical, should output files be overwritten if they already exist (default is \code{FALSE})
#' @details \code{module=} sets the SAD module to be used: can be either \code{"noisemes"}, \code{"opensmile"} or \code{"tocombo"}
#'
#' It appears that some of the modules have difficulties with larger audio files (opensmile and noisemes). Hence, setting \code{splitaudio=} to a numeric value will temporarilly split the source audio into chunks of that duration (\code{\link{split_audio}}). Im my experience, a chunk duration of about two minutes solves these issues (e.g. via \code{splitaudio=120}). Note that this step requires the \code{sox} utility available (see \code{\link{set_binaries}} and \code{\link{split_audio}}).
#' @return a data.frame with the locations of the created rttm files and some diagnostics
#' @export
#' @importFrom utils write.table
#'
divime_sad <- function(audio_loc,
divime_loc,
module = "noisemes",
splitaudio = NULL,
vmstart = TRUE,
vmshutdown = TRUE,
messages = TRUE,
overwrite = FALSE) {
# audio_loc = "~/Desktop/test_audio/"
# divime_loc = "/Volumes/Data/VM2/ooo/DiViMe"
# vmshutdown = F; messages = TRUE; overwrite = TRUE
# module = "noisemes"; splitaudio = FALSE
# check whether sox is available if audio is to be split
if (!is.null(splitaudio)) {
allgood <- FALSE
if (!is.null(getOption("avutils_sox"))) {
allgood <- TRUE
}
if (Sys.which("sox") != "") {
allgood <- TRUE
}
if (!allgood) {
stop("sox not found for splitting audio files")
}
if (splitaudio <= 0) {
splitaudio <- FALSE
} else {
splitdur <- splitaudio
splitaudio <- TRUE
}
} else {
splitaudio <- FALSE
}
audio_loc <- normalizePath(audio_loc)
divime_loc <- normalizePath(divime_loc)
vagrant <- Sys.which("vagrant")
# check VM state and start if necessary
if (vmstart) {
vm_running <- divime_vagrant_state(divime_loc = divime_loc,
what = "status",
silent = TRUE)
if (vm_running %in% c("running (virtualbox)")) {
vm_running <- TRUE
} else {
vm_running <- FALSE
}
if (!vm_running) {
divime_vagrant_state(divime_loc = divime_loc,
what = "start",
silent = TRUE)
}
}
paths <- avutils:::handle_filenames(audio_loc = audio_loc,
divime_loc = divime_loc)
logres <- data.frame(audio = paths$filestoprocess,
size = paths$size,
processed = FALSE,
ptime = NA,
outlines = NA,
output = NA,
audiocopy = NA,
audioremove = NA,
resultscopy = NA,
resultsremove = NA,
yuniproblem = NA)
# create command depending on the desired module
if (module == "noisemes") cm <- paste0("ssh -c 'noisemesSad.sh data/'")
if (module == "opensmile") cm <- paste0("ssh -c 'opensmileSad.sh data/'")
if (module == "tocombo") cm <- paste0("ssh -c 'tocomboSad.sh data/'")
# loop through files
for (i in 1:nrow(logres)) {
# take time stamp
t1 <- Sys.time()
# create names and locations for output rttm
output_file <- paste0(module, "Sad_", paths$root_clean[i], ".rttm")
output_file_ori <- paste0(module, "Sad_", paths$root[i], ".rttm")
output_file_to <- normalizePath(paste0(audio_loc, "/", paths$folder[i], output_file_ori),
winslash = "/",
mustWork = FALSE)
output_file_from <- normalizePath(paste0(divime_loc, "/data/", output_file),
winslash = "/",
mustWork = FALSE)
# if overwrite = FALSE, continue only if the target file does not yet exist
# if it already exists, we can skip the processing in the VM
output_exists <- file.exists(output_file_to)
if (!(!overwrite & output_exists)) {
# copy audio file (either entirely or split)
if (splitaudio) {
splitfiles <- split_audio(filein = paths$audiosource[i],
split = splitdur,
pathout = dirname(paths$audiotarget_clean[i]))
if (sum(!file.exists(splitfiles)) == 0) logres$audiocopy[i] <- TRUE
} else {
logres$audiocopy[i] <- file.copy(from = paths$audiosource[i],
to = paths$audiotarget_clean[i])
}
# deal with working directories
WD <- getwd()
setwd(divime_loc)
# run bash command
xres <- system2(command = vagrant,
args = cm,
stdout = TRUE,
stderr = TRUE)
setwd(WD)
# remove audio file(s) from divimi location
if (splitaudio) {
temp <- file.remove(splitfiles)
if (sum(temp) == length(splitfiles)) logres$audioremove[i] <- TRUE
# and get names of rttm files (for merging into single rttm later)
rttm_files <- list.files(dirname(splitfiles[1]),
pattern = ".rttm",
full.names = TRUE)
} else {
logres$audioremove[i] <- file.remove(paths$audiotarget_clean[i])
}
# check for success
success <- TRUE
if (module == "tocombo") {
if ("MATLAB:nomem" %in% xres) {
success <- FALSE
message("'tocombo' produced MatLab memory error. Split audio file?")
}
if (sum(grepl("[[:digit:]]{1,10} Killed", xres)) > 0) {
success <- FALSE
message("'tocombo' produced error './get_TOcomboSAD_output_v3'. (process killed). Split audio file?")
}
}
if (success) {
# merge multiple rttm files if necessary
if (splitaudio) {
r <- combine_rttm(rttm_files = rttm_files,
split_dur = splitdur,
basename = as.character(paths$root[i]))
write.table(x = r, file = output_file_from, sep = " ",
quote = FALSE, row.names = FALSE, col.names = FALSE)
file.remove(rttm_files)
}
# log number of lines in output
logres$outlines[i] <- length(readLines(output_file_from))
# copy output back to source location from divime location
logres$resultscopy[i] <- file.copy(from = output_file_from,
to = output_file_to,
overwrite = overwrite)
# remove output from divimi location
logres$resultsremove[i] <- file.remove(output_file_from)
logres$output[i] <- output_file_ori
logres$processed[i] <- TRUE
# check for yunitator problem and log it
X <- xres[grep("[[:digit:]]{1,10} Killed", xres)]
if (length(X) > 0) {
logres$yuniproblem[i] <- TRUE
if (messages) message("[POTENTIAL PROBLEM] :",
paths$filestoprocess[i],
" --> ",
output_file)
message("possibly yunitator problem with file: ",
paths$filestoprocess[i])
} else {
logres$yuniproblem[i] <- FALSE
if (messages) message(paths$filestoprocess[i],
" --> ",
output_file_ori)
}
# additional clean up
if (module == "opensmile") {
fn <- paste0(divime_loc, "/data/", paths$root_clean[i], ".txt")
if (file.exists(fn)) {
file.remove(fn)
}
}
rm(X)
}
# clean up
rm(xres)
}
# clean up
rm(output_exists, output_file, output_file_from, output_file_ori, output_file_to)
t2 <- Sys.time()
logres$ptime[i] <- as.numeric(round(difftime(t2, t1, units = "min"), 3))
# predict time left
temp <- na.omit(logres[, c("ptime", "size")])
sizes <- logres$size[is.na(logres$ptime)]
if (nrow(temp) > 1) {
tempres <- lm(ptime ~ size, temp)
if (length(sizes) > 0) {
timeleft <- round(sum(predict(tempres, newdata = data.frame(size = sizes))), 1)
cat("expected time until finish: ", timeleft, " minutes\n")
}
}
}
# shut down if requested
if (vmshutdown) {
divime_vagrant_state(divime_loc = divime_loc,
what = "halt",
silent = TRUE)
}
logres
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.