tests/testthat/test_saveload.R

library(uwot)
context("load/save model")

test_that("can save and load simple model", {
  set.seed(1337)
  model <- umap(iris10,
    n_neighbors = 4, n_epochs = 2, init = "spca",
    metric = "euclidean", verbose = FALSE, n_threads = 0,
    ret_model = TRUE
  )

  mod_fname <- tempfile(tmpdir = tempdir())
  model <- save_uwot(model, file = mod_fname)
  expect_true(file.exists(mod_fname))

  # Can use model after saving
  set.seed(1337)
  res_trans <- umap_transform(iris10, model)
  expect_ok_matrix(res_trans)

  # Clean up temp dir from saving
  expect_true(file.exists(model$mod_dir))
  unload_uwot(model)
  expect_false(file.exists(model$mod_dir))
  # Can't use transform now model is unloaded
  expect_error(umap_transform(iris10, model), "is unloaded")

  modelload <- load_uwot(file = mod_fname)
  set.seed(1337)
  resload_trans <- umap_transform(iris10, modelload)
  expect_ok_matrix(resload_trans)

  expect_equal(resload_trans, res_trans)
  if (file.exists(mod_fname)) {
    unlink(mod_fname)
  }

  # Clean up temp dir from loading
  expect_true(file.exists(modelload$mod_dir))
  unload_uwot(modelload)
  expect_false(file.exists(modelload$mod_dir))
})


test_that("can save and load mixed distance model", {
  set.seed(1337)
  jiris10 <- jitter(iris10)
  metric2 <- list(
    "euclidean" = c(1, 2),
    "cosine" = c("Petal.Length", "Petal.Width")
  )
  model <- umap(jiris10,
    n_neighbors = 4, n_epochs = 2, init = "spca",
    metric = metric2,
    verbose = FALSE, n_threads = 0,
    ret_nn = TRUE, ret_model = TRUE
  )

  mod_fname <- tempfile(tmpdir = tempdir())
  model <- save_uwot(model, file = mod_fname)
  expect_true(file.exists(mod_fname))

  # Can use model after saving
  set.seed(1337)
  res_trans <- umap_transform(jiris10, model)
  expect_ok_matrix(res_trans)

  # Clean up temp dir from saving
  expect_true(file.exists(model$mod_dir))
  unload_uwot(model)
  expect_false(file.exists(model$mod_dir))
  # Can't use transform now model is unloaded
  expect_error(umap_transform(iris10, model), "is unloaded")

  modelload <- load_uwot(file = mod_fname)
  set.seed(1337)
  resload_trans <- umap_transform(jiris10, modelload)
  expect_ok_matrix(resload_trans)

  expect_equal(resload_trans, res_trans)
  if (file.exists(mod_fname)) {
    unlink(mod_fname)
  }

  # Clean up temp dir from loading
  expect_true(file.exists(modelload$mod_dir))
  unload_uwot(modelload)
  expect_false(file.exists(modelload$mod_dir))
})

test_that("unloading a model on save", {
  set.seed(1337)
  model <- umap(iris10,
    n_neighbors = 4, n_epochs = 2, init = "spca",
    metric = "euclidean", verbose = FALSE, n_threads = 0,
    ret_model = TRUE
  )

  mod_fname <- tempfile(tmpdir = tempdir())
  model <- save_uwot(model, file = mod_fname, unload = TRUE)
  expect_false(file.exists(model$mod_dir))

  # Trying to transform with a model that got unloaded won't work
  expect_error(umap_transform(iris10, model), "is unloaded")

  modelload <- load_uwot(file = mod_fname)
  # Clean up temp dir from loading
  expect_true(file.exists(modelload$mod_dir))
  # Can avoid cleaning up if you really want that
  unload_uwot(modelload, cleanup = FALSE)
  expect_true(file.exists(modelload$mod_dir))
  # Can unload multiple times
  unload_uwot(modelload, cleanup = TRUE)
  expect_false(file.exists(modelload$mod_dir))
})

# #88
test_that("save-load-save", {
  set.seed(1337)
  X <- matrix(rnorm(100), 10, 10)

  model <- uwot::umap(X, n_neighbors = 4, ret_model = TRUE)
  model_file <- tempfile(tmpdir = tempdir())
  model <- uwot::save_uwot(model, file = model_file)
  model2 <- uwot::load_uwot(file = model_file)
  new_file <- tempfile(tmpdir = tempdir())
  uwot::save_uwot(model2, file = new_file)
  expect_true(file.exists(new_file))

  modelm <- uwot::umap(X, n_neighbors = 4, metric = list("euclidean" = 1:5, "euclidean" = 6:10), ret_model = TRUE)
  modelm_file <- tempfile(tmpdir = tempdir())
  modelm <- uwot::save_uwot(modelm, file = modelm_file)
  modelm2 <- uwot::load_uwot(file = modelm_file)
  new_filem <- tempfile(tmpdir = tempdir())
  uwot::save_uwot(modelm2, file = new_filem)
  expect_true(file.exists(new_filem))
})

# #117 correlation metric not correctly restored
test_that("reload-correlation", {
  set.seed(1337)
  model <- umap(iris10,
                n_neighbors = 4, n_epochs = 2, init = "spca",
                metric = "correlation", verbose = FALSE, n_threads = 0,
                ret_model = TRUE, ret_extra = c("nn")
  )
  expect_equal(names(model$metric), "correlation")
  expect_equal(model$nn_index$metric, "correlation")

  set.seed(1337)
  transformed_before_reload <-
    umap_transform(iris10,
                   model,
                   n_epochs = 2,
                   ret_extra = c("nn"))

  expect_equal(
    transformed_before_reload$nn$correlation$dist,
    model$nn$correlation$dist,
    check.attributes = FALSE,
    tol = 1e-7
  )

  mod_fname <- tempfile(tmpdir = tempdir())
  model <- save_uwot(model, file = mod_fname, unload = TRUE)

  modelload <- load_uwot(file = mod_fname)

  expect_equal(names(model$metric), "correlation")
  expect_equal(model$nn_index$metric, "correlation")

  set.seed(1337)
  transformed_after_reload <-
    umap_transform(iris10,
                   modelload,
                   n_epochs = 2,
                   ret_extra = c("nn"))
  expect_equal(
    transformed_after_reload$nn$correlation$dist,
    model$nn$correlation$dist,
    check.attributes = FALSE,
    tol = 1e-7
  )

  if (file.exists(mod_fname)) {
    unlink(mod_fname)
  }
  expect_true(file.exists(modelload$mod_dir))
  unload_uwot(modelload)
  expect_false(file.exists(modelload$mod_dir))
})

test_that("save-load hnsw", {
  testthat::skip_if_not_installed("RcppHNSW")
  set.seed(1337)
  model <- umap(iris10,
    n_neighbors = 4, n_epochs = 2, init = "spca",
    metric = "euclidean", verbose = FALSE, n_threads = 0,
    ret_model = TRUE, ret_extra = c("nn"), nn_method = "hnsw"
  )
  expect_equal(model$nn_method, "hnsw")

  set.seed(1337)
  transformed_before_reload <-
    umap_transform(iris10,
      model,
      n_epochs = 2,
      ret_extra = c("nn")
    )

  mod_fname <- tempfile(tmpdir = tempdir())
  model <- save_uwot(model, file = mod_fname, unload = TRUE)

  modelload <- load_uwot(file = mod_fname)

  expect_equal(modelload$nn_method, "hnsw")

  set.seed(1337)
  transformed_after_reload <-
    umap_transform(iris10,
      modelload,
      n_epochs = 2,
      ret_extra = c("nn")
    )

  if (file.exists(mod_fname)) {
    unlink(mod_fname)
  }
  expect_true(file.exists(modelload$mod_dir))
  unload_uwot(modelload)
  expect_false(file.exists(modelload$mod_dir))

  expect_equal(model$nn$euclidean$idx, modelload$nn$euclidean$idx)
  expect_equal(model$nn$euclidean$dist, modelload$nn$euclidean$dist)

  expect_equal(
    transformed_before_reload$nn$euclidean$idx,
    transformed_after_reload$nn$euclidean$idx,
  )
  expect_equal(
    transformed_before_reload$nn$euclidean$dist,
    transformed_after_reload$nn$euclidean$dist,
    check.attributes = FALSE,
    tol = 1e-7
  )

  expect_equal(
    transformed_before_reload$embedding,
    transformed_after_reload$embedding
  )
})

test_that("save-load nndescent", {
  testthat::skip_if_not_installed("rnndescent")
  set.seed(1337)
  model <- umap(iris10,
                n_neighbors = 4, n_epochs = 2, init = "spca",
                metric = "euclidean", verbose = FALSE, n_threads = 0,
                ret_model = TRUE, ret_extra = c("nn"), nn_method = "nndescent"
  )
  expect_equal(model$nn_method, "nndescent")

  set.seed(1337)
  transformed_before_reload <-
    umap_transform(iris10,
                   model,
                   n_epochs = 2,
                   ret_extra = c("nn")
    )

  mod_fname <- tempfile(tmpdir = tempdir())
  model <- save_uwot(model, file = mod_fname, unload = TRUE)

  modelload <- load_uwot(file = mod_fname)

  expect_equal(modelload$nn_method, "nndescent")

  set.seed(1337)
  transformed_after_reload <-
    umap_transform(iris10,
                   modelload,
                   n_epochs = 2,
                   ret_extra = c("nn")
    )

  if (file.exists(mod_fname)) {
    unlink(mod_fname)
  }
  expect_true(file.exists(modelload$mod_dir))
  unload_uwot(modelload)
  expect_false(file.exists(modelload$mod_dir))

  expect_equal(model$nn$euclidean$idx, modelload$nn$euclidean$idx)
  expect_equal(model$nn$euclidean$dist, modelload$nn$euclidean$dist)

  expect_equal(
    transformed_before_reload$nn$euclidean$idx,
    transformed_after_reload$nn$euclidean$idx,
  )
  expect_equal(
    transformed_before_reload$nn$euclidean$dist,
    transformed_after_reload$nn$euclidean$dist,
    check.attributes = FALSE,
    tol = 1e-7
  )

  expect_equal(
    transformed_before_reload$embedding,
    transformed_after_reload$embedding
  )

  mod_fname2 <- tempfile(tmpdir = tempdir())
  saveRDS(modelload, mod_fname2)
  modelload2 <- readRDS(mod_fname2)
  expect_equal(modelload2$nn_method, "nndescent")
  set.seed(1337)
  transformed_after_reload2 <-
    umap_transform(iris10,
                   modelload2,
                   n_epochs = 2,
                   ret_extra = c("nn")
    )
  expect_equal(
    transformed_after_reload$nn$euclidean$idx,
    transformed_after_reload2$nn$euclidean$idx,
  )
  expect_equal(
    transformed_after_reload$nn$euclidean$dist,
    transformed_after_reload2$nn$euclidean$dist,
    check.attributes = FALSE,
    tol = 1e-7
  )
  expect_equal(
    transformed_after_reload$embedding,
    transformed_after_reload2$embedding
  )
  if (file.exists(mod_fname2)) {
    unlink(mod_fname2)
  }
})
jlmelville/uwot documentation built on April 19, 2024, 9:31 p.m.