R/projects.R

Defines functions loadProject saveProject enableDataSourceFunctions newProject on_save_button_clicked on_open_button_clicked on_save_as_activate on_save_menu_activate on_open_activate on_close_activate on_new_button_clicked on_new_activate

Documented in on_close_activate on_new_activate on_new_button_clicked on_open_activate on_open_button_clicked on_save_as_activate on_save_button_clicked on_save_menu_activate

# Gnome R Data Miner: GNOME interface to R for Data Mining
#
# Time-stamp: <2019-03-31 14:09:45 Graham Williams>
#
# Project functionality.
#
# Copyright (c) 2009 Togaware Pty Ltd
#
# This files is part of Rattle.
#
# Rattle is free software: you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 2 of the License, or
# (at your option) any later version.
#
# Rattle is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with Rattle. If not, see <https://www.gnu.org/licenses/>.

########################################################################
# CALLBACKS

on_new_activate <- function(action, window)     { newProject()  }
on_new_button_clicked <- function(action, window)  { newProject() }
on_close_activate <- function(action, window)     { closeProject()  }

on_open_activate <- function(action, window)
{
  # Wrap the actual call with a "try" so that the watch cursor turns
  # off even on error.
  
  setStatusBar()
  set.cursor("watch")
  try(loadProject())
  set.cursor()
}

on_save_menu_activate <- function(action, window)
{
  setStatusBar()
  set.cursor("watch")
  on.exit(set.cursor())
  saveProject()
}

on_save_as_activate <- function(action, window)
{
  setStatusBar()
  set.cursor("watch")
  on.exit(set.cursor())
  saveProject()
}

on_open_button_clicked <- function(action, window)
{
  setStatusBar()
  set.cursor("watch")
  on.exit(set.cursor())
  loadProject()
}

on_save_button_clicked <- function(action, window)
{
  setStatusBar()
  set.cursor("watch")
  on.exit(set.cursor())
  saveProject()
}

########################################################################
# NEW PROJECT

newProject <- function(ask.overwrite=TRUE)
{
  if (not.null(listBuiltModels()) && ask.overwrite)
  {
    if (! questionDialog(Rtxt("You have requested to start a new project.\n\n",
                              "This will clear the current project (dataset",
                              "and models).\n\n",
                              "If you choose not to continue you can save",
                              "the project, and then start a new project.\n\n",
                              "Do you wish to continue, and overwrite the",
                              "current project?")))
      return()
  }

  resetRattle()

  # Clear out the log and re-initialise it.

  setTextviewContents("log_textview", "")
  initiateLog()
  
  # Ensure data sources are enabled again.
  
  enableDataSourceFunctions()

  # Reset things that can't be done in resetRattle()

  # 090314 I was finding that the filechooserbutton was being set to a
  # folder with the setFilename, so try using unselectFilename instead.
  
  #theWidget("data_filechooserbutton")$setFilename("")
  filename <- theWidget("data_filechooserbutton")$getFilename()
  if (not.null(filename)) theWidget("data_filechooserbutton")$unselectFilename(filename)
  
  theWidget("data_name_combobox")$setActive(-1)

  # TODO Plenty of other things that should be reset as well.

  crv$NOTEBOOK$setCurrentPage(getNotebookPage(crv$NOTEBOOK,
                                              crv$NOTEBOOK.DATA.NAME))
  switchToPage(crv$NOTEBOOK.DATA.NAME)
  
}

enableDataSourceFunctions <- function(enable=TRUE)
{
  # 080707 Turn the data source options on/off. This is used when
  # loading a project to avoid datasets being loaded. Logically we
  # don't load a new dataset if we have loaded a project. We can
  # always click New to then load a new dataset.
  
  widgets <- c("data_type_label", "data_csv_radiobutton", "data_arff_radiobutton",
                "data_rdata_radiobutton", "data_rdataset_radiobutton",
                "data_library_radiobutton", "data_odbc_radiobutton",
                "data_corpus_radiobutton")
  for (w in widgets) theWidget(w)$setSensitive(enable)
}

########################################################################
# Close Project
#
# For now, Close is just like New.

closeProject <- newProject

########################################################################
# Save Project

saveProject <- function()
{

  # Check pre-conditions.
  
  if (noDatasetLoaded()) return()
  if (variablesHaveChanged("saving the project")) return()

  # Obtain a filename to save to.
  
  dialog <- RGtk2::gtkFileChooserDialog(Rtxt("Save Project"), NULL, "save",
                                 "gtk-cancel", RGtk2::GtkResponseType["cancel"],
                                 "gtk-save", RGtk2::GtkResponseType["accept"])
  dialog$setDoOverwriteConfirmation(TRUE)

  # 090707 Add the crs$projext extension by default to be consistent
  # throughout Rattle. It is also needed for OverwriteConfirmation.

  if (is.null(crs$projname))
    default.name <- crs$dataname
  else
    default.name <- crs$projname
    
  dialog$setCurrentName(paste(get.stem(default.name), crv$projext, sep=""))

  if (! is.null(crs$pwd)) dialog$setCurrentFolder(crs$pwd)

  if (length(crv$project.extensions))
  {
    ff <- RGtk2::gtkFileFilterNew()
    ff$setName(Rtxt("Projects"))
    lapply(paste("*.", crv$project.extensions, sep=""), ff$addPattern)
    dialog$addFilter(ff)
  }
 
  ff <- RGtk2::gtkFileFilterNew()
  ff$setName(Rtxt("RData Files"))
  ff$addPattern("*.Rdata")
  dialog$addFilter(ff)

  ff <- RGtk2::gtkFileFilterNew()
  ff$setName(Rtxt("All Files"))
  ff$addPattern("*")
  dialog$addFilter(ff)
  
  if (dialog$run() == RGtk2::GtkResponseType["accept"])
  {
    save.name <- dialog$getFilename()
    save.ext <- get.extension(save.name)
    filter.name <- dialog$getFilter()$getName()
    crs$projname <- save.name
    dialog$destroy()
  }
  else
  {
    dialog$destroy()
    return()
  }

  # 081111 Deal with the filename extension. We add an extension of
  # either rattle or Rdata (or other extensions that might be listed
  # in crv$project.extensions) if the save.name does not have one
  # already. The logic of which to add depends on whether one of the
  # filters is active, or else the first extension in the list
  # crv$project.extensions.

  if (tolower(save.ext) %notin% c(crv$project.extensions, "rdata"))
  {
    if (filter.name == Rtxt("Projects"))
    {
      if (save.ext != crv$project.extensions[1])
        save.name <- sprintf("%s.%s", save.name, crv$project.extensions[1])
    }
    else if (filter.name == Rtxt("RData Files"))
    {
      if (save.ext != "Rdata")
        save.name <- sprintf("%s.Rdata", save.name)
    }
    else
    {
      if (save.ext != crv$project.extensions[1])
        save.name <- sprintf("%s.%s", save.name, crv$project.extensions[1])
    }
  }
  
  # Save the filename to restore on reloading.

  crs$filename <- theWidget("data_filechooserbutton")$getUri()

  # 100609 Save the partition sizes for restoration.

  crs$partition <- theWidget("data_sample_entry")$getText()
  
  # Save all of the text views to be restored on a load.
  # Put the following into a function and call for each textview.

  crs$text$summary <- getTextviewContent("summary_textview")
  crs$text$correlation <- getTextviewContent("correlation_textview")
  crs$text$prcomp <- getTextviewContent("prcomp_textview")
  crs$text$kmeans <- getTextviewContent("kmeans_textview")
  crs$text$hclust <- getTextviewContent("hclust_textview")
  crs$text$rpart <-  getTextviewContent("rpart_textview")
  crs$text$rf <-  getTextviewContent("rf_textview")
  crs$text$esvm <-  getTextviewContent("esvm_textview")
  crs$text$ksvm <-  getTextviewContent("ksvm_textview")
  crs$text$glm <-  getTextviewContent("glm_textview")
  crs$text$ada <-  getTextviewContent("ada_textview")
  crs$text$nnet <-  getTextviewContent("nnet_textview")
  crs$text$survival <-  getTextviewContent("model_survival_textview")
  #crs$text$gbm <-  getTextviewContent("gbm_textview")
  crs$text$risk <- getTextviewContent("risk_textview")
  crs$text$roc <- getTextviewContent("roc_textview")
  crs$text$log <- getTextviewContent("log_textview")

  # Save Transform variables selections - not sure it is really
  # needed, but follow the template!

  crs$zero <- getSelectedVariables("zero")
  
  # Save Distribution variable selections

  crs$boxplot <- getSelectedVariables("boxplot")
  crs$hisplot <- getSelectedVariables("hisplot")
  crs$cumplot <- getSelectedVariables("cumplot")
  crs$benplot <- getSelectedVariables("benplot")
  crs$barplot <- getSelectedVariables("barplot")
  crs$dotplot <- getSelectedVariables("dotplot")

  # Save seed information

  crs$train.on <- theWidget("data_sample_checkbutton")$getActive()
  crs$train.seed <- theWidget("sample_seed_spinbutton")$getValue()
  crs$kmeans.seed <- theWidget("kmeans_seed_spinbutton")$getValue()
  
  # Save Model options

  if (not.null(crs$rpart))
  {
    crs$rpart.opt$priors <- theWidget("model_tree_priors_entry")$getText()
    crs$rpart.opt$loss   <- theWidget("model_tree_loss_entry")$getText()
    crs$rpart.opt$split  <- theWidget("rpart_minsplit_spinbutton")$getValue()
    crs$rpart.opt$depth  <- theWidget("rpart_maxdepth_spinbutton")$getValue()
    crs$rpart.opt$cp     <- theWidget("model_tree_cp_spinbutton")$getValue()
    crs$rpart.opt$bucket <- theWidget("rpart_minbucket_spinbutton")$getValue()
    crs$rpart.opt$miss   <- theWidget("model_tree_include_missing_checkbutton")$getActive()
  }

  if (not.null(crs$rf))
  {
    crs$rf.opt$trees     <- theWidget("rf_ntree_spinbutton")$getValue()
    crs$rf.opt$vars      <- theWidget("rf_mtry_spinbutton")$getValue()
    crs$rf.opt$sample    <- theWidget("model_rf_sample_entry")$getText()
    crs$rf.opt$proximity <- theWidget("rf_proximity_checkbutton")$getActive()
  }
    
  crs$svm.opt$kernel <- theWidget("svm_kernel_combobox")$getActive()

  set.cursor("watch")
  on.exit(set.cursor())
  startLog()
  appendLog(Rtxt("Save the project data (variable crs) to file."),
            sprintf('save(crs, file="%s", compress=TRUE)', save.name))
  save(crs, file=save.name, compress=TRUE)

  # Record the cwd for projects.
  
  crs$pwd <- dirname(save.name)
  
  setMainTitle(basename(save.name))
  setStatusBar(sprintf(Rtxt("The current project has been saved to '%s'"), save.name))
}

loadProject <- function()
{
  # Check if models exist and if so warn about losing the current project.

  if (not.null(listBuiltModels()))
  {
    if (! questionDialog(Rtxt("You have chosen to load a project.\n\n",
                              "This will clear the old project (dataset and",
                              "models) which may not have been saved.",
                              "If you choose not to continue you can save",
                              "the project, and then load the new project.",
                              "\n\n",
                              "Do you wish to continue, and overwrite the",
                              "current project?")))
      return()
  }

  # Request the rattle filename to be loaded

  dialog <- RGtk2::gtkFileChooserDialog(Rtxt("Open Project"), NULL, "open",
                                 "gtk-cancel", RGtk2::GtkResponseType["cancel"],
                                 "gtk-open", RGtk2::GtkResponseType["accept"])

  if (! is.null(crs$pwd)) dialog$setCurrentFolder(crs$pwd)

  if (length(crv$project.extensions))
  {
    ff <- RGtk2::gtkFileFilterNew()
    ff$setName(Rtxt("Projects"))
    lapply(paste("*.", crv$project.extensions, sep=""), ff$addPattern)
    dialog$addFilter(ff)
  }
  
  ff <- RGtk2::gtkFileFilterNew()
  ff$setName(Rtxt("RData Files"))
  ff$addPattern("*.RData")
  dialog$addFilter(ff)

  ff <- RGtk2::gtkFileFilterNew()
  ff$setName(Rtxt("All Files"))
  ff$addPattern("*")
  dialog$addFilter(ff)
  
  if (dialog$run() == RGtk2::GtkResponseType["accept"])
  {
    load.name <- dialog$getFilename()
    dialog$destroy()
  }
  else
  {
    dialog$destroy()
    return()
  }

  if (!file.exists(load.name))
    if (!questionDialog(sprintf(Rtxt("The project file '%s' does not exist?"),
                                load.name)))
      return()
  
  # Load the file.

  set.cursor("watch")
  on.exit(set.cursor())

  resetRattle()  # Seems appropriate to clear out the crs

  crv$NOTEBOOK$setCurrentPage(0)

  # 090317 Trying to figure out how to place the saved environment
  # into the crs environment. This seems to do the trick.

  ocrs <- crs
  load(load.name)
  for (o in objects(crs))
    assign(o, get(o, envir=crs), envir=ocrs)
  rm(crs)

  # Record the cwd for projects.
  
  crs$pwd <- dirname(load.name)

  # 101115 Record a project name if there is none.

  if (is.null(crs$projname)) crs$projname <- load.name
  
  # Now update all appropriate textviews and associated data.

  setMainTitle(basename(load.name))
  crv$DATA.DISPLAY.NOTEBOOK$setCurrentPage(crv$DATA.DISPLAY.TREEVIEW.TAB)
  
  # DATA

  # Reset the file chooser button. 090211 What should happen if the
  # file does not exist? This is most likely when the project comes
  # from another user or another system. Leaving it set as empty seems
  # to work in that we can make changes to the roles and they get
  # effected without trying to load the default dataset. 090317 Is
  # that still true? Also, I don't recall why I go for the basename if
  # it does not exist. Seems to make some sense. 120520 Take account
  # of the case where there is no filename stored as when an R Dataset
  # was loaded.
  
  if (! is.null(crs$filename))
  {
    if (file.exists(uri2file(crs$filename)))
      theWidget("data_filechooserbutton")$setUri(crs$filename)
    else
      crs$filename <- basename(crs$filename)
  }
  
  if (! is.null(crs$dwd) && ! file.exists(uri2file(crs$dwd)))
    crs$dwd <- ""

  # 100609 Restore partition sizes before we resetVariableRoles since
  # sampling is redone there. Do I also need to restore the seed to
  # the GUI here?

  if (is.null(crs$partition))
    theWidget("data_sample_entry")$setText("70/30")
  else
    theWidget("data_sample_entry")$setText(crs$partition)

  # 090402 Are these needed any more now we assign crs above? I don't
  # think so. Comment out all the following assignments as well.
  
#  crs$train      <- crs$train
#  crs$train.seed <- crs$train.seed

  # 100609 Check if crs$partition is null, and if so we assume an old
  # rattle project, so restore the sample size in the old
  # way. Eventually should be able to reomve this.
  
  if (is.null(crs$partition))
    if(crs$train.on)
    {
      nrows <- nrow(crs$dataset)
      srows <- length(crs$train)
      per <- 100*srows/nrows
      theWidget("data_sample_checkbutton")$setActive(TRUE)
      theWidget("sample_count_spinbutton")$setRange(1,nrows)
      theWidget("sample_count_spinbutton")$setValue(srows)
      if (not.null(crs$train.seed))
        theWidget("sample_seed_spinbutton")$setValue(crs$train.seed)
      else
        theWidget("sample_seed_spinbutton")$setValue(crv$seed)
      theWidget("sample_percentage_spinbutton")$setValue(per)
    }
    else
    {
      theWidget("data_sample_checkbutton")$setActive(FALSE)
    }
  else
  {
    theWidget("data_sample_checkbutton")$setActive(crs$train.on)
  }

  # Make sure we don't attempt to reload the file on executing the
  # Data tab, and thereby overwriting the current data, losing all of
  # the work already done on it. Set the modified time for the dataset
  # to be apparently now.

  crs$mtime <- Sys.time()

  # VARIABLES

  # Deal with the weights. This is either crs$dataset$VARIABLE or some
  # arbitrary formula. Need to distinguish and in the former to pass
  # the variable through to resetVariableRoles, and if the latter then
  # set the widget.

  if (not.null(crs$weights))
  {
    wname <- gsub("crs\\$dataset\\$", "", crs$weights)
    if (wname %in% colnames(crs$dataset))
    {
      theWidget("weight_entry")$setSensitive(FALSE)
    }
    else
    {
      theWidget("weight_entry")$setText(wname)
      #    the.weight <- sprintf("Weights: %s",weights.display)
      #    theWidget("model_tree_rpart_weights_label")$setText(the.weight)
      crs$weights <- crs$weights
      wname <- NULL
    }
  }
  else
    wname <- NULL

  resetVariableRoles(colnames(crs$dataset), nrow(crs$dataset),
                     crs$input, crs$target, crs$risk, crs$ident, crs$ignore,
                     wname,
                     crs$zero,
                     crs$boxplot, crs$hisplot, crs$cumplot, crs$benplot,
                     crs$barplot, crs$dotplot, resample=FALSE, autoroles=FALSE)
  executeSelectTab()
  resetTestTab()
  
  if (not.null(crs$risk))
    theWidget("evaluate_risk_label")$setText(crs$risk)

  # 080707 Ensure data sources are disabled so that we can not,
  # logically, load a dataset after we have loaded a project. This
  # also helps to ensure when we press the Execute button, a data set
  # is not thought to be needed to be loaded.

  enableDataSourceFunctions(FALSE)
  
  # Explore
  
  setTextviewContents("summary_textview", crs$text$summary)
  setTextviewContents("correlation_textview", crs$text$correlation)
  setTextviewContents("prcomp_textview", crs$text$prcomp)

  # TRANSFORM

#  crs$transforms <- crs$transforms
  
  # CLUSTER
  
#  crs$kmeans      <- crs$kmeans
#  crs$kmeans.seed <- crs$kmeans.seed
  if (not.null(crs$kmeans.seed))
    theWidget("kmeans_seed_spinbutton")$setValue(crs$kmeans.seed)
  else
    theWidget("kmeans_seed_spinbutton")$setValue(crv$seed)
  setTextviewContents("kmeans_textview", crs$text$kmeans)

  showModelKMeansExists()
  
#  crs$hclust   <- crs$hclust
  setTextviewContents("hclust_textview", crs$text$hclust)

  showModelHClustExists() # 100424 Enable appropriate widgets if hclust exists.
  
  # TODO - Heading toward using namespace rather than loading
  # libraries and interfering with user's environment - Bit by
  # bit. The current eval parse stuff was for display of the libray
  # command on Log but no longer should be used.

#  crs$page     <- crs$page
#  crs$smodel   <- crs$smodel

#  crs$rpart    <- crs$rpart
  setTextviewContents("rpart_textview", crs$text$rpart)
  if (not.null(crs$rpart)) eval(parse(text="library(rpart, quietly=TRUE)"))
  
#  crs$rf       <- crs$rf
  setTextviewContents("rf_textview", crs$text$rf)
  if (not.null(crs$rf)) eval(parse(text="library(randomForest, quietly=TRUE)"))

#  crs$svm      <- crs$svm
  setTextviewContents("esvm_textview", crs$text$esvm)
  if (not.null(crs$svm)) eval(parse(text="library(e1071, quietly=TRUE)"))

#  crs$ksvm     <- crs$ksvm
  setTextviewContents("ksvm_textview", crs$text$ksvm)
  if (not.null(crs$ksvm)) eval(parse(text="library(kernlab, quietly=TRUE)"))

#  crs$glm      <- crs$glm
  setTextviewContents("glm_textview", crs$text$glm)

  setTextviewContents("ada_textview", crs$text$ada)

  setTextviewContents("nnet_textview", crs$text$nnet)
  if (not.null(crs$nnet)) eval(parse(text="library(nnet, quietly=TRUE)"))

  setTextviewContents("model_survival_textview", crs$text$survival)
  if (not.null(crs$survival)) eval(parse(text="library(survival, quietly=TRUE)"))

  if (not.null(crs$rpart.opt$priors))
    theWidget("model_tree_priors_entry")$setText(crs$rpart.opt$priors)
  if (not.null(crs$rpart.opt$loss))
    theWidget("model_tree_loss_entry")$setText(crs$rpart.opt$loss)
  if (not.null(crs$rpart.opt$split))
    theWidget("rpart_minsplit_spinbutton")$setValue(crs$rpart.opt$split)
  if (not.null(crs$rpart.opt$depth))
    theWidget("rpart_maxdepth_spinbutton")$setValue(crs$rpart.opt$depth)
  if (not.null(crs$rpart.opt$cp))
    theWidget("model_tree_cp_spinbutton")$setValue(crs$rpart.opt$cp)
  if (not.null(crs$rpart.opt$bucket))
    theWidget("rpart_minbucket_spinbutton")$setValue(crs$rpart.opt$bucket)
  if (not.null(crs$rpart.opt$miss))
    theWidget("model_tree_include_missing_checkbutton")$setActive(crs$rpart.opt$miss)

  
  # Make buttons sensitive for MODEL:RPART if there is an RPART model
  
  showModelRPartExists()

  ## Make buttons sensitive for MODEL:ADA if there is an ADA model
  
  showModelAdaExists()

  if (not.null(crs$rf.opt$trees))
    theWidget("rf_ntree_spinbutton")$setValue(crs$rf.opt$trees)
  if (not.null(crs$rf.opt$vars))
    theWidget("rf_mtry_spinbutton")$setValue(crs$rf.opt$vars)
  if (not.null(crs$rf.opt$sample))
    theWidget("model_rf_sample_entry")$setText(crs$rf.opt$sample)
  if (not.null(crs$rf.opt$proximity))
    theWidget("rf_proximity_checkbutton")$setActive(crs$rf.opt$proximity)

  # Make buttons sensitive for MODEL:RF if there is an RF model

  showModelRFExists()
  
  if (not.null(crs$svm))
    theWidget("e1071_radiobutton")$setActive(TRUE)

  if (not.null(crs$svm.opt$kernel))
    theWidget("svm_kernel_combobox")$setActive(crs$svm.opt$kernel)

  # EVALUATE

  setTextviewContents("risk_textview", crs$text$risk)
  setTextviewContents("roc_textview", crs$text$roc )

  if (not.null(crs$testname))
  {
    theWidget("evaluate_filechooserbutton")$setFilename(crs$testname)
    theWidget("evaluate_csv_radiobutton")$setActive(TRUE)
  }
  
  
#  crs$perf     <- crs$perf
#  crs$eval     <- crs$eval
#  crs$testset  <- crs$testset
#  crs$testname <- crs$testname

  # Ensure the Evaluate options are reset appropriately. 091217 Why is
  # rattle::: being called directly?
  
  # rattle:::configureEvaluateTab()

  configureEvaluateTab()
  
  # LOG
  
  setTextviewContents("log_textview", crs$text$log)
  startLog()
  appendLog(Rtxt("Reload the project data (variable crs) from file."),
            sprintf('load("%s")', load.name))
  setStatusBar(sprintf(Rtxt("Project loaded from '%s'"), load.name))
}

Try the rattle package in your browser

Any scripts or data that you put into this service are public.

rattle documentation built on March 21, 2022, 5:06 p.m.