R/smtl.R
In sMTL: Sparse Multi-Task Learning

Documented in smtl

#' smtl: make model-fitting function
#'
#' @param y A numeric outcome vector (for multi-task/domain generalization problems) or a numeric outcome matrix (for multi-label problems)
#' @param X A matrix of covariates
#' @param study A vector of integers specifying task (or study/domain) ID. This should be set to NA for Multi-Label problems, but is required for Multi-Task and Domain Generalization problems.
#' @param s An integer specifying the sparsity level
#' @param commonSupp A boolean specifying whether to constrain solutions to have a common support
#' @param warmStart A boolean specifying whether a warm start model is fit internally before the final model. Warm starts improve solution quality but will be slower.
#' @param lambda_1 A numeric vector of ridge penalty hyperparameter values
#' @param lambda_2 A numeric vector of betaBar (to borrow strength across coefficient values) penalty hperparameter values
#' @param lambda_z A numeric vector zBar (to borrow strength across coefficient supports) penalty hperparameter values
#' @param scale A boolean specifying whether to center and scale covariates before model fitting (either way coefficient estimates are returned on original scale before centering/scaling)
#' @param maxIter An integer specifying the maximum number of coordinate descent iterations before
#' @param LocSrch_maxIter An integer specifying the number of maximum local search iterations
#' @param independent.regs A boolean specifying whether to fit independent regressions (instead of multi-task). This ensures there is NO information sharing via active sets or penalties
#' @param model A boolean indicating whether to return design matrix and outcome vector
#' @param messageInd A boolean specifying whether to include messages (verbose)
#' @return A list (object of S3 class). \item{beta}{ Matrix with coefficient estimates where column j are estimates from task j.}
#' \item{reg_type}{ String specifying whether model is \code{"multiStudy"} denoting that there is a separate design matrix for each task, \code{"multiLabel"} where the design matrix is the same 
#' across tasks and \code{"L0"} indicating a single-task regression.} \item{K}{ Integer that indicates number of tasks.} \item{s}{ An integer that indicates sparsity level.} \item{commonSupp}{ Boolean 
#'indicating of supports are common across tasks.} \item{warmStart}{ A Boolean indicating whether to fit a MTL model as a warm start.} \item{grid}{ A dataframe including grid of hyperparameters that model
#' is fit on.} \item{maxIter}{ An integer specifying the maximum number of iterations of block CD.} \item{LocSrch_maxIter}{ An integer specify the maximum number of iterations of local search.}
#' \item{independent.regs}{ A boolean indicating whether to make each task independent of each other (no shared active sets).} \item{AS_multiplier}{ An integer specifying the active set multiplier.} 
#' \item{X_train}{ A Matrix: the design matrix (row concatenated across tasks).} \item{y_train}{ The outcome vector or matrix.}
#' @examples
#' 
#' \dontrun{
#' 
#' if (identical(Sys.getenv("AUTO_JULIA_INSTALL"), "true")) { ## The examples are quite time consuming
#' ## Do initiation for and automatic installation if necessary
#'
#' # load package
#' library(sMTL)
#' smtl_setup()
#' 
#' #####################################################################################
#' ##### simulate data
#' #####################################################################################
#' set.seed(1) # fix the seed to get a reproducible result
#' K <- 4 # number of datasets 
#' p <- 100 # covariate dimension
#' s <- 5 # support size
#' q <- 7 # size of subset of covariates that can be non-zero for any task
#' n_k <- 50 # task sample size
#' N <- n_k * p # full dataset samplesize
#' X <- matrix( rnorm(N * p), nrow = N, ncol=p) # full design matrix
#' B <- matrix(1 + rnorm(K * (p+1) ), nrow = p + 1, ncol = K) # betas before making sparse
#' Z <- matrix(0, nrow = p, ncol = K) # matrix of supports
#' y <- vector(length = N) # outcome vector
#' 
#' # randomly sample support to make betas sparse
#' for(j in 1:K)     Z[1:q, j] <- sample( c( rep(1,s), rep(0, q - s) ), q, replace = FALSE )
#' B[-1,] <- B[-1,] * Z # make betas sparse and ensure all models have an intercept
#' 
#' task <- rep(1:K, each = n_k) # vector of task labels (indices)
#' 
#' # iterate through and make each task specific dataset
#' for(j in 1:K){
#'     indx <- which(task == j) # indices of task
#'     e <- rnorm(n_k)
#'     y[indx] <- B[1, j] + X[indx,] %*% B[-1,j] + e
#'     }
#'     colnames(B) <- paste0("beta_", 1:K)
#'     rownames(B) <- paste0("X_", 1:(p+1))
#'     
#'     print("Betas")
#'     print(round(B[1:8,],2))
#'     
#' #####################################################################################
#' ##### fit Multi-Task Learning Model for Heterogeneous Support
#' #####################################################################################
#'   
#'     mod <- sMTL::smtl(y = y, 
#'                       X = X, 
#'                       study = task, 
#'                       s = 5, 
#'                       commonSupp = FALSE,
#'                       lambda_1 = 0.001,
#'                       lambda_2 = 0,
#'                       lambda_z = 0.25)
#'     
#'     print(round(mod$beta[1:8,],2))
#'     
#'     # make predictions
#'     preds <- sMTL::predict(model = mod, X = X[1:5,])
#'     
#' #####################################################################################
#' ##### fit Multi-Task Learning Model for Common Support
#' #####################################################################################
#'     library(sMTL)
#'     sMTL::smtl_setup(path = "/Applications/Julia-1.5.app/Contents/Resources/julia/bin")
#'     mod <- sMTL::smtl(y = y, 
#'                       X = X, 
#'                       study = task, 
#'                       s = 5, 
#'                       commonSupp = TRUE,
#'                       lambda_1 = 0.001,
#'                       lambda_2 = 0.5)
#'     
#'     print(round(mod$beta[1:8,],2))
#'     }
#'     }
#'     
#' @import JuliaConnectoR
#' @export

smtl = function(y, 
                X, 
                study = NA, 
                s, 
                commonSupp = FALSE,
                warmStart = TRUE,
                lambda_1 = 0, 
                lambda_2 = 0, 
                lambda_z = 0, 
                scale = TRUE,
                maxIter = 10000,
                LocSrch_maxIter = 50,
                messageInd = TRUE,
                model = TRUE,
                independent.regs = FALSE # shared active sets
                ) {
    
    var <- NULL # global variable declaration for CRAN checks
    
    ###################
    # sanity checks
    ###################
    np <- dim(X)
    nobs <- as.integer(np[1])
    p <- as.integer(np[2])
    
    ##check dims
    if(is.null(np)|(np[2]<=1))   stop("X should be a matrix with 2 or more columns")
    
    dimy=dim(y)
    nrowy=ifelse(is.null(dimy),length(y),dimy[1])
    if(nrowy!=nobs)  stop(paste("number of observations in y (",nrowy,") not equal to the number of rows of x (",nobs,")",sep=""))
    
    convex_flag <- FALSE # indicator of whethere s>=p
        
    if(any(s >= p)){
        
        message(paste("s (",s,") (support size), is >= number of covaraites (",p,"). s is set to p. commonSupp set to TRUE. Solving non-sparse convex problem.",sep=""))
        s <- p # set to p
        commonSupp <- TRUE
        lambda_z <- 0 # cannot have convex version and lambda_z > 0
        convex_flag <- TRUE  # indicator of whethere s>=p
        LocSrch_maxIter <- 0 # no local search 
        independent.regs <- FALSE # cannot be independent
        }   
    
    
    # find path of sMTL package
    juliaFnPath <- paste0( .libPaths("sMTL"), "/sMTL/julia/" )
    
    # catch errors
    maxIter <- round(maxIter)
    
    if(is.numeric(LocSrch_maxIter))   LocSrch_maxIter <- as.integer( round(LocSrch_maxIter) )
    if(is.na(LocSrch_maxIter))        LocSrch_maxIter <- as.integer( 0 )
    
    if(!is.integer(LocSrch_maxIter) | LocSrch_maxIter < 0){
        message("LocSrch_maxIter must be an integer >= 0. We set it to default")
        LocSrch_maxIter <- 50
    }      
    
    # find path of sMTL package
    juliaFnPath <- paste0( .libPaths("sMTL"), "/sMTL/julia/" )
    
    AS_multiplier <- 3 # warm start multiplier for number of non-zeros
    
    # determine if problem is multiLabel
    if( is.matrix(y) ){
        
        if( any( apply(y, 2, var)  == 0 ) )   stop("At least one task's y is constant")
        
        # make sure y is a matrix with multiple columns
        if( ncol(y) > 1 ){
            reg_type <- "multiLabel"
            K <- ncol(y)
        }else{
            # if only 1 column, then coerce into vector
            y <- as.numeric(y)
        }    

    }
    
    if( is.vector(y) ){
        
        if( stats::var(y) == 0 )   stop("y is constant")
        
        # y is a vector and no studies given then just L0 problem
        if( anyNA(study) ){
            reg_type <- "L0"
            K <- 1
        }else{
            # if study is given
            reg_type <- "multiStudy"
            study <- as.integer( as.factor( study ) )
            K <- length( unique(study) )
        }
    }
    
    #####################
    # order tuning values
    #####################
    # ensure grids are of same length
    gridLen <- max( c(length(lambda_1),
                      length(lambda_2),
                      length(lambda_z)
                      )
                    )    
    
    # remove any NAs
    lambda_1[(is.na(lambda_1))] <- 0
    lambda_2[(is.na(lambda_2))] <- 0
    lambda_z[(is.na(lambda_z))] <- 0
    
    # if there is only value, repeat it for the entire grid
    if( length(lambda_1) == 1)   lambda_1 <- rep(lambda_1, gridLen)
    if( length(lambda_2) == 1)   lambda_2 <- rep(lambda_2, gridLen)
    if( length(lambda_z) == 1)   lambda_z <- rep(lambda_z, gridLen)
    
    # check if they are of the same length
    if( stats::var( c(length(lambda_1),
                       length(lambda_2),
                       length(lambda_z)) 
                        ) != 0 )    stop("Lengths of vectors lambda_1, lambda_2 and lambda_z must be of the same length")
    
    grid <- data.frame(lambda_1 = lambda_1,
                       lambda_2 = lambda_2,
                       lambda_z = lambda_z)
    
    grid <- grid[  order(grid$lambda_1,
                         -grid$lambda_2,
                         -grid$lambda_z,
                         decreasing=TRUE),  ]
    
    # add regularization if there isn't any
    sp_index <- which(grid$lambda_1 == 0 & grid$lambda_2 == 0)
    if(length(sp_index) > 1)    grid$lambda_1[sp_index] <- 1e-7 # add small penalty to ensure unique solution
    
    
    lambda_1 <- grid$lambda_1
    lambda_2 <- grid$lambda_2
    lambda_z <- grid$lambda_z
    
    # if local iterations not specified for all tuning values, use the first one for all values
    LocSrch_maxIter <- rep(LocSrch_maxIter[1], nrow(grid) ) 
    
    #####################
    # return object
    #####################
    fit_list <- list(   beta = NA,
                        reg_type = reg_type,
                        K = K,
                        s = s, 
                        commonSupp = commonSupp,
                        warmStart = warmStart,
                        grid = grid,
                        scale = scale,
                        maxIter = maxIter,
                        LocSrch_maxIter = LocSrch_maxIter,
                        independent.regs = independent.regs, 
                        AS_multiplier = AS_multiplier
                    )
    
    if(model){
        fit_list$X_train <- X
        fit_list$y_train <- y
    }   
    
    rm(grid)
    #####################
    # L0 regression
    #####################
    if( reg_type == "L0" ){
        
        # L0 regression
        
        if( !exists("L0_reg") )  L0_reg <- JuliaConnectoR::juliaCall("include", paste0(juliaFnPath, "l0_IHT_tune.jl") ) # sparseReg
        
        suppressWarnings(  if( anyNA(warmStart) | warmStart == TRUE ){
            b <- rep(0, ncol(X) + 1) 
        }else if( is.vector(warmStart) ){
            b <- warmStart
        }
        
        )
        
        if(warmStart & s < p){
            
            if(messageInd)   message("Warm Start Model Running")
            
            b <- L0_reg(X = as.matrix( X ),
                          y = as.numeric( y ),
                          rho = as.integer( min(AS_multiplier * s, p) ),
                          beta = as.matrix(b),
                          lambda = as.numeric(max(lambda_1)),
                          scale = scale,
                          maxIter = as.integer( 500 ),
                          localIter = as.integer(0)
            )
            
        }
        
        if(messageInd)   message("Single L0 Regression")
        
        fit_list$beta <- L0_reg(X = as.matrix( X ),
                      y = as.numeric( y ),
                      rho = as.integer(s),
                      beta = as.matrix(b),
                      lambda = as.numeric(lambda_1),
                      scale = scale,
                      maxIter = as.integer( maxIter ),
                      localIter = as.integer(LocSrch_maxIter)
                        )
        
        dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
        dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
        
        return(fit_list)
        
        
    #####################
    # multiStudy
    #####################
    }else if( reg_type == "multiStudy" ){
        
        # warm start with matrix of 0s
        suppressWarnings( if( anyNA(warmStart) | warmStart == TRUE ){
            b <- matrix(0, nrow = ncol(X) + 1, ncol = K) 
        }else if(is.matrix(warmStart)){
            b <- warmStart
        }
        
        )
        
        #*********************************
        # multiStudy: Common Support
        #*********************************
        if(commonSupp){
            
            if( !any(lambda_2 > 0) & s < p){
                
                # none have betaBar penalty
                if( !exists("L0_MS") )  L0_MS <- juliaCall("include", paste0(juliaFnPath, "BlockIHT_tune.jl") )
                
                if(warmStart & s < p){
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS(X = as.matrix( X ),
                                      y = as.numeric( y ),
                                      rho = as.integer( min(AS_multiplier * s, p) ),
                                      study = as.integer(study), # these are the study labels ordered appropriately for this fold
                                      beta = as.matrix(b),
                                      lambda = as.numeric(max(lambda_1)),
                                      scale = scale,
                                      maxIter = as.integer( 500 ),
                                      localIter = as.integer(0)
                                )
                    
                }
                
                if(messageInd)   message("Common Support Multi-Study")
                
                fit_list$beta <- L0_MS(X = as.matrix( X ),
                                y = as.numeric( y ),
                                rho = as.integer(s),
                                study = as.integer(study), # these are the study labels ordered appropriately for this fold
                                beta = as.matrix(b),
                                lambda = as.numeric(lambda_1),
                                scale = scale,
                                maxIter = as.integer( maxIter ),
                                localIter = as.integer(LocSrch_maxIter)
                )
                # message(dim(fit_list$beta))

                dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
                dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
                
                return(fit_list)
                
            }else{
                
                # if some have betaBar penalty or s == p
                if( !exists("L0_MS2") )  L0_MS2 <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_tune.jl") ) 
                
                if(warmStart & s < p){
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS2(X = as.matrix( X ),
                                       y = as.numeric( y ),
                                       rho = as.integer( min(AS_multiplier * s, p) ),
                                       study = as.integer(study), # these are the study labels ordered appropriately for this fold
                                       beta = as.matrix(b),
                                       lambda1 = as.numeric(max(lambda_1)),
                                        lambda2 = as.numeric(0),
                                       scale = scale,
                                       maxIter = as.integer( 500 ),
                                       localIter = as.integer(0)
                    )

                }
                
                if(messageInd)   message("Common Support Multi-Study with Beta-Bar Penalty")
                
                fit_list$beta <- L0_MS2(X = as.matrix( X ),
                             y = as.numeric( y ),
                             rho = as.integer(s),
                             study = as.integer(study), # these are the study labels ordered appropriately for this fold
                             beta = as.matrix(b),
                             lambda1 = as.numeric(lambda_1),
                             lambda2 = as.numeric(lambda_2),
                             scale = scale,
                             maxIter = as.integer( maxIter ),
                             localIter = as.integer(LocSrch_maxIter)
                            )
                
            }
            
            dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
            dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
            
            return(fit_list)
            
            #**********************************
            # multiStudy: Heterogeneous Support
            #**********************************
        }else{
            

            if( independent.regs & ( all(lambda_2 == 0) & all(lambda_z == 0) ) ){
                
                if(messageInd)   message("Heterogeneous Support Multi-Study with Separate Active Sets")
                
                # # no shared AS (only use for completely separate LO)
                if( !exists("L0_MS_z3") )   L0_MS_z3 <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_inexact_diffAS_tuneTest.jl") ) # sepratae active sets for each study
                # # 

                if(warmStart & s < p){
                    
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS_z3(X = as.matrix( X ),
                                   y = as.numeric( y ),
                                   rho = as.integer( min(AS_multiplier * s, p) ),
                                   study = study, # these are the study labels ordered appropriately for this fold
                                   beta = as.matrix(b),
                                   lambda1 = max( as.numeric(lambda_1) ),
                                   lambda2 = 0,
                                   lambda_z = 0,
                                   scale = scale,
                                   maxIter = as.integer( 500 ),
                                   localIter = as.integer(0)
                    )
                }
                
                fit_list$beta <- L0_MS_z3(X = as.matrix( X ),
                                  y = as.numeric( y ),
                                  rho = as.integer(s),
                                  study = as.integer(study), # these are the study labels ordered appropriately for this fold
                                  beta = as.matrix(b),
                                  lambda1 = as.numeric(lambda_1),
                                  lambda2 = as.numeric(lambda_2),
                                  lambda_z = as.numeric(lambda_z),
                                  scale = scale,
                                  maxIter = as.integer( maxIter ),
                                  localIter = as.integer(LocSrch_maxIter)
                )
                
            }else{
                
                # shared active sets OR sharing penalties
                if( !exists("L0_MS_z") )   L0_MS_z <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_inexactAS_tune_old.jl") ) # MT: Need to check it works;  "_tune_old.jl" version gives the original active set version that performs better #\beta - \betaBar penalty
                
                if(warmStart & s < p){
                    
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS_z(X = as.matrix( X ),
                                   y = as.numeric( y ),
                                   rho = as.integer( min(AS_multiplier * s, p) ),
                                   study = study, # these are the study labels ordered appropriately for this fold
                                   beta = as.matrix(b),
                                   lambda1 = max( as.numeric(lambda_1) ),
                                   lambda2 = 0,
                                   lambda_z = 0,
                                   scale = scale,
                                   maxIter = as.integer( 500 ),
                                   localIter = as.integer(0)
                                   )
                }
                
                if(messageInd)   message("Heterogeneous Support Multi-Study")
                
                fit_list$beta <- L0_MS_z(X = as.matrix( X ),
                               y = as.numeric( y ),
                               rho = as.integer(s),
                               study = as.integer(study), # these are the study labels ordered appropriately for this fold
                               beta = as.matrix(b),
                               lambda1 = as.numeric(lambda_1),
                               lambda2 = as.numeric(lambda_2),
                               lambda_z = as.numeric(lambda_z),
                               scale = scale,
                               maxIter = as.integer( maxIter ),
                               localIter = as.integer(LocSrch_maxIter)
                )
                
            }
            #L0_MS_z2 <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_inexact_tuneTest.jl") ) # MT: Need to check it works; no active set but NO common support (it does have Z - zbar and beta - betabar)
            
            dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
            dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
            
            return(fit_list)
        }
        #####################
        # multiLabel
        #####################
    }else if( reg_type == "multiLabel" ){
        

        # warm start with matrix of 0s
        suppressWarnings( if( anyNA(warmStart) | warmStart == TRUE ){
            b <- matrix(0, nrow = ncol(X) + 1, ncol = K) 
        }else if(is.matrix(warmStart)){
            b <- warmStart
        }
        
        )
        
        #*********************************
        # multiLabel: Common Support
        #*********************************
        if(commonSupp){
            
            if( !any(lambda_2 > 0) & s < p ){
                
                # none have betaBar penalty
                
                if( !exists("L0_MS_MT") )   L0_MS_MT <- juliaCall("include", paste0(juliaFnPath, "BlockIHT_tune_MT.jl") ) # MT: Need to check it works
                
                if(warmStart & s < p){
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS_MT(X = as.matrix( X ),
                                    y = as.matrix( y ),
                                    rho = as.integer( min(AS_multiplier * s, p) ),
                                    study = NA, # these are the study labels ordered appropriately for this fold
                                    beta = as.matrix( b ) ,
                                    lambda = as.numeric(max(lambda_1)),
                                    scale = scale,
                                    maxIter = as.integer( 500 ),
                                    localIter = as.integer(0)
                    )
                    
                }
                
                if(messageInd)   message("Common Support Multi-Label")
                
                fit_list$beta <- L0_MS_MT(X = as.matrix( X ),
                             y = as.matrix( y ),
                             rho = as.integer(s),
                             study = NA, # these are the study labels ordered appropriately for this fold
                             beta = as.matrix( b ) ,
                             lambda = as.numeric(lambda_1),
                             scale = scale,
                             maxIter = as.integer( maxIter ),
                             localIter = as.integer(LocSrch_maxIter)
                )
                
                dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
                dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
                
                return(fit_list)
                
            }else{
                # if some have betaBar penalty or s == p
                
                if( !exists("L0_MS2_MT") )   L0_MS2_MT <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_tune_MT.jl") ) # MT: Need to check it works;   multi study with beta-bar penalty
                
                if(warmStart & s < p){
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS2_MT(X = as.matrix( X ),
                                          y = as.matrix( y ),
                                          rho = as.integer( min(AS_multiplier * s, p) ),
                                          study = NA, # these are the study labels ordered appropriately for this fold
                                          beta = as.matrix( b ) ,
                                          lambda1 = as.numeric(max(lambda_1)),
                                          lambda2 = 0,
                                          scale = scale,
                                          maxIter = as.integer( 500 ),
                                          localIter = as.integer(0)
                    )
                    
                }
                
                if(messageInd)   message("Common Support Multi-Label with Beta-Bar Penalty")
                
                fit_list$beta <- L0_MS2_MT(X = as.matrix( X ),
                              y = as.matrix( y ),
                              rho = as.integer(s),
                              study = NA, # these are the study labels ordered appropriately for this fold
                              beta = as.matrix(b),
                              lambda1 = as.numeric(lambda_1),
                              lambda2 = as.numeric(lambda_2),
                              scale = scale,
                              maxIter = as.integer( maxIter ),
                              localIter = as.integer(LocSrch_maxIter)
                )
                
            }
            
            dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
            dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
            
            return(fit_list)
            
            #**********************************
            # multiLabel: Heterogeneous Support
            #**********************************
        }else{
            
            if( independent.regs & ( all(lambda_2 == 0) & all(lambda_z == 0) ) ){
                
                # no shared AS (only use for completely separate LO)
                if( !exists("L0_MS_z3_MT") )   L0_MS_z3_MT <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_inexact_diffAS_tuneTest_MT.jl") ) # sepratae active sets for each study

                if(warmStart & s < p){
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS_z3_MT(X = as.matrix( X ),
                                   y = as.matrix( y ),
                                   rho = as.integer( min(AS_multiplier * s, p) ),
                                   study = NA, # these are the study labels ordered appropriately for this fold
                                   beta = as.matrix(b),
                                   lambda1 = as.numeric( max(lambda_1) ),
                                   lambda2 = as.numeric(0),
                                   lambda_z = as.numeric(0),
                                   scale = scale,
                                   maxIter = as.integer( 500 ),
                                   localIter = as.integer(0)
                    )
                }
                
                if(messageInd)   message("Heterogeneous Support Multi-Label with Separate Active Sets")
                
                
                fit_list$beta <- L0_MS_z3_MT(X = as.matrix( X ),
                                y = as.matrix( y ),
                                rho = as.integer(s),
                                study = NA, # these are the study labels ordered appropriately for this fold
                                beta = as.matrix(b),
                                lambda1 = as.numeric(lambda_1),
                                lambda2 = as.numeric(lambda_2),
                                lambda_z = as.numeric(lambda_z),
                                scale = scale,
                                maxIter = as.integer( maxIter ),
                                localIter = as.integer(LocSrch_maxIter)
                )
                
            }else{
                
                # shared active sets OR sharing penalties
                if( !exists("L0_MS_z_MT") )   L0_MS_z_MT <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_inexactAS_tune_old_MT.jl") ) # MT: Need to check it works;  "_tune_old.jl" version gives the original active set version that performs better #\beta - \betaBar penalty
                
                if(warmStart & s < p){
                    if(messageInd)   message("Warm Start Model Running")
                    
                    b <- L0_MS_z_MT(X = as.matrix( X ),
                                   y = as.matrix( y ),
                                   rho = as.integer( min(AS_multiplier * s, p) ),
                                   study = NA, # these are the study labels ordered appropriately for this fold
                                   beta = as.matrix(b),
                                   lambda1 = max( as.numeric(lambda_1) ),
                                   lambda2 = 0,
                                   lambda_z = 0,
                                   scale = scale,
                                   maxIter = as.integer( 500 ),
                                   localIter = as.integer(0)
                    )
                }
                
                if(messageInd)   message("Heterogeneous Support Multi-Label")
                
                fit_list$beta <- L0_MS_z_MT(X = as.matrix( X ),
                               y = as.matrix( y ),
                               rho = as.integer(s),
                               study = NA, # these are the study labels ordered appropriately for this fold
                               beta = as.matrix(b),
                               lambda1 = as.numeric(lambda_1),
                               lambda2 = as.numeric(lambda_2),
                               lambda_z = as.numeric(lambda_z),
                               scale = scale,
                               maxIter = as.integer( maxIter ),
                               localIter = as.integer(LocSrch_maxIter)
                )
                
            }
            #L0_MS_z2 <- juliaCall("include", paste0(juliaFnPath, "BlockComIHT_inexact_tuneTest.jl") ) # MT: Need to check it works; no active set but NO common support (it does have Z - zbar and beta - betabar)
            
            dimnames(fit_list$beta)[[2]] <- paste0("beta_", 1:(dim(fit_list$beta)[[2]]) ) # rename columns
            dimnames(fit_list$beta)[[1]] <- c("Intercept", paste0("V", seq(1, dim(fit_list$beta)[[1]] - 1) ) ) # rename rows
            
            return(fit_list)
        }
    }
    
}