R/fmcsBatch.R

Defines functions fmcsBatch

Documented in fmcsBatch

########################
## fmcsBatch Function ##
########################
.packageName <- 'fmcsR'

fmcsBatch <-
function(querySdf, sdfset, al = 0, au = 0, bl = 0, bu = 0, 
			matching.mode = "static",timeout=60000,numParallel=1) {

    if(class(querySdf)=="SDFset") querySdf <- querySdf[[1]]
    al = as.integer(al) 
    au = as.integer(au) 
    bl = as.integer(bl) 
    bu = as.integer(bu) 
    
    if (matching.mode == "static") {
        matching.int = 0
    } else if (matching.mode == "aromatic") {
        matching.int = 1
    } else if (matching.mode == "ring") {
        matching.int = 2
    } else {
        stop("matching.mode needs to be static, aromatic, or ring.")
    }
    
    matching.int = as.integer(matching.int)
    
    s1 <- as(querySdf, "character") 
    s1 <- paste(s1, collapse="\n")
    
    targetSize <- numeric(length(sdfset))
    mcsSize <- numeric(length(sdfset))

	 score = function(targetSdf){
		  library(ChemmineR)
		  library(fmcsR)
		  #print(sdfid(targetSdf))
        s2 <- as(targetSdf, "character")
        s2 <- paste(s2, collapse="\n")
		  warningCount <- 0
        
		  suppressWarnings(
			  withCallingHandlers(
				  result_data <- 
				  .C('fmcs_R_wrap', s1, s2, al, au, bl, bu, 
						matching.int, as.integer(0), as.integer(timeout), 
						sdfOne="", sdfTwo="",
						sdf1Size = "", sdf2Size = "", mcsSize = "", PACKAGE = 'fmcsR')
				  , warning = function(w) warningCount <<- warningCount + 1))
     
		  data.frame(querySize  = as.integer(result_data$sdf1Size),
				 targetSize = as.integer(result_data$sdf2Size),
				 mcsSize    = as.integer(result_data$mcsSize),
				 warningCount = warningCount) 
	 }
	 environment(score) =  new.env(parent=globalenv())

	 cl = makeCluster(numParallel,outfile="")
	 clusterExport(cl,c("matching.int","timeout","s1","al","au","bl","bu"),
						envir=environment())

	 results = Reduce(rbind,clusterApplyLB(cl,sdfset,score))
	 stopCluster(cl)

	 querySize = results$querySize[1]
	 targetSize = results$targetSize
	 mcsSize = results$mcsSize
	 warningCount = sum(results$warningCount)

    
    minsize <- ifelse(querySize < targetSize, querySize, targetSize)
    tanimoto <- mcsSize/(querySize + targetSize - mcsSize)
    overlap <- mcsSize/minsize
    searchMA <- cbind(Query_Size = querySize, Target_Size = targetSize, MCS_Size = mcsSize, Tanimoto_Coefficient = tanimoto, Overlap_Coefficient = overlap) 
    rownames(searchMA) <- cid(sdfset)

	 if(warningCount != 0)
		 warning(warningCount," comparisons exeeded the timeout of ",
					timeout,"ms and did not complete")
    return(searchMA)
}
girke-lab/fmcsR documentation built on May 17, 2019, 5:27 a.m.