geneSummary: Summarize GEOquery data

Documented in filterTbl

#'Filter Data Tables
#'
#'@description Returns the row indice of the corresponding values to the input.
#'
#'@usage filterTbl(tbl, type, long = FALSE, var, input)
#'
#'@author Nicholas Hutson
#'
#'@examples data <- getGEO("GSE443452")
#'geneSymbol <- "TP53"
#'long <- TRUE
#'tbl <- extExp(data, geneSymbol, long)
#'filterTbl(tbl, "Gene Expression", geneSymbol, long)
#'
#'@export

filterTbl <- function(tbl, type, long = FALSE, var, input){ #OUTPUT ROW INDICES OR 0

  y <- match(var,colnames(tbl))
  y <- y[!is.na(y)]
  w <- colnames(tbl)[y]

  #browser()

  x <- which(input!="",arr.ind = TRUE)
  y <- data.frame(tbl[,y])
  #get rid of all empty inputs
  y <- data.frame(y[,x])
  colnames(y) <- w[x]
  z <- input[x]

    if(type == "Gene Expression" & long == FALSE){
      #check if y input is not the first 2 column names of tbl
      #if so, search for rows where the sample gene expression fits the inputted logical expression
      #going to have to compare row indexes or logical vector with z vector
      if(identical(z,character(0))){
        z <- 0
      }else{

        browser()

        a <- which(colnames(y) %in% colnames(tbl)[1:2], arr.ind = TRUE)#finds symbol and id inputs where there are inputs3

        if(!identical(a, integer(0))){
          y1 <- data.frame(y[,a])
          z1 <- z[a]

          z1 <- unlist(strsplit(z1,", ",fixed = TRUE)) #split up comma deliminated inputs

          i <- 1:length(z1)
          if(length(i)>1){
            z1 <- unlist(lapply(i, function(a){
              row.match(z1[a], y1)
            }))
          }else{
            z1 <- row.match(z1, y1)
          }

          #browser()

          y2 <- as.character(y[,-a])
          len <- dim(data.frame(y[,-a]))[2] #different way to find the number of elements
          z2 <- z[-a] #remove ID and Symbol rows
        }else{ #runs when none of the filters are ID or Symbol filters
          y2 <- y
          len <- dim(y)[2]
          z2 <- z
        }

        #browser()

        #ifelse statements to determine the correct rows to output
        if(!exists("z1")){
          if(len > 1 | len == 0){
            b <- list()
            for(i in 1:len){
              b[i] <- paste(as.character(y2[i]), z2[i])
              b[i] <- parse(text = b[i])
            }
            z <- which(apply(data.frame(b),1,all)==TRUE, arr.ind = TRUE) #false when there's any false
          }else{
            b <- paste(y2, z2) #should be like "y >4"
            b <- parse(text = b)
            #need to have row indice output
            z <- which(unlist(lapply(b,eval))==TRUE, arr.ind = TRUE)
          }
        }else{
          if(identical(z2,character(0))){
            z <- z1
          }else if(len > 1){
            b <- list()
            for(i in 1:len){
              b[i] <- paste(as.character(y2[i]), z2[i])
              b[i] <- parse(text = b[i])
            }
            z2 <- which(apply(data.frame(b),1,all)==TRUE, arr.ind = TRUE) #false when there's any false
            #now compare row indices
            if(z1 %in% z2){
              z <- z1
            }else{
              z <- 0
            }
          }else{
            b <- paste(y2, z2)
            b <- parse(text = b)
            #need to have row indice output
            z2 <- which(unlist(lapply(b,eval))==TRUE, arr.ind = TRUE)
            #now compare row indices
            if(z1 %in% z2){
              z <- z1
            }else{
              z <- 0
            }
          }
        }
      } #should output the row indices for matching "Symbol" and "ID" inputs
    }else if(type == "Gene Expression" & long==TRUE){
      #browser()
      if(identical(z,character(0))){
        z <- 0
      }else{

        zprime <- z

        i <- 1:length(z)
        z1 <- list()

        z <- lapply(i, function(a){ #try to get list of split character vectors
          unlist(strsplit(zprime[a],", ",fixed = TRUE))
          })
        z <- lapply(i, function(a){
          j <- length(z[a])
          z1[a] <- lapply(j, function(b){ #create list of true row indices
            which(z[a][[b]]==y[,a], arr.ind = TRUE)
          })
          reduce(z1[a], intersect)
        })

        #have to do an intersect for each element of the list, and then the list overall
        z <- reduce(z, intersect)
      }
    }else{
      if(identical(z,character(0))){
        z <- 0
      }else{
        z <- data.frame(strsplit(z,", ",fixed = TRUE)[[1]])
        z <- row.match(z, y) #find the matching row indices
      }
    }
  return(z)
}