R/protein_bind.F.R

Defines functions protein_bind.F

protein_bind.F <-
function(Feat, SQuali, SQualiN){
  Item <- c("/allele=", "/bound_moiety=", "/citation=", "/db_xref=", "/experiment=", "/function=", "/gene=", "/gene_synonym=", "/inference=", "/locus_tag=", "/map=", "/note=", "/old_locus_tag=", "/operon=", "/standard_name=")
  ItemN <- c("allele", "bound_moiety", "citation", "db_xref", "experiment", "function", "gene", "gene_synonym", "inference", "locus_tag", "map", "note", "old_locus_tag", "operon", "standard_name")
  Feat[length(Feat)] <- gsub("\\\",$", "", Feat[length(Feat)])
  protein_bind <- data.frame("Location" = "protein_bind", "Qualifier" = gsub(".*protein_bind +([^.]+)\"*", "\\1", Feat[1], perl = T), stringsAsFactors = F)
  for(i in 2:length(Feat)){
    for(j in 1:length(Item)){
      if(length(grep(Item[j], Feat[i], perl = T)) == 1){
        protein_bind <- rbind(protein_bind, c(ItemN[j],  gsub(".*=([^.]+)\"*", "\\1", Feat[i])))
        if((length(grep("\\\\\"$|\"\\\", $|\\d$", Feat[i])) == 0 & i != length(Feat)) == T){
          t <- i+1
          while(length(grep("\\\\\"$|\"\\\", $|\\d$", Feat[t])) == 0 && t <= length(Feat)){
            protein_bind[dim(protein_bind)[1],2] <- paste(protein_bind[dim(protein_bind)[1],2], gsub("\\s", " ", Feat[t]), sep = " ")
            t <- t+1
          }
          if(length(grep("\\\\\"$|\"\\\", $|\\d$", Feat[t])) == 1){
            protein_bind[dim(protein_bind)[1],2] <- paste(protein_bind[dim(protein_bind)[1],2], gsub("\\s", " ", Feat[t]), sep = " ")
          }
        }
      }
    }
    for(k in 1:length(SQuali)){
      if(length(grep(SQuali[k], Feat[i], perl = T)) == 1){
        protein_bind <- rbind(protein_bind, c(SQuali[k], SQualiN[k]))
      }
    }
  }
  protein_bind <- apply(protein_bind, 2, function(x){gsub(" {2,}", " ", x, perl = TRUE)})
  protein_bind <- apply(protein_bind, 2, function(x){gsub("\"", "", x, fixed = T)})
  protein_bind <- apply(protein_bind, 2, function(x){gsub("\\", "", x, fixed = T)})
  protein_bind <- apply(protein_bind, 2, function(x){gsub("[^[:alnum:][:space:][]'.,:_<>()-]", "", x, perl = TRUE)})
  return(protein_bind)
}

Try the read.gb package in your browser

Any scripts or data that you put into this service are public.

read.gb documentation built on Sept. 6, 2021, 5:08 p.m.