R/HierAr_updated.R
In HierDpart: Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems

Documented in HierAr

HierAr=function(x, nreg, r, ncode) {
  read.genepop1 <- function(file, ncode, quiet = FALSE) {
    #require(adegenet)
    adegenet::.readExt
    adegenet::.genlab
    adegenet::df2genind
    adegenet::is.genind
    adegenet::pop
    adegenet::repool
    adegenet::Hs
    adegenet::seppop
    adegenet::popNames
    if (toupper(.readExt(file)) != "GEN")
      stop("File extension .gen expected")
    if (!quiet)
      cat("\n Converting data from a Genepop .gen file to a genind object... \n\n")
    prevcall <- match.call()
    txt <- scan(file, sep = "\n", what = "character", quiet = TRUE)
    if (!quiet)
      cat("\nFile description: ", txt[1], "\n")
    txt <- txt[-1]
    txt <- gsub("\t", " ", txt)
    NA.char <- paste(rep("0", ncode), collapse = "")
    locinfo.idx <- 1:(min(grep("POP", toupper(txt))) - 1)
    locinfo <- txt[locinfo.idx]
    locinfo <- paste(locinfo, collapse = ",")
    loc.names <- unlist(strsplit(locinfo, "([,]|[\n])+"))
    loc.names <- trimws(loc.names)
    nloc <- length(loc.names)
    txt <- txt[-locinfo.idx]
    pop.idx <- grep("^([[:space:]]*)POP([[:space:]]*)$", toupper(txt))
    npop <- length(pop.idx)
    nocomma <- which(!(1:length(txt)) %in% grep(",", txt))
    splited <- nocomma[which(!nocomma %in% pop.idx)]
    if (length(splited) > 0) {
      for (i in sort(splited, decreasing = TRUE)) {
        txt[i - 1] <- paste(txt[i - 1], txt[i], sep = " ")
      }
      txt <- txt[-splited]
    }
    pop.idx <- grep("^([[:space:]]*)POP([[:space:]]*)$", toupper(txt))
    txt[length(txt) + 1] <- "POP"
    nind.bypop <- diff(grep("^([[:space:]]*)POP([[:space:]]*)$", toupper(txt))) - 1
    pop <- factor(rep(1:npop, nind.bypop))
    txt <- txt[-c(pop.idx, length(txt))]
    temp <- sapply(1:length(txt), function(i) strsplit(txt[i], ","))
    ind.names <- vapply(temp, function(e) e[1], character(1))
    ind.names <- trimws(ind.names)
    vec.genot <- vapply(temp, function(e) e[2], character(1))
    vec.genot <- trimws(vec.genot)
    X <- matrix(unlist(strsplit(vec.genot, "[[:space:]]+")), ncol = nloc, byrow = TRUE)
    if (any(duplicated(ind.names))) {
      rownames(X) <- .genlab("", nrow(X))
    } else {
      rownames(X) <- ind.names
    }
    colnames(X) <- loc.names
    pop.names.idx <- cumsum(table(pop))
    pop.names <- ind.names[pop.names.idx]
    levels(pop) <- pop.names
    if (!all(unique(nchar(X)) == (ncode * 2)))
      stop(paste("some alleles are not encoded with", ncode, "characters\nCheck 'ncode' argument"))
    res <- df2genind(X = X, pop = as.character(pop), ploidy = 2, ncode = ncode, NA.char = NA.char)
    res@call <- prevcall
    if (!quiet)
      cat("\n...done.\n\n")
    return(res)
  }

  genfiles = read.genepop1(x, ncode, quiet = TRUE)  # covert the genepop #files to genind files, we can also use read.genpop from adegent package
  hierfstat::genind2hierfstat
  hfiles <- genind2hierfstat(genfiles)  # convert into hieformat
  sampsize = summary(genfiles$pop)
  ## Here we add our hierchical information (regions-pops) to the data
 # requireNamespace("dplyr")
  npops = length(levels(genfiles$pop))
  # sampsize=length(genfiles@pop)/length(levels(genfiles$pop)) ## sample size for identical pop size
  if (length(r) != nreg)
    stop("Number of regions should be equal to the number defined in the level")  ## number of pops per region
  if (sum(r) != npops)
    stop("Number of pops should be equal to the number defined in level")
  ## modifying the strata information
  popr = list()
  rsample = list()
  for (i in 1:nreg) {
    popr[[i]] = list()
    popr[[i]] = as.factor(rep(paste("pop", i), times = sum(sampsize[(sum(head(r, i - 1)) + 1):(sum(head(r, i)))])))  ### be aware that times depend on the sample size and str on your data
    rsample[[i]] = sum(sampsize[(sum(head(r, i - 1)) + 1):(sum(head(r, i)))])
  }
  popeco = as.factor(rep("ecosystem", times = length(genfiles$pop)))  ### here sample size * total numbe of pops
  rsample = as.data.frame(rsample)
  rsample = as.numeric(unlist(rsample))
  region = list()
  for (i in seq_along(r)) {
    region[[i]] = list()
    region[[i]] = hfiles[(sum(head(rsample, i - 1)) + 1):(sum(head(rsample, i))), ]
    region[[i]]$pop = factor(region[[i]]$pop)
  }
  ### we have already delimited the region in above section (hie He), we just change the pop factors in the regions
  ### and ecosystems create lists to copy the above files into new files, so that avoid confusion and error

  arregion = list()  # these lists are used yto store the original data
  hierar = list()  # these lists are used yto store the Ar: allelic richness
  hierarav = list()
  ## we enter a loop to pool pops ##
  arecosystem = hfiles
  arecosystem$pop = factor(popeco)
  hierfstat::allelic.richness
  for (i in seq_along(r)) {
    arregion[[i]] = region[[i]]
    arregion[[i]]$pop = factor(popr[[i]])  ### This way is to drop the levels from 16 pops to the current levels, like nowlevelr1=c('pop1','pop2','pop3','pop4')

    hierar[[i]] = list()
    hierarav[[i]] = list()
    ## geting allelic richness per loci and per pops/region
    hierar[[i]] = allelic.richness(arregion[[i]], min.n = NULL, diploid = TRUE)$Ar
    ### average allele richness over loci
    hierarav[[i]] = colMeans(hierar[[i]])
  }
  hierar_reg=do.call(cbind, lapply(hierar, data.frame))
  colnames(hierar_reg) = c(paste("Ar_region", 1:nreg))
  hierAr_R = do.call(cbind, lapply(hierarav, data.frame))
  hierAr_Rav = rowMeans(hierAr_R)
  hierarpop = allelic.richness(hfiles, min.n = NULL, diploid = TRUE)$Ar
  hierarpopav = colMeans(hierarpop)
  Arpopav = mean(hierarpopav)
  hierareco = allelic.richness(arecosystem, min.n = NULL, diploid = TRUE)$Ar
  hierarecoav = colMeans(hierareco)
  hierAr = cbind(hierarecoav, hierAr_Rav, Arpopav)
  colnames(hierAr) = c("Art", "Arr", "Arp")
  colnames(hierarpop) = c(paste("Arpop", 1:npops))
  colnames(hierAr_R) = c(paste("Ar_region", 1:nreg))
  return(list(Ar_pop = hierarpop,Hierareco=hierareco, Ar_reg = hierAr_R,Hierar_loc=hierar_reg, Ar_ovell = hierAr))
}

Any scripts or data that you put into this service are public.

HierDpart documentation built on March 31, 2021, 5:09 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

HierDpart
Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems

R/HierAr_updated.R
In HierDpart: Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems

Defines functions HierAr

Documented in HierAr

Try the HierDpart package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

HierDpart Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems

R/HierAr_updated.R In HierDpart: Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems

Defines functions HierAr

Documented in HierAr

Try the HierDpart package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

HierDpart
Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems

R/HierAr_updated.R
In HierDpart: Partitioning Hierarchical Diversity and Differentiation Across Metrics and Scales, from Genes to Ecosystems