R/utils.outflank.fst.r
In dartR.popgen: Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis

WC_FST_FiniteSample_Haploids_2AllelesB_MCW <- function(AllCounts) {
  # Input a matrix of the counts of each allele (columns) in each population
  # (rows) returns vector instead of list of Fst values,
  # according to Weir

  n_pops <- dim(AllCounts)[1]
  r <- n_pops
  counts1 <- AllCounts[, 1]
  sample_sizes <- rowSums(AllCounts)
  n_ave <- mean(as.numeric(sample_sizes))
  n_c <- (n_pops * n_ave - sum(sample_sizes^2) / (n_pops * n_ave)) /
    (n_pops - 1)
  p_freqs <- counts1 / sample_sizes
  p_ave <- sum(sample_sizes * p_freqs) / (n_ave * n_pops)

  He <- 2 * p_ave * (1 - p_ave)

  s2 <- sum(sample_sizes * (p_freqs - p_ave)^2) / ((n_pops - 1) * n_ave)


  T1 <-
    s2 - 1 / (n_ave - 1) * (p_ave * (1 - p_ave) - (s2 * (r - 1) / r))
  T2 <-
    (n_c - 1) * (p_ave * (1 - p_ave)) / (n_ave - 1) + (1 + (r - 1) * (n_ave - n_c) /
      (n_ave - 1)) * s2 / r

  FST <- T1 / T2

  return(c(He, p_ave, FST, T1, T2))
}

WC_FST_FiniteSample_Haploids_2AllelesB_NoSamplingCorrection <-
  function(AllCounts) {
    # Input a matrix of the counts of each allele (columns) in each
    # population (rows)

    n_pops <- dim(AllCounts)[1]
    r <- n_pops
    counts1 <- AllCounts[, 1]
    sample_sizes <- rowSums(AllCounts)
    n_ave <- mean(as.numeric(sample_sizes))
    n_c <- (n_pops * n_ave - sum(sample_sizes^2) / (n_pops * n_ave)) /
      (n_pops - 1)
    p_freqs <- counts1 / sample_sizes
    p_ave <- sum(sample_sizes * p_freqs) / (n_ave * n_pops)

    He <- 2 * p_ave * (1 - p_ave)

    s2 <- sum(sample_sizes * (p_freqs - p_ave)^2) / ((n_pops - 1) * n_ave)


    T1NoCorr <- s2
    T2NoCorr <- s2 / r + (p_ave * (1 - p_ave))

    FSTNoCorr <- T1NoCorr / T2NoCorr

    return(
      c(
        HeNoCorr = He,
        p_aveNoCorr = p_ave,
        FSTNoCorr = FSTNoCorr,
        T1NoCorr = T1NoCorr,
        T2NoCorr = T2NoCorr
      )
    )
  }

fstBarCalculatorNoCorr <- function(DataList) {
  # Calculates mean FstNoCorr from the dataframe, using sum(T1NoCorr) /
  # sum(T2NoCorr) as the estimate of mean Fst. Uses only data for
  # which qvalues > qthreshold (i.e. $OutlierFlag==FALSE) Does not internally
  # screen for low MAF or low He values (but that can be added
  # by only sending the high MAF rows to this function)
  sum(DataList$T1NoCorr[which(!DataList$OutlierFlag)]) / sum(DataList$T2NoCorr[which(!DataList$OutlierFlag)])
}

fstBarCalculator <- function(DataList) {
  # Calculates mean Fst from the dataframe, using sum(T1) / sum(T2) as the
  # estimate of mean Fst. Uses only data for which qvalues >
  # qthreshold (i.e. $OutlierFlag==FALSE) Does not internally screen for low
  # MAF or low He values (but that can be added by only sending
  # the high MAF rows to this function)
  sum(DataList$T1[which(!DataList$OutlierFlag)]) / sum(DataList$T2[which(!DataList$OutlierFlag)])
}

WC_FST_FiniteSample_Diploids_2Alleles_NoCorr <-
  function(Sample_Mat) {
    # Sample Mat has three columns (homo_p,m heterozygotes, and homo_q) and
    # a row for each population

    sample_sizes <- rowSums(Sample_Mat)
    n_ave <- mean(sample_sizes)
    n_pops <- nrow(Sample_Mat) # r
    r <- n_pops
    n_c <- (n_pops * n_ave - sum(sample_sizes^2) / (n_pops * n_ave)) /
      (n_pops - 1)
    p_freqs <- (Sample_Mat[, 1] + Sample_Mat[, 2] / 2) / sample_sizes
    p_ave <- sum(sample_sizes * p_freqs) / (n_ave * n_pops)
    s2 <- sum(sample_sizes * (p_freqs - p_ave)^2) / ((n_pops - 1) * n_ave)

    if (s2 == 0) {
      return(1)
    }

    h_freqs <- Sample_Mat[, 2] / sample_sizes
    h_ave <- sum(sample_sizes * h_freqs) / (n_ave * n_pops)

    a <- n_ave / n_c * (s2)

    b <-
      (p_ave * (1 - p_ave) - (r - 1) / r * s2 - (2 * n_ave) / (4 * n_ave) * h_ave)

    c <- 1 / 2 * h_ave

    He <- 1 - sum(p_ave^2, (1 - p_ave)^2)

    FST <- a / (a + b + c)
    return(list(
      He = He,
      FSTNoCorr = FST,
      T1NoCorr = a,
      T2NoCorr = (a + b + c)
    ))
  }


WC_FST_FiniteSample_Diploids_2Alleles <- function(Sample_Mat) {
  # Sample Mat has three columns (homo_p,m heterozygotes, and homo_q) and a
  # row for each population

  sample_sizes <- rowSums(Sample_Mat)
  n_ave <- mean(sample_sizes)
  n_pops <- nrow(Sample_Mat) # r
  r <- n_pops
  n_c <- (n_pops * n_ave - sum(sample_sizes^2) / (n_pops * n_ave)) /
    (n_pops - 1)
  p_freqs <- (Sample_Mat[, 1] + Sample_Mat[, 2] / 2) / sample_sizes
  p_ave <- sum(sample_sizes * p_freqs) / (n_ave * n_pops)

  s2 <- sum(sample_sizes * (p_freqs - p_ave)^2) / ((n_pops - 1) * n_ave)
  if (s2 == 0) {
    return(1)
  }

  h_freqs <- Sample_Mat[, 2] / sample_sizes
  h_ave <- sum(sample_sizes * h_freqs) / (n_ave * n_pops)

  a <-
    n_ave / n_c * (s2 - 1 / (n_ave - 1) * (p_ave * (1 - p_ave) - ((r - 1) /
      r) * s2 - (1 / 4) * h_ave))

  b <-
    n_ave / (n_ave - 1) * (p_ave * (1 - p_ave) - (r - 1) / r * s2 - (2 * n_ave - 1) /
      (4 * n_ave) * h_ave)

  c <- 1 / 2 * h_ave

  He <- 1 - sum(p_ave^2, (1 - p_ave)^2)

  FST <- a / (a + b + c)
  return(list(
    He = He,
    FST = FST,
    T1 = a,
    T2 = (a + b + c)
  ))
}

Any scripts or data that you put into this service are public.

dartR.popgen documentation built on June 28, 2024, 1:06 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

dartR.popgen
Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis

R/utils.outflank.fst.r
In dartR.popgen: Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis

Defines functions WC_FST_FiniteSample_Diploids_2Alleles WC_FST_FiniteSample_Diploids_2Alleles_NoCorr fstBarCalculator fstBarCalculatorNoCorr WC_FST_FiniteSample_Haploids_2AllelesB_NoSamplingCorrection WC_FST_FiniteSample_Haploids_2AllelesB_MCW

Try the dartR.popgen package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

dartR.popgen Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis

R/utils.outflank.fst.r In dartR.popgen: Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis

Defines functions WC_FST_FiniteSample_Diploids_2Alleles WC_FST_FiniteSample_Diploids_2Alleles_NoCorr fstBarCalculator fstBarCalculatorNoCorr WC_FST_FiniteSample_Haploids_2AllelesB_NoSamplingCorrection WC_FST_FiniteSample_Haploids_2AllelesB_MCW

Try the dartR.popgen package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

dartR.popgen
Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis

R/utils.outflank.fst.r
In dartR.popgen: Analysing 'SNP' and 'Silicodart' Data Generated by Genome-Wide Restriction Fragment Analysis