MoBiodiv
diff --git a/‎DESCRIPTION
Lines changed: 11 additions & 7 deletions b/‎DESCRIPTION
Lines changed: 11 additions & 7 deletions
diff --git a/‎NAMESPACE
Lines changed: 10 additions & 1 deletion b/‎NAMESPACE
Lines changed: 10 additions & 1 deletion
diff --git a/‎NEWS.md
Lines changed: 21 additions & 2 deletions b/‎NEWS.md
Lines changed: 21 additions & 2 deletions
diff --git a/‎R/beta_C.R
Lines changed: 251 additions & 0 deletions b/‎R/beta_C.R
Lines changed: 251 additions & 0 deletions
diff --git a/‎R/k-NCN_curve_functions.R
Lines changed: 1 addition & 0 deletions b/‎R/k-NCN_curve_functions.R
Lines changed: 1 addition & 0 deletions
diff --git a/‎R/mobr-package.R
Lines changed: 2 additions & 2 deletions b/‎R/mobr-package.R
Lines changed: 2 additions & 2 deletions
@@ -1,13 +1,13 @@
 Package: mobr
 Title: Measurement of Biodiversity
-Version: 2.0.2
+Version: 3.0.0
 Authors@R: c(person("Daniel", "McGlinn", email = "[email protected]", 
                     role = c("aut", "cre")),
              person("Xiao", "Xiao", email = "[email protected]", 
                     role = "aut"),
              person("Brian", "McGill", email = "[email protected]",
                     role = "aut"),
-             person("Felix", "May", email = "felix.may@idiv.de", 
+             person("Felix", "May", email = "felix.may@posteo.de", 
                     role = "aut"),
              person("Thore", "Engel", email = "[email protected]",
                     role = "aut"),
@@ -28,8 +28,9 @@ Description: Functions for calculating metrics for the measurement biodiversity
     and its changes across scales, treatments, and gradients. The methods 
     implemented in this package are described in:
     Chase, J.M., et al. (2018) <doi:10.1111/ele.13151>, 
-    McGlinn, D.J., et al. (2019) <doi:10.1111/2041-210X.13102>, and
-    McGlinn, D.J., et al. (2021) <doi:10.1002/ecy.3233>. 
+    McGlinn, D.J., et al. (2019) <doi:10.1111/2041-210X.13102>,
+    McGlinn, D.J., et al. (2020) <doi:10.1101/851717>, and
+    McGlinn, D.J., et al. (2023) <doi:10.1101/2023.09.19.558467>. 
 Depends:
     R (>= 3.0.2)
 Imports:
@@ -44,15 +45,18 @@ Imports:
     tibble,
     vctrs,
     rlang,
-    geosphere
+    geosphere,
+    scam,
+    sf
 Suggests:
     knitr,
     rmarkdown,
-    testthat
+    testthat,
+    methods
 License: MIT + file LICENSE
 LazyData: true
+RoxygenNote: 7.3.1
 URL: https://github.com/MoBiodiv/mobr
 BugReports: https://github.com/MoBiodiv/mobr/issues
-RoxygenNote: 7.1.1
 Encoding: UTF-8
 VignetteBuilder: knitr
@@ -4,18 +4,26 @@ S3method(plot,mob_out)
 S3method(plot,mob_stats)
 S3method(print,mob_in)
 S3method(subset,mob_in)
+export(Chat)
 export(avg_nn_dist)
+export(calc_C_target)
 export(calc_PIE)
-export(calc_biodiv)
+export(calc_SPIE)
+export(calc_S_C)
+export(calc_beta_div)
 export(calc_chao1)
+export(calc_comm_div)
+export(calc_div)
 export(compare_samp_rarefaction)
 export(get_delta_stats)
 export(get_mob_stats)
 export(get_null_comm)
+export(invChat)
 export(kNCN_average)
 export(make_mob_in)
 export(plot_N)
 export(plot_abu)
+export(plot_comm_div)
 export(plot_rarefaction)
 export(rarefaction)
 import(dplyr)
@@ -45,6 +53,7 @@ importFrom(stats,coef)
 importFrom(stats,dist)
 importFrom(stats,lm)
 importFrom(stats,loess)
+importFrom(stats,optimize)
 importFrom(stats,pf)
 importFrom(stats,predict)
 importFrom(stats,quantile)
 
@@ -1,3 +1,24 @@
+## version 3.0.0
+---
+
+Major update
+### new features
+- `calc_comm_div` now replaces `get_mob_stats`. The ancillary plotting function
+`plot.mob_stats` is now replaced with `plot_comm_div`. We hope to eventually
+add back in bootstrapping confidence intervals for the statistics but that is
+not currently supported. If you would like to know more about this design
+decision see the discussion here: https://github.com/MoBiodiv/mobr/issues/255. 
+- `plot_rarefaction` is a bit more versatile with many new arguments 
+that provide options for smoothing or averaging rarefaction curves
+when making comparisons within or between groups respectively. 
+- The R package `beta_C` by Thore Engel has now been absorbed into
+the `mobr` package. Use function `calc_beta_div` or `calc_comm_div`
+with `beta` in the `scales` argument to compute coverage based beta
+diversity. Note the index in this case is `S_C` (i.e., richness S for a
+given level of coverage C)
+- a vignette was added to demonstrate how to make computations of beta
+diversity using `mobr` called `beta_div_demo`
+
 ## version 2.0.2
 ---
 ### change for CRAN
@@ -19,7 +40,6 @@ others are compared to. This is similar to the implementation in the function
 
 
 ## version 2.0.0
-
 ---
 
 ### new features
@@ -51,7 +71,6 @@ the most computationally efficient solutions
 
 
 ## version 1.0.0
-
 ---
 
 - provided core functionality of mob tools described in McGlinn et al. 
 
@@ -0,0 +1,251 @@
+#' Calculate expected sample coverage C_hat
+#'
+#' Returns expected sample coverage of a sample `x` for a smaller than observed
+#' sample size `m` (Chao & Jost, 2012). This code was copied from INEXT's internal
+#' function \code{iNEXT::Chat.Ind} (Hsieh et al 2016).
+#' 
+#' @param x integer vector (species abundances)
+#' @param m integer a number of individuals that is smaller than observed total
+#' community abundance. 
+#'
+#' @return a numeric value that is the expected coverage. 
+#' 
+#' @references 
+#' Chao, A., and L. Jost. 2012. Coverage-based rarefaction and extrapolation:
+#'  standardizing samples by completeness rather than size. Ecology 93:2533–2547.
+#'  
+#' Anne Chao, Nicholas J. Gotelli, T. C. Hsieh, Elizabeth L. Sander, K. H. Ma,
+#'  Robert K. Colwell, and Aaron M. Ellison 2014. Rarefaction and extrapolation
+#'  with Hill numbers: a framework for sampling and estimation in species
+#'  diversity studies.  Ecological Monographs 84:45-67.
+#' 
+#' T. C. Hsieh, K. H. Ma and Anne Chao. 2024. 
+#'  iNEXT: iNterpolation and EXTrapolation for
+#'  species diversity. R package version 3.0.1
+#'  URL: http://chao.stat.nthu.edu.tw/wordpress/software-download/.
+#' 
+#' 
+#' @export
+#'
+#' @examples
+#' data(inv_comm)
+#' # What is the expected coverage at a sample size of 50 at the gamma scale?
+#' Chat(colSums(inv_comm), 50)
+Chat <- function (x, m)
+{
+    x <- x[x > 0]
+    n <- sum(x)
+    f1 <- sum(x == 1)
+    f2 <- sum(x == 2)
+    f0.hat <- ifelse(f2 == 0, (n - 1) / n * f1 * (f1 - 1) / 2, (n -
+                                                                    1) / n * f1 ^
+                         2 / 2 / f2)
+    A <- ifelse(f1 > 0, n * f0.hat / (n * f0.hat + f1), 1)
+    Sub <- function(m) {
+        if (m < n) {
+            xx <- x[(n - x) >= m]
+            out <- 1 - sum(xx / n * exp(
+                lgamma(n - xx + 1) - lgamma(n -
+                                                xx - m + 1) - lgamma(n) + lgamma(n - m)
+            ))
+        }
+        if (m == n)
+            out <- 1 - f1 / n * A
+        if (m > n)
+            out <- 1 - f1 / n * A ^ (m - n + 1)
+        out
+    }
+    sapply(m, Sub)
+}
+
+#' Number of individuals corresponding to a desired coverage (inverse C_hat)
+#'
+#' If you wanted to resample a vector to a certain expected sample coverage, how
+#' many individuals would you have to draw? This is C_hat solved for the number
+#' of individuals. This code is a modification of INEXT's internal function
+#' `invChat.Ind` (Hsieh et al 2016).
+#' 
+#' @param x integer vector (species abundances)
+#' @param C coverage value between 0 and 1
+#'
+#' @return a numeric value which is the number of individuals for a given
+#' level of coverage \code{C}.
+#' @references 
+#' Chao, A., and L. Jost. 2012. Coverage-based rarefaction and extrapolation:
+#'  standardizing samples by completeness rather than size. Ecology 93:2533–2547.
+#'  
+#' Anne Chao, Nicholas J. Gotelli, T. C. Hsieh, Elizabeth L. Sander, K. H. Ma,
+#'  Robert K. Colwell, and Aaron M. Ellison 2014. Rarefaction and extrapolation
+#'  with Hill numbers: a framework for sampling and estimation in species
+#'  diversity studies.  Ecological Monographs 84:45-67.
+#' 
+#' T. C. Hsieh, K. H. Ma and Anne Chao. 2024. 
+#'  iNEXT: iNterpolation and EXTrapolation for
+#'  species diversity. R package version 3.0.1
+#'  URL: http://chao.stat.nthu.edu.tw/wordpress/software-download/.
+#' @seealso \code{\link{calc_S_C}}
+#' @export
+#' @importFrom stats optimize
+#' @examples
+#' data(inv_comm)
+#' # What sample size corresponds to an expected sample coverage of 55%?
+#' invChat(colSums(inv_comm), 0.55)
+#'
+invChat <- function (x, C)
+{
+    m <- NULL
+    n <- sum(x)
+    refC <- Chat(x, n)
+    f <- function(m, C)
+        abs(Chat(x, m) - C)
+    # for interpolation
+    if (refC > C) {
+        opt <- stats::optimize(f,
+                        C = C,
+                        lower = 0,
+                        upper = sum(x))
+        mm <- opt$minimum
+    }
+    # for extrapolation
+    if (refC <= C) {
+        f1 <- sum(x == 1)
+        f2 <- sum(x == 2)
+        if (f1 > 0 & f2 > 0) {
+            A <- (n - 1) * f1 / ((n - 1) * f1 + 2 * f2)
+        }
+        if (f1 > 1 & f2 == 0) {
+            A <- (n - 1) * (f1 - 1) / ((n - 1) * (f1 - 1) + 2)
+        }
+        if (f1 == 1 & f2 == 0) {
+            A <- 1
+        }
+        if (f1 == 0 & f2 == 0) {
+            A <- 1
+        }
+        mm <- (log(n / f1) + log(1 - C)) / log(A) - 1
+        mm <- n + mm
+        
+    }
+    if (mm > 2 * n)
+        warning(
+            "The maximum size of the extrapolation exceeds double reference sample size, the results for q = 0 may be subject to large prediction bias."
+        )
+    return(mm)
+}
+
+
+#' Calculate species richness for a given coverage level. 
+#'
+#' This function uses coverage-based rarefaction to compute species richness.
+#' Specifically, the metric is computed as the
+#' 
+#' @param x a site by species matrix or a species abundance distribution
+#' @param C_target target coverage between 0 and 1 (default is NULL). If not
+#' provided then target coverage is computed by \code{\link{calc_C_target}}
+#' @param extrapolate logical. Defaults to TRUE in which case richness is 
+#' extrapolated to sample sizes larger than observed in the dataset.
+#' @param interrupt logical. Should the function throw an error when \code{C_target}
+#'  exceeds the maximum recommendable coverage?
+#'
+#' @returns numeric value which is the species richness at a specific level of 
+#' coverage.
+#' @references 
+#' Chao, A., and L. Jost. 2012. Coverage-based rarefaction and extrapolation:
+#'  standardizing samples by completeness rather than size. Ecology 93:2533–2547.
+#'  
+#' Anne Chao, Nicholas J. Gotelli, T. C. Hsieh, Elizabeth L. Sander, K. H. Ma,
+#'  Robert K. Colwell, and Aaron M. Ellison 2014. Rarefaction and extrapolation
+#'  with Hill numbers: a framework for sampling and estimation in species
+#'  diversity studies.  Ecological Monographs 84:45-67.
+#' 
+#' T. C. Hsieh, K. H. Ma and Anne Chao. 2024. 
+#'  iNEXT: iNterpolation and EXTrapolation for
+#'  species diversity. R package version 3.0.1
+#'  URL: http://chao.stat.nthu.edu.tw/wordpress/software-download/.
+#' 
+#' @seealso \code{\link{invChat}}
+#' @export
+#'
+#' @examples
+#' data(tank_comm)
+#' # What is species richness for a coverage value of 60%?
+#' calc_S_C(tank_comm, C_target = 0.6)
+calc_S_C <- function(x,
+                   C_target = NULL,
+                   extrapolate = TRUE,
+                   interrupt = TRUE) {
+    x <- as.matrix(x)
+    if (any(dim(x) == 1))
+      sad <- as.numeric(x)
+    else
+      sad <- colSums(x)
+    if (is.null(C_target))
+      C_target <- calc_C_target(x)
+    N <- round(invChat(sad, C_target))
+    C_max = calc_C_target(x, factor = ifelse(extrapolate, 2, 1))
+    if (C_target > C_max & interrupt) {
+        if (extrapolate) {
+          stop(
+            paste0(
+              "Coverage exceeds the maximum possible value recommendable for extrapolation (i.e. C_target = ",
+              round(C_max, 4),
+              "). Reduce the value of C_target."
+            )
+          )
+        } else{
+          stop(
+            paste0(
+              "Coverage exceeds the maximum possible value for interpolation (i.e. C_target = ",
+              round(C_max, 4),
+              "). Use extrapolation or reduce the value of C_target."
+            )
+          )
+        }
+    }
+    if (N > 1) {
+        S_C = rarefaction(x = sad,
+                            method = "IBR",
+                            effort = N,
+                            extrapolate = extrapolate,
+                            quiet_mode = TRUE)
+    } else {
+        S_C = NA
+    }
+    attr(S_C, "C") = C_target
+    attr(S_C, "N") = N
+    return(S_C)
+}
+
+#' Calculate the recommended target coverage value for the computation of beta_C 
+#'
+#' Returns the estimated gamma-scale coverage that corresponds to the largest
+#' allowable sample size (i.e. the smallest observed sample size at the alpha
+#' scale multiplied by an extrapolation factor). The default (factor = 2) allows
+#' for extrapolation up to 2 times the observed sample size of the smallest
+#' alpha sample. For factor= 1, only interpolation is applied. Factors larger
+#' than 2 are not recommended.
+#'
+#' @param x a site by species abundance matrix
+#' @param factor numeric. A multiplier for how much larger than total community 
+#' abundance to extrapolate to. Defaults to 2. 
+#'
+#' @return numeric value
+#' @export
+#'
+#' @examples
+#' data(tank_comm)
+#'
+#' # What is the largest possible C that I can use to calculate beta_C
+#' calc_C_target(tank_comm)
+calc_C_target <- function(x, factor = 2) {
+    x <- as.matrix(x)
+    if (any(dim(x) == 1)) {
+        n <- factor * sum(x)
+        C_target <- Chat(x, n)
+    }
+    else {
+        n <- min(factor * rowSums(x))
+        C_target <- Chat(colSums(x), n)
+    }
+    return(C_target)
+}
@@ -13,6 +13,7 @@
 #' @importFrom stats runif
 #' 
 #' @keywords internal
+#' @noRd
 centroid_accumulate = function(x, focal_sample = 1, n = NULL, coords = NULL, latlong = FALSE) {
 
     if ("mob_in" %in% class(x)) {
 
@@ -7,5 +7,5 @@
 #'   abundance, species commonness, and spatial aggregation of conspecifics.
 #' 
 #' @name mobr
-#' @docType package
-NULL
+"_PACKAGE"
+