noaa-akro
diff --git a/‎.Rbuildignore‎
Lines changed: 3 additions & 1 deletion b/‎.Rbuildignore‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎DESCRIPTION‎
Lines changed: 10 additions & 4 deletions b/‎DESCRIPTION‎
Lines changed: 10 additions & 4 deletions
diff --git a/‎R/AssembleGAMFormula.R‎
Lines changed: 82 additions & 0 deletions b/‎R/AssembleGAMFormula.R‎
Lines changed: 82 additions & 0 deletions
diff --git a/‎R/AutodetectGAMTerms.R‎
Lines changed: 118 additions & 0 deletions b/‎R/AutodetectGAMTerms.R‎
Lines changed: 118 additions & 0 deletions
@@ -1,7 +1,9 @@
 ^EFHSDM\.Rproj$
 ^\.Rproj\.user$
 ^dev$
-^R/Meatgrinder5\.R$
 ^LICENSE\.md$
 ^doc$
 ^Meta$
+^CONTRIBUTING\.md$
+^\.github$
+^Meatgrinder6_mcs.R
@@ -44,3 +44,5 @@ vignettes/*.pdf
 inst/doc
 /doc/
 /Meta/
+
+Meatgrinder6_mcs.R
@@ -8,20 +8,25 @@ Authors@R:
            comment = c(ORCID = "0000-0003-2663-9243")),
       person(c("James", "T."), "Thorson", email = "james.thorson@noaa.gov", role = c("aut"),
            comment = c(ORCID = "0000-0001-7415-1010")),
-      person("Jodi", "Pirtle", ,email = "jodi.pirtle@noaa.gov", role = c("aut"),
+      person(c("Jodi", "L."), "Pirtle", email = "jodi.pirtle@noaa.gov", role = c("aut"),
            comment = c(ORCID = "0000-0002-4421-8234")),
       person(c("Margaret","C."), "Siple", email = "margaret.siple@noaa.gov", role = c("aut", "com"),
-           comment = c(ORCID = "0000-0002-4260-9856"))     
+           comment = c(ORCID = "0000-0002-4260-9856")),
+      person(c("Mason","J."), "Smith", email = "mason.smith@noaa.gov", role = c("aut", "com"),
+           comment = c(ORCID = "0000-0002-3132-6869")),
+      person(c("Mallarie", "E."), "Yeager", email = "mallarie.yeager@noaa.gov", role = c("aut", "com"),
+           comment = c(ORCID = " 0000-0002-5513-2583"))     
            )
-Description: This package fits species distribution models (SDMs) to groundfish and crab data from the Eastern Bering Sea, Aleutian Islands, and Gulf of Alaska. These SDMs were used in the 2022 EFH 5-Year Review. 
+Description: This package fits species distribution models (SDMs) to groundfish and crab data from the Eastern Bering Sea, Aleutian Islands, and Gulf of Alaska. These SDMs were used in the 2023 EFH 5-Year Review. 
 License: MIT + file LICENSE
 Encoding: UTF-8
 Roxygen: list(markdown = TRUE)
 RoxygenNote: 7.3.2
 Suggests: 
     knitr,
     rmarkdown,
-    gridExtra
+    gridExtra,
+    testthat (>= 3.0.0)
 VignetteBuilder: knitr
 Imports: 
     ggplot2,
@@ -43,3 +48,4 @@ Depends:
     R (>= 3.5.0)
 LazyData: 
     false
+Config/testthat/edition: 3
@@ -0,0 +1,82 @@
+#' Make a GAM formula
+#'
+#' @description Improved version designed to use the tables produced by the Autodetect functions
+# allows for easily dropping terms for things like term selections and deviance explained.
+#' @param yvar Name of dependent variable for gam models
+#' @param gam.table Data frame of parameters for GAM formula
+#' @param hgam Logical; do you want an hgam formula
+#'
+#' @return Returns a formula object, or list of formulas for hgam
+#' @export
+#'
+#' @examples
+AssembleGAMFormula <- function(yvar, gam.table, hgam = F) {
+
+  # logic to handle different possibilities to supply for hgam
+  if (hgam) {
+    if (is.data.frame(gam.table[[1]])) {
+      gam.table1 <- gam.table[[1]]
+    } else {
+      gam.table1 <- gam.table
+    }
+    if (is.data.frame(gam.table[[2]])) {
+      gam.table2 <- gam.table[[2]]
+    } else {
+      gam.table2 <- gam.table1
+    }
+    form.list <- list(gam.table1, gam.table2)
+  } else {
+    gam.table1 <- gam.table
+    form.list <- list(gam.table1)
+  }
+
+  for (f in 1:length(form.list)) {
+    g.table <- form.list[[f]]
+    out.terms <- rep(NA, nrow(g.table))
+
+    for (t in 1:nrow(g.table)) {
+      if (g.table$type[t] == "smooth") {
+        out.term0 <- paste0("s(", g.table$term[t])
+      }
+      if (g.table$type[t] == "factor") {
+        out.term0 <- paste0("as.factor(", g.table$term[t])
+      }
+      if (g.table$type[t] == "offset") {
+        out.term0 <- paste0("offset(", g.table$term[t])
+      }
+
+      if (is.na(g.table$term2[t]) == F) {
+        out.term0 <- paste0(out.term0, ",", g.table$term2[t])
+      }
+      if (is.na(g.table$bs[t]) == F) {
+        out.term0 <- paste0(out.term0, ",bs='", g.table$bs[t], "'")
+      }
+      if (is.na(g.table$k[t]) == F) {
+        out.term0 <- paste0(out.term0, ",k=", g.table$k[t])
+      }
+      if (is.na(g.table$m[t]) == F & is.na(g.table$m2[t])) {
+        out.term0 <- paste0(out.term0, ",m=", g.table$m[t])
+      }
+      if (is.na(g.table$m[t]) == F & is.na(g.table$m2[t]) == F) {
+        out.term0 <- paste0(out.term0, ",m=c(", g.table$m[t], ",", g.table$m2[t], ")")
+      }
+      out.terms[t] <- paste0(out.term0, ")")
+      if (g.table$type[t] == "linear") {
+        out.terms[t] <- g.table$term[t]
+      }
+    }
+
+    if (f == 1) {
+      out.form <- list(stats::as.formula(paste0(yvar, " ~ ", paste(out.terms, collapse = " + "))))
+    }
+    if (f > 1) {
+      out.form[[f]] <- stats::as.formula(paste0(" ~ ", paste(out.terms, collapse = " + ")))
+    }
+  }
+  if (
+    length(form.list) == 1) {
+    return(out.form[[1]])
+  } else {
+    return(out.form)
+  }
+}
@@ -0,0 +1,118 @@
+#' Auto-detect GAM terms
+#'
+#' @description This is a useful function that returns a table of the terms in a GAM, whether they are a one dimensional (linear) term, a two dimensional smooth, or a factor. Also detects the offset.
+#' @param model A fitted GAM model object
+#' @param hgam character describing how to handle hgams; use "d" for the density model, "p" for the prob model, or "b" or "all" for both
+#'
+#' @return returns a data frame with columns describing the name and type of all model components and relevant smoother parameters
+#' @export
+#'
+#' @examples
+AutodetectGAMTerms <- function(model, hgam = "all") {
+  n.formulas <- 1
+  if (model$family$family == "ziplss" & hgam %in% c("b", "both", "all")) {
+    n.formulas <- 2
+  }
+
+  for (f in 1:n.formulas) {
+    form.index <- 3
+
+    # a lot of special handling for ziplss models
+    if (model$family$family == "ziplss") {
+      if (hgam %in% c("b", "both", "all")) {
+        form1 <- stats::formula(model)[[f]]
+      }
+      if (hgam %in% c("d", "dens", "density")) {
+        form1 <- stats::formula(model)[[1]]
+      }
+      if (hgam %in% c("p", "prob", "probability")) {
+        form1 <- stats::formula(model)[[2]]
+      }
+    } else {
+      form1 <- stats::formula(model)
+    }
+
+    terms <- trimws(strsplit(as.character(form1[[length(form1)]]), split = "[+]")[[2]])
+
+    # loop through and figure out the information for the table
+    type.dat <- data.frame(type = rep(NA, length(terms)), dims = 1, term = NA, term2 = NA, bs = NA, k = NA, m = NA, m2 = NA)
+    for (t in 1:length(terms)) {
+      x <- terms[t]
+      x2 <- strsplit(x, split = "[(=)]")[[1]]
+      # linear terms
+      if (length(x2) == 1) {
+        type.dat$type[t] <- "linear"
+        type.dat$term[t] <- x2
+      } else {
+        # smoothed terms
+        if (x2[1] %in% c("s", "te")) {
+          dims <- length(strsplit(x2[2], split = ", ")[[1]]) - 1
+          for (n in 1:dims) {
+            type.dat[t, 2 + n] <- strsplit(x2[2], split = ", ")[[1]][n]
+          }
+          type.dat$type[t] <- "smooth"
+          type.dat$dims[t] <- dims
+
+          # find smoother basis
+          formula.options <- strsplit(x, split = ",")[[1]]
+          bs.spot <- which(unlist(lapply(strsplit(formula.options, "="), FUN = function(x) {
+            return(trimws(x[1]))
+          })) == "bs")
+          if (length(bs.spot) > 0) {
+            type.dat$bs[t] <- strsplit(formula.options[bs.spot], split = "\"")[[1]][2]
+          }
+
+          # find smoother k
+          k.spot <- which(unlist(lapply(strsplit(formula.options, "="), FUN = function(x) {
+            return(trimws(x[1]))
+          })) == "k")
+          if (length(k.spot) > 0) {
+            type.dat$k[t] <- trimws(strsplit(strsplit(formula.options[k.spot], split = "=")[[1]][2], split = "[)]")[[1]])
+          }
+
+          # find penalty m, which can be complicated
+          m.spot <- which(unlist(lapply(strsplit(formula.options, "="), FUN = function(x) {
+            return(trimws(x[1]))
+          })) == "m")
+          if (length(m.spot) > 0) {
+            if ("c" %in% strsplit(formula.options[m.spot], split = "")[[1]]) {
+              m.spot <- c(m.spot, m.spot + 1)
+            }
+            for (n in 1:length(m.spot)) {
+              m1 <- trimws(formula.options[m.spot][n])
+              if (n == 1) {
+                m2 <- trimws(strsplit(m1, split = "=")[[1]][2])
+              } else {
+                m2 <- m1
+              }
+              m3 <- trimws(strsplit(m2, split = "[()]")[[1]])
+              type.dat[t, 6 + n] <- suppressWarnings(stats::na.omit(as.numeric(m3))[1])
+            }
+          }
+        }
+        # factor terms
+        if (x2[1] == "as.factor") {
+          type.dat$type[t] <- "factor"
+          type.dat$term[t] <- x2[2]
+        }
+      }
+    }
+    # Make the table
+    terms2 <- unlist(strsplit(x = names(model$model), split = "[()]"))
+    off.term <- which(terms2 == "offset") + 1
+    if (length(off.term) > 0) {
+      type.dat <- rbind(type.dat, data.frame(type = "offset", dims = 1, term = terms2[off.term], term2 = NA, bs = NA, k = NA, m = NA, m2 = NA))
+    }
+    # if multiple formulas, need to make a list
+    if (n.formulas > 1) {
+      if (f == 1) {
+        out.dat <- list(type.dat)
+      } else {
+        out.dat[[f]] <- type.dat
+      }
+    } else {
+      out.dat <- type.dat
+    }
+  }
+  return(out.dat)
+}