changes to make models with and without replicates work with all other functions.

marlonecobos · marlonecobos · commit 690a7b257177 · 2026-01-18T18:45:47.000-05:00
diff --git a/R/fit_selected.R b/R/fit_selected.R
@@ -124,7 +124,7 @@ fit_selected <- function(calibration_results,
   m_ids <- calibration_results$selected_models$ID
   algorithm <- calibration_results$algorithm
 
-  # Fitting models over multiple replicates
+  # Fitting models if they have multiple replicates
   if (n_replicates > 1) {
     if (verbose) {
       message("Fitting replicates...")
@@ -224,6 +224,7 @@ fit_selected <- function(calibration_results,
   if (verbose) {
     message("\nFitting full models...")
   }
+
   # Full models grid setup
   n_models <- length(m_ids)
   dfgrid <- expand.grid(models = m_ids, replicates = 1)
@@ -278,6 +279,11 @@ fit_selected <- function(calibration_results,
     }
   }
 
+  # Stop the cluster for full models
+  if (parallel) {
+    parallel::stopCluster(cl)
+  }
+
   # Assign names to full models
   names(full_models) <- paste0("Model_", m_ids)
 
@@ -286,10 +292,6 @@ fit_selected <- function(calibration_results,
     best_models[[i]]$Full_model <- full_models[[i]]
   }
 
-  # Stop the cluster for full models
-  if (parallel) {
-    parallel::stopCluster(cl)
-  }
 
   # Compute thresholds for predictions
   occ <- calibration_results$calibration_data[
@@ -298,7 +300,7 @@ fit_selected <- function(calibration_results,
   # Predictions and consensus for occurrences
   p_occ <- lapply(names(best_models), function(x) {
     m_x <- best_models[[x]]
-    if (any(grepl("Rep", names(m_x)))) {
+    if (n_replicates > 1) {
       m_x$Full_model <- NULL
     }
 
@@ -308,33 +310,59 @@ fit_selected <- function(calibration_results,
                                                        type = type))
     } else if (algorithm == "glm") {
       p_r <- sapply(m_x, function(i) suppressWarnings(
-        as.numeric(predict_glm_mx(model = i,
-                       newdata = occ, type = type))
+        as.numeric(predict_glm_mx(model = i, newdata = occ, type = type))
         ))
     }
 
-    p_mean <- apply(p_r, 1, mean, na.rm = TRUE)
-    p_median <- apply(p_r, 1, median, na.rm = TRUE)
+    if (n_replicates > 1) {
+      p_mean <- apply(p_r, 1, mean, na.rm = TRUE)
+      p_median <- apply(p_r, 1, median, na.rm = TRUE)
 
-    list(mean = p_mean, median = p_median)
+      list(mean = p_mean, median = p_median, rep = p_r)
+    } else {
+      list(Full_model = p_r[, 1])
+    }
   })
 
   names(p_occ) <- names(best_models)
 
   # Calculate consensus across models
-  mean_consensus <- apply(sapply(p_occ, function(x) x$mean), 1,
-                          mean, na.rm = TRUE)
-  median_consensus <- apply(sapply(p_occ, function(x) x$median), 1,
-                            median, na.rm = TRUE)
+  if (length(p_occ) == 1) {
+    if (n_replicates > 1) {
+      mean_consensus <- p_occ[[1]]$mean
+      median_consensus <- p_occ[[1]]$median
+    } else {
+      mean_consensus <- p_occ[[1]]$Full_model
+      median_consensus <- p_occ[[1]]$Full_model
+    }
+
+  } else {
+    if (n_replicates > 1) {
+      mean_consensus <- apply(sapply(p_occ, function(x) x$mean), 1,
+                              mean, na.rm = TRUE)
+      median_consensus <- apply(do.call(cbind, lapply(p_occ, `[[`, "rep")), 1,
+                                median, na.rm = TRUE)
+    } else {
+      mean_consensus <- apply(sapply(p_occ, function(x) x$Full_model), 1,
+                              mean, na.rm = TRUE)
+      median_consensus <- apply(sapply(p_occ, function(x) x$Full_model), 1,
+                                median, na.rm = TRUE)
+    }
+  }
+
+  p_occ <- lapply(p_occ, function(x) x[names(x) != "rep"])
+
   consensus <- list(mean = mean_consensus, median = median_consensus)
+
   p_occ <- c(p_occ, list(consensus = consensus))
 
   # Calculate thresholds
   p_thr <- lapply(p_occ, function(model) {
     lapply(model, calc_thr,
            thr = calibration_results$summary$omission_rate_thr / 100)
   })
-  #Append type of predictions
+
+  # Append type of predictions
   p_thr$type <- type
 
   #Prepare final data
diff --git a/R/helpers_project_selected_glmnetx.R b/R/helpers_project_selected_glmnetx.R
@@ -68,9 +68,11 @@ var_models_rep_by_gcm <- function(path) {
     mean_replicates <- terra::rast(lapply(1:n_replicates, function(n) {
       rep_n <- terra::mean(rast(lapply(r_x, function(x) x[[n]])))
     }))
-    var_rep_x <- terra::app(mean_replicates, "var")} else {
-      r_x <- terra::rast(model_files)
-      var_rep_x <- terra::app(r_x, "var")}
+    var_rep_x <- terra::app(mean_replicates, "var")
+  } else {
+    r_x <- terra::rast(model_files)
+    var_rep_x <- terra::app(r_x, "var")
+  }
   names(var_rep_x) <- basename(path)
   return(var_rep_x)
 }
@@ -80,7 +82,8 @@ var_models_model_by_gcm <- function(path, consensus) {
                          full.names = TRUE))
   r_x <- r_x[[sapply(r_x, function(r) names(r) == consensus)]]
   if (terra::nlyr(r_x) > 1) {
-  var_x <- terra::app(r_x, "var") } else {
+    var_x <- terra::app(r_x, "var")
+  } else {
     var_x <- r_x * 0
   }
   return(var_x)
@@ -124,7 +127,7 @@ check_pred_scenarios <- function(projection_data, out_dir) {
   #Present
   if ("Present" %in% sc) {
     #Create folder
-    present_dir <- file.path(out_dir, "Present/")
+    present_dir <- file.path(out_dir, "Present")
     present_sc <- names(projection_data[["Present"]])
     suppressWarnings({
       d_present <- data.frame(
@@ -140,7 +143,7 @@ check_pred_scenarios <- function(projection_data, out_dir) {
   #Past
   if ("Past" %in% sc) {
     #Create folder
-    past_dir <- file.path(out_dir, "Past/")
+    past_dir <- file.path(out_dir, "Past")
     #Get grid of projections
     df_past <- do.call(
       rbind,
@@ -172,7 +175,7 @@ check_pred_scenarios <- function(projection_data, out_dir) {
   ####Project to Future scenarios####
   if ("Future" %in% sc) {
     #Create folder
-    future_dir <- file.path(out_dir, "Future/")
+    future_dir <- file.path(out_dir, "Future")
 
     #Create grid of time-ssp-gcm
     df_future <- do.call(
diff --git a/R/projection_variability.R b/R/projection_variability.R
@@ -6,22 +6,23 @@
 #' replicates, model parameterizations, and general circulation models (GCMs).
 #'
 #' @usage
-#' projection_variability(model_projections, by_replicate = TRUE, by_gcm = TRUE,
-#'                        by_model = TRUE, consensus = "median",
-#'                        write_files = FALSE, output_dir = NULL,
-#'                        return_rasters = TRUE, progress_bar = FALSE,
-#'                        verbose = TRUE, overwrite = FALSE)
+#' projection_variability(model_projections, from_replicates = TRUE,
+#'                        from_parameters = TRUE, from_gcms = TRUE,
+#'                        consensus = "median", write_files = FALSE,
+#'                        output_dir = NULL, return_rasters = TRUE,
+#'                        progress_bar = FALSE, verbose = TRUE,
+#'                        overwrite = FALSE)
 #'
 #' @param model_projections a `model_projections` object generated by the
 #' \code{\link{project_selected}}() function. This object contains the file
 #' paths to the raster projection results and the thresholds used for binarizing
 #' the predictions.
-#' @param by_replicate (logical) whether to compute the variance originating
+#' @param from_replicates (logical) whether to compute the variance originating
 #' from replicates.
-#' @param by_gcm (logical) whether to compute the variance originating from
-#' general circulation models (GCMs)
-#' @param by_model (logical) whether to compute the variance originating from
+#' @param from_parameters (logical) whether to compute the variance originating from
 #' model parameterizations.
+#' @param from_gcms (logical) whether to compute the variance originating from
+#' general circulation models (GCMs)
 #' @param consensus (character) (character) the consensus measure to use for
 #' calculating changes. Available options are 'mean', 'median', 'range', and
 #' 'stdev' (standard deviation). Default is 'median'.
@@ -108,19 +109,19 @@
 #'                       out_dir = out_dir)
 #'
 #' # Step 5: Compute variance from distinct sources
-#' v <- projection_variability(model_projections = p, by_replicate = FALSE)
+#' v <- projection_variability(model_projections = p, from_replicates = FALSE)
 #'
-#' #terra::plot(v$Present$by_replicate)  # Variance from replicates, present projection
-#' terra::plot(v$Present$by_model)  # From models
-#' #terra::plot(v$`Future_2041-2060_ssp126`$by_replicate)  # From replicates in future projection
-#' terra::plot(v$`Future_2041-2060_ssp126`$by_model)  # From models
-#' terra::plot(v$`Future_2041-2060_ssp126`$by_gcm)  # From GCMs
+#' #terra::plot(v$Present$from_replicates)  # Variance from replicates, present projection
+#' terra::plot(v$Present$from_parameters)  # From models with distinct parameters
+#' #terra::plot(v$`Future_2041-2060_ssp126`$from_replicates)  # From replicates in future projection
+#' terra::plot(v$`Future_2041-2060_ssp126`$from_parameters)  # From models
+#' terra::plot(v$`Future_2041-2060_ssp585`$from_gcms)  # From GCMs
 
 
 projection_variability <- function(model_projections,
-                                   by_replicate = TRUE,
-                                   by_gcm = TRUE,
-                                   by_model = TRUE,
+                                   from_replicates = TRUE,
+                                   from_parameters = TRUE,
+                                   from_gcms = TRUE,
                                    consensus = "median",  # MAKE IT WORK WHEN CONSENSUS IS FULL MODEL
                                    write_files = FALSE,
                                    output_dir = NULL,
@@ -140,13 +141,13 @@ projection_variability <- function(model_projections,
   }
 
   if (length(consensus) > 1) {
-    stop("Argument 'consensus' must be a unique value.",
-         "\nAvailable options are: 'median', 'range', 'mean' or 'stdev'.")
+    stop("Argument 'consensus' must be a single value.",
+         "\nOptions are: 'median' or 'mean'.")
   }
-  consensus_out <- setdiff(consensus, c("median", "range", "mean", "stdev"))
+  consensus_out <- setdiff(consensus, c("median", "mean"))
   if (length(consensus_out) > 0) {
     stop("Invalid 'consensus' provided.",
-         "\nAvailable options are: 'median', 'range', 'mean' or 'stdev'.")
+         "\nOptions are: 'median' or 'mean'.")
   }
 
   if (write_files & is.null(output_dir)) {
@@ -167,7 +168,10 @@ projection_variability <- function(model_projections,
   if (write_files) {
     out_dir <- file.path(output_dir, "variance")
     dir.create(out_dir, recursive = TRUE, showWarnings = FALSE)
-  } else {out_dir <- NULL}
+  } else {
+    out_dir <- NULL
+  }
+
   #### Get data ####
   d <- model_projections[["paths"]]
 
@@ -183,9 +187,6 @@ projection_variability <- function(model_projections,
 
   ####Iteration over combinations####
   res <- lapply(1:nrow(uc), function(z) {
-
-    #To test
-    #z = 1
     time <- uc$Time[z]
     period <- uc$Period[z]
     scenario <- uc$Scenario[z]
@@ -199,7 +200,7 @@ projection_variability <- function(model_projections,
     paths <- d_p$output_path
 
     #### By replicate ####
-    if (by_replicate) {
+    if (from_replicates) {
       if (verbose) {
         message("\nCalculating variability from distinct replicates: scenario ",
                 z, " of ", nrow(uc))
@@ -208,42 +209,51 @@ projection_variability <- function(model_projections,
 
       #### By replicates ####
       # Get variance of replicates in each gcm, than get the average across gcms
-      var_rep_by_gcm <- terra::rast(lapply(paths, var_models_rep_by_gcm))
-      var_rep <- terra::mean(var_rep_by_gcm)
-    } else {#End of by_replicate
+      var_rep <- terra::rast(lapply(paths, var_models_rep_by_gcm))
+      var_rep <- terra::mean(var_rep)
+      names(var_rep) <- "from_replicates"
+    } else {#End of from_replicates
       var_rep <- NULL
     }
 
     #### By Model ####
-    if (by_model) {
+    if (from_parameters) {
       if (verbose) {
         message("Calculating variability from distinct models: scenario ",
                 z, " of ", nrow(uc))
       }
 
       # Get variance of models in each gcm, than get the average
-      var_model_by_gcm <- terra::rast(lapply(paths, var_models_model_by_gcm, consensus))
-      var_model <- terra::mean(var_model_by_gcm)
-      names(var_model) <- "by_model"
+      if (names(model_projections$thresholds[[1]])[1] == "Full_model") {
+        var_model <- terra::rast(lapply(paths, var_models_model_by_gcm,
+                                        "Full_model"))
+      } else {
+        var_model <- terra::rast(lapply(paths, var_models_model_by_gcm,
+                                        consensus))
+      }
+
+      var_model <- terra::mean(var_model)
+      names(var_model) <- "from_parameters"
     } else { #End of by model
       var_model <-  NULL
     }
 
 
     ####By GCM####
-    if (by_gcm & period != "Present") {
+    if (from_gcms & period != "Present") {
       if (verbose) {
         message("Calculating variability from distinct GCMs: scenario ",
                 z, " of ", nrow(uc))
       }
 
       var_gcm <- var_models_across_gcm(paths = paths, consensus = consensus)
-      names(var_gcm) <- "by_gcm"
+      names(var_gcm) <- "from_gcms"
     } else {
-      var_gcm <- NULL}#End of by_gcm
+      var_gcm <- NULL
+    }#End of from_gcms
 
-    all_var <- terra::rast(c("by_replicate" = var_rep, "by_model" = var_model,
-                             "by_gcm" = var_gcm))
+    all_var <- terra::rast(c("from_replicates" = var_rep, "from_parameters" = var_model,
+                             "from_gcms" = var_gcm))
 
 
     #Write results
diff --git a/man/projection_variability.Rd b/man/projection_variability.Rd