sigven
diff --git a/‎.bumpversion.cfg
-24 b/‎.bumpversion.cfg
-24
diff --git a/‎.bumpversion.toml
+46 b/‎.bumpversion.toml
+46
diff --git a/‎DESCRIPTION
+1-1 b/‎DESCRIPTION
+1-1
diff --git a/‎R/data.R
+7 b/‎R/data.R
+7
diff --git a/‎R/disease_drug.R
+4-3 b/‎R/disease_drug.R
+4-3
diff --git a/‎R/enrich.R
+109-23 b/‎R/enrich.R
+109-23
diff --git a/‎R/onco_enrichr.R
+8-3 b/‎R/onco_enrichr.R
+8-3
diff --git a/‎R/ppi.R
+2-1 b/‎R/ppi.R
+2-1
diff --git a/‎R/sysdata.rda
17 Bytes b/‎R/sysdata.rda
17 Bytes
@@ -0,0 +1,46 @@
+[tool.bumpversion]
+current_version = "1.5.2"
+search = "{current_version}"
+replace = "{new_version}"
+message = "Bump version: {current_version} → {new_version}"
+regex = false
+ignore_missing_version = false
+ignore_missing_files = false
+commit = true
+parse = """(?x)
+    (?P<major>0|[1-9]\\d*)\\.
+    (?P<minor>0|[1-9]\\d*)\\.
+    (?P<patch>0|[1-9]\\d*)
+    (?:\\.(?P<dev>\\d+))?
+"""
+
+serialize = [
+    "{major}.{minor}.{patch}.{dev}",
+    "{major}.{minor}.{patch}",
+]
+
+[[tool.bumpversion.files]]
+filename = "DESCRIPTION"
+search = "Version: {current_version}"
+replace = "Version: {new_version}"
+
+[[tool.bumpversion.files]]
+filename = "README.md"
+search = "2F{current_version}"
+replace = "2F{new_version}"
+
+[[tool.bumpversion.files]]
+filename = "pkgdown/index.md"
+search = "2F{current_version}"
+replace = "2F{new_version}"
+
+[[tool.bumpversion.files]]
+filename = "vignettes/installation.Rmd"
+search = "{current_version}"
+replace = "{new_version}"
+
+[[tool.bumpversion.files]]
+filename = ".github/workflows/pkgdown.yaml"
+search = "VERSION: '{current_version}'"
+replace = "VERSION: '{new_version}'"
+
@@ -30,7 +30,7 @@ biocViews:
 Imports: dplyr,
          assertthat,
          assertable,
-         clusterProfiler,
+         clusterProfiler (>= 4.13),
          DT, 
          gganatogram, 
          ggpubr,
 
@@ -4,3 +4,10 @@
 #' @format A character vector of 24 color codes
 #'
 "tissue_colors"
+
+#' Format (columns) for clusterProfiler enrichment output
+#'
+#'
+#' @format A character vector of 23 variables
+#'
+"cp_output_cols"
@@ -12,7 +12,7 @@
 #' "refseq_transcript_id", "ensembl_protein", "refseq_protein")
 #' @param ignore_id_err logical indicating if analysis should
 #' continue when uknown query identifiers are encountered
-#' @param incude_gene_summary logical indicating if gene summary (NCBI/UniProt) should be included
+#' @param include_gene_summary logical indicating if gene summary (NCBI/UniProt) should be included
 #' in output data tables
 #' @param tumor_site character indicating primary tumor site of interest
 #'
@@ -118,9 +118,10 @@ cancer_association_rank <- function(
 
   if(NROW(qgenes_match$found) > 2500){
     lgr::lgr$warn( paste0(
-      "Query set must exceeds max limit of 2,500 valid entries - ",
+      "Query set exceeds max limit of 2,500 valid entries - ",
       "limiting input to 2,500 entries"))
-    qgenes_match[['found']] <- head(qgenes_match[['found']], 2500)
+    qgenes_match[['found']] <-
+      utils::head(qgenes_match[['found']], 2500)
   }
 
   lgr::lgr$info( paste0(
 
@@ -55,8 +55,9 @@ get_go_enrichment <- function(query_entrez,
     )
 
   if (simplify == T) {
-    ego <- clusterProfiler::simplify(ego, cutoff=0.8,
-                                     by="p.adjust", select_fun=min)
+    ego <- clusterProfiler::simplify(
+      ego, cutoff=0.8,
+      by="p.adjust", select_fun=min)
   }
 
   df <- as.data.frame(utils::head(ego, 5000))
@@ -67,6 +68,12 @@ get_go_enrichment <- function(query_entrez,
     df <- df |> dplyr::mutate(db = ontology)
   }
   if (nrow(df) > 0) {
+    assertable::assert_colnames(
+      df, c("ID","Description","Count",
+            "GeneRatio","BgRatio","pvalue",
+            "qvalue","geneID"),
+      only_colnames = F, quiet = T)
+
     df <- suppressWarnings(
       df |>
         dplyr::mutate(db = paste0("GO_", .data$db)) |>
@@ -75,8 +82,6 @@ get_go_enrichment <- function(query_entrez,
           go_description = "Description",
           count = "Count",
           gene_ratio = "GeneRatio",
-          rich_factor = "RichFactor",
-          fold_enrichment = "FoldEnrichment",
           z_score = "zScore",
           background_ratio = "BgRatio",
           gene_id = "geneID") |>
@@ -85,9 +90,6 @@ get_go_enrichment <- function(query_entrez,
             paste0('<a href=\'http://amigo.geneontology.org/amigo/term/',
                    .data$go_id,'\' target=\'_blank\'>',
                    .data$go_description,'</a>')) |>
-        tidyr::separate(.data$gene_ratio,
-                        c('num_query_hits','num_query_all'),
-                        sep = "/", remove = F, convert = T) |>
         dplyr::mutate(qvalue = as.numeric(.data$qvalue)) |>
         dplyr::mutate(pvalue = as.numeric(.data$pvalue)) |>
         dplyr::mutate(
@@ -103,20 +105,65 @@ get_go_enrichment <- function(query_entrez,
               !is.na(.data$pvalue),
               as.numeric(formatC(.data$pvalue, format = "e",
                                  digits = 1)),
+              as.numeric(NA)))
+    )
+
+    df <- suppressWarnings(
+      df |>
+        dplyr::mutate(qvalue = as.numeric(.data$qvalue)) |>
+        dplyr::mutate(pvalue = as.numeric(.data$pvalue)) |>
+        dplyr::mutate(
+          qvalue =
+            dplyr::if_else(
+              !is.na(.data$qvalue),
+              as.numeric(formatC(.data$qvalue, format = "e",
+                                 digits = 1)),
               as.numeric(NA))) |>
-        tidyr::separate(.data$background_ratio,
-                        c('num_background_hits','num_background_all'),
-                        sep = "/", remove = F, convert = T) |>
+        dplyr::mutate(
+          pvalue =
+            dplyr::if_else(
+              !is.na(.data$pvalue),
+              as.numeric(formatC(.data$pvalue, format = "e",
+                                 digits = 1)),
+              as.numeric(NA)))
+    )
+
+    df$enrichment_factor <- NA
+    if("FoldEnrichment" %in% colnames(df)){
+      df <- df |>
+        dplyr::mutate(
+          enrichment_factor = round(
+            as.numeric(.data$FoldEnrichment), digits = 2)) |>
+        dplyr::select(-c("FoldEnrichment"))
+    }else{
+      df <- df |>
+        tidyr::separate(
+          .data$gene_ratio,
+          c('num_query_hits','num_query_all'),
+          sep = "/", remove = F, convert = T) |>
+        tidyr::separate(
+          .data$background_ratio,
+          c('num_background_hits','num_background_all'),
+          sep = "/", remove = F, convert = T) |>
         dplyr::mutate(
           enrichment_factor =
-            round(as.numeric((.data$num_query_hits / .data$num_query_all) /
-                               (.data$num_background_hits / .data$num_background_all)),
-                  digits = 1)) |>
+            round(as.numeric((
+              .data$num_query_hits / .data$num_query_all) /
+                (.data$num_background_hits / .data$num_background_all)),
+              digits = 2)) |>
         dplyr::select(-c("num_query_hits",
                          "num_query_all",
                          "num_background_hits",
                          "num_background_all"))
-    )
+
+    }
+    df$rich_factor <- NA
+    if("RichFactor" %in% colnames(df)){
+      df <- df |>
+        dplyr::mutate(
+          rich_factor = as.numeric(.data$RichFactor)) |>
+        dplyr::select(-c("RichFactor"))
+    }
 
     gene2id <- NULL
     if (!is.null(genedb)) {
@@ -164,6 +211,15 @@ get_go_enrichment <- function(query_entrez,
       df$setting_p_value_adj_method <- p_value_adjustment_method
       df$setting_min_geneset_size <- min_geneset_size
       df$setting_max_geneset_size <- max_geneset_size
+
+      for(c in oncoEnrichR::cp_output_cols){
+        if(!(c %in% colnames(df))){
+          df[,c] <- NA
+        }
+      }
+      df <- df |>
+        dplyr::select(
+          dplyr::any_of(oncoEnrichR::cp_output_cols))
     }
   } else {
     df <- NULL
@@ -238,15 +294,18 @@ get_universal_enrichment <- function(query_entrez,
   df <- as.data.frame(utils::head(enr,5000))
   rownames(df) <- NULL
   if (nrow(df) > 0) {
+    assertable::assert_colnames(
+      df, c("ID","Description","Count",
+            "GeneRatio","BgRatio","pvalue",
+            "qvalue","geneID"),
+      only_colnames = F, quiet = T)
     df <- suppressWarnings(
       df |>
         dplyr::rename(
           standard_name = "ID",
           description = "Description",
           count = "Count",
           gene_ratio = "GeneRatio",
-          rich_factor = "RichFactor",
-          fold_enrichment = "FoldEnrichment",
           z_score = "zScore",
           background_ratio = "BgRatio",
           gene_id = "geneID")
@@ -331,6 +390,21 @@ get_universal_enrichment <- function(query_entrez,
               as.numeric(formatC(.data$pvalue, format = "e",
                                  digits = 1)),
               as.numeric(NA))) |>
+        dplyr::mutate(
+          db = dplyr::if_else(is.na(.data$db) &
+                                nchar(dbsource) > 0,
+                              dbsource,
+                              as.character(.data$db)))
+    )
+
+    if("FoldEnrichment" %in% colnames(df)){
+      df <- df |>
+        dplyr::mutate(
+          enrichment_factor = round(
+            as.numeric(.data$FoldEnrichment), digits = 2)) |>
+        dplyr::select(-c("FoldEnrichment"))
+    }else{
+      df <- df |>
         tidyr::separate(
           .data$gene_ratio,
           c('num_query_hits','num_query_all'),
@@ -344,17 +418,20 @@ get_universal_enrichment <- function(query_entrez,
             round(as.numeric((
               .data$num_query_hits / .data$num_query_all) /
                 (.data$num_background_hits / .data$num_background_all)),
-              digits = 1)) |>
+              digits = 2)) |>
         dplyr::select(-c("num_query_hits",
                          "num_query_all",
                          "num_background_hits",
-                         "num_background_all")) |>
+                         "num_background_all"))
+
+    }
+    df$rich_factor <- NA
+    if("RichFactor" %in% colnames(df)){
+      df <- df |>
         dplyr::mutate(
-          db = dplyr::if_else(is.na(.data$db) &
-                                nchar(dbsource) > 0,
-                              dbsource,
-                              as.character(.data$db)))
-    )
+          rich_factor = as.numeric(.data$RichFactor)) |>
+        dplyr::select(-c("RichFactor"))
+    }
 
     gene2id <- NULL
     if (!is.null(genedb)) {
@@ -392,6 +469,15 @@ get_universal_enrichment <- function(query_entrez,
       df$setting_p_value_adj_method <- p_value_adjustment_method
       df$setting_min_geneset_size <- min_geneset_size
       df$setting_max_geneset_size <- max_geneset_size
+
+      for(c in oncoEnrichR::cp_output_cols){
+        if(!(c %in% colnames(df))){
+          df[,c] <- NA
+        }
+      }
+      df <- df |>
+        dplyr::select(
+          dplyr::any_of(oncoEnrichR::cp_output_cols))
     }
   } else {
     df <- NULL
 
@@ -1786,6 +1786,7 @@ onco_enrich <- function(query = NULL,
 #' @param file full filename for report output (e.g. "oe_report.html" or "oe_report.xlsx")
 #' @param ignore_file_extension logical to accept any type of filaname extensions (for Galaxy integration)
 #' @param overwrite logical indicating if existing output files may be overwritten
+#' @param render_quarto_quiet logical indicating if Quarto rendering should be done quietly
 #' @param format file format of output (html/excel)
 #' @param ... options for Galaxy/non self-contained HTML. Only applicable for use in Galaxy
 #'
@@ -1797,6 +1798,7 @@ write <- function(report,
                   file = "testReport.html",
                   ignore_file_extension = F,
                   overwrite = F,
+                  render_quarto_quiet = T,
                   format = "html",
                   ...) {
 
@@ -1868,7 +1870,8 @@ write <- function(report,
     return()
   }
 
-  output_directory <- dirname(file)
+  #output_directory <- dirname(file)
+  output_directory <- normalizePath(dirname(file))
 
   if(is.na(html_extern_path) & !embed_resources){
     html_extern_path <- output_directory
@@ -1885,6 +1888,9 @@ write <- function(report,
       lgr::lgr$info(paste0("ERROR: ",val))
       return()
     }
+  }else{
+    lgr::lgr$info(paste0("ERROR: provide absolute (not relative) path to output file"))
+    return()
   }
 
   if (overwrite == F) {
@@ -1956,7 +1962,6 @@ write <- function(report,
       system.file("templates", package = "oncoEnrichR")
 
     ## make temporary directory for quarto report rendering
-    #stringi::stri_rand_strings(10, 1)
     tmp_quarto_dir <- file.path(
       output_directory,
       paste0('quarto_', stringi::stri_rand_strings(1, 15))
@@ -2018,7 +2023,7 @@ write <- function(report,
     quarto::quarto_render(
       input = quarto_main_template_sample,
       execute_dir = tmp_quarto_dir,
-      quiet = T)
+      quiet = render_quarto_quiet)
 
     ## check that supporting libs do not exist in output directory (Galaxy)
     if (galaxy_run == T & embed_resources == F){
 
@@ -19,7 +19,8 @@ get_network_hubs <- function(edges = NULL,
   d <- igraph::graph_from_data_frame(d = edges, directed = F)
 
   ## hub score (Kleinberg"s hub centrality)
-  hscore <- igraph::hub_score(d)
+  #hscore <- igraph::hub_score(d)
+  hscore <- igraph::authority_score(d)
   hub_scores <- data.frame(
     symbol = names(sort(hscore$vector,decreasing = T)),
     hub_score = round(sort(hscore$vector,decreasing = T), digits = 3),