ihmeuw
diff --git a/‎src/idd_forecast_mbp/06_upload/03_create_and_combine_aa_draws_parallel.py‎
Lines changed: 5 additions & 5 deletions b/‎src/idd_forecast_mbp/06_upload/03_create_and_combine_aa_draws_parallel.py‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎src/idd_forecast_mbp/06_upload/06_create_and_combine_as_draws_parallel.py‎
Lines changed: 185 additions & 0 deletions b/‎src/idd_forecast_mbp/06_upload/06_create_and_combine_as_draws_parallel.py‎
Lines changed: 185 additions & 0 deletions
diff --git a/‎src/idd_forecast_mbp/06_upload/06_make_mega_as_draws.ipynb‎
Lines changed: 68 additions & 9 deletions b/‎src/idd_forecast_mbp/06_upload/06_make_mega_as_draws.ipynb‎
Lines changed: 68 additions & 9 deletions
@@ -18,7 +18,7 @@
 
 run_date = "2025_07_24"
 run_date = '2025_08_04'
-run_date = '2025_08_11'
+run_date = '2025_08_28'
 dah_scenarios = rfc.dah_scenarios
 dah_scenarios = ['Baseline', 'Constant']
 dah_scenarios = ['Baseline']
@@ -48,7 +48,7 @@
 
 # Project
 project = "proj_rapidresponse"  # Adjust this to your project name if needed
-queue = 'long.q'
+queue = 'all.q'
 
 wf_uuid = uuid.uuid4()
 tool_name = f"{package_name}_create_summaries_{wf_uuid}"
@@ -74,16 +74,16 @@
     }
 )
 
-memory = "80G"
+memory = "100G"
 
 # Define the task template for processing each year batch
 task_template = tool.get_task_template(
     template_name=template_name,
     default_cluster_name="slurm",
     default_compute_resources={
         "memory": memory,
-        "cores": 16,
-        "runtime": "45m",
+        "cores": 10,
+        "runtime": "60m",
         "queue": queue,
         "project": project,
         "stdout": str(stdout_dir),
 
@@ -0,0 +1,185 @@
+import getpass
+import uuid
+from jobmon.client.tool import Tool  # type: ignore
+from pathlib import Path
+import geopandas as gpd  # type: ignore
+from idd_forecast_mbp import constants as rfc
+
+repo_name = rfc.repo_name
+package_name = rfc.package_name
+
+hold_variables = {
+    'malaria': ['DAH', 'flood', 'gdppc', 'suitability'],
+    'dengue': ['gdppc', 'suitability', 'urban'],
+}
+run_hold_variables = False
+
+template_name = f'{repo_name}_06_03_create_and_combine'
+
+run_date = "2025_07_24"
+run_date = '2025_08_04'
+run_date = '2025_08_28'
+dah_scenarios = rfc.dah_scenarios
+dah_scenarios = ['Baseline', 'Constant']
+dah_scenarios = ['Baseline']
+# dah_scenarios = ['reference', 'better', 'worse']
+
+causes = rfc.cause_map
+# causes = ['dengue']
+ssp_scenarios = rfc.ssp_scenarios
+# ssp_scenarios = ['ssp245']
+
+
+# Script directory
+SCRIPT_ROOT = rfc.REPO_ROOT / repo_name / "src" / package_name / "06_upload"
+
+draws = rfc.draws
+
+# Jobmon setup
+user = getpass.getuser()
+
+log_dir = Path("/mnt/team/idd/pub/")
+log_dir.mkdir(parents=True, exist_ok=True)
+# Create directories for stdout and stderr
+stdout_dir = log_dir / "stdout"
+stderr_dir = log_dir / "stderr"
+stdout_dir.mkdir(parents=True, exist_ok=True)
+stderr_dir.mkdir(parents=True, exist_ok=True)
+
+# Project
+project = "proj_rapidresponse"  # Adjust this to your project name if needed
+queue = 'all.q'
+
+wf_uuid = uuid.uuid4()
+tool_name = f"{package_name}_create_summaries_{wf_uuid}"
+tool = Tool(name=tool_name)
+
+# Create a workflow
+workflow = tool.create_workflow(
+    name=f"{tool_name}_workflow_{wf_uuid}",
+    max_concurrently_running=10000,  # Adjust based on system capacity
+)
+
+# Compute resources
+workflow.set_default_compute_resources_from_dict(
+    cluster_name="slurm",
+    dictionary={
+        "memory": "15G",
+        "cores": 1,
+        "runtime": "60m",
+        "queue": queue,
+        "project": project,
+        "stdout": str(stdout_dir),
+        "stderr": str(stderr_dir),
+    }
+)
+
+memory = "100G"
+
+# Define the task template for processing each year batch
+task_template = tool.get_task_template(
+    template_name=template_name,
+    default_cluster_name="slurm",
+    default_compute_resources={
+        "memory": memory,
+        "cores": 10,
+        "runtime": "60m",
+        "queue": queue,
+        "project": project,
+        "stdout": str(stdout_dir),
+        "stderr": str(stderr_dir),
+    },
+    command_template=(
+        "python {script_root}/create_and_combine_as_draws.py "
+        "--cause {{cause}} "
+        "--ssp_scenario {{ssp_scenario}} "
+        "--dah_scenario {{dah_scenario}} "
+        "--measure {{measure}} "
+        "--hold_variable {{hold_variable}} "
+        "--run_date {{run_date}}"
+    ).format(script_root=SCRIPT_ROOT),
+    node_args=["cause", "ssp_scenario", "dah_scenario", "measure", "hold_variable", "run_date"],
+    task_args=[],
+    op_args=[],
+)
+
+
+tasks = []
+
+for cause in causes:
+    for ssp_scenario in ssp_scenarios:
+        for measure in ['mortality', 'incidence']:
+            if cause == "malaria":
+                for dah_scenario in dah_scenarios:
+                    # Create the primary task
+                    task = task_template.create_task(
+                        cause=cause,
+                        ssp_scenario=ssp_scenario,
+                        dah_scenario=dah_scenario,
+                        measure=measure,
+                        hold_variable='None',
+                        run_date=run_date,
+                    )
+                    tasks.append(task)
+            else:
+                # Create the primary task
+                task = task_template.create_task(
+                    cause=cause,
+                    ssp_scenario=ssp_scenario,
+                    dah_scenario='None',
+                    measure=measure,
+                    hold_variable='None',
+                    run_date=run_date,
+                )
+                tasks.append(task)
+if run_hold_variables:
+    for cause in causes:
+        for hold_variable in hold_variables[cause]:
+            for ssp_scenario in rfc.ssp_scenarios:
+                for measure in ['mortality', 'incidence']:
+                    if cause == "malaria":
+                        for dah_scenario in dah_scenarios:
+                            # Create the primary task
+                            task = task_template.create_task(
+                                cause=cause,
+                                ssp_scenario=ssp_scenario,
+                                dah_scenario=dah_scenario,
+                                measure=measure,
+                                hold_variable=hold_variable,
+                                run_date=run_date
+                            )
+                            tasks.append(task)
+                    else:
+                        # Create the primary task
+                        task = task_template.create_task(
+                            cause=cause,
+                            ssp_scenario=ssp_scenario,
+                            dah_scenario=None,
+                            measure=measure,
+                            hold_variable=hold_variable,
+                            run_date=run_date
+                        )
+                        tasks.append(task)
+
+print(f"Number of tasks: {len(tasks)}")
+
+if tasks:
+    workflow.add_tasks(tasks)
+    print("✅ Tasks successfully added to workflow.")
+else:
+    print("⚠️ No tasks added to workflow. Check task generation.")
+
+try:
+    workflow.bind()
+    print("✅ Workflow successfully bound.")
+    print(f"Running workflow with ID {workflow.workflow_id}.")
+    print("For full information see the Jobmon GUI:")
+    print(f"https://jobmon-gui.ihme.washington.edu/#/workflow/{workflow.workflow_id}")
+except Exception as e:
+    print(f"❌ Workflow binding failed: {e}")
+
+try:
+    status = workflow.run()
+    print(f"Workflow {workflow.workflow_id} completed with status {status}.")
+except Exception as e:
+    print(f"❌ Workflow submission failed: {e}")
@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "id": "cc3b5a3b",
    "metadata": {},
    "outputs": [],
@@ -26,7 +26,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "id": "409b3738",
    "metadata": {},
    "outputs": [],
@@ -37,7 +37,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "id": "172bf6bd",
    "metadata": {},
    "outputs": [],
@@ -53,10 +53,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "id": "fe636c87",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'ssp_scenario' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[31m---------------------------------------------------------------------------\u001b[39m",
+      "\u001b[31mNameError\u001b[39m                                 Traceback (most recent call last)",
+      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[5]\u001b[39m\u001b[32m, line 6\u001b[39m\n\u001b[32m      4\u001b[39m cause_map = rfc.cause_map\n\u001b[32m      5\u001b[39m ssp_scenarios = rfc.ssp_scenarios\n\u001b[32m----> \u001b[39m\u001b[32m6\u001b[39m scenario = ssp_scenarios[\u001b[43mssp_scenario\u001b[49m][\u001b[33m\"\u001b[39m\u001b[33mdhs_scenario\u001b[39m\u001b[33m\"\u001b[39m] \u001b[38;5;66;03m#  is the DHS scenario name\u001b[39;00m\n",
+      "\u001b[31mNameError\u001b[39m: name 'ssp_scenario' is not defined"
+     ]
+    }
+   ],
    "source": [
     "ssp_draws = rfc.draws\n",
     "measure_map = rfc.measure_map\n",
@@ -68,10 +80,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "id": "a2156f97",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'cause' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[31m---------------------------------------------------------------------------\u001b[39m",
+      "\u001b[31mNameError\u001b[39m                                 Traceback (most recent call last)",
+      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[6]\u001b[39m\u001b[32m, line 1\u001b[39m\n\u001b[32m----> \u001b[39m\u001b[32m1\u001b[39m \u001b[38;5;28;01mif\u001b[39;00m \u001b[43mcause\u001b[49m == \u001b[33m\"\u001b[39m\u001b[33mmalaria\u001b[39m\u001b[33m\"\u001b[39m:\n\u001b[32m      2\u001b[39m     \u001b[38;5;28;01mif\u001b[39;00m hold_variable == \u001b[33m'\u001b[39m\u001b[33mNone\u001b[39m\u001b[33m'\u001b[39m:\n\u001b[32m      3\u001b[39m         processed_forecast_ds_path_template = \u001b[33m\"\u001b[39m\u001b[38;5;132;01m{UPLOAD_DATA_PATH}\u001b[39;00m\u001b[33m/full_as_\u001b[39m\u001b[38;5;132;01m{cause}\u001b[39;00m\u001b[33m_measure_\u001b[39m\u001b[38;5;132;01m{measure}\u001b[39;00m\u001b[33m_ssp_scenario_\u001b[39m\u001b[38;5;132;01m{ssp_scenario}\u001b[39;00m\u001b[33m_dah_scenario_\u001b[39m\u001b[38;5;132;01m{dah_scenario}\u001b[39;00m\u001b[33m_draw_\u001b[39m\u001b[38;5;132;01m{draw}\u001b[39;00m\u001b[33m_with_predictions.nc\u001b[39m\u001b[33m\"\u001b[39m\n",
+      "\u001b[31mNameError\u001b[39m: name 'cause' is not defined"
+     ]
+    }
+   ],
    "source": [
     "\n",
     "\n",
@@ -176,7 +200,28 @@
     "file_paths = [get_file_path(draw, cause, measure, ssp_scenario, dah_scenario, vaccinate, hold_variable) \n",
     "              for draw in ssp_draws]\n",
     "\n",
-    "print(f\"Loading {len(file_paths)} files...\")\n",
+    "print(f\"Loading {len(file_paths)} files...\")\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0540081a",
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'as_ds' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[31m---------------------------------------------------------------------------\u001b[39m",
+      "\u001b[31mNameError\u001b[39m                                 Traceback (most recent call last)",
+      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[1]\u001b[39m\u001b[32m, line 1\u001b[39m\n\u001b[32m----> \u001b[39m\u001b[32m1\u001b[39m \u001b[43mas_ds\u001b[49m\n",
+      "\u001b[31mNameError\u001b[39m: name 'as_ds' is not defined"
+     ]
+    }
+   ],
+   "source": [
     "\n",
     "# Open all files as a single dataset with lazy loading\n",
     "upload_ds = xr.open_mfdataset(\n",
@@ -290,8 +335,22 @@
   }
  ],
  "metadata": {
+  "kernelspec": {
+   "display_name": "forecast-mbp",
+   "language": "python",
+   "name": "python3"
+  },
   "language_info": {
-   "name": "python"
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.9"
   }
  },
  "nbformat": 4,