Add option to generate notebook of plots (#11)

patricktnast · web-flow · commit 47870d1b1d96 · 2026-01-15T15:00:59.000-08:00
* [COPILOT] refactor extraction code to separate module

* format

* [COPILOT] consolidate benchmark and phase configs.

* refactor extraction to create a 'configuration'

* remove unused imports

* fix method sig

* minor fixes

* cleanup

* add basic unit tests

* add back result summary columns

* make callpattern more ergonomic

* condense

* add cli for summarization

* [COPILOT] Add tests

* edits for readability

* change nan check to warning

* format

* add summarize run at the end of the run_benchmark loop

* [COPILOT] extract plotting functions to new module

* [COPILOT] refactor plots

* adjust so that we only create fractions for bottleneck patterns, which are defined in a particular way.

* make bottleneck patterns more strict

* [COPILOT] add nb generation

* adjust organization

* format

* remove duplicate param

* rename callpattern

* add line number to extraction

* add test to ensure we can select correct line

* use pipeline call as ex instead

* format

* updates

* format
diff --git a/setup.py b/setup.py
@@ -54,6 +54,7 @@
         "matplotlib",
         "seaborn",
         "scalene",
+        "nbformat>=5.0",
     ]
 
     setup_requires = ["setuptools_scm"]
diff --git a/src/vivarium_profiling/templates/__init__.py b/src/vivarium_profiling/templates/__init__.py
@@ -0,0 +1,6 @@
+"""Templates for vivarium_profiling."""
+
+from pathlib import Path
+
+TEMPLATES_DIR = Path(__file__).parent
+ANALYSIS_NOTEBOOK_TEMPLATE = TEMPLATES_DIR / "analysis_template.ipynb"
diff --git a/src/vivarium_profiling/templates/analysis_template.ipynb b/src/vivarium_profiling/templates/analysis_template.ipynb
@@ -0,0 +1,216 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "072e8e0a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "import matplotlib.pyplot as plt\n",
+    "from pathlib import Path\n",
+    "from vivarium_profiling.tools.extraction import ExtractionConfig\n",
+    "from vivarium_profiling.tools import plotting\n",
+    "\n",
+    "# Configure matplotlib for notebook\n",
+    "%matplotlib inline"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b7058668",
+   "metadata": {},
+   "source": [
+    "## Load Data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9241f5cb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load benchmark results\n",
+    "benchmark_results_path = Path(r\"{{BENCHMARK_RESULTS_PATH}}\")\n",
+    "summary_path = Path(r\"{{SUMMARY_PATH}}\")\n",
+    "\n",
+    "raw = pd.read_csv(benchmark_results_path)\n",
+    "summary = pd.read_csv(summary_path)\n",
+    "\n",
+    "# Load extraction config\n",
+    "config = ExtractionConfig()\n",
+    "\n",
+    "print(f\"Loaded {len(raw)} raw benchmark results\")\n",
+    "print(f\"Loaded {len(summary)} model summaries\")\n",
+    "print(f\"\\nRaw data shape: {raw.shape}\")\n",
+    "print(f\"Summary data shape: {summary.shape}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4c47df2b",
+   "metadata": {},
+   "source": [
+    "## Performance Analysis\n",
+    "\n",
+    "Overall runtime and memory usage comparison across models."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "22bb73fb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plotting.create_figures(\n",
+    "    summary,\n",
+    "    output_dir=None,\n",
+    "    chart_title=\"performance_analysis\",\n",
+    "    time_col=\"rt_s\",\n",
+    "    mem_col=\"mem_mb\",\n",
+    "    time_pdiff_col=\"rt_s_pdiff\",\n",
+    "    save=False\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7e31e5f0",
+   "metadata": {},
+   "source": [
+    "## Phase Runtime Analysis\n",
+    "\n",
+    "Detailed analysis of individual simulation phases (setup, initialize_simulants, run, finalize, report)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ee250c94",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get phase metrics from config\n",
+    "phase_patterns = [p for p in config.patterns if p.cumtime_template == \"rt_{name}_s\"]\n",
+    "\n",
+    "for pattern in phase_patterns:\n",
+    "    time_col = pattern.cumtime_col\n",
+    "    time_pdiff_col = f\"{time_col}_pdiff\"\n",
+    "    \n",
+    "    print(f\"\\n=== {pattern.name.upper()} ===\")\n",
+    "    plotting.create_figures(\n",
+    "        summary,\n",
+    "        output_dir=None,\n",
+    "        chart_title=f\"runtime_analysis_{pattern.name}\",\n",
+    "        time_col=time_col,\n",
+    "        mem_col=None,\n",
+    "        time_pdiff_col=time_pdiff_col,\n",
+    "        save=False\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7f07476e",
+   "metadata": {},
+   "source": [
+    "## Non-Run Time Analysis\n",
+    "\n",
+    "Analysis of time spent outside the main run phase (setup, initialization, reporting, etc.)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0bf6f0d7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plotting.create_figures(\n",
+    "    summary,\n",
+    "    output_dir=None,\n",
+    "    chart_title=\"runtime_analysis_non_run\",\n",
+    "    time_col=\"rt_non_run_s\",\n",
+    "    mem_col=None,\n",
+    "    time_pdiff_col=\"rt_non_run_s_pdiff\",\n",
+    "    save=False\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "aa16a06d",
+   "metadata": {},
+   "source": [
+    "## Bottleneck Cumulative Time Analysis\n",
+    "\n",
+    "Analysis of cumulative time spent in known bottleneck functions (gather_results, pipeline_call, population_get)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "691b5377",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get bottleneck patterns from config\n",
+    "bottleneck_patterns = [\n",
+    "    p for p in config.patterns\n",
+    "    if p.extract_cumtime and p.cumtime_col == f\"{p.name}_cumtime\"\n",
+    "]\n",
+    "\n",
+    "for pattern in bottleneck_patterns:\n",
+    "    time_col = pattern.cumtime_col\n",
+    "    time_pdiff_col = f\"{time_col}_pdiff\"\n",
+    "    \n",
+    "    print(f\"\\n=== {pattern.name.upper()} ===\")\n",
+    "    plotting.create_figures(\n",
+    "        summary,\n",
+    "        output_dir=None,\n",
+    "        chart_title=f\"bottleneck_runtime_analysis_{pattern.name}\",\n",
+    "        time_col=time_col,\n",
+    "        mem_col=None,\n",
+    "        time_pdiff_col=time_pdiff_col,\n",
+    "        save=False\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4f267afb",
+   "metadata": {},
+   "source": [
+    "## Bottleneck Fractions vs Scale Factor\n",
+    "\n",
+    "Fraction of run() time spent in each bottleneck function, plotted against model scale factor."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ddcc58f6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plotting.plot_bottleneck_fractions(\n",
+    "    summary,\n",
+    "    output_dir=None,\n",
+    "    config=config,\n",
+    "    metric=\"median\",\n",
+    "    save=False\n",
+    ")"
+   ]
+  }
+ ],
+ "metadata": {
+  "language_info": {
+   "name": "python"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/src/vivarium_profiling/tools/cli.py b/src/vivarium_profiling/tools/cli.py
@@ -293,10 +293,19 @@ def _expand_model_specs(model_patterns: list[str]) -> list[Path]:
     is_flag=True,
     help="Drop into python debugger if an error occurs.",
 )
+@click.option(
+    "--nb",
+    is_flag=True,
+    help=(
+        "Generate a Jupyter notebook for interactive analysis. "
+        "If summary.csv already exists, skip summary generation."
+    ),
+)
 def summarize(
     benchmark_results: str,
     verbose: int,
     with_debugger: bool,
+    nb: bool,
 ) -> None:
     """Summarize benchmark results and create visualizations.
 
@@ -311,10 +320,13 @@ def summarize(
     - bottleneck_runtime_analysis_*.png: Bottleneck cumtime charts
     - bottleneck_fraction_*.png: Bottleneck fraction scaling charts
 
+    If --nb is specified, also creates:
+    - analysis.ipynb: Interactive Jupyter notebook with all plots
+
     Example usage:
         summarize results/profile_2026_01_07/benchmark_results.csv
     """
     configure_logging_to_terminal(verbose)
     benchmark_results_path = Path(benchmark_results)
     main = handle_exceptions(run_summarize_analysis, logger, with_debugger=with_debugger)
-    main(benchmark_results_path)
+    main(benchmark_results_path, nb=nb)
diff --git a/src/vivarium_profiling/tools/notebook_generator.py b/src/vivarium_profiling/tools/notebook_generator.py
@@ -0,0 +1,56 @@
+"""Generate Jupyter notebooks for interactive benchmark analysis."""
+
+from pathlib import Path
+
+import nbformat as nbf
+from loguru import logger
+
+from vivarium_profiling.templates import ANALYSIS_NOTEBOOK_TEMPLATE
+
+NOTEBOOK_NAME = "analysis.ipynb"
+
+
+def create_analysis_notebook(
+    benchmark_results_path: Path,
+    summary_path: Path,
+    output_path: Path,
+) -> None:
+    """Create a Jupyter notebook for interactive benchmark analysis.
+
+    Loads a template notebook and substitutes file paths.
+
+    Parameters
+    ----------
+    benchmark_results_path
+        Path to benchmark_results.csv file.
+    summary_path
+        Path to summary.csv file.
+    output_path
+        Path where the notebook should be saved (e.g., analysis.ipynb).
+    config
+        Extraction configuration (currently unused, kept for API consistency).
+
+    """
+    # Define substitutions
+    substitutions = {
+        "{{BENCHMARK_RESULTS_PATH}}": str(benchmark_results_path),
+        "{{SUMMARY_PATH}}": str(summary_path),
+    }
+
+    # Load template
+    with open(ANALYSIS_NOTEBOOK_TEMPLATE) as f:
+        nb = nbf.read(f, as_version=4)
+
+    # Apply substitutions to all code cells
+    for cell in nb.cells:
+        if cell.cell_type == "code":
+            source = cell.source
+            for placeholder, value in substitutions.items():
+                source = source.replace(placeholder, value)
+            cell.source = source
+
+    # Save the notebook
+    with open(output_path, "w") as f:
+        nbf.write(nb, f)
+
+    logger.info(f"Created analysis notebook: {output_path}")
diff --git a/src/vivarium_profiling/tools/plotting.py b/src/vivarium_profiling/tools/plotting.py
diff --git a/src/vivarium_profiling/tools/summarize.py b/src/vivarium_profiling/tools/summarize.py

Original file line number	Diff line number	Diff line change
`@@ -54,6 +54,7 @@`
`54`	`54`	`"matplotlib",`
`55`	`55`	`"seaborn",`
`56`	`56`	`"scalene",`
	`57`	`+ "nbformat>=5.0",`
`57`	`58`	`]`
`58`	`59`
`59`	`60`	`setup_requires = ["setuptools_scm"]`