Add exploration notebook but with diffusion

sgreenbury · sgreenbury · commit d3c48c82292a · 2025-12-09T17:28:37.000Z
diff --git a/notebooks/00_01_exploration_diffusion_reaction.ipynb b/notebooks/00_01_exploration_diffusion_reaction.ipynb
@@ -0,0 +1,340 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "0",
+   "metadata": {},
+   "source": [
+    "## AutoCast encoder-processor-decoder model API Exploration\n",
+    "\n",
+    "This notebook aims to explore the end-to-end API.\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1",
+   "metadata": {},
+   "source": [
+    "### Example dataaset\n",
+    "\n",
+    "We use the `AdvectionDiffusion` dataset as an example dataset to illustrate training and evaluation of models. This dataset simulates the advection-diffusion equation in 2D.\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pickle\n",
+    "from pathlib import Path\n",
+    "\n",
+    "from autoemulate.simulations.advection_diffusion import AdvectionDiffusion\n",
+    "from autoemulate.simulations.reaction_diffusion import ReactionDiffusion\n",
+    "\n",
+    "simulation_name = \"reaction_diffusion\"\n",
+    "\n",
+    "Sim = (\n",
+    "    ReactionDiffusion if simulation_name == \"reaction_diffusion\" else AdvectionDiffusion\n",
+    ")\n",
+    "sim = Sim(return_timeseries=True, log_level=\"error\")\n",
+    "\n",
+    "\n",
+    "def generate_split(simulator, n_train: int = 50, n_valid: int = 2, n_test: int = 2):\n",
+    "    \"\"\"Generate training, validation, and test splits from the simulator.\"\"\"\n",
+    "    train = simulator.forward_samples_spatiotemporal(n_train)\n",
+    "    valid = simulator.forward_samples_spatiotemporal(n_valid)\n",
+    "    test = simulator.forward_samples_spatiotemporal(n_test)\n",
+    "    return {\"train\": train, \"valid\": valid, \"test\": test}\n",
+    "\n",
+    "\n",
+    "# Cache file path\n",
+    "cache_file = Path(f\"{simulation_name}_cache.pkl\")\n",
+    "\n",
+    "# Load from cache if it exists, otherwise generate and save\n",
+    "if cache_file.exists():\n",
+    "    print(f\"Loading cached simulation data from {cache_file}\")\n",
+    "    with open(cache_file, \"rb\") as f:\n",
+    "        combined_data = pickle.load(f)\n",
+    "else:\n",
+    "    print(\"Generating simulation data...\")\n",
+    "    combined_data = generate_split(sim)\n",
+    "    print(f\"Saving simulation data to {cache_file}\")\n",
+    "    with open(cache_file, \"wb\") as f:\n",
+    "        pickle.dump(combined_data, f)\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3",
+   "metadata": {},
+   "source": [
+    "### Read combined data into datamodule\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from auto_cast.data.datamodule import SpatioTemporalDataModule\n",
+    "\n",
+    "n_steps_input = 1\n",
+    "n_steps_output = 4\n",
+    "stride = 4\n",
+    "datamodule = SpatioTemporalDataModule(\n",
+    "    data=combined_data,\n",
+    "    data_path=None,\n",
+    "    n_steps_input=n_steps_input,\n",
+    "    n_steps_output=n_steps_output,\n",
+    "    stride=n_steps_output,\n",
+    "    batch_size=16,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5",
+   "metadata": {},
+   "source": [
+    "### Example batch\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "batch = next(iter(datamodule.train_dataloader()))\n",
+    "\n",
+    "# batch"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from azula.noise import VPSchedule\n",
+    "\n",
+    "from auto_cast.decoders.identity import IdentityDecoder\n",
+    "from auto_cast.encoders.identity import IdentityEncoder\n",
+    "from auto_cast.models.encoder_decoder import EncoderDecoder\n",
+    "from auto_cast.models.encoder_processor_decoder import EPDTrainProcessor\n",
+    "from auto_cast.nn.unet import TemporalUNetBackbone\n",
+    "from auto_cast.processors.diffusion import DiffusionProcessor\n",
+    "\n",
+    "# from auto_cast.processors.fno import FNOProcessor\n",
+    "\n",
+    "batch = next(iter(datamodule.train_dataloader()))\n",
+    "n_channels = batch.input_fields.shape[-1]\n",
+    "# processor = FNOProcessor(\n",
+    "#     in_channels=n_channels * n_steps_input,\n",
+    "#     out_channels=n_channels * n_steps_output,\n",
+    "#     n_modes=(16, 16),\n",
+    "#     hidden_channels=64,\n",
+    "#     stride=n_steps_output,\n",
+    "#     max_rollout_steps=100,\n",
+    "# )\n",
+    "processor = DiffusionProcessor(\n",
+    "    backbone=TemporalUNetBackbone(\n",
+    "        in_channels=n_channels * n_steps_output,\n",
+    "        out_channels=n_channels * n_steps_output,\n",
+    "        cond_channels=n_channels * n_steps_input,\n",
+    "        mod_features=256,\n",
+    "        hid_channels=(32, 64, 128),\n",
+    "        hid_blocks=(2, 2, 2),\n",
+    "        spatial=2,\n",
+    "        periodic=False,\n",
+    "    ),\n",
+    "    schedule=VPSchedule(),\n",
+    "    n_steps_output=n_steps_output,\n",
+    "    n_channels_out=n_channels,\n",
+    "    stride=n_steps_output\n",
+    ")\n",
+    "# encoder = PermuteConcat(with_constants=False)\n",
+    "# decoder = ChannelsLast(output_channels=n_channels, time_steps=n_steps_output)\n",
+    "\n",
+    "encoder = IdentityEncoder()\n",
+    "decoder = IdentityDecoder()\n",
+    "model = EPDTrainProcessor(\n",
+    "    encoder_decoder=EncoderDecoder(encoder=encoder, decoder=decoder),\n",
+    "    processor=processor,\n",
+    "    stride=stride,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model(batch).shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dl = datamodule.train_dataloader()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "10",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "batch.input_fields.shape[0]*len(dl)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "11",
+   "metadata": {},
+   "source": [
+    "### Run trainer\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "12",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import lightning as L\n",
+    "\n",
+    "device = \"mps\"  # \"cpu\"\n",
+    "# device = \"cpu\"\n",
+    "trainer = L.Trainer(max_epochs=3, accelerator=device, log_every_n_steps=10)\n",
+    "trainer.fit(model, datamodule.train_dataloader(), datamodule.val_dataloader())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "13",
+   "metadata": {},
+   "source": [
+    "### Run the evaluation\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "14",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "trainer.test(model, datamodule.test_dataloader())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "15",
+   "metadata": {},
+   "source": [
+    "### Example rollout\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "16",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# A single element is the full trajectory\n",
+    "batch = next(iter(datamodule.rollout_test_dataloader()))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "17",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# First n_steps_input are inputs\n",
+    "print(batch.input_fields.shape)\n",
+    "# Remaining n_steps_output are outputs\n",
+    "print(batch.output_fields.shape)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "18",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Run rollout on one trajectory\n",
+    "preds, trues = model.rollout(batch, free_running_only=True)\n",
+    "\n",
+    "print(preds.shape)\n",
+    "assert trues is not None\n",
+    "print(trues.shape)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "19",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from IPython.display import HTML\n",
+    "\n",
+    "from auto_cast.utils import plot_spatiotemporal_video\n",
+    "\n",
+    "anim = plot_spatiotemporal_video(\n",
+    "    pred=preds,\n",
+    "    true=trues,\n",
+    ")\n",
+    "HTML(anim.to_jshtml())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "20",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}