alan-turing-institute
diff --git a/‎notebooks/00_exploration.ipynb‎
Lines changed: 18 additions & 11 deletions b/‎notebooks/00_exploration.ipynb‎
Lines changed: 18 additions & 11 deletions
diff --git a/‎notebooks/01_encoder_decoder.ipynb‎
Lines changed: 181 additions & 0 deletions b/‎notebooks/01_encoder_decoder.ipynb‎
Lines changed: 181 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 3 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎src/auto_cast/__init__.py‎
Lines changed: 6 additions & 2 deletions b/‎src/auto_cast/__init__.py‎
Lines changed: 6 additions & 2 deletions
@@ -17,7 +17,7 @@
    "source": [
     "### Example dataaset\n",
     "\n",
-    "We use the `AdvectionDiffusion` dataset as an example dataset to illustrate training and evaluation of models. This dataset simulates the advection-diffusion equation in 2D."
+    "We use the `AdvectionDiffusion` dataset as an example dataset to illustrate training and evaluation of models. This dataset simulates the advection-diffusion equation in 2D.\n"
    ]
   },
   {
@@ -27,12 +27,12 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "\n",
-    "from autoemulate.simulations.reaction_diffusion import ReactionDiffusion as Sim\n",
+    "from autoemulate.simulations.advection_diffusion import AdvectionDiffusion as Sim\n",
     "\n",
     "sim = Sim(return_timeseries=True, log_level=\"error\")\n",
     "\n",
-    "def generate_split(simulator: Sim, n_train: int = 1, n_valid: int = 1, n_test: int = 1):\n",
+    "\n",
+    "def generate_split(simulator: Sim, n_train: int = 10, n_valid: int = 2, n_test: int = 2):\n",
     "    \"\"\"Generate training, validation, and test splits from the simulator.\"\"\"\n",
     "    train = simulator.forward_samples_spatiotemporal(n_train)\n",
     "    valid = simulator.forward_samples_spatiotemporal(n_valid)\n",
@@ -63,7 +63,11 @@
     "n_steps_input = 4\n",
     "n_steps_output = 1\n",
     "datamodule = SpatioTemporalDataModule(\n",
-    "    data=combined_data, data_path=None, n_steps_input=n_steps_input, n_steps_output=n_steps_output, batch_size=16\n",
+    "    data=combined_data,\n",
+    "    data_path=None,\n",
+    "    n_steps_input=n_steps_input,\n",
+    "    n_steps_output=n_steps_output,\n",
+    "    batch_size=16,\n",
     ")"
    ]
   },
@@ -112,7 +116,9 @@
     "decoder = ChannelsLast(output_channels=n_channels, time_steps=n_steps_output)\n",
     "\n",
     "model = EncoderProcessorDecoder.from_encoder_processor_decoder(\n",
-    "    encoder_decoder=EncoderDecoder(encoder=encoder, decoder=decoder),\n",
+    "    encoder_decoder=EncoderDecoder.from_encoder_decoder(\n",
+    "        encoder=encoder, decoder=decoder\n",
+    "    ),\n",
     "    processor=processor,\n",
     ")"
    ]
@@ -144,8 +150,8 @@
    "source": [
     "import lightning as L\n",
     "\n",
-    "# device = \"mps\"  # \"cpu\"\n",
-    "device = \"cpu\"\n",
+    "device = \"mps\"  # \"cpu\"\n",
+    "# device = \"cpu\"\n",
     "trainer = L.Trainer(max_epochs=1, accelerator=device, log_every_n_steps=10)\n",
     "trainer.fit(model, datamodule.train_dataloader(), datamodule.val_dataloader())"
    ]
@@ -155,7 +161,7 @@
    "id": "11",
    "metadata": {},
    "source": [
-    "### Run the evaluation"
+    "### Run the evaluation\n"
    ]
   },
   {
@@ -173,7 +179,7 @@
    "id": "13",
    "metadata": {},
    "source": [
-    "### Example rollout"
+    "### Example rollout\n"
    ]
   },
   {
@@ -208,7 +214,7 @@
    "outputs": [],
    "source": [
     "# Run rollout on one trajectory\n",
-    "preds, trues = model.rollout(batch)"
+    "preds, trues = model.rollout(batch, free_running_only=True)"
    ]
   },
   {
@@ -228,6 +234,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
+    "assert trues is not None\n",
     "print(trues.shape)\n"
    ]
   }
 
@@ -0,0 +1,181 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# from autoemulate.simulations.advection_diffusion import AdvectionDiffusion\n",
+    "from autoemulate.simulations.reaction_diffusion import ReactionDiffusion as Sim\n",
+    "\n",
+    "sim = Sim(return_timeseries=True, log_level=\"error\")\n",
+    "\n",
+    "\n",
+    "def generate_split(simulator: Sim, n_train: int = 4, n_valid: int = 2, n_test: int = 2):\n",
+    "    \"\"\"Generate training, validation, and test splits from the simulator.\"\"\"\n",
+    "    train = simulator.forward_samples_spatiotemporal(n_train)\n",
+    "    valid = simulator.forward_samples_spatiotemporal(n_valid)\n",
+    "    test = simulator.forward_samples_spatiotemporal(n_test)\n",
+    "    return {\"train\": train, \"valid\": valid, \"test\": test}\n",
+    "\n",
+    "\n",
+    "combined_data = generate_split(sim)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from auto_cast.data.datamodule import SpatioTemporalDataModule\n",
+    "\n",
+    "datamodule = SpatioTemporalDataModule(\n",
+    "    data=combined_data,\n",
+    "    data_path=None,\n",
+    "    n_steps_input=1,\n",
+    "    n_steps_output=0,\n",
+    "    batch_size=16,\n",
+    "    autoencoder_mode=True,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "batch = next(iter(datamodule.train_dataloader()))\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Check input field shape: batch of single frames with two channels\n",
+    "batch.input_fields.shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "\n",
+    "torch.allclose(batch.input_fields, batch.output_fields)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from auto_cast.decoders.dc import DCDecoder\n",
+    "from auto_cast.encoders.dc import DCEncoder\n",
+    "from auto_cast.models.ae import AE\n",
+    "\n",
+    "channels = batch.input_fields.shape[-1]\n",
+    "\n",
+    "encoder = DCEncoder(\n",
+    "    in_channels=channels,\n",
+    "    out_channels=16,\n",
+    "    hid_channels=(32, 64),\n",
+    "    spatial=2,\n",
+    "    hid_blocks=(2, 2),\n",
+    "    pixel_shuffle=False,\n",
+    ")\n",
+    "\n",
+    "decoder = DCDecoder(\n",
+    "    in_channels=16,\n",
+    "    out_channels=channels,\n",
+    "    hid_channels=(64, 32),\n",
+    "    spatial=2,\n",
+    "    hid_blocks=(2, 2),\n",
+    "    pixel_shuffle=False,\n",
+    ")\n",
+    "model = AE(encoder=encoder, decoder=decoder)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import lightning as L\n",
+    "\n",
+    "device = \"mps\"  # \"cpu\"\n",
+    "trainer = L.Trainer(max_epochs=5, accelerator=device, log_every_n_steps=10)\n",
+    "trainer.fit(model, datamodule.train_dataloader(), datamodule.val_dataloader())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "\n",
+    "for idx, batch in enumerate(datamodule.test_dataloader()):\n",
+    "    inputs = batch.input_fields.to(device)\n",
+    "    outputs, latents = model.forward_with_latent(batch)\n",
+    "    print(\"Input shape:\", inputs.shape)\n",
+    "    print(\"Output shape:\", outputs.shape)\n",
+    "    print(\"Latent shape:\", latents.shape)\n",
+    "    fig, axs = plt.subplots(1, 4, figsize=(8, 4))\n",
+    "    axs[0].imshow(inputs[0, 0, :, :, 0].cpu().numpy(), cmap=\"viridis\")\n",
+    "    axs[0].set_title(\"Input\")\n",
+    "    axs[1].imshow(outputs[0, 0, :, :, 0].detach().cpu().numpy(), cmap=\"viridis\")\n",
+    "    axs[1].set_title(\"Reconstruction\")\n",
+    "    axs[2].imshow(\n",
+    "        outputs[0, 0, :, :, 0].detach().cpu().numpy()\n",
+    "        - inputs[0, 0, :, :, 0].cpu().numpy(),\n",
+    "        cmap=\"viridis\",\n",
+    "    )\n",
+    "    axs[2].set_title(\"Difference\")\n",
+    "    axs[3].imshow(latents[0, 0, :, :, 0].detach().cpu().numpy(), cmap=\"viridis\")\n",
+    "    axs[3].set_title(f\"Latent dim {0}\")\n",
+    "    plt.show()\n",
+    "    if idx >= 3:\n",
+    "        break"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
@@ -9,8 +9,10 @@ authors = [
 requires-python = ">=3.11,<3.13"
 dependencies = [
     "autoemulate>=1.2.0",
+    "azula>=0.7.0",
     "einops>=0.8.1",
     "h5py>=3.15.1",
+    "jaxtyping>=0.3.3",
     "lightning>=2.5.6",
     "neuraloperator>=2.0.0",
     "the-well>=1.1.0",
@@ -19,6 +21,7 @@ dependencies = [
 
 [project.optional-dependencies]
 dev = [
+    "beartype>=0.22.8",
     "ipykernel>=7.1.0",
     "pytest>=9.0.1",
     "pytest-cov>=7.0.0",
 
@@ -1,2 +1,6 @@
-def main() -> None:  # noqa: D103
-    print("Hello from auto-cast!")
+import os
+
+if os.getenv("RUNTIME_TYPECHECKING", "True").lower() in ["1", "true"]:
+    from beartype.claw import beartype_this_package
+
+    beartype_this_package()