NVIDIA
diff --git a/‎sub-packages/bionemo-moco/examples/entropic_time_scheduler_tutorial_cfm.ipynb‎
Lines changed: 49 additions & 46 deletions b/‎sub-packages/bionemo-moco/examples/entropic_time_scheduler_tutorial_cfm.ipynb‎
Lines changed: 49 additions & 46 deletions
@@ -34,10 +34,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import torch \n",
-    "import math\n",
-    "import numpy as np \n",
     "import matplotlib.pyplot as plt\n",
+    "import torch\n",
     "from sklearn.datasets import make_moons"
    ]
   },
@@ -126,6 +124,8 @@
    ],
    "source": [
     "normalize = True\n",
+    "\n",
+    "\n",
     "def sample_moons(n, normalize=False):\n",
     "    x1, _ = make_moons(n_samples=n, noise=0.05)\n",
     "    x1 = torch.Tensor(x1)\n",
@@ -134,6 +134,7 @@
     "        x1 = (x1 - x1.mean(0)) / x1.std(0) * 2\n",
     "    return x1\n",
     "\n",
+    "\n",
     "x1 = sample_moons(1000)\n",
     "plt.scatter(x1[:, 0], x1[:, 1])"
    ]
@@ -211,11 +212,10 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import torch\n",
     "import matplotlib.pyplot as plt\n",
-    "from bionemo.moco.schedules.inference_time_schedules import (\n",
-    "    LinearInferenceSchedule, TimeDirection\n",
-    ")"
+    "import torch\n",
+    "\n",
+    "from bionemo.moco.schedules.inference_time_schedules import LinearInferenceSchedule, TimeDirection"
    ]
   },
   {
@@ -245,12 +245,13 @@
    "source": [
     "%%time\n",
     "# ---------- parameters ----------\n",
-    "dim           = 2\n",
-    "shape         = (batch_size, dim)\n",
-    "_FLOW_STEPS   = 100           # number of steps\n",
-    "display_int   = 10            # show every n-th step\n",
+    "dim = 2\n",
+    "shape = (batch_size, dim)\n",
+    "_FLOW_STEPS = 100  # number of steps\n",
+    "display_int = 10  # show every n-th step\n",
     "# --------------------------------\n",
     "\n",
+    "\n",
     "def square_centre_limits(ax, pts, pad_frac: float = 0.05):\n",
     "    \"\"\"Make the axes square and centred on the data.\n",
     "\n",
@@ -261,18 +262,16 @@
     "    \"\"\"\n",
     "    x, y = pts[:, 0], pts[:, 1]\n",
     "    x_mid, y_mid = (x.max() + x.min()) / 2, (y.max() + y.min()) / 2\n",
-    "    half_range   = max(x.max() - x.min(), y.max() - y.min()) / 2\n",
-    "    half_range  *= (1 + pad_frac)          # add a small margin\n",
+    "    half_range = max(x.max() - x.min(), y.max() - y.min()) / 2\n",
+    "    half_range *= 1 + pad_frac  # add a small margin\n",
     "    ax.set_xlim(x_mid - half_range, x_mid + half_range)\n",
     "    ax.set_ylim(y_mid - half_range, y_mid + half_range)\n",
     "\n",
+    "\n",
     "# define schedule\n",
-    "inference_sched = LinearInferenceSchedule(\n",
-    "    nsteps=_FLOW_STEPS,\n",
-    "    direction=TimeDirection.UNIFIED\n",
-    ")\n",
-    "schedule = inference_sched.generate_schedule().to(DEVICE)   # len = _FLOW_STEPS\n",
-    "dts      = inference_sched.discretize().to(DEVICE)          # len = _FLOW_STEPS\n",
+    "inference_sched = LinearInferenceSchedule(nsteps=_FLOW_STEPS, direction=TimeDirection.UNIFIED)\n",
+    "schedule = inference_sched.generate_schedule().to(DEVICE)  # len = _FLOW_STEPS\n",
+    "dts = inference_sched.discretize().to(DEVICE)  # len = _FLOW_STEPS\n",
     "\n",
     "# always show t=0 and t=1\n",
     "display_indices = sorted(set(range(0, _FLOW_STEPS + 1, display_int)) | {0, _FLOW_STEPS})\n",
@@ -281,22 +280,23 @@
     "with torch.no_grad():\n",
     "    # start from the prior used in training\n",
     "    x = cfm.sample_prior(shape).to(DEVICE)\n",
-    "    \n",
+    "\n",
     "    fig, axes = plt.subplots(1, n_plots, figsize=(4 * n_plots, 4))\n",
     "    for ax in axes:\n",
-    "        ax.set_aspect('equal', 'box')\n",
-    "        ax.set_xticks([]); ax.set_yticks([])\n",
+    "        ax.set_aspect(\"equal\", \"box\")\n",
+    "        ax.set_xticks([])\n",
+    "        ax.set_yticks([])\n",
     "\n",
     "    plot_idx = 0\n",
     "    axes[plot_idx].scatter(x[:, 0].cpu(), x[:, 1].cpu(), s=2)\n",
-    "    axes[plot_idx].set_title('t = 0.00')\n",
+    "    axes[plot_idx].set_title(\"t = 0.00\")\n",
     "    square_centre_limits(axes[plot_idx], x.cpu())\n",
     "\n",
     "    # sampling loop\n",
     "    for step, (dt, t) in enumerate(zip(dts, schedule)):\n",
     "        full_t = inference_sched.pad_time(batch_size, t, device=DEVICE)\n",
-    "        v_t    = model(torch.cat([x, full_t[:, None]], dim=-1))\n",
-    "        x      = cfm.step(v_t, x, dt, t=full_t)\n",
+    "        v_t = model(torch.cat([x, full_t[:, None]], dim=-1))\n",
+    "        x = cfm.step(v_t, x, dt, t=full_t)\n",
     "\n",
     "        # time after the step (always exists, even at the very end)\n",
     "        t_next = (t + dt).item()\n",
@@ -305,11 +305,11 @@
     "            plot_idx += 1\n",
     "            ax = axes[plot_idx]\n",
     "            ax.scatter(x[:, 0].cpu(), x[:, 1].cpu(), s=2)\n",
-    "            ax.set_title(f't = {t_next:.2f}')\n",
+    "            ax.set_title(f\"t = {t_next:.2f}\")\n",
     "            square_centre_limits(ax, x.cpu())\n",
     "\n",
     "plt.tight_layout(pad=0.8)\n",
-    "plt.show()\n"
+    "plt.show()"
    ]
   },
   {
@@ -325,12 +325,11 @@
    "metadata": {},
    "outputs": [],
    "source": [
+    "import matplotlib.pyplot as plt\n",
     "import torch\n",
     "from torch import Tensor\n",
-    "import matplotlib.pyplot as plt\n",
-    "from bionemo.moco.schedules.inference_time_schedules import (\n",
-    "    EntropicInferenceSchedule, TimeDirection\n",
-    ")"
+    "\n",
+    "from bionemo.moco.schedules.inference_time_schedules import EntropicInferenceSchedule, TimeDirection"
    ]
   },
   {
@@ -367,10 +366,11 @@
    ],
    "source": [
     "%%time\n",
-    "_FLOW_STEPS   = 100\n",
-    "display_int   = 10 # controls every \"n\" steps to display\n",
+    "_FLOW_STEPS = 100\n",
+    "display_int = 10  # controls every \"n\" steps to display\n",
     "shape = (batch_size, dim)\n",
     "\n",
+    "\n",
     "# Predictor function wrapper.\n",
     "# The scheduler needs a function `model(t, x)` and this wrapper handles the formatting.\n",
     "def predictor_fn(t: Tensor, x: Tensor) -> Tensor:\n",
@@ -379,62 +379,65 @@
     "        t = t.unsqueeze(-1)\n",
     "    if t.shape[0] != x.shape[0]:\n",
     "        t = t.expand(x.shape[0], -1)\n",
-    "    \n",
+    "\n",
     "    model_input = torch.cat([x, t], dim=-1)\n",
     "    return model(model_input)\n",
     "\n",
+    "\n",
     "def x_0_sampler_fn(n_samples: int) -> Tensor:\n",
     "    return cfm.sample_prior((n_samples, dim))\n",
     "\n",
+    "\n",
     "def x_1_sampler_fn(n_samples: int) -> Tensor:\n",
     "    return sample_moons(n_samples)\n",
     "\n",
+    "\n",
     "inference_sched = EntropicInferenceSchedule(\n",
     "    predictor=predictor_fn,\n",
     "    x_0_sampler=x_0_sampler_fn,\n",
     "    x_1_sampler=x_1_sampler_fn,\n",
     "    nsteps=_FLOW_STEPS,\n",
-    "    n_approx_entropy_points=30,      # More points -> more accurate schedule, but slower to generate\n",
+    "    n_approx_entropy_points=30,  # More points -> more accurate schedule, but slower to generate\n",
     "    batch_size=batch_size,\n",
     "    direction=TimeDirection.UNIFIED,\n",
     "    device=DEVICE,\n",
     ")\n",
     "print(\"Generating entropic schedule...\")\n",
-    "schedule = inference_sched.generate_schedule().to(DEVICE)  \n",
-    "dts      = inference_sched.discretize().to(DEVICE)\n",
+    "schedule = inference_sched.generate_schedule().to(DEVICE)\n",
+    "dts = inference_sched.discretize().to(DEVICE)\n",
     "print(\"Schedule generated.\")\n",
     "\n",
     "display_indices = sorted(set(range(0, _FLOW_STEPS + 1, display_int)) | {0, _FLOW_STEPS})\n",
     "n_plots = len(display_indices)\n",
     "\n",
     "with torch.no_grad():\n",
-    "\n",
     "    x = cfm.sample_prior((batch_size, dim)).to(DEVICE)\n",
     "\n",
     "    fig, axes = plt.subplots(1, n_plots, figsize=(4 * n_plots, 4))\n",
     "    for ax in axes:\n",
-    "        ax.set_aspect('equal', 'box')\n",
-    "        ax.set_xticks([]); ax.set_yticks([])\n",
+    "        ax.set_aspect(\"equal\", \"box\")\n",
+    "        ax.set_xticks([])\n",
+    "        ax.set_yticks([])\n",
     "\n",
     "    plot_idx = 0\n",
     "    axes[plot_idx].scatter(x[:, 0].cpu(), x[:, 1].cpu(), s=2)\n",
-    "    axes[plot_idx].set_title('t = 0.00')\n",
-    "    square_centre_limits(axes[plot_idx], x.cpu()) \n",
+    "    axes[plot_idx].set_title(\"t = 0.00\")\n",
+    "    square_centre_limits(axes[plot_idx], x.cpu())\n",
     "\n",
     "    # integration loop & viz\n",
     "    for step, (dt, t) in enumerate(zip(dts, schedule)):\n",
     "        full_t = inference_sched.pad_time(batch_size, t, device=DEVICE)\n",
-    "        v_t    = model(torch.cat([x, full_t[:, None]], dim=-1))\n",
-    "        x      = cfm.step(v_t, x, dt, t=full_t)\n",
+    "        v_t = model(torch.cat([x, full_t[:, None]], dim=-1))\n",
+    "        x = cfm.step(v_t, x, dt, t=full_t)\n",
     "\n",
     "        t_next = (t + dt).item()\n",
     "\n",
     "        if (step + 1) in display_indices:\n",
     "            plot_idx += 1\n",
     "            ax = axes[plot_idx]\n",
     "            ax.scatter(x[:, 0].cpu(), x[:, 1].cpu(), s=2)\n",
-    "            ax.set_title(f't = {t_next:.2f}')\n",
-    "            square_centre_limits(ax, x.cpu()) \n",
+    "            ax.set_title(f\"t = {t_next:.2f}\")\n",
+    "            square_centre_limits(ax, x.cpu())\n",
     "\n",
     "plt.tight_layout(pad=0.8)\n",
     "plt.show()"