diff --git a/flake.nix b/flake.nix
index 960b841e4..6d6deda94 100644
--- a/flake.nix
+++ b/flake.nix
@@ -57,6 +57,11 @@
       inputs.nixpkgs.follows = "nixpkgs";
     };
 
+    # Provides only `room-server` for images/dev/symphony-codex (through
+    # `pkgs.symphony-room-server` in lib/overlay.nix). The Elixir runtime
+    # itself lives in packages/symphony now; room-server's source moved to
+    # the ix monorepo, so this pin stays on the last symphony rev that still
+    # builds it and retires once the image's room-server seam moves too.
     symphony = {
       url = "github:indexable-inc/symphony/main";
       inputs.nixpkgs.follows = "nixpkgs";
diff --git a/lib/per-system.nix b/lib/per-system.nix
index ab650f8d4..473d9531d 100644
--- a/lib/per-system.nix
+++ b/lib/per-system.nix
@@ -633,6 +633,11 @@ let
               printf '%s\n' '${forced}' > "$out"
             '';
           run-records-session = repoPackages.run.passthru.tests.recordsSession;
+          # Symphony's required quality lane (compile -Werror, mix format,
+          # credo, mix test) as a sandboxed derivation; see
+          # packages/symphony/default.nix. The advisory lane (dialyzer,
+          # sobelow, deps.audit) stays a local `mix quality` run.
+          symphony-elixir = repoPackages.symphony.passthru.tests.elixir;
           # Deterministic alloc-count gate for indexbench: runs the counting-
           # allocator demo bench once through `indexbench assert` and fails if its
           # allocation count exceeds the declared budget. Reproducible, unlike
@@ -809,5 +814,19 @@ in
         pkgs.jemalloc
       ];
     };
+
+    # Dev loop for packages/symphony: the Elixir/OTP pairing the runtime pins
+    # (1.19 on 28) plus the host tools bin/run-nix expects. codex is the plain
+    # nixpkgs CLI; authenticate it before `nix run .#symphony`.
+    symphony = pkgs.mkShellNoCC {
+      packages = [
+        (ix.languages.elixir.toolchain pkgs { version = "1.19"; })
+        (ix.languages.erlang.toolchain pkgs { version = "28"; })
+        pkgs.codex
+        pkgs.gh
+        pkgs.git
+        pkgs.openssh
+      ];
+    };
   };
 }
diff --git a/modules/services/symphony/default.nix b/modules/services/symphony/default.nix
new file mode 100644
index 000000000..a4bc8c19e
--- /dev/null
+++ b/modules/services/symphony/default.nix
@@ -0,0 +1,353 @@
+# NixOS service module for the Symphony runtime.
+#
+# Minimal opinionated systemd unit. Reads secrets from an EnvironmentFile
+# you control, so you can wire any secret manager (sops-nix, agenix,
+# Bitwarden Secrets Manager, AWS Secrets Manager, etc.) underneath. For
+# Bitwarden Secrets Manager specifically, set `secretsCommand` to a
+# `bws run -- ...` invocation; the unit will wrap ExecStart with it.
+{
+  config,
+  lib,
+  pkgs,
+  ...
+}:
+let
+  inherit (lib)
+    mkEnableOption
+    mkIf
+    mkOption
+    optionalString
+    types
+    ;
+
+  cfg = config.services.symphony;
+in
+{
+  options.services.symphony = {
+    enable = mkEnableOption "Symphony runtime";
+
+    package = mkOption {
+      type = types.package;
+      description = "Symphony package (provides /bin/symphony from this flake's default output).";
+    };
+
+    user = mkOption {
+      type = types.str;
+      default = "symphony";
+      description = "Unix user the service runs as. Set to an existing user, or let DynamicUser handle it.";
+    };
+
+    stateDir = mkOption {
+      type = types.path;
+      default = "/var/lib/symphony";
+      description = "Directory for runs, workspaces, logs, and the staged runtime copy.";
+    };
+
+    httpPort = mkOption {
+      type = types.port;
+      default = 4040;
+      description = "Phoenix HTTP listener port.";
+    };
+
+    primaryRepo = mkOption {
+      type = types.nullOr types.path;
+      default = null;
+      description = "Absolute path to the primary repository checkout (SYMPHONY_PRIMARY_REPO).";
+    };
+
+    repoRoot = mkOption {
+      type = types.nullOr types.path;
+      default = null;
+      description = "Optional parent directory of sibling repository checkouts (SYMPHONY_REPO_ROOT). Defaults to the parent of primaryRepo.";
+    };
+
+    workflowPack = mkOption {
+      type = types.str;
+      default = "example";
+      description = "Built-in workflow pack name; ignored when packDir is set.";
+    };
+
+    packDir = mkOption {
+      type = types.nullOr types.path;
+      default = null;
+      description = "Absolute path to an external workflow pack (SYMPHONY_PACK_DIR). Takes precedence over workflowPack.";
+    };
+
+    roomRegistryUrl = mkOption {
+      type = types.nullOr types.str;
+      default = null;
+      description = ''
+        Central room.ix.dev base URL each run's room-server registers its
+        backend with (SYMPHONY_ROOM_REGISTRY_URL). Drives both the room UI's
+        transcript view and the Slack "Run details" deep link. Unset disables
+        registration and the Slack link. The matching write token is a secret;
+        supply SYMPHONY_ROOM_REGISTRY_TOKEN via environmentFile.
+      '';
+    };
+
+    roomAdvertiseHost = mkOption {
+      type = types.nullOr types.str;
+      default = null;
+      description = ''
+        Address a provisioned per-run room-server binds and advertises so
+        room.ix.dev can reach it to proxy the run's transcript
+        (SYMPHONY_ROOM_ADVERTISE_HOST). Set to this host's tailnet address when
+        room.ix.dev runs elsewhere; unset keeps the loopback default, reachable
+        only when room.ix.dev shares the host.
+      '';
+    };
+
+    roomServerUrl = mkOption {
+      type = types.nullOr types.str;
+      default = null;
+      description = ''
+        Standing room-server URL for `:local` / `{:room, url}` placements that
+        do not provision their own per-run server (SYMPHONY_ROOM_SERVER_URL).
+      '';
+    };
+
+    extraEnvironment = mkOption {
+      type = types.attrsOf types.str;
+      default = { };
+      description = ''
+        Additional environment variables exported to the service. Use for
+        non-secret config: LINEAR_WORKSPACE_SLUG, SYMPHONY_BOT_USERNAME,
+        SYMPHONY_BOT_EMAIL, SYMPHONY_GITHUB_APP_OWNER_REPO,
+        SYMPHONY_GITHUB_STATS_QUERY, SYMPHONY_SLACK_NOTIFY_CHANNEL, etc.
+      '';
+    };
+
+    environmentFile = mkOption {
+      type = types.nullOr types.path;
+      default = null;
+      description = ''
+        Path to a systemd EnvironmentFile holding secrets:
+        LINEAR_API_KEY, GITHUB_TOKEN, LINEAR_WEBHOOK_SECRET,
+        GITHUB_WEBHOOK_SECRET, SLACK_SIGNING_SECRET, SLACK_BOT_OAUTH_TOKEN,
+        SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64, SYMPHONY_ROOM_REGISTRY_TOKEN,
+        etc.
+        Wire this to whichever secret manager you use (sops-nix, agenix, ...).
+        Leave null if you use secretsCommand instead.
+      '';
+    };
+
+    secretsCommand = mkOption {
+      type = types.nullOr (types.listOf types.str);
+      default = null;
+      example = [
+        "bws"
+        "run"
+        "--project-id"
+        "symphony-prod"
+        "--"
+      ];
+      description = ''
+        Optional command that wraps ExecStart and injects secrets into the
+        environment. Designed for Bitwarden Secrets Manager (`bws run --
+        ...`) or any compatible secret-injecting CLI. The wrapper command
+        must exec its trailing arguments. Place the bws binary on the
+        service's PATH via `path = [ pkgs.bws ];` or by adding it to
+        runtimeInputs of the symphony package.
+
+        When set, the unit also expects BWS_ACCESS_TOKEN (or equivalent)
+        to be exported via environmentFile or extraEnvironment.
+      '';
+    };
+
+    path = mkOption {
+      type = types.listOf types.package;
+      default = [ ];
+      description = "Extra packages on the service PATH (e.g. pkgs.bws when using secretsCommand).";
+    };
+
+    hostRuntime = mkOption {
+      default = { };
+      description = ''
+        The host codex placement. When enabled, a workflow node that
+        declares `location: host` (or the run's resolved fallback) runs
+        codex directly on this machine as a real OS user, with no VM. The
+        per-run room-server and the codex process it spawns run as
+        `user` inside that user's home directory, launched as transient
+        `systemd-run --uid` units. This option wires the polkit grant,
+        PATH, and environment that path needs. It stays inert until
+        `enable` is set.
+      '';
+      type = types.submodule {
+        options = {
+          enable = mkEnableOption "the host codex placement";
+
+          user = mkOption {
+            type = types.str;
+            default = "";
+            description = "OS user codex runs as for host placement (SYMPHONY_HOST_USER). Must already exist with a home directory.";
+          };
+
+          group = mkOption {
+            type = types.nullOr types.str;
+            default = null;
+            description = "OS group for host runs (SYMPHONY_HOST_GROUP); omitted uses the user's primary group.";
+          };
+
+          workspacesDir = mkOption {
+            type = types.nullOr types.path;
+            default = null;
+            description = "Parent directory for run checkouts (SYMPHONY_HOST_WORKSPACES_DIR); defaults to <user home>/symphony-workspaces.";
+          };
+
+          roomServerPackage = mkOption {
+            type = types.nullOr types.package;
+            default = null;
+            description = "Package providing the codex-wrapped room-server launched as the host user (this flake's room-server output). Used by the per-run host placement.";
+          };
+
+          keep = mkOption {
+            type = types.bool;
+            default = false;
+            description = "Leave the unit and checkout in place after the turn for inspection (SYMPHONY_HOST_KEEP).";
+          };
+        };
+      };
+    };
+  };
+
+  config = mkIf cfg.enable {
+    assertions = [
+      {
+        assertion = !cfg.hostRuntime.enable || cfg.hostRuntime.user != "";
+        message = "services.symphony.hostRuntime.user must be set when hostRuntime.enable is true.";
+      }
+      {
+        assertion = !cfg.hostRuntime.enable || cfg.hostRuntime.roomServerPackage != null;
+        message = "services.symphony.hostRuntime.roomServerPackage must be set when hostRuntime.enable is true.";
+      }
+    ];
+
+    # The host runtime calls systemd's StartTransientUnit over D-Bus to run
+    # codex as another user. A non-root service needs polkit authorization
+    # for that. Scope the grant to the "symphony-host-" unit-name prefix so
+    # the service cannot manage unrelated system units. See systemd-run(1)
+    # and the polkit systemd1 actions documented at
+    # https://www.freedesktop.org/software/systemd/man/latest/org.freedesktop.systemd1.html
+    security.polkit = lib.mkIf cfg.hostRuntime.enable {
+      enable = true;
+      extraConfig = ''
+        polkit.addRule(function(action, subject) {
+          if (subject.user == "${cfg.user}" &&
+              action.id == "org.freedesktop.systemd1.manage-units") {
+            var unit = action.lookup("unit");
+            if (unit && unit.indexOf("symphony-host-") == 0) {
+              return polkit.Result.YES;
+            }
+          }
+        });
+      '';
+    };
+
+    users.users = lib.mkIf (cfg.user == "symphony") {
+      symphony = {
+        isSystemUser = true;
+        group = "symphony";
+        home = cfg.stateDir;
+      };
+    };
+
+    users.groups = lib.mkIf (cfg.user == "symphony") {
+      symphony = { };
+    };
+
+    systemd.tmpfiles.rules = [
+      "d ${cfg.stateDir} 0750 ${cfg.user} ${cfg.user} -"
+      "d ${cfg.stateDir}/workspaces 0750 ${cfg.user} ${cfg.user} -"
+      "d ${cfg.stateDir}/runs 0750 ${cfg.user} ${cfg.user} -"
+      "d ${cfg.stateDir}/log 0750 ${cfg.user} ${cfg.user} -"
+    ];
+
+    systemd.services.symphony = {
+      description = "Symphony runtime";
+      wantedBy = [ "multi-user.target" ];
+      after = [ "network-online.target" ];
+      wants = [ "network-online.target" ];
+
+      path =
+        cfg.path
+        ++ lib.optionals cfg.hostRuntime.enable [
+          pkgs.systemd
+          pkgs.getent
+          cfg.hostRuntime.roomServerPackage
+        ];
+
+      environment = {
+        SYMPHONY_STATE_DIR = cfg.stateDir;
+        SYMPHONY_WORKSPACES_DIR = "${cfg.stateDir}/workspaces";
+        SYMPHONY_RUNS_DIR = "${cfg.stateDir}/runs";
+        SYMPHONY_LOGS_ROOT = "${cfg.stateDir}/log";
+        SYMPHONY_HTTP_PORT = toString cfg.httpPort;
+        SYMPHONY_WORKFLOW_PACK = cfg.workflowPack;
+      }
+      // (lib.optionalAttrs (cfg.primaryRepo != null) {
+        SYMPHONY_PRIMARY_REPO = toString cfg.primaryRepo;
+      })
+      // (lib.optionalAttrs (cfg.repoRoot != null) {
+        SYMPHONY_REPO_ROOT = toString cfg.repoRoot;
+      })
+      // (lib.optionalAttrs (cfg.packDir != null) {
+        SYMPHONY_PACK_DIR = toString cfg.packDir;
+      })
+      // (lib.optionalAttrs (cfg.roomRegistryUrl != null) {
+        SYMPHONY_ROOM_REGISTRY_URL = cfg.roomRegistryUrl;
+      })
+      // (lib.optionalAttrs (cfg.roomAdvertiseHost != null) {
+        SYMPHONY_ROOM_ADVERTISE_HOST = cfg.roomAdvertiseHost;
+      })
+      // (lib.optionalAttrs (cfg.roomServerUrl != null) {
+        SYMPHONY_ROOM_SERVER_URL = cfg.roomServerUrl;
+      })
+      // (lib.optionalAttrs cfg.hostRuntime.enable (
+        {
+          SYMPHONY_HOST_USER = cfg.hostRuntime.user;
+          SYMPHONY_HOST_ROOM_SERVER_COMMAND = lib.getExe cfg.hostRuntime.roomServerPackage;
+        }
+        // (lib.optionalAttrs (cfg.hostRuntime.group != null) {
+          SYMPHONY_HOST_GROUP = cfg.hostRuntime.group;
+        })
+        // (lib.optionalAttrs (cfg.hostRuntime.workspacesDir != null) {
+          SYMPHONY_HOST_WORKSPACES_DIR = toString cfg.hostRuntime.workspacesDir;
+        })
+        // (lib.optionalAttrs cfg.hostRuntime.keep {
+          SYMPHONY_HOST_KEEP = "true";
+        })
+      ))
+      // cfg.extraEnvironment;
+
+      serviceConfig = {
+        Type = "simple";
+        User = cfg.user;
+        Group = cfg.user;
+        ExecStart =
+          let
+            symphonyBin = "${cfg.package}/bin/symphony";
+            wrapper = optionalString (cfg.secretsCommand != null) (
+              lib.escapeShellArgs cfg.secretsCommand + " "
+            );
+          in
+          "${wrapper}${symphonyBin}";
+        Restart = "on-failure";
+        RestartSec = "10s";
+        StateDirectory = lib.mkIf (lib.hasPrefix "/var/lib/" cfg.stateDir) (
+          lib.removePrefix "/var/lib/" cfg.stateDir
+        );
+        # Symphony spawns codex subprocesses and clones git repos, so
+        # most sandboxing options need to stay permissive. Only enable
+        # the cheap, safe ones.
+        NoNewPrivileges = true;
+        PrivateTmp = true;
+        ProtectKernelTunables = true;
+        ProtectKernelModules = true;
+        ProtectControlGroups = true;
+      }
+      // (lib.optionalAttrs (cfg.environmentFile != null) {
+        EnvironmentFile = cfg.environmentFile;
+      });
+    };
+  };
+}
diff --git a/packages/symphony/.env.example b/packages/symphony/.env.example
new file mode 100644
index 000000000..f8b0ff477
--- /dev/null
+++ b/packages/symphony/.env.example
@@ -0,0 +1,78 @@
+# --- Core runtime -----------------------------------------------------------
+SYMPHONY_PRIMARY_REPO=
+SYMPHONY_WORKFLOW_PACK=example
+# Or, to load an external pack:
+# SYMPHONY_PACK_DIR=/path/to/your/pack
+SYMPHONY_HTTP_PORT=4040
+SYMPHONY_STATE_DIR=/var/lib/symphony
+SYMPHONY_WORKSPACES_DIR=
+SYMPHONY_REPO_ROOT=
+
+# --- Codex placement --------------------------------------------------------
+# Each agent node names its placement in the .sym workflow with `location:`
+# (local|room|ixvm|host). The placement a run retries on when its declared
+# `ixvm` placement fails to provision (host|local|none); defaults to host.
+# SYMPHONY_PLACEMENT_FALLBACK=host
+# Host placement: runs codex on this machine as a real OS user, no VM.
+# SYMPHONY_HOST_USER=hari
+# SYMPHONY_HOST_GROUP=
+# SYMPHONY_HOST_WORKSPACES_DIR=
+# SYMPHONY_HOST_KEEP=false
+
+# --- Claude models ----------------------------------------------------------
+# A skill whose codex_model names a Claude model (e.g. claude-opus-4-8) runs
+# through headless Claude Code instead of codex, with --dangerously-skip-permissions.
+# Auth is the Anthropic API key below.
+ANTHROPIC_API_KEY=
+# SYMPHONY_CLAUDE_COMMAND=claude
+
+# --- Integrations -----------------------------------------------------------
+LINEAR_API_KEY=
+LINEAR_TEAM_KEY=
+LINEAR_WORKSPACE_SLUG=
+LINEAR_WEBHOOK_SECRET=
+
+GITHUB_TOKEN=
+GITHUB_WEBHOOK_SECRET=
+
+SLACK_BOT_OAUTH_TOKEN=
+SLACK_SIGNING_SECRET=
+SYMPHONY_SLACK_NOTIFY_CHANNEL=
+# Post failed cron runs to Slack (digest, quality, idiomatic, babysit-dispatch
+# and other scheduled workflows). Defaults to true.
+SYMPHONY_SLACK_NOTIFY_CRON_FAILURES=
+# Comma-separated workflow names whose successful cron runs also post, e.g.
+# "digest,quality". Use "*" to post every cron success (expect high-frequency
+# dispatchers like babysit-dispatch too). Defaults to none, so cron successes
+# stay quiet.
+SYMPHONY_SLACK_NOTIFY_CRON_WORKFLOWS=
+
+# --- Dashboard / links ------------------------------------------------------
+SYMPHONY_GITHUB_STATS_QUERY=
+
+# --- Activity room (optional) -----------------------------------------------
+# room.ix.dev is the central room UI that aggregates run transcripts. Each run's
+# room-server registers its backend here so the UI can show (and the Slack
+# "Run details" button can deep-link to) the run's transcript. Leave
+# SYMPHONY_ROOM_REGISTRY_URL unset to disable registration and the Slack link.
+SYMPHONY_ROOM_REGISTRY_URL=
+# Bearer token the central room server requires for backend registration
+# writes (matches the room-server's ROOM_BACKEND_TOKEN). Optional.
+SYMPHONY_ROOM_REGISTRY_TOKEN=
+# Address a provisioned per-run room-server binds and advertises so room.ix.dev
+# can reach it to proxy the run's transcript. Set to this host's tailnet
+# address when room.ix.dev runs elsewhere; unset keeps the loopback default
+# (only reachable when room.ix.dev shares the host).
+SYMPHONY_ROOM_ADVERTISE_HOST=
+# A standing room-server URL for `:local` / `{:room, url}` placements that do
+# not provision their own per-run server.
+SYMPHONY_ROOM_SERVER_URL=
+
+# --- Optional GitHub App ----------------------------------------------------
+# Skills mint installation tokens via SymphonyElixir.GithubApp when these are
+# set. The private key is base64-encoded so it fits in a single-line env file.
+SYMPHONY_GITHUB_APP_ID=
+SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64=
+SYMPHONY_GITHUB_APP_OWNER_REPO=
+SYMPHONY_BOT_USERNAME=
+SYMPHONY_BOT_EMAIL=
diff --git a/packages/symphony/.gitignore b/packages/symphony/.gitignore
new file mode 100644
index 000000000..f4c68754a
--- /dev/null
+++ b/packages/symphony/.gitignore
@@ -0,0 +1,11 @@
+.env
+.env.*
+!.env.example
+log/
+tmp/
+room.db
+room.db-shm
+room.db-wal
+workspaces/
+runs/
+.worktrees/
diff --git a/packages/symphony/AGENTS.md b/packages/symphony/AGENTS.md
new file mode 100644
index 000000000..4e3ed2ad3
--- /dev/null
+++ b/packages/symphony/AGENTS.md
@@ -0,0 +1,73 @@
+# symphony
+
+An Elixir runtime that orchestrates Codex agent sessions across one or
+more git repositories. Workflows are written in the `.sym` surface
+language, lowered to an IR run graph the runtime walks; hot-reloaded
+`.sym` workflows and markdown skills are the configuration surface. The
+room stack (`room-server` and the Tauri/Svelte client) lives in the IX
+monorepo; this package is the Elixir runtime that drives it over HTTP.
+
+Repo-wide standards (writing style, Nix style, commit conventions) come
+from the index root AGENTS.md. This file holds only the invariants that
+are specific to symphony.
+
+Do not commit secrets. Tokens for Linear, GitHub, Slack, Codex, or any
+other external system must be supplied through the runtime environment or
+host secret manager. The bundled `.env.example` lists the keys the
+runtime reads.
+
+## Self-contained operations
+
+Symphony's runtime behavior must not depend on out-of-repo changes to
+function. In particular, scheduled work (cron triggers, dispatchers,
+auto-healing loops) belongs inside the runtime, driven by Symphony's own
+cron scheduler. Do not introduce systemd timers, host nix modules, or any
+out-of-repo schedulers as load-bearing pieces of a symphony feature. A
+fresh symphony deploy should bring up all of its scheduled work without
+needing a paired change in any other repo.
+
+## Workflow packs
+
+The runtime is pack-agnostic. The bundled `workflows/example/` pack is the
+public default and is intentionally narrow (a single manual-trigger inspect
+skill). Deployers point `SYMPHONY_PACK_DIR` at their own pack to drive real
+work. Keep core changes pack-agnostic: no workflow names, repo slugs,
+label strings, or ticket schemes hardcoded in `elixir/lib/`.
+
+## Elixir style
+
+The Elixir runtime is the entry point for symphony itself; the room
+stack it drives lives in the IX monorepo and is not owned here. Keep
+`elixir/lib/` pack-agnostic, with workflow shape carried in `.sym` /
+markdown under the active pack directory rather than hardcoded in source.
+
+Prefer Mix tasks and supervised processes over loose scripts. A new
+scheduled job is a child of Symphony's cron supervisor, not a host-level
+timer.
+
+## Tests
+
+Tests should protect behavior that can regress across boundaries:
+module merges, generated units, pack rendering, and runtime contracts
+(including the engine wire fixtures in `contracts/fixtures` shared with
+the room-server in IX). Avoid asserting facts already obvious from the
+literal config under test.
+
+The required lane (compile with warnings as errors, format, credo,
+`mix test`) runs sandboxed as the `symphony-elixir` flake check; the
+advisory lane is `make quality` in `elixir/`. See `docs/quality.md`.
+
+## Layout
+
+```
+default.nix                # symphony launcher package + the elixir check
+elixir/                    # Symphony runtime (.sym/IR orchestrator)
+workflows/                 # pack-agnostic example pack
+contracts/fixtures/        # engine wire fixtures shared with room-server (IX)
+docs/                      # package-owned reference
+../../modules/services/symphony/  # NixOS module for the runtime
+```
+
+Folders should preserve conceptual paths. When siblings share a real
+domain, nest them under that domain instead of flattening the name
+into repeated dashed prefixes.
diff --git a/packages/symphony/CLAUDE.md b/packages/symphony/CLAUDE.md
new file mode 120000
index 000000000..47dc3e3d8
--- /dev/null
+++ b/packages/symphony/CLAUDE.md
@@ -0,0 +1 @@
+AGENTS.md
\ No newline at end of file
diff --git a/packages/symphony/LICENSE b/packages/symphony/LICENSE
new file mode 100644
index 000000000..376f10496
--- /dev/null
+++ b/packages/symphony/LICENSE
@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or Derivative
+          Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work, excluding
+          those notices that do not pertain to any part of the Derivative
+          Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/packages/symphony/README.md b/packages/symphony/README.md
new file mode 100644
index 000000000..afeac2147
--- /dev/null
+++ b/packages/symphony/README.md
@@ -0,0 +1,45 @@
+<p align="center">
+  <img src="assets/logo.svg" width="80" alt="Symphony" />
+</p>
+
+# symphony
+
+> [!IMPORTANT]
+> Symphony is highly experimental software. Use it at your own risk: it can spawn Codex sessions, create branches, open PRs, and mutate Linear/GitHub state when credentials allow it.
+
+Symphony is a boring DAG runtime for deterministic agent workflows. Workflows are written in the `.sym` surface language, lowered to an IR run graph, and walked by a supervised Elixir/OTP runtime with a LiveView dashboard, cron/Slack/Linear/GitHub triggers, and per-run git worktrees. It moved here from the dedicated [indexable-inc/symphony](https://github.com/indexable-inc/symphony) repo (rev `c9e7092`).
+
+Run it from this repo:
+
+```sh
+nix run .#symphony
+```
+
+The launcher requires an authenticated `codex` on PATH and refuses to start without one. It stages this source tree under `~/.local/state/symphony`, fetches mix deps, and boots the dashboard on http://127.0.0.1:4040. Point `SYMPHONY_PRIMARY_REPO` at a local checkout first; [docs/setup.md](docs/setup.md) and [.env.example](.env.example) cover the full configuration surface.
+
+<img alt="Symphony dashboard" src="https://github.com/user-attachments/assets/eb06f062-3b2d-41a4-a679-94c5c2f847aa" />
+
+## Layout
+
+- [`elixir/`](elixir/): the runtime (DSL parser, IR, runtime supervisor, Phoenix dashboard, triggers).
+- [`workflows/example/`](workflows/example/): the bundled pack, intentionally narrow (one manual-trigger `inspect` workflow plus its read-only skill). Real deployments point `SYMPHONY_PACK_DIR` at their own pack.
+- [`contracts/fixtures/`](contracts/fixtures/): engine wire fixtures shared with the room-server in the ix monorepo. The Elixir contract tests read them from `../../contracts`, so this directory stays beside `elixir/`.
+- [`bin/run-nix`](bin/run-nix): the production entrypoint the `symphony` package wraps.
+- [`docs/`](docs/): setup, engine contract, and quality-gate reference.
+
+## Neighbors
+
+- The room stack symphony drives over HTTP (`room-server` and the room UI) lives in the ix monorepo (`crates/room`, `packages/room`).
+- `location: ixvm` placements provision VMs from the [`symphony-codex`](../../images/dev/symphony-codex/) image, which carries `room-server` on PATH.
+- Deployment goes through the [`symphony` NixOS module](../../modules/services/symphony/) (`services.symphony.*`), with secrets supplied via `environmentFile` or `secretsCommand`.
+
+## Developing
+
+```sh
+nix develop .#symphony   # Elixir 1.19 / OTP 28, plus codex, gh, git
+cd packages/symphony/elixir
+make all                 # setup, compile -Werror, fmt-check, credo
+mix test
+```
+
+CI runs the same required lane sandboxed as the `symphony-elixir` flake check (see [default.nix](default.nix)); after changing `elixir/mix.lock`, refresh the `fetchMixDeps` hash there. The advisory lane (`make quality`: sobelow, deps.audit, dialyzer, coveralls) stays a local run; see [docs/quality.md](docs/quality.md).
diff --git a/packages/symphony/assets/logo.svg b/packages/symphony/assets/logo.svg
new file mode 100644
index 000000000..30ee45cb5
--- /dev/null
+++ b/packages/symphony/assets/logo.svg
@@ -0,0 +1,6 @@
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" width="512" height="512">
+	<rect width="512" height="512" fill="#1a1a1a"/>
+	<svg x="64" y="64" width="384" height="384" viewBox="0 0 24 24">
+		<path d="M12 2L2 7l10 5 10-5-10-5zM2 17l10 5 10-5M2 12l10 5 10-5" fill="#f0f0f0"/>
+	</svg>
+</svg>
diff --git a/packages/symphony/bin/run-nix b/packages/symphony/bin/run-nix
new file mode 100755
index 000000000..f19588fda
--- /dev/null
+++ b/packages/symphony/bin/run-nix
@@ -0,0 +1,63 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+
+SYMPHONY_STATE_DIR="${SYMPHONY_STATE_DIR:-$HOME/.local/state/symphony}"
+SYMPHONY_RUNTIME_DIR="${SYMPHONY_RUNTIME_DIR:-$SYMPHONY_STATE_DIR/runtime}"
+SYMPHONY_LOGS_ROOT="${SYMPHONY_LOGS_ROOT:-$SYMPHONY_STATE_DIR/log}"
+SYMPHONY_HTTP_PORT="${SYMPHONY_HTTP_PORT:-${SYMPHONY_PORT:-4040}}"
+
+# The new DAG runtime calls this SYMPHONY_WORKSPACES_DIR; the older
+# escript called it SYMPHONY_WORKSPACE_ROOT. Accept either, prefer the
+# new name.
+SYMPHONY_WORKSPACES_DIR="${SYMPHONY_WORKSPACES_DIR:-${SYMPHONY_WORKSPACE_ROOT:-$SYMPHONY_STATE_DIR/workspaces}}"
+
+# Run history (per-run JSON snapshots that drive the dashboard). The
+# default in SymphonyElixir.Config is $SYMPHONY_ROOT/runs, but
+# SYMPHONY_ROOT here points at the runtime copy which gets wiped on
+# every restart. Anchor runs/ at the stable state dir so the dashboard
+# shows historical runs after rebuilds.
+SYMPHONY_RUNS_DIR="${SYMPHONY_RUNS_DIR:-$SYMPHONY_STATE_DIR/runs}"
+
+if ! command -v codex >/dev/null 2>&1; then
+  echo "codex is required on PATH and must already be authenticated" >&2
+  exit 1
+fi
+
+mkdir -p "$SYMPHONY_STATE_DIR" "$SYMPHONY_WORKSPACES_DIR" "$SYMPHONY_LOGS_ROOT" "$SYMPHONY_RUNS_DIR"
+
+# Stage the repo into the runtime dir so mix can write _build there
+# without touching the source checkout (which is read-only when invoked
+# from nix store, and live-edited when invoked from a working tree).
+rm -rf "$SYMPHONY_RUNTIME_DIR.tmp"
+mkdir -p "$SYMPHONY_RUNTIME_DIR.tmp"
+cp -R "$REPO_ROOT/." "$SYMPHONY_RUNTIME_DIR.tmp/"
+chmod -R u+w "$SYMPHONY_RUNTIME_DIR.tmp"
+rm -rf "$SYMPHONY_RUNTIME_DIR"
+mv "$SYMPHONY_RUNTIME_DIR.tmp" "$SYMPHONY_RUNTIME_DIR"
+
+# SYMPHONY_ROOT is read by SymphonyElixir.Config at boot to anchor the
+# catalogs (workflows/ and skills/ live there) and to resolve relative
+# paths. Anchor it at the runtime copy so a live edit of REPO_ROOT does
+# not get half-loaded mid-run.
+export SYMPHONY_ROOT="$SYMPHONY_RUNTIME_DIR"
+export SYMPHONY_WORKSPACES_DIR
+export SYMPHONY_RUNS_DIR
+export SYMPHONY_LOGS_ROOT
+export SYMPHONY_HTTP_PORT
+
+cd "$SYMPHONY_RUNTIME_DIR/elixir"
+
+# Production runs use MIX_ENV=prod; default to prod for the systemd
+# unit invocation. Callers can override (e.g. dev iteration).
+export MIX_ENV="${MIX_ENV:-prod}"
+
+mix deps.get --only "$MIX_ENV"
+mix compile --warnings-as-errors
+
+# mix run --no-halt starts SymphonyElixir.Application (which boots the
+# Catalog, WorkflowCatalog, the run supervisor, the LiveView endpoint,
+# and the triggers) and stays in the foreground so systemd can supervise
+# it.
+exec mix run --no-halt
diff --git a/packages/symphony/contracts/fixtures/agent_turn_response.json b/packages/symphony/contracts/fixtures/agent_turn_response.json
new file mode 100644
index 000000000..d959ec61a
--- /dev/null
+++ b/packages/symphony/contracts/fixtures/agent_turn_response.json
@@ -0,0 +1,12 @@
+{
+  "threadId": "thread_abc",
+  "outcome": { "kind": "ok" },
+  "eventCount": 4,
+  "usage": {
+    "tokensIn": 1200,
+    "tokensOut": 340,
+    "cacheRead": 800,
+    "cacheCreation": 64,
+    "costUsd": 0.0123
+  }
+}
diff --git a/packages/symphony/contracts/fixtures/engine_event.json b/packages/symphony/contracts/fixtures/engine_event.json
new file mode 100644
index 000000000..fefc03d9a
--- /dev/null
+++ b/packages/symphony/contracts/fixtures/engine_event.json
@@ -0,0 +1,5 @@
+{
+  "turnId": "thread_abc",
+  "seq": 7,
+  "body": { "type": "textDelta", "text": "hello" }
+}
diff --git a/packages/symphony/contracts/fixtures/turn_request.json b/packages/symphony/contracts/fixtures/turn_request.json
new file mode 100644
index 000000000..afbb16a44
--- /dev/null
+++ b/packages/symphony/contracts/fixtures/turn_request.json
@@ -0,0 +1,11 @@
+{
+  "engine": "codex",
+  "model": "gpt-5.3-codex",
+  "effort": "medium",
+  "permissions": "workspace_write",
+  "cwd": "/workspace/run_x/primary",
+  "prompt": "write FOO to ./hello.txt and stop",
+  "tools": [],
+  "runId": "run_x",
+  "nodeId": "n0"
+}
diff --git a/packages/symphony/default.nix b/packages/symphony/default.nix
new file mode 100644
index 000000000..43af867ce
--- /dev/null
+++ b/packages/symphony/default.nix
@@ -0,0 +1,176 @@
+# Symphony: the Elixir control plane for `.sym` agent workflows, absorbed
+# from the dedicated indexable-inc/symphony repo at
+# c9e709208c3ae161e24f625b9f3808a288c859ed. The launcher stages this source
+# tree into the state dir at start and runs it with `mix run --no-halt`
+# (see bin/run-nix), so the package is a closure around the source rather
+# than a compiled BEAM release; production keeps deploying the same way it
+# did from the standalone flake's `packages.default`.
+#
+# The room stack symphony drives over HTTP (room-server and the room UI)
+# lives in the ix monorepo. The `room-server` binary baked into
+# `images/dev/symphony-codex` still resolves from the pinned `symphony`
+# flake input (see flake.nix); only the runtime moved here.
+{
+  lib,
+  pkgs,
+  ix,
+  writeNushellApplication,
+}:
+let
+  # mise.toml pins Elixir 1.19 on OTP 28; the launcher and the check build
+  # against the same pairing so a deploy never runs code the gate did not.
+  elixir = ix.languages.elixir.toolchain pkgs { version = "1.19"; };
+  erlang = ix.languages.erlang.toolchain pkgs { version = "28"; };
+
+  # The tree bin/run-nix stages at service start: the mix project, the
+  # bundled example pack, and the engine wire fixtures. contracts/ sits
+  # beside elixir/ because the contract tests resolve it relatively
+  # (test/symphony_elixir/engine/contract_fixtures_test.exs).
+  src = lib.fileset.toSource {
+    root = ./.;
+    fileset = lib.fileset.unions [
+      ./bin
+      ./contracts
+      ./elixir
+      ./workflows
+    ];
+  };
+
+  # Test-env mix deps as a fixed-output derivation so the sandboxed check
+  # runs offline. Refresh the hash whenever elixir/mix.lock changes.
+  mixFodDeps = pkgs.beamPackages.fetchMixDeps {
+    pname = "symphony-elixir-deps";
+    version = "0.2.0"; # keep in sync with elixir/mix.exs
+    src = lib.fileset.toSource {
+      root = ./elixir;
+      fileset = lib.fileset.unions [
+        ./elixir/mix.exs
+        ./elixir/mix.lock
+      ];
+    };
+    inherit elixir;
+    mixEnv = "test";
+    hash = "sha256-TLRGNPIm3zQKeFt54wrdirYYK81ribfsV92/NVLdQSM=";
+  };
+
+  # mix.lock pins lazy_html (a C++ NIF over lexbor) as a test-only dep for
+  # LiveView's HTML assertions. Compiling it either downloads this exact
+  # precompiled NIF over mix's httpc or git-clones lexbor, and the sandbox
+  # allows neither, so the check below seeds elixir_make's artifact cache
+  # with the upstream release tarball; elixir_make still verifies it against
+  # the checksum.exs pinned inside the dep before unpacking. Refresh the
+  # url/hash when a mix.lock bump moves lazy_html.
+  lazyHtmlNif = pkgs.fetchurl {
+    url = "https://github.com/dashbitco/lazy_html/releases/download/v0.1.10/lazy_html-nif-2.16-x86_64-linux-gnu-0.1.10.tar.gz";
+    hash = "sha256-Ni0JKbP6OJqQ8rT08VnF/KWjiyigoVUjqSZ3LRU9dBo=";
+  };
+
+  # The required quality lane the standalone repo ran per PR (make ci:
+  # compile --warnings-as-errors, format --check-formatted, credo, test),
+  # now a sandboxed derivation wired into `checks` through per-system.nix.
+  # The advisory lane (dialyzer, sobelow, mix_audit, coveralls) stays a
+  # local `mix quality` run; see docs/quality.md.
+  elixirCheck = pkgs.stdenv.mkDerivation {
+    pname = "symphony-elixir-check";
+    version = "0.2.0";
+    inherit src;
+    sourceRoot = "source/elixir";
+
+    nativeBuildInputs = [
+      erlang
+      elixir
+      (pkgs.beamPackages.hex.override { inherit elixir; })
+      pkgs.git
+    ];
+    strictDeps = true;
+
+    env = {
+      MIX_ENV = "test";
+      HEX_OFFLINE = "1";
+      LANG = "C.UTF-8";
+      LC_CTYPE = "C.UTF-8";
+      # rebar-built deps (telemetry) make mix install rebar over the network
+      # unless the binaries are pinned, same as fetchMixDeps/mixRelease do.
+      MIX_REBAR = "${pkgs.beamPackages.rebar}/bin/rebar";
+      MIX_REBAR3 = "${pkgs.beamPackages.rebar3}/bin/rebar3";
+      # The precompiled lazy_html .so is a generic linux-gnu build, so the
+      # BEAM needs libstdc++ findable at dlopen time when the test suite
+      # loads the NIF.
+      LD_LIBRARY_PATH = lib.makeLibraryPath [ pkgs.stdenv.cc.cc.lib ];
+    };
+
+    # Same deps wiring as nixpkgs mixRelease: deps come from the fixed-output
+    # fetch, copied writable because deps.compile builds in place. The
+    # elixir_make cache seed short-circuits the lazy_html NIF download (see
+    # lazyHtmlNif above; mix/tasks/compile.elixir_make.ex reuses an existing
+    # archive instead of fetching).
+    postUnpack = ''
+      export MIX_HOME="$TEMPDIR/mix"
+      export HEX_HOME="$TEMPDIR/hex"
+      export MIX_DEPS_PATH="$TEMPDIR/deps"
+      cp --no-preserve=mode -R "${mixFodDeps}" "$MIX_DEPS_PATH"
+
+      export ELIXIR_MAKE_CACHE_DIR="$TEMPDIR/elixir-make-cache"
+      mkdir -p "$ELIXIR_MAKE_CACHE_DIR"
+      cp "${lazyHtmlNif}" "$ELIXIR_MAKE_CACHE_DIR/${lazyHtmlNif.name}"
+    '';
+
+    configurePhase = ''
+      runHook preConfigure
+      mix deps.compile --no-deps-check --skip-umbrella-children
+      ln -s "$MIX_DEPS_PATH" ./deps
+      runHook postConfigure
+    '';
+
+    buildPhase = ''
+      runHook preBuild
+      mix compile --no-deps-check --warnings-as-errors
+      runHook postBuild
+    '';
+
+    doCheck = true;
+    checkPhase = ''
+      runHook preCheck
+      mix format --check-formatted
+      mix credo
+      mix test --no-deps-check
+      runHook postCheck
+    '';
+
+    installPhase = ''
+      runHook preInstall
+      mkdir -p "$out"
+      runHook postInstall
+    '';
+  };
+in
+(writeNushellApplication {
+  name = "symphony";
+  meta = {
+    description = "Elixir runtime for .sym agent workflows (control plane, LiveView dashboard, triggers)";
+    license = lib.licenses.asl20;
+  };
+  # codex is intentionally absent: bin/run-nix requires an authenticated
+  # codex on the operator's PATH and refuses to start otherwise, so the
+  # binary and its credentials stay host-owned.
+  runtimeInputs = [
+    pkgs.bash
+    pkgs.cacert
+    pkgs.coreutils
+    elixir
+    erlang
+    pkgs.gh
+    pkgs.git
+    pkgs.openssh
+  ];
+  text = ''
+    def --wrapped main [...args] {
+      exec ${src}/bin/run-nix ...$args
+    }
+  '';
+}).overrideAttrs
+  (old: {
+    passthru = (old.passthru or { }) // {
+      tests.elixir = elixirCheck;
+    };
+  })
diff --git a/packages/symphony/docs/engine-contract.md b/packages/symphony/docs/engine-contract.md
new file mode 100644
index 000000000..a003ccb3c
--- /dev/null
+++ b/packages/symphony/docs/engine-contract.md
@@ -0,0 +1,117 @@
+# Engine contract
+
+This is the source of truth for the wire shapes shared between the Elixir
+runtime and the Rust room-server. It is the WS-0 seam of the overhaul: the
+DSL, the runtime, and the room-server all code against these shapes, so a
+change here is a deliberate cross-language change with a golden fixture to
+prove both sides still agree.
+
+Two layers own these shapes:
+
+- `crates/room/src/engine.rs` (Rust, in the IX monorepo): `TurnRequest`,
+  `EngineEvent`, `TurnStatus`, `EngineAnswer`, and the `Engine` trait.
+- `elixir/lib/symphony_elixir/engine/` and `ir/` (Elixir): the
+  `Engine.Envelope` that lowers to a `TurnRequest`, and the `IR.*`
+  durable run state that the runtime persists.
+
+Golden fixtures live in `contracts/fixtures/`. `turn_request.json` is the
+shape Elixir produces and Rust consumes, so both sides assert it: the Rust
+test in `crates/room/tests/engine_contract.rs` (in the IX monorepo) and the Elixir test
+in `elixir/test/symphony_elixir/engine/contract_fixtures_test.exs`. A field
+rename fails a check on both sides rather than silently at runtime.
+`engine_event.json` is the shape Rust produces and Elixir will consume; only
+the Rust side parses it today, because the Elixir `EngineEvent` decoder
+lands with the streaming client (the synchronous `/api/agent/turns` path
+returns an `AgentTurnResponse`, not an event stream).
+`agent_turn_response.json` is the synchronous turn result Rust produces and
+Elixir consumes, so both sides assert it: Rust deserializes the fixture and
+Elixir feeds it through `Engine.Client.submit_turn/3` and checks the lowered
+`cost`.
+
+## Casing and tagging
+
+- Field names are camelCase on the wire (`turnId`, `runId`), matching the
+  existing room-server JSON.
+- Enum bodies carry a `type` tag (`EngineEventBody`) or a `kind` tag
+  (`TurnOutcome`, `EngineAnswer`).
+- Scalar enums serialize as a lowercase or snake_case string
+  (`engine: "claude"`, `permissions: "danger_full_access"`).
+
+## TurnRequest
+
+The engine-agnostic turn the Elixir `Engine.Client` submits. The room-server
+adapter lowers it to engine-native flags.
+
+```json
+{
+  "engine": "codex",
+  "model": "gpt-5.3-codex",
+  "effort": "medium",
+  "permissions": "workspace_write",
+  "cwd": "/workspace/run_x/primary",
+  "prompt": "write FOO to ./hello.txt and stop",
+  "tools": [],
+  "runId": "run_x",
+  "nodeId": "n0"
+}
+```
+
+`effort` is omitted entirely when the envelope leaves it unset (the engine
+picks its default). `permissions` is one of `read_only`, `workspace_write`,
+`danger_full_access`; each adapter lowers it (Codex to sandbox + approval
+policy, Claude to a permission mode or `--dangerously-skip-permissions`).
+
+## EngineEvent
+
+One normalized event for one turn. `EngineEventBody` is the superset of
+what Codex emits; Claude is a subset producer and simply never emits
+`approvalRequest` or `toolCallRequest` (it self-executes its tools under
+`--dangerously-skip-permissions`).
+
+```json
+{ "turnId": "thread_abc", "seq": 7, "body": { "type": "textDelta", "text": "hello" } }
+```
+
+Body variants: `turnStarted`, `textDelta`, `reasoningDelta`,
+`toolCallStarted`, `toolCallOutput`, `fileChanged`, `statusChanged`,
+`usage`, `approvalRequest`, `toolCallRequest`, `turnCompleted`.
+
+## AgentTurnResponse
+
+The synchronous result of `POST /api/agent/turns`. The room-server awaits
+the whole turn and returns its terminal outcome, the thread id it assigned,
+the event count, and the turn's terminal `usage` totals. Both engines emit
+cumulative `Usage` events, so the response carries the last one as the
+whole-turn total; `Engine.Client` lowers it to the `IR.Attempt.cost` shape
+(`usd`, `tokens_in`, `tokens_out`, `cache_read`, `cache_creation`).
+
+```json
+{
+  "threadId": "thread_abc",
+  "outcome": { "kind": "ok" },
+  "eventCount": 4,
+  "usage": {
+    "tokensIn": 1200,
+    "tokensOut": 340,
+    "cacheRead": 800,
+    "cacheCreation": 64,
+    "costUsd": 0.0123
+  }
+}
+```
+
+`usage` is always present (a turn that emitted none serializes a zeroed
+total); `costUsd` is omitted when the engine did not price the turn, so a
+present `usd` always means a real number. A response with no `usage` (an
+older server) lowers to a nil cost so the attempt records "unknown" rather
+than a sham zero.
+
+## Envelope to TurnRequest
+
+`Engine.Envelope` (Elixir) is the authored, validated shape; `Engine.Client`
+lowers it to a `TurnRequest` (`request_body/2`). The envelope adds `location`
+(`:local`, `:ixvm`, `{:host, name}`, `{:room, url}`), which the client
+resolves to the room-server URL and does not put on the wire. The Elixir
+fixture test asserts `request_body/2` reproduces `turn_request.json`
+byte-for-byte after a JSON round-trip, so the lowering and the shared
+fixture cannot drift apart.
diff --git a/packages/symphony/docs/quality.md b/packages/symphony/docs/quality.md
new file mode 100644
index 000000000..10b23cbde
--- /dev/null
+++ b/packages/symphony/docs/quality.md
@@ -0,0 +1,71 @@
+# Quality gate
+
+Symphony runs a quality gate that reports formatting, lint, static security,
+dependency-audit, type, and coverage findings. It is informational today and
+does not block PRs. Run it locally with one command:
+
+```sh
+cd elixir
+make quality
+```
+
+That target runs `mix quality` (format check, Credo strict, Sobelow, deps
+audit, Dialyzer) followed by `mix coveralls`. None of these are part of the
+required lane: that lane (compile with warnings as errors, format check,
+credo, `mix test`) runs sandboxed in index CI as the `symphony-elixir` flake
+check (see `../default.nix`).
+
+## Tools
+
+- `mix format --check-formatted`: fails if any file is not formatted to the
+  rules in `elixir/.formatter.exs` (200-column lines).
+- `mix credo --strict`: lint and refactoring analysis. Strict mode surfaces all
+  priorities, including the low-priority refactor checks pinned in
+  `elixir/.credo.exs`.
+- `mix sobelow --config`: static security scanner for Phoenix apps, reading
+  `elixir/.sobelow-conf`. Reports common web vulnerabilities (XSS, CSRF,
+  config, traversal). Reporting only: it does not set an `exit` threshold.
+- `mix deps.audit`: checks the dependency tree in `mix.lock` against the
+  Elixir security advisory database (`mix_audit`).
+- `mix dialyzer`: success-typing analysis (`dialyxir`). The PLT is built under
+  `elixir/priv/plts/` (gitignored).
+- `mix coveralls`: test-suite line coverage total (`excoveralls`).
+
+## CI
+
+The standalone repo ran the advisory lane as its own GitHub workflow. In
+index, only the required lane is wired into CI (the `symphony-elixir` flake
+check); the advisory lane is a local `make quality` run. Sobelow, deps.audit,
+Dialyzer, and coveralls all want network access or large mutable caches, so a
+sandboxed derivation is a bad fit for them today.
+
+## Phased rollout
+
+The gate ships in two phases so it never blocks PRs while the codebase is still
+being brought into compliance.
+
+### Phase A (landed in the standalone repo, WS-8): tooling plus non-blocking reporting
+
+Install the tools, add the `quality` Make target and alias, and surface a
+violations summary. Nothing here makes the required lane stricter. The point
+is to see the violations, not to enforce them yet.
+
+### Phase B (WS-9, after the overhaul cutover): enforce
+
+Phase B lands only after the top-down overhaul cutover, once the module set is
+final, so we do not spend effort on modules the cutover deletes. Steps:
+
+1. One-time Styler reformat, then enable the Styler formatter plugin in
+   `.formatter.exs`.
+2. Add Boundary as a dep and `use Boundary` annotations encoding the layer
+   rules: DSL -> IR -> Runtime -> `Engine.Client`; `Engine.Client` is the only
+   door to the room-server; `bridge`/`state`/`http` never name a concrete
+   engine.
+3. Fix the `credo --strict` and Dialyzer violations.
+4. Fold the enforceable parts into the `symphony-elixir` flake check so they
+   gate PRs.
+
+Boundary is deferred until post-cutover on purpose. The module topology is
+still changing in the overhaul, so annotating modules now would encode layer
+rules onto modules the cutover removes. Boundary annotations land in Phase B
+against the final module set.
diff --git a/packages/symphony/docs/setup.md b/packages/symphony/docs/setup.md
new file mode 100644
index 000000000..bda51d70c
--- /dev/null
+++ b/packages/symphony/docs/setup.md
@@ -0,0 +1,135 @@
+# Setup
+
+## Local development
+
+```bash
+git clone https://github.com/indexable-inc/index
+cd index
+
+export SYMPHONY_PRIMARY_REPO=/path/to/your/repo
+nix run .#symphony
+```
+
+Open http://127.0.0.1:4040 for the dashboard.
+
+The bundled `workflows/example` pack ships a single manual-trigger `.sym`
+workflow (`workflows/inspect.sym`) with a read-only `inspect` skill that does
+not push anything anywhere. It is intended as a starting point you can copy
+into your own pack.
+
+## Running a real workflow pack
+
+Drop your pack directory (a `workflows/` of `.sym` files, a `skills/` of
+markdown, and a `repositories.yaml`) anywhere on the host and point Symphony
+at it:
+
+```bash
+export SYMPHONY_PACK_DIR=/path/to/your/pack
+export SYMPHONY_PRIMARY_REPO=/path/to/your/primary/repo
+nix run github:indexable-inc/index#symphony
+```
+
+Required runtime credentials depend on which triggers and tools your pack
+uses; see `README.md` and `elixir/lib/symphony_elixir/config.ex` for the full
+env var list.
+
+Symphony treats the workflow pack as read-only runtime input. Put mutable run
+state under `SYMPHONY_RUNS_DIR` and worktrees under `SYMPHONY_WORKSPACES_DIR`;
+both default under the runtime state directory when using the Nix wrapper.
+
+Common ones:
+
+- `LINEAR_API_KEY` (Linear graphql tool + webhook enqueue)
+- `GITHUB_TOKEN` (dashboard statistics)
+- `LINEAR_WEBHOOK_SECRET`, `GITHUB_WEBHOOK_SECRET`, `SLACK_SIGNING_SECRET`
+  (webhook receivers)
+- `SYMPHONY_GITHUB_APP_ID`, `SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64`,
+  `SYMPHONY_GITHUB_APP_OWNER_REPO` (commit/push as a bot identity)
+- `SYMPHONY_BOT_USERNAME`, `SYMPHONY_BOT_EMAIL` (git author when the App is
+  configured)
+
+Codex must already be installed and authenticated on the host.
+
+## Choosing a placement
+
+Each agent node picks where its codex session runs with a `location:` field in
+the `.sym` workflow:
+
+```
+implement <- agent {
+  engine: codex
+  model: "gpt-5.3-codex"
+  permissions: workspace_write
+  location: host   # or: ixvm, room, local
+  prompt: skill "implement"
+}
+```
+
+`host` runs codex directly on the Symphony machine as a real OS user
+(`SYMPHONY_HOST_USER`) inside that user's home directory, with no VM, so the
+agent can read and write that user's files. `ixvm` runs it inside a
+short-lived iXVM. Both stand up a per-run room-server and register it so the
+room UI can attach. `local` and `room` use the default
+`SYMPHONY_ROOM_SERVER_URL`.
+
+When a node's `ixvm` placement fails to provision before the first turn, the
+run retries on the placement named by `SYMPHONY_PLACEMENT_FALLBACK` (defaults
+to `host`). On NixOS, set `services.symphony.hostRuntime` to wire the polkit
+grant, PATH, and `SYMPHONY_HOST_USER` the host placement needs:
+
+```nix
+services.symphony.hostRuntime = {
+  enable = true;
+  user = "hari";
+  # room-server now lives in the IX monorepo; provide its wrapped binary.
+  roomServerPackage = ix.packages.${pkgs.system}.room-server;
+};
+```
+
+## Choosing an engine: Codex or Claude
+
+An agent node names its engine directly in the `.sym` workflow with the
+`engine:` field (`codex` or `claude`); the room-server's engine host runs the
+turn through the matching adapter.
+
+```
+report <- agent {
+  engine: claude
+  model: haiku
+  permissions: read_only
+  prompt: inline "write a status report"
+}
+```
+
+A Claude model means `claude-*` or the `opus` / `sonnet` / `haiku` aliases.
+Claude turns are billed against `ANTHROPIC_API_KEY`. The codex-only `sandbox`
+/ `approval_policy` skill fields do not apply to Claude turns.
+
+## Production deployment (NixOS)
+
+```nix
+{
+  inputs.index.url = "github:indexable-inc/index";
+
+  outputs = { self, nixpkgs, index, ... }: {
+    nixosConfigurations.host = nixpkgs.lib.nixosSystem {
+      modules = [
+        index.nixosModules.symphony
+        ({ pkgs, ... }: {
+          services.symphony = {
+            enable = true;
+            package = index.packages.${pkgs.stdenv.hostPlatform.system}.symphony;
+            packDir = "/var/lib/symphony-pack";
+            primaryRepo = "/var/lib/repos/my-app";
+            environmentFile = "/run/secrets/symphony.env";
+          };
+        })
+      ];
+    };
+  };
+}
+```
+
+Pair the module with whichever secret store you prefer (sops-nix, agenix,
+Bitwarden Secrets Manager via `secretsCommand`, etc). See the module options
+in `modules/services/symphony/default.nix` at the repo root.
diff --git a/packages/symphony/elixir/.credo.exs b/packages/symphony/elixir/.credo.exs
new file mode 100644
index 000000000..d0cc61a0e
--- /dev/null
+++ b/packages/symphony/elixir/.credo.exs
@@ -0,0 +1,30 @@
+%{
+  configs: [
+    %{
+      name: "default",
+      files: %{
+        included: ["lib/", "test/", "config/", "mix.exs"],
+        excluded: []
+      },
+      strict: false,
+      color: true,
+      checks: [
+        # Make refactoring suggestions informational rather than CI-failing.
+        # CI catches real correctness issues via mix compile --warnings-as-errors;
+        # credo's refactor suggestions are useful local feedback but should not
+        # gate the build on every threshold tweak.
+        {Credo.Check.Refactor.CyclomaticComplexity, max_complexity: 12, priority: :low},
+        {Credo.Check.Refactor.Nesting, max_nesting: 3, priority: :low},
+        {Credo.Check.Refactor.WithClauses, priority: :low},
+        {Credo.Check.Refactor.RedundantWithClauseResult, priority: :low},
+        {Credo.Check.Refactor.CondStatements, priority: :low},
+        {Credo.Check.Readability.WithSingleClause, priority: :low},
+        # Config is intentionally a wide snapshot of env vars. Splitting into
+        # nested substructs would just push the same field count into nested
+        # types without making boot-time wiring clearer, and would break the
+        # field-name == opt-key round-trip the snapshot relies on.
+        {Credo.Check.Warning.StructFieldAmount, max_fields: 60}
+      ]
+    }
+  ]
+}
diff --git a/packages/symphony/elixir/.formatter.exs b/packages/symphony/elixir/.formatter.exs
new file mode 100644
index 000000000..59e60a5c2
--- /dev/null
+++ b/packages/symphony/elixir/.formatter.exs
@@ -0,0 +1,5 @@
+# Used by "mix format"
+[
+  inputs: ["{mix,.formatter}.exs", "{config,lib,test}/**/*.{ex,exs}"],
+  line_length: 200
+]
diff --git a/packages/symphony/elixir/.gitattributes b/packages/symphony/elixir/.gitattributes
new file mode 100644
index 000000000..6db95539d
--- /dev/null
+++ b/packages/symphony/elixir/.gitattributes
@@ -0,0 +1 @@
+test/fixtures/status_dashboard_snapshots/* linguist-generated=true
diff --git a/packages/symphony/elixir/.gitignore b/packages/symphony/elixir/.gitignore
new file mode 100644
index 000000000..f5c8fbfa8
--- /dev/null
+++ b/packages/symphony/elixir/.gitignore
@@ -0,0 +1,56 @@
+# The directory Mix will write compiled artifacts to.
+/_build/
+
+# If you run "mix test --cover", coverage assets end up here.
+/cover/
+
+# Dialyzer PLT files (mix.exs sets plt_core_path/plt_local_path here).
+/priv/plts/
+
+# The directory Mix downloads your dependencies sources to.
+/deps/
+
+# Where third-party dependencies like ExDoc output generated docs.
+/doc/
+
+# Temporary files, for example, from tests.
+/tmp/
+
+# Generated browser assets.
+/priv/static/assets/
+
+# Local runtime logs.
+/log/
+/logs/
+
+# If the VM crashes, it generates a dump, let's ignore it too.
+erl_crash.dump
+
+# Elixir language server and tooling.
+/.elixir_ls/
+/.fetch/
+
+# Editor / OS temporary files.
+.DS_Store
+*.swp
+*.swo
+*~
+
+# IDE folders.
+.idea/
+.vscode/
+/bin/
+
+# Local environment and auth artifacts.
+.env
+.env.*
+.secrets
+.credentials
+status.txt
+.codex/original-user-prompt.txt
+
+# Also ignore archive artifacts (built via "mix archive.build").
+*.ez
+
+# Ignore package tarball (built via "mix hex.build").
+symphony_elixir-*.tar
diff --git a/packages/symphony/elixir/.sobelow-conf b/packages/symphony/elixir/.sobelow-conf
new file mode 100644
index 000000000..3e2793fb1
--- /dev/null
+++ b/packages/symphony/elixir/.sobelow-conf
@@ -0,0 +1,14 @@
+# Sobelow static security scanner config.
+# https://hexdocs.pm/sobelow/Mix.Tasks.Sobelow.html
+#
+# `mix sobelow --config` reads this file. WS-8 runs sobelow as an
+# informational gate only, so do not set `exit: "low"` here; that would turn
+# any finding into a nonzero exit and could gate a PR once the quality job is
+# promoted to required in WS-9. Keep this scan reporting-only until then.
+[
+  verbose: false,
+  private: false,
+  skip: false,
+  router: "lib/symphony_elixir_web/router.ex",
+  format: "txt"
+]
diff --git a/packages/symphony/elixir/AGENTS.md b/packages/symphony/elixir/AGENTS.md
new file mode 100644
index 000000000..71cef3269
--- /dev/null
+++ b/packages/symphony/elixir/AGENTS.md
@@ -0,0 +1,65 @@
+# Symphony Elixir
+
+This directory contains the Elixir/OTP runtime that lowers `.sym`
+workflows to an IR run graph and walks it. See `../README.md` for the
+project overview, file layout, env vars, and API.
+
+## Environment
+
+- Elixir: `1.19.x` (OTP 28), pinned in `mise.toml`.
+- Install deps: `mix deps.get`.
+- Main quality gate: `make all` (which runs `make setup`, `make build`,
+  `make fmt-check`, `make lint`).
+
+## Codebase-Specific Conventions
+
+- Runtime config is loaded from the process environment at boot via
+  `SymphonyElixir.Config`. Prefer adding new knobs there rather than
+  reading `System.get_env/1` ad hoc.
+- Workflows (`workflows/*.sym`) are hot-reloaded by
+  `SymphonyElixir.WorkflowCatalog` and skills (`skills/*.md`) by
+  `SymphonyElixir.Catalog`, both on a 1s tick; no restart needed for
+  content changes.
+- Workspace safety is critical:
+  - Never run a Codex turn with cwd inside the source repo. Every run
+    gets a fresh `git worktree add` under `SYMPHONY_WORKSPACES_DIR`.
+  - `SymphonyElixir.PathSafety.canonicalize/1` is the gate; any new
+    code that resolves a workspace-relative path should route through
+    it.
+- Runtime behavior is stateful and concurrency-sensitive: preserve
+  retry, resume-on-boot, and workspace-cleanup semantics in
+  `SymphonyElixir.Runtime` and `SymphonyElixir.IR.Store`.
+
+## Tests and Validation
+
+Run targeted tests while iterating, then run full gates before
+handoff:
+
+```bash
+make all
+mix test
+```
+
+## Required Rules
+
+- Public functions (`def`) in `lib/` should have an adjacent `@spec`.
+- `defp` specs are optional.
+- `@impl` callback implementations are exempt from the `@spec` rule.
+- Keep changes narrowly scoped; avoid unrelated refactors in the same
+  PR.
+- Follow existing module/style patterns in `lib/symphony_elixir/*`.
+
+## CI
+
+The sandboxed `symphony-elixir` flake check runs the required lane
+(compile with warnings as errors, `mix format --check-formatted`,
+`mix credo`, `mix test`) against the deps pinned in `mix.lock`; see
+`../default.nix`. After changing `mix.lock`, refresh the
+`fetchMixDeps` hash there.
+
+## Docs Update Policy
+
+If behavior/config changes, update docs in the same PR:
+
+- `../README.md` for the project concept, file layout, env vars, API.
+- `../docs/setup.md` for host setup / runtime credentials.
diff --git a/packages/symphony/elixir/Makefile b/packages/symphony/elixir/Makefile
new file mode 100644
index 000000000..68e15ec3a
--- /dev/null
+++ b/packages/symphony/elixir/Makefile
@@ -0,0 +1,46 @@
+.PHONY: help all setup deps build fmt fmt-check lint test ci quality
+
+MIX ?= mix
+
+help:
+	@echo "Targets: setup, deps, fmt, fmt-check, lint, test, ci, quality"
+
+setup:
+	$(MIX) local.hex --force --if-missing
+	$(MIX) local.rebar --force --if-missing
+	$(MIX) setup
+
+deps:
+	$(MIX) deps.get
+
+build:
+	$(MIX) build
+
+fmt:
+	$(MIX) format
+
+fmt-check:
+	$(MIX) format --check-formatted
+
+lint:
+	$(MIX) lint
+
+test:
+	$(MIX) test
+
+ci:
+	$(MAKE) setup
+	$(MAKE) build
+	$(MAKE) fmt-check
+	$(MAKE) lint
+	$(MAKE) test
+
+all: ci
+
+# Non-required reporting gate (WS-8). Intentionally separate from ci/all so it
+# never blocks PRs while the codebase is brought into compliance (WS-9).
+# Depends on setup so a clean CI runner has Hex, rebar, and fetched deps
+# before the tools run; without it `mix quality` aborts on a missing SCM.
+quality: setup
+	$(MIX) quality
+	$(MIX) coveralls
diff --git a/packages/symphony/elixir/config/config.exs b/packages/symphony/elixir/config/config.exs
new file mode 100644
index 000000000..d1f0c98f5
--- /dev/null
+++ b/packages/symphony/elixir/config/config.exs
@@ -0,0 +1,18 @@
+import Config
+
+config :phoenix, :json_library, Jason
+
+config :symphony_elixir, SymphonyElixirWeb.Endpoint,
+  adapter: Bandit.PhoenixAdapter,
+  url: [host: "localhost"],
+  render_errors: [
+    formats: [html: SymphonyElixirWeb.ErrorHTML, json: SymphonyElixirWeb.ErrorJSON],
+    layout: false
+  ],
+  pubsub_server: SymphonyElixir.PubSub,
+  live_view: [signing_salt: "symphony-live-view"],
+  check_origin: false,
+  server: true,
+  http: [ip: {127, 0, 0, 1}, port: 4040]
+
+import_config "#{config_env()}.exs"
diff --git a/packages/symphony/elixir/config/dev.exs b/packages/symphony/elixir/config/dev.exs
new file mode 100644
index 000000000..becde7693
--- /dev/null
+++ b/packages/symphony/elixir/config/dev.exs
@@ -0,0 +1 @@
+import Config
diff --git a/packages/symphony/elixir/config/prod.exs b/packages/symphony/elixir/config/prod.exs
new file mode 100644
index 000000000..becde7693
--- /dev/null
+++ b/packages/symphony/elixir/config/prod.exs
@@ -0,0 +1 @@
+import Config
diff --git a/packages/symphony/elixir/config/runtime.exs b/packages/symphony/elixir/config/runtime.exs
new file mode 100644
index 000000000..20c936f93
--- /dev/null
+++ b/packages/symphony/elixir/config/runtime.exs
@@ -0,0 +1,22 @@
+import Config
+
+# Runtime config. Boot reads these from the environment so a single binary can
+# move between hosts without recompiling.
+
+secret_key_base =
+  System.get_env("SYMPHONY_SECRET_KEY_BASE") ||
+    Base.encode64(:crypto.strong_rand_bytes(48), padding: false)
+
+config :symphony_elixir, SymphonyElixirWeb.Endpoint, secret_key_base: secret_key_base
+
+if config_env() != :test do
+  port_string = System.get_env("SYMPHONY_HTTP_PORT", "4040")
+
+  port =
+    case Integer.parse(port_string) do
+      {value, ""} when value >= 0 -> value
+      _ -> raise "SYMPHONY_HTTP_PORT must be a non-negative integer, got #{inspect(port_string)}"
+    end
+
+  config :symphony_elixir, SymphonyElixirWeb.Endpoint, http: [ip: {127, 0, 0, 1}, port: port]
+end
diff --git a/packages/symphony/elixir/config/test.exs b/packages/symphony/elixir/config/test.exs
new file mode 100644
index 000000000..25bcfc719
--- /dev/null
+++ b/packages/symphony/elixir/config/test.exs
@@ -0,0 +1,13 @@
+import Config
+
+# Tests do not need to bind a real HTTP socket. Letting the endpoint
+# bind 127.0.0.1:4040 means `mix test` fails whenever a real symphony
+# is already running on the same host. Set `server: false` so the
+# Bandit adapter is skipped; LiveView and Plug logic that the test
+# suite touches still work without a live listener.
+config :symphony_elixir, SymphonyElixirWeb.Endpoint, server: false
+
+# Tests start the bits they need from test_helper.exs. The full supervision
+# tree depends on SYMPHONY_ROOT and friends being set, which test runners
+# should not have to inherit from the host env.
+config :symphony_elixir, auto_start: false
diff --git a/packages/symphony/elixir/docs/logging.md b/packages/symphony/elixir/docs/logging.md
new file mode 100644
index 000000000..2708fe72b
--- /dev/null
+++ b/packages/symphony/elixir/docs/logging.md
@@ -0,0 +1,40 @@
+# Logging Best Practices
+
+This guide defines logging conventions for Symphony so Codex can diagnose failures quickly.
+
+## Goals
+
+- Make logs searchable by issue and session.
+- Capture enough execution context to identify root cause without reruns.
+- Keep messages stable so dashboards/alerts are reliable.
+
+## Required Context Fields
+
+When logging issue-related work, include both identifiers:
+
+- `issue_id`: Linear internal UUID (stable foreign key).
+- `issue_identifier`: human ticket key (for example `MT-620`).
+
+When logging Codex execution lifecycle events, include:
+
+- `session_id`: combined Codex thread/turn identifier.
+
+## Message Design
+
+- Use explicit `key=value` pairs in message text for high-signal fields.
+- Prefer deterministic wording for recurring lifecycle events.
+- Include the action outcome (`completed`, `failed`, `retrying`) and the reason/error when available.
+- Avoid logging large payloads unless required for debugging.
+
+## Scope Guidance
+
+- `AgentRunner`: log start/completion/failure with issue context, plus `session_id` when known.
+- `Orchestrator`: log dispatch, retry, terminal/non-active transitions, and worker exits with issue context. Include `session_id` whenever running-entry data has it.
+- `Runtime` / `Runtime.RoomEngineClient`: log node turn start/completion/error with run context and the engine `thread_id`.
+
+## Checklist For New Logs
+
+- Is this event tied to a Linear issue? Include `issue_id` and `issue_identifier`.
+- Is this event tied to a Codex session? Include `session_id`.
+- Is the failure reason present and concise?
+- Is the message format consistent with existing lifecycle logs?
diff --git a/packages/symphony/elixir/docs/token_accounting.md b/packages/symphony/elixir/docs/token_accounting.md
new file mode 100644
index 000000000..2c6e107be
--- /dev/null
+++ b/packages/symphony/elixir/docs/token_accounting.md
@@ -0,0 +1,304 @@
+# Codex Token Accounting
+
+This document explains how Codex reports token usage through the app-server protocol and how Symphony should account for it.
+
+It is based on the current Codex source in `codex-rs`, especially:
+
+- `app-server/README.md`
+- `protocol/src/protocol.rs`
+- `app-server/src/bespoke_event_handling.rs`
+- `app-server-protocol/src/protocol/v2.rs`
+- `exec/src/event_processor_with_jsonl_output.rs`
+- `state/src/extract.rs`
+
+## Short Version
+
+- `last_token_usage` means "the latest increment".
+- `total_token_usage` means "the cumulative total so far".
+- `thread/tokenUsage/updated` is the live streaming notification for token usage.
+- `turn/completed` carries final turn state, and turn-level usage is exposed separately from the live thread token stream.
+- Generic `usage` fields are event-specific. Do not assume every `usage` payload is a cumulative thread total.
+
+## Primary Source Semantics
+
+Codex defines `TokenUsageInfo` like this:
+
+```rust
+pub struct TokenUsageInfo {
+    pub total_token_usage: TokenUsage,
+    pub last_token_usage: TokenUsage,
+    pub model_context_window: Option<i64>,
+}
+```
+
+The important behavior is in `append_last_usage`:
+
+```rust
+pub fn append_last_usage(&mut self, last: &TokenUsage) {
+    self.total_token_usage.add_assign(last);
+    self.last_token_usage = last.clone();
+}
+```
+
+That gives the core semantics:
+
+- `last_token_usage`: the newest chunk of usage that was just added
+- `total_token_usage`: the accumulated total after adding that chunk
+
+This is the most important accounting rule in the Codex source.
+
+## Event Types
+
+### `codex/event/token_count`
+
+Codex core emits token count events containing `TokenUsageInfo`.
+
+These events can carry:
+
+- `info.total_token_usage`
+- `info.last_token_usage`
+- `info.model_context_window`
+
+Symphony sees these events wrapped inside the app-server message stream.
+
+Meaning:
+
+- `total_token_usage` is an absolute cumulative snapshot
+- `last_token_usage` is the delta that produced that snapshot
+
+### `thread/tokenUsage/updated`
+
+The app-server converts token count events into a dedicated thread-scoped notification:
+
+```rust
+let notification = ThreadTokenUsageUpdatedNotification {
+    thread_id: conversation_id.to_string(),
+    turn_id,
+    token_usage,
+};
+```
+
+`ThreadTokenUsage` is defined as:
+
+```rust
+pub struct ThreadTokenUsage {
+    pub total: TokenUsageBreakdown,
+    pub last: TokenUsageBreakdown,
+    pub model_context_window: Option<i64>,
+}
+```
+
+And it is populated directly from `TokenUsageInfo`:
+
+```rust
+impl From<CoreTokenUsageInfo> for ThreadTokenUsage {
+    fn from(value: CoreTokenUsageInfo) -> Self {
+        Self {
+            total: value.total_token_usage.into(),
+            last: value.last_token_usage.into(),
+            model_context_window: value.model_context_window,
+        }
+    }
+}
+```
+
+Meaning:
+
+- `thread/tokenUsage/updated` is the canonical live notification for token usage
+- `tokenUsage.total` is an absolute thread total
+- `tokenUsage.last` is the latest increment that produced that total
+
+The app-server README is explicit: token usage streams separately via `thread/tokenUsage/updated`.
+
+### `turn/completed`
+
+The app-server README says `turn/completed` carries final turn state and token usage.
+
+There are two important details:
+
+1. The app-server protocol `turn/completed` notification contains a final `turn` object.
+2. The `exec` event processor also emits a turn-completed event that includes a `usage` struct.
+
+In the `exec` event processor, the turn-completed usage is built from the most recent captured `total_token_usage`:
+
+```rust
+if let Some(info) = &ev.info {
+    self.last_total_token_usage = Some(info.total_token_usage.clone());
+}
+```
+
+Then on turn completion:
+
+```rust
+let usage = if let Some(u) = &self.last_total_token_usage {
+    Usage {
+        input_tokens: u.input_tokens,
+        cached_input_tokens: u.cached_input_tokens,
+        output_tokens: u.output_tokens,
+    }
+}
+```
+
+Important consequence:
+
+- a turn-completed `usage` payload is not the same schema as `ThreadTokenUsage`
+- it should be interpreted in the context of the specific event that emitted it
+- it must not be blindly mixed with `thread/tokenUsage/updated` accounting
+
+### Generic `usage`
+
+Codex uses the word `usage` in multiple places.
+
+That does not mean all `usage` maps have the same semantics.
+
+Examples:
+
+- `thread/tokenUsage/updated.tokenUsage.total`: absolute cumulative thread total
+- `thread/tokenUsage/updated.tokenUsage.last`: latest delta
+- turn-completed `usage`: event-specific completion usage payload
+
+Rule:
+
+- never classify a `usage` map by name alone
+- classify it by event type and payload path
+
+## What The Metrics Mean
+
+### Absolute totals
+
+These are safe high-water-mark style counters:
+
+- `info.total_token_usage`
+- `tokenUsage.total` on `thread/tokenUsage/updated`
+
+Use these when you want:
+
+- live dashboard totals
+- stable per-thread accumulation
+- recovery after missed intermediate events
+
+### Deltas
+
+These are incremental additions:
+
+- `info.last_token_usage`
+- `tokenUsage.last` on `thread/tokenUsage/updated`
+
+Use these only when:
+
+- no absolute total is available
+- you are explicitly handling additive updates
+
+### Context window
+
+`model_context_window` is not spend. It is the model's context limit.
+
+Codex also has logic that can "fill to context window", which sets:
+
+- `total_token_usage.total_tokens = context_window`
+- `last_token_usage.total_tokens = delta`
+
+So `total_tokens` can reflect context-window normalization behavior, not just a raw upstream token report.
+
+For Symphony, `model_context_window` should be displayed or logged separately from spend.
+
+## Recommended Accounting Strategy For Symphony
+
+Track usage per active Codex thread.
+
+For each thread, keep:
+
+- `absolute_total`: latest accepted absolute total snapshot
+- `accumulated_total`: the total you expose in UI/API
+- `last_seen_turn_id`
+
+### Preferred source order
+
+When a token-related event arrives, use this precedence:
+
+1. `thread/tokenUsage/updated.tokenUsage.total`
+2. `TokenCountEvent.info.total_token_usage`
+
+Ignore these for accounting:
+
+- `thread/tokenUsage/updated.tokenUsage.last`
+- `TokenCountEvent.info.last_token_usage`
+- generic `usage` maps
+- turn-completed `usage`
+
+Do not treat generic `params.usage` as equivalent to a cumulative thread total unless the event type makes that meaning explicit.
+
+### Algorithm
+
+#### If an absolute total is present
+
+- Treat it as a thread-level snapshot.
+- If it is greater than or equal to the stored `absolute_total`, replace the stored absolute total.
+- Set exposed totals from that absolute snapshot.
+- Do not add the corresponding delta again.
+
+#### If no absolute total is present
+
+- Ignore the event for accounting.
+- Keep the last accepted absolute high-water mark unchanged.
+
+### Why this matters
+
+If you misclassify a per-turn `usage` payload as an absolute thread total, later turns can appear to stall because a smaller per-turn number is compared against a larger cumulative baseline.
+
+## What Symphony Should And Should Not Do
+
+### Do
+
+- Prefer `thread/tokenUsage/updated` for live reporting.
+- Treat `tokenUsage.total` as authoritative for thread totals.
+- Key accounting by `thread_id`, not just issue id.
+- Expect one thread to span multiple turns when Symphony reuses a live Codex thread.
+
+### Do not
+
+- Do not treat every `usage` map as absolute.
+- Do not count `tokenUsage.last` or `last_token_usage` into dashboard totals.
+- Do not add turn-completed `usage` on top of already-counted live thread totals unless you can prove it represents missing spend.
+- Do not reset accounting just because a new turn starts on the same thread.
+
+## Practical Interpretation For Symphony Logs
+
+When reading raw app-server events:
+
+- `codex/event/token_count`
+  - useful if you are inspecting nested `info.total_token_usage`
+- `thread/tokenUsage/updated`
+  - best source for live dashboard and API totals
+- `turn/completed`
+  - best used as end-of-turn state, not as an unconditional additive token event
+
+## Why `total_token_usage` Is The Durable Choice
+
+Codex itself consistently prefers cumulative totals when it needs durable state:
+
+- the state extractor stores `info.total_token_usage.total_tokens`
+- the exec event processor caches the last `total_token_usage` and uses that on turn completion
+
+That is a strong signal for Symphony:
+
+- use absolute totals as the main accounting surface
+- ignore last/delta values for totals
+
+## Recommended Symphony Documentation Contract
+
+If Symphony documents token reporting externally, the contract should be:
+
+- Live token totals come from Codex thread-scoped cumulative usage.
+- Incremental usage may also be emitted, but Symphony does not use it for totals.
+- Turn-completed usage is event-specific and should not be assumed to be a fresh additive increment.
+- Reporting is thread-based, and multiple turns can occur on one thread.
+
+## Implementation Checklist
+
+- Prefer `thread/tokenUsage/updated.tokenUsage.total`
+- Fallback to `info.total_token_usage`
+- Ignore `last` for totals
+- Key totals by `thread_id`
+- Do not classify generic `usage` by field name alone
+- Do not double-count turn-completed usage after live updates
diff --git a/packages/symphony/elixir/lib/symphony_elixir.ex b/packages/symphony/elixir/lib/symphony_elixir.ex
new file mode 100644
index 000000000..91e387cf4
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir.ex
@@ -0,0 +1,16 @@
+defmodule SymphonyElixir do
+  @moduledoc """
+  Symphony runs workflows of agent invocations.
+
+  - A `workflows/<name>.sym` file declares the nodes and edges of a workflow
+    in the `.sym` surface language, lowered to an IR run graph.
+  - A `skills/<name>.md` file declares the system prompt, codex policy, and
+    tool surface a `skill "name"` prompt resolves to.
+  - A trigger (Linear label, manual API call, cron tick, Slack, GitHub)
+    starts a run.
+  - Each run gets a fresh workspace from the primary repository's configured
+    default branch.
+  - The IR runtime walks the graph, executing one node at a time through the
+    engine host.
+  """
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/application.ex b/packages/symphony/elixir/lib/symphony_elixir/application.ex
new file mode 100644
index 000000000..7c3e953e9
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/application.ex
@@ -0,0 +1,84 @@
+defmodule SymphonyElixir.Application do
+  @moduledoc """
+  OTP application entrypoint.
+
+  Boot order (one_for_one):
+
+      Phoenix.PubSub         in-process eventbus
+      Task.Supervisor        short-lived tasks (codex turns, trigger work)
+      Config                 boot-time env snapshot
+      GithubApp              mints and caches GitHub App installation tokens
+      Catalog                watches skills/*.md, hot-reloads
+      WorkflowCatalog        watches workflows/*.sym, hot-reloads the DSL ingress index
+      CronState              persists per-workflow last_fired_at for cron workflows
+      Runtime.Registry       name registry for per-run runtimes
+      Runtime.Placement      per-run room-server placement registry (ixvm/host)
+      Runtime.Supervisor     DynamicSupervisor for runs
+      Triggers.Slack         polls Slack for completed huddles (opt-in)
+      Triggers.Cron          fires cron-triggered workflows on a wall-clock cadence
+      Endpoint               Phoenix HTTP + LiveView; also receives Linear webhooks
+  """
+
+  use Application
+
+  @impl true
+  def start(_type, _args) do
+    if Application.get_env(:symphony_elixir, :auto_start, true) do
+      start_supervised()
+    else
+      Supervisor.start_link([], strategy: :one_for_one, name: SymphonyElixir.Supervisor)
+    end
+  end
+
+  defp start_supervised do
+    :ok = SymphonyElixir.LogFile.configure()
+
+    role = role()
+    children = children_for(role)
+
+    with {:ok, pid} <- Supervisor.start_link(children, strategy: :one_for_one, name: SymphonyElixir.Supervisor) do
+      if role == :control_plane, do: SymphonyElixir.Runtime.Supervisor.resume_pending()
+      {:ok, pid}
+    end
+  end
+
+  # Read directly from the env, not the Config snapshot: the role decides
+  # whether Config itself (and the rest of the tree) boots.
+  defp role do
+    case System.get_env("SYMPHONY_ROLE") do
+      "worker" -> :worker
+      _ -> :control_plane
+    end
+  end
+
+  # The full control plane: triggers, webhooks, the run engine, the placement
+  # registry, and the runtime-worker registry that backs :remote placement.
+  defp children_for(:control_plane) do
+    [
+      {Phoenix.PubSub, name: SymphonyElixir.PubSub},
+      {Task.Supervisor, name: SymphonyElixir.TaskSupervisor},
+      SymphonyElixir.Config,
+      SymphonyElixir.GithubApp,
+      SymphonyElixir.Catalog,
+      SymphonyElixir.WorkflowCatalog,
+      SymphonyElixir.CronState,
+      {Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry},
+      SymphonyElixir.Runtime.Placement,
+      SymphonyElixir.Runtime.RuntimeRegistry,
+      SymphonyElixir.Runtime.Supervisor,
+      SymphonyElixir.Triggers.Slack,
+      SymphonyElixir.Triggers.Cron,
+      SymphonyElixirWeb.Endpoint
+    ]
+  end
+
+  # A runtime worker: just enough to dial the control plane and provision
+  # per-run room-servers on this host. No DB, triggers, engine, or HTTP surface.
+  defp children_for(:worker) do
+    [
+      {Task.Supervisor, name: SymphonyElixir.TaskSupervisor},
+      SymphonyElixir.Config,
+      SymphonyElixir.Runtime.WorkerClient
+    ]
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/catalog.ex b/packages/symphony/elixir/lib/symphony_elixir/catalog.ex
new file mode 100644
index 000000000..6e8c97f98
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/catalog.ex
@@ -0,0 +1,132 @@
+defmodule SymphonyElixir.Catalog do
+  @moduledoc """
+  Watches `skills/*.md` and publishes the latest parsed skills. Polls every
+  `catalog_poll_ms` (default 1s) and compares hashes.
+
+  Reload semantics:
+
+  - A new file appears: parsed and added.
+  - An existing file's bytes change: re-parsed; old version is replaced.
+  - A file is deleted: removed from the catalog.
+  - A parse error: kept logged but not crashed; the previously-loaded
+    version (if any) stays in place until the bytes parse again.
+
+  Skill resolution is load-bearing for the IR engine path:
+  `Runtime.RoomEngineClient` resolves a node's `skill "name"` prompt through
+  `Catalog.skill/1`, which expands shared `{{partial:_}}` includes at load
+  time. The YAML/DAG stack also watched `dags/`; that surface was deleted in
+  the `.sym`/IR cutover (ENG-1828), so this catalog now watches skills only.
+
+  Active runs snapshot the skills they resolve at run start; reloads here
+  affect only NEW runs.
+  """
+
+  use GenServer
+  require Logger
+
+  alias SymphonyElixir.{Config, Skill}
+
+  @table :symphony_catalog
+
+  defstruct [:skills_dir, :poll_ms]
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @spec skill(String.t()) :: {:ok, Skill.t()} | {:error, :not_found}
+  def skill(name) when is_binary(name) do
+    case :ets.lookup(@table, {:skill, name}) do
+      [{_key, skill}] -> {:ok, skill}
+      [] -> {:error, :not_found}
+    end
+  end
+
+  @spec skills() :: [Skill.t()]
+  def skills do
+    :ets.match_object(@table, {{:skill, :_}, :_})
+    |> Enum.map(fn {_key, skill} -> skill end)
+  end
+
+  @impl true
+  def init(_opts) do
+    :ets.new(@table, [:named_table, :public, read_concurrency: true])
+    config = Config.get()
+
+    state = %__MODULE__{
+      skills_dir: config.skills_dir,
+      poll_ms: config.catalog_poll_ms
+    }
+
+    schedule_scan(0)
+    {:ok, state}
+  end
+
+  @impl true
+  def handle_info(:scan, %__MODULE__{} = state) do
+    scan_dir(state.skills_dir, :skill, &Skill.load/1)
+    schedule_scan(state.poll_ms)
+    {:noreply, state}
+  end
+
+  defp schedule_scan(after_ms) do
+    Process.send_after(self(), :scan, after_ms)
+  end
+
+  defp scan_dir(dir, :skill, loader) do
+    files = Path.wildcard(Path.join(dir, "*.md"))
+
+    seen_names =
+      Enum.reduce(files, MapSet.new(), fn path, acc ->
+        name = Path.basename(path, Path.extname(path))
+        load_if_changed(:skill, name, path, loader)
+        MapSet.put(acc, name)
+      end)
+
+    remove_missing(:skill, seen_names)
+  end
+
+  defp load_if_changed(kind, name, path, loader) do
+    case File.read(path) do
+      {:ok, raw} ->
+        new_hash = :crypto.hash(:sha256, raw)
+
+        case current_hash(kind, name) do
+          ^new_hash ->
+            :ok
+
+          _ ->
+            case loader.(path) do
+              {:ok, parsed} ->
+                :ets.insert(@table, {{kind, name}, parsed})
+                Logger.info("Catalog loaded #{kind}=#{name} hash=#{Base.encode16(new_hash, case: :lower) |> binary_part(0, 8)}")
+
+              {:error, reason} ->
+                Logger.warning("Catalog failed to load #{kind}=#{name}: #{inspect(reason)}")
+            end
+        end
+
+      {:error, reason} ->
+        Logger.warning("Catalog failed to read #{path}: #{inspect(reason)}")
+    end
+  end
+
+  defp current_hash(kind, name) do
+    case :ets.lookup(@table, {kind, name}) do
+      [{_key, %{body_hash: hash}}] -> hash
+      _ -> nil
+    end
+  end
+
+  defp remove_missing(kind, seen_names) do
+    @table
+    |> :ets.match_object({{kind, :_}, :_})
+    |> Enum.each(fn {{^kind, name} = key, _value} ->
+      unless MapSet.member?(seen_names, name) do
+        :ets.delete(@table, key)
+        Logger.info("Catalog removed #{kind}=#{name} (file deleted)")
+      end
+    end)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/claude/code.ex b/packages/symphony/elixir/lib/symphony_elixir/claude/code.ex
new file mode 100644
index 000000000..64060e833
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/claude/code.ex
@@ -0,0 +1,209 @@
+defmodule SymphonyElixir.Claude.Code do
+  @moduledoc """
+  Runs one workflow node as a headless Claude Code session in the run's
+  workspace, used when a skill's `codex_model` names a Claude model
+  (`claude-*`, or the `opus` / `sonnet` / `haiku` aliases); every other
+  model goes to Codex.
+
+  This is the in-process Claude runner the YAML/DAG `NodeExecutor` used.
+  The `.sym`/IR engine path runs Claude turns through the room-server's
+  `engine_claude` adapter instead, so this module is not on the IR hot
+  path. It is kept (not deleted with the rest of the old stack) because it
+  is the only in-process Claude turn runner and removing it would orphan
+  Claude support outside the room-server; revisit once the IR path proves
+  Claude parity end to end on the room-server engine host.
+
+  There is no app-server protocol, no VM, and no Symphony dynamic-tool
+  surface here. This module spawns the `claude` CLI once, non-interactively,
+  and reads back a single JSON result:
+
+      printf '%s' "$prompt" | claude --print --output-format json \\
+        --dangerously-skip-permissions --model claude-opus-4-8
+
+  - `--print` runs Claude Code non-interactively and exits.
+  - `--dangerously-skip-permissions` lets the agent edit files and run
+    tools with no approval prompts. A Claude model is the opt-in for that;
+    there is no per-tool gate the way codex has `approval_policy`.
+  - `--output-format json` emits one result object on stdout whose
+    `result`, `session_id`, and `is_error` fields we surface.
+  - `--model` is the skill's `codex_model` value, passed through verbatim.
+
+  The agent uses Claude Code's own tools (Bash, Edit, Read, ...) plus
+  whatever CLIs are on PATH inside the workspace (`git`, `gh`). The
+  GitHub App bot identity stamped into the checkout therefore applies to
+  claude runs exactly as it does to codex runs.
+
+  Auth is the Anthropic API key in `ANTHROPIC_API_KEY`, the same secret
+  surface every other integration token flows through. It is injected
+  into the subprocess env, never onto the command line, so it cannot
+  leak into logs or run records.
+
+  The prompt and model travel through the subprocess environment
+  (`SYMPHONY_CLAUDE_PROMPT`, `SYMPHONY_CLAUDE_MODEL`) and the prompt is
+  piped on stdin rather than passed positionally, so neither argv length
+  limits nor a leading dash in the prompt can corrupt the command line.
+
+  Bad fit if: `ANTHROPIC_API_KEY` is unset (the run errors with
+  `:anthropic_api_key_not_configured`), or the Symphony service runs as
+  root, where `--dangerously-skip-permissions` refuses to start.
+
+  This engine ignores any placement: a Claude model run through this
+  in-process path has no per-run room-server.
+  """
+
+  alias SymphonyElixir.Config
+
+  require Logger
+
+  @prompt_env "SYMPHONY_CLAUDE_PROMPT"
+  @model_env "SYMPHONY_CLAUDE_MODEL"
+
+  # One hour, matching the codex turn timeout. A workflow node that has
+  # not produced its result JSON by then is treated as hung.
+  @default_turn_timeout_ms 60 * 60 * 1000
+
+  @type env_pair :: {String.t(), String.t()}
+  @type context :: %{optional(:identifier) => String.t(), optional(:title) => String.t()}
+
+  @spec run(Path.t(), String.t(), context(), keyword()) :: {:ok, map()} | {:error, term()}
+  def run(workspace, prompt, _context, opts)
+      when is_binary(workspace) and is_binary(prompt) and is_list(opts) do
+    config = Keyword.fetch!(opts, :config)
+    model = Keyword.fetch!(opts, :model)
+    turn_timeout_ms = Keyword.get(opts, :turn_timeout_ms, @default_turn_timeout_ms)
+    extra_env = Keyword.get(opts, :extra_env, [])
+
+    with {:ok, api_key} <- fetch_api_key(config),
+         {:ok, bash} <- find_bash(),
+         :ok <- ensure_workspace(workspace) do
+      env =
+        env_charlists(
+          extra_env ++
+            [
+              {"ANTHROPIC_API_KEY", api_key},
+              {@prompt_env, prompt},
+              {@model_env, model}
+            ]
+        )
+
+      port =
+        Port.open(
+          {:spawn_executable, String.to_charlist(bash)},
+          [
+            :binary,
+            :exit_status,
+            args: [~c"-c", String.to_charlist(command(config.claude_command))],
+            cd: String.to_charlist(workspace),
+            env: env
+          ]
+        )
+
+      deadline = System.monotonic_time(:millisecond) + turn_timeout_ms
+      collect(port, deadline, turn_timeout_ms, [])
+    end
+  end
+
+  # The command run under `bash -c`. The prompt and model are referenced
+  # from the environment (double-quoted so the shell does not re-split or
+  # glob them); piping the prompt on stdin keeps it off the argv entirely.
+  @doc false
+  @spec command(String.t()) :: String.t()
+  def command(claude_command) when is_binary(claude_command) do
+    "printf '%s' \"$#{@prompt_env}\" | " <>
+      claude_command <>
+      " --print --output-format json --dangerously-skip-permissions" <>
+      " --model \"$#{@model_env}\""
+  end
+
+  defp fetch_api_key(%Config{anthropic_api_key: key}) when is_binary(key) and key != "", do: {:ok, key}
+  defp fetch_api_key(%Config{}), do: {:error, :anthropic_api_key_not_configured}
+
+  defp find_bash do
+    case System.find_executable("bash") do
+      nil -> {:error, :bash_not_found}
+      bash -> {:ok, bash}
+    end
+  end
+
+  defp ensure_workspace(workspace) do
+    if File.dir?(workspace), do: :ok, else: {:error, {:workspace_not_directory, workspace}}
+  end
+
+  defp env_charlists(env) when is_list(env) do
+    Enum.map(env, fn {k, v} when is_binary(k) and is_binary(v) ->
+      {String.to_charlist(k), String.to_charlist(v)}
+    end)
+  end
+
+  # Claude Code's json output format prints exactly one object on stdout
+  # at the end of the turn, so we buffer everything and parse on exit
+  # rather than streaming. stderr is left on the BEAM's stderr (no
+  # :stderr_to_stdout) so progress and diagnostics reach journald without
+  # polluting the JSON we have to decode.
+  defp collect(port, deadline, timeout_ms, chunks) do
+    remaining_ms = max(deadline - System.monotonic_time(:millisecond), 0)
+
+    receive do
+      {^port, {:data, data}} ->
+        collect(port, deadline, timeout_ms, [data | chunks])
+
+      {^port, {:exit_status, 0}} ->
+        parse_result(output(chunks))
+
+      {^port, {:exit_status, status}} ->
+        {:error, {:claude_exit, status, tail(output(chunks))}}
+    after
+      remaining_ms ->
+        kill_port(port)
+        {:error, {:claude_turn_timeout, timeout_ms}}
+    end
+  end
+
+  defp parse_result(stdout) do
+    case Jason.decode(last_json_line(stdout)) do
+      {:ok, %{"is_error" => false} = result} ->
+        {:ok,
+         %{
+           kind: :claude,
+           session_id: Map.get(result, "session_id"),
+           result: Map.get(result, "result"),
+           total_cost_usd: Map.get(result, "total_cost_usd")
+         }}
+
+      {:ok, %{"is_error" => true} = result} ->
+        {:error, {:claude_turn_failed, Map.get(result, "subtype"), Map.get(result, "result")}}
+
+      {:ok, other} ->
+        {:error, {:claude_invalid_result, other}}
+
+      {:error, _reason} ->
+        {:error, {:claude_unparseable_output, tail(stdout)}}
+    end
+  end
+
+  # Defensive: a stray non-JSON line on stdout (a tool that ignores the
+  # json contract, a shell notice) should not mask the result object,
+  # which json mode prints last. Take the last non-blank line.
+  defp last_json_line(stdout) do
+    stdout
+    |> String.split("\n", trim: true)
+    |> List.last()
+    |> Kernel.||("")
+  end
+
+  defp output(chunks), do: chunks |> Enum.reverse() |> IO.iodata_to_binary()
+
+  defp tail(text) when is_binary(text), do: String.slice(text, max(String.length(text) - 2_000, 0), 2_000)
+
+  defp kill_port(port) do
+    case Port.info(port, :os_pid) do
+      {:os_pid, os_pid} -> System.cmd("kill", ["-KILL", Integer.to_string(os_pid)], stderr_to_stdout: true)
+      _ -> :ok
+    end
+
+    if Port.info(port) != nil, do: Port.close(port)
+    :ok
+  rescue
+    _ -> :ok
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/codex/provision.ex b/packages/symphony/elixir/lib/symphony_elixir/codex/provision.ex
new file mode 100644
index 000000000..60d77f710
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/codex/provision.ex
@@ -0,0 +1,534 @@
+defmodule SymphonyElixir.Codex.Provision do
+  @moduledoc """
+  Shared building blocks for the runtimes that prepare a checkout and a
+  room-server outside the BEAM (`Codex.IxVm` and `Codex.Host`).
+
+  Both runtimes clone the same repositories with the same bot-identity and
+  GitHub auth stamping, export the same environment into the remote
+  room-server/Codex process, and poll the same `/api/health` endpoint. The
+  only thing that differs is where the script runs (an iXVM shell versus a
+  privilege-dropped local unit). Keeping the clone, env, and health logic
+  here means the load-bearing git auth header has a single owner.
+  """
+
+  alias SymphonyElixir.{Config, RepositoryCatalog}
+
+  @ix_workspace_root "/workspace/symphony"
+  @ix_room_state_root "/var/lib/symphony-room"
+
+  # The room state and workspace roots the host runtime uses inside the
+  # target user's home. Shared so `Codex.Host` and `Runtime.Placement`
+  # land the checkout and state in the same place.
+  @host_room_state_subdir ".local/state/symphony-room"
+  @host_default_workspaces_subdir "symphony-workspaces"
+
+  @doc """
+  Shell-quote a value for safe interpolation into a `bash -lc` script.
+  """
+  @spec sh(String.t()) :: String.t()
+  def sh(value) when is_binary(value) do
+    "'" <> String.replace(value, "'", "'\\''") <> "'"
+  end
+
+  @doc """
+  The iXVM-side root that holds every run-scoped checkout, and the
+  per-run subdirectory under it. The room-server runs from the primary
+  repo's checkout inside this tree.
+  """
+  @spec ix_run_root(String.t()) :: Path.t()
+  def ix_run_root(run_id), do: Path.join(@ix_workspace_root, run_id)
+
+  @doc "The iXVM-side primary-repo checkout for a run, where the engine turn runs."
+  @spec ix_primary_workspace(Config.t(), String.t()) :: Path.t()
+  def ix_primary_workspace(%Config{} = config, run_id) do
+    Path.join(ix_run_root(run_id), RepositoryCatalog.primary(config).name)
+  end
+
+  @doc """
+  The `ix new` argv that provisions a room-server VM for a run. The
+  load-bearing shape (l7-proxy port, region, ipv4, env injection) lives
+  here so `Codex.IxVm` and `Runtime.Placement` build it the same way and
+  the redaction in `sanitize_ix_args/1` keeps matching it.
+  """
+  @spec create_vm_args(Config.t(), String.t(), [{String.t(), String.t()}]) :: [String.t()]
+  def create_vm_args(%Config{} = config, vm_name, env) when is_binary(vm_name) and is_list(env) do
+    ["new", config.ix_image, "--name", vm_name, "--l7-proxy-port", to_string(config.ix_room_port), "--no-shell"]
+    |> append_region(config.ix_region)
+    |> append_ipv4(config.ix_room_connect)
+    |> append_env(env)
+  end
+
+  @doc """
+  The `bash -lc` script that clones the run's repositories into the VM's
+  run root on a run-scoped branch. The caller owns running it through
+  `ix shell`.
+  """
+  @spec ix_workspace_script(Config.t(), String.t(), keyword()) :: String.t()
+  def ix_workspace_script(%Config{} = config, run_id, opts) when is_list(opts) do
+    token = Keyword.get(opts, :bot_token) || config.github_token
+    run_root = ix_run_root(run_id)
+    blocks = repo_blocks(config, run_root, "symphony/#{run_id}", token)
+
+    """
+    set -euo pipefail
+    mkdir -p #{sh(run_root)}
+    #{blocks}
+    """
+  end
+
+  @doc """
+  The `bash -lc` script that boots the per-run room-server inside the VM,
+  exporting the runtime env first. One owner so `Codex.IxVm` and
+  `Runtime.Placement` start the server identically (notably the
+  `pkill -x room-server` that stops only the named process).
+  """
+  @spec ix_room_start_script(Config.t(), String.t(), keyword()) :: String.t()
+  def ix_room_start_script(%Config{} = config, run_id, opts) when is_list(opts) do
+    room_state_dir = Path.join(@ix_room_state_root, run_id)
+    exports = env_export_lines(runtime_env(config, opts))
+
+    """
+    set -euo pipefail
+    mkdir -p #{sh(room_state_dir)}
+    pkill -x room-server || true
+    #{exports}
+    nohup #{config.ix_room_server_command} --host 0.0.0.0 --port #{config.ix_room_port} --state-dir #{sh(room_state_dir)} --no-wt > /tmp/symphony-room-server.log 2>&1 &
+    """
+  end
+
+  @doc """
+  The `localport:vmport` mapping a port-forward tunnel uses for a VM, and
+  the loopback URL that mapping exposes. The local port is derived from
+  the VM name so concurrent runs do not collide on the same loopback
+  port.
+  """
+  @spec port_forward_mapping(Config.t(), String.t()) :: {String.t(), String.t()}
+  def port_forward_mapping(%Config{} = config, vm_name) when is_binary(vm_name) do
+    local_port = config.ix_local_port_base + :erlang.phash2(vm_name, 1000)
+    {"#{local_port}:#{config.ix_room_port}", "http://127.0.0.1:#{local_port}"}
+  end
+
+  @doc "The `ix port-forward` argv for a VM and `localport:vmport` mapping."
+  @spec port_forward_args(String.t(), String.t()) :: [String.t()]
+  def port_forward_args(vm_name, mapping) when is_binary(vm_name) and is_binary(mapping) do
+    ["port-forward", vm_name, mapping]
+  end
+
+  @doc "The `ix rm --force` argv for a VM."
+  @spec rm_vm_args(String.t()) :: [String.t()]
+  def rm_vm_args(vm_name) when is_binary(vm_name), do: ["rm", "--force", vm_name]
+
+  @doc "The `ix ls --json` argv used to look a VM up by name."
+  @spec list_vms_args() :: [String.t()]
+  def list_vms_args, do: ["ls", "--json"]
+
+  @doc "The `ix shell <vm> -- bash -lc <script>` argv that runs a setup script in a VM."
+  @spec shell_args(String.t(), String.t()) :: [String.t()]
+  def shell_args(vm_name, script) when is_binary(vm_name) and is_binary(script) do
+    ["shell", vm_name, "--", "bash", "-lc", script]
+  end
+
+  @doc """
+  A DNS-safe, length-bounded VM name for a run/node, ending in a hash of
+  the pair so distinct nodes never collide after slug truncation. Shared
+  so the legacy and IR paths name VMs the same way.
+  """
+  @spec vm_name(String.t(), String.t()) :: String.t()
+  def vm_name(run_id, node_id) when is_binary(run_id) and is_binary(node_id) do
+    slug =
+      "sym-#{run_id}-#{node_id}"
+      |> String.downcase()
+      |> String.replace(~r/[^a-z0-9-]+/, "-")
+      |> String.trim("-")
+      |> append_name_hash(run_id, node_id)
+      |> String.slice(0, 63)
+      |> String.trim("-")
+
+    if slug == "", do: "sym-#{:erlang.unique_integer([:positive])}", else: slug
+  end
+
+  @doc """
+  Redact secrets from an `ix` argv before it reaches a log or run record.
+  Drops the value of any `--env NAME=VALUE` pair and any sensitive
+  `export NAME='value'` inside a shell script argument. Shared so both
+  the legacy and IR placement paths redact the same way.
+  """
+  @spec sanitize_ix_args([String.t()]) :: [String.t()]
+  def sanitize_ix_args(args) when is_list(args), do: sanitize_ix_args(args, [])
+
+  defp sanitize_ix_args([], acc), do: Enum.reverse(acc)
+
+  defp sanitize_ix_args(["--env", assignment | rest], acc) do
+    sanitize_ix_args(rest, [redact_env_assignment(assignment), "--env" | acc])
+  end
+
+  defp sanitize_ix_args([arg | rest], acc) do
+    sanitize_ix_args(rest, [redact_sensitive_exports(arg) | acc])
+  end
+
+  defp redact_env_assignment(assignment) do
+    case String.split(assignment, "=", parts: 2) do
+      [name, _value] -> name <> "=<redacted>"
+      [name] -> name <> "=<redacted>"
+    end
+  end
+
+  defp redact_sensitive_exports(arg) do
+    Regex.replace(~r/export ([A-Z0-9_]*(?:TOKEN|KEY|SECRET)[A-Z0-9_]*)='[^']*'/, arg, "export \\1='<redacted>'")
+  end
+
+  defp append_region(args, nil), do: args
+  defp append_region(args, ""), do: args
+  defp append_region(args, region) when is_binary(region), do: args ++ ["--region", region]
+
+  defp append_ipv4(args, "direct_ipv4"), do: args ++ ["--ipv4"]
+  defp append_ipv4(args, _mode), do: args
+
+  defp append_env(args, env) do
+    Enum.reduce(env, args, fn {key, value}, acc -> acc ++ ["--env", "#{key}=#{value}"] end)
+  end
+
+  defp append_name_hash(slug, run_id, node_id) do
+    hash =
+      :crypto.hash(:sha256, run_id <> ":" <> node_id)
+      |> Base.encode16(case: :lower)
+      |> String.slice(0, 10)
+
+    base =
+      slug
+      |> String.slice(0, 52)
+      |> String.trim("-")
+
+    Enum.join([base, hash], "-")
+  end
+
+  # --- host (systemd-run) ---------------------------------------------
+  #
+  # The host runtime drops privileges to `SYMPHONY_HOST_USER` and runs the
+  # checkout plus the per-run room-server as transient `systemd-run` units.
+  # The argv shape (the `--collect`/`--uid`/`--setenv` base, the named
+  # `--unit=`, the sync `--pipe --wait` form) lives here so `Codex.Host`
+  # (legacy per-node) and `Runtime.Placement` (IR per-run) build identical
+  # commands and the polkit grant keeps matching the unit name.
+
+  @doc """
+  The parent of a host run's checkouts: `SYMPHONY_HOST_WORKSPACES_DIR`/run_id
+  when set, otherwise `<home>/symphony-workspaces/<run_id>`. The clone lands
+  here owned by the target user.
+  """
+  @spec host_run_root(Config.t(), Path.t(), String.t()) :: Path.t()
+  def host_run_root(%Config{host_workspaces_dir: dir}, _home, run_id) when is_binary(dir) and dir != "" do
+    Path.join(dir, run_id)
+  end
+
+  def host_run_root(%Config{}, home, run_id) when is_binary(home) do
+    Path.join([home, @host_default_workspaces_subdir, run_id])
+  end
+
+  @doc "The host-side primary-repo checkout for a run, where the engine turn runs."
+  @spec host_primary_workspace(Config.t(), Path.t(), String.t(), [RepositoryCatalog.t()] | nil) :: Path.t()
+  def host_primary_workspace(%Config{} = config, run_root, _run_id, repositories \\ nil) when is_binary(run_root) do
+    primary =
+      case repositories do
+        nil -> RepositoryCatalog.primary(config)
+        repos -> Enum.find(repos, & &1.primary?) || raise "remote provision repositories must define one primary repo"
+      end
+
+    Path.join(run_root, primary.name)
+  end
+
+  @doc "The per-run room-server state dir under the target user's home."
+  @spec host_room_state_dir(Path.t(), String.t()) :: Path.t()
+  def host_room_state_dir(home, run_id) when is_binary(home), do: Path.join([home, @host_room_state_subdir, run_id])
+
+  @doc """
+  The `systemd-run` unit-name base for a run/node, prefixed with
+  `symphony-host-` so the polkit grant (scoped to that prefix in
+  `modules/services/symphony`) authorizes the non-root service to manage
+  it. The `.service` suffix and any role suffix (`-setup`, `-clean`) are
+  the caller's to append.
+  """
+  @spec host_unit_base(String.t(), String.t()) :: String.t()
+  def host_unit_base(run_id, node_id) when is_binary(run_id) and is_binary(node_id) do
+    hash =
+      :crypto.hash(:sha256, run_id <> ":" <> node_id)
+      |> Base.encode16(case: :lower)
+      |> String.slice(0, 16)
+
+    "symphony-host-" <> hash
+  end
+
+  @doc """
+  The `systemd-run` argv that runs `command` to completion as the target
+  user via a named transient unit. `--pipe --wait` streams stdio back and
+  propagates the exit code; `--collect` reaps the unit even on failure.
+  Used for the workspace clone and the cleanup `rm`.
+  """
+  @spec host_run_sync_args(Config.t(), String.t(), Path.t(), String.t(), [{String.t(), String.t()}], [String.t()]) ::
+          [String.t()]
+  def host_run_sync_args(%Config{} = config, user, home, unit, env, command)
+      when is_binary(user) and is_binary(home) and is_binary(unit) and is_list(env) and is_list(command) do
+    host_base_run_args(config, user, home, env) ++ ["--unit=" <> unit, "--pipe", "--wait", "--"] ++ command
+  end
+
+  @doc """
+  The `systemd-run` argv that starts a long-lived `command` as the target
+  user under a named transient unit and returns once systemd accepts it.
+  Used for the per-run room-server; teardown stops the unit by name.
+  """
+  @spec host_run_unit_args(Config.t(), String.t(), Path.t(), String.t(), [{String.t(), String.t()}], [String.t()]) ::
+          [String.t()]
+  def host_run_unit_args(%Config{} = config, user, home, unit, env, command)
+      when is_binary(user) and is_binary(home) and is_binary(unit) and is_list(env) and is_list(command) do
+    host_base_run_args(config, user, home, env) ++ ["--unit=" <> unit, "--"] ++ command
+  end
+
+  defp host_base_run_args(%Config{host_group: group}, user, home, env) do
+    setenv = Enum.map(env, fn {key, value} -> "--setenv=#{key}=#{value}" end)
+
+    ["--collect", "--uid=" <> user, "--working-directory=" <> home]
+    |> host_append_group(group)
+    |> Kernel.++(setenv)
+  end
+
+  defp host_append_group(args, group) when is_binary(group) and group != "", do: args ++ ["--gid=" <> group]
+  defp host_append_group(args, _group), do: args
+
+  @doc """
+  The `bash -lc` script that prepares a host run: makes the room state and
+  run-root dirs, then clones the run's repositories on a run-scoped branch.
+  The caller owns running it through a `systemd-run --pipe --wait` unit.
+  """
+  @spec host_workspace_script(
+          Config.t(),
+          Path.t(),
+          Path.t(),
+          String.t(),
+          String.t() | nil,
+          [RepositoryCatalog.t()] | nil
+        ) :: String.t()
+  def host_workspace_script(%Config{} = config, run_root, state_dir, run_id, token, repositories \\ nil)
+      when is_binary(run_root) and is_binary(state_dir) and is_binary(run_id) do
+    blocks = repo_blocks(config, run_root, "symphony/#{run_id}", token, repositories)
+
+    """
+    set -euo pipefail
+    mkdir -p #{sh(state_dir)} #{sh(run_root)}
+    #{blocks}
+    """
+  end
+
+  @doc "The `rm -rf <run_root>` script for the host cleanup unit."
+  @spec host_cleanup_script(Path.t()) :: String.t()
+  def host_cleanup_script(run_root) when is_binary(run_root), do: "rm -rf #{sh(run_root)}"
+
+  @doc """
+  The room-server argv for the host runtime: the configured command split
+  on whitespace (its head resolved to an absolute path) plus the bind
+  host/port and state dir. The room-server runs on loopback only; the
+  caller picks the port. `--no-wt` opts out of the WebTransport listener:
+  a host-placed engine host only serves the HTTP `/api` surface, and the
+  fixed WT port would collide across the many per-run servers that share
+  one host.
+  """
+  @spec host_room_server_command(Config.t(), String.t(), pos_integer(), Path.t()) :: [String.t()]
+  def host_room_server_command(%Config{host_room_server_command: command}, host, port, state_dir)
+      when is_binary(host) and is_integer(port) and is_binary(state_dir) do
+    [exe | rest] =
+      case String.split(command, ~r/\s+/, trim: true) do
+        [head | rest] -> [System.find_executable(head) || head | rest]
+        [] -> ["room-server"]
+      end
+
+    [exe | rest] ++
+      ["--host", host, "--port", Integer.to_string(port), "--state-dir", state_dir, "--no-wt"]
+  end
+
+  @doc """
+  Parse the target user's home directory out of a `getent passwd` line.
+  Shared so both host paths resolve the same `$HOME` the checkout and room
+  state live under.
+  """
+  @spec parse_passwd_home(String.t(), String.t()) :: {:ok, Path.t()} | {:error, term()}
+  def parse_passwd_home(output, user) when is_binary(output) and is_binary(user) do
+    output
+    |> String.split("\n", trim: true)
+    |> List.first()
+    |> case do
+      nil ->
+        {:error, {:host_user_unknown, user}}
+
+      line ->
+        case String.split(line, ":") do
+          fields when length(fields) >= 6 ->
+            home = Enum.at(fields, 5)
+            if is_binary(home) and home != "", do: {:ok, home}, else: {:error, {:host_user_no_home, user}}
+
+          _ ->
+            {:error, {:host_user_unknown, user}}
+        end
+    end
+  end
+
+  @doc """
+  Redact secrets from a `systemd-run` argv before it reaches a log or run
+  record: drop the value of any `--setenv=NAME=value` pair. Shared so the
+  legacy and IR host paths redact the same way.
+  """
+  @spec sanitize_setenv_args([String.t()]) :: [String.t()]
+  def sanitize_setenv_args(args) when is_list(args) do
+    Enum.map(args, fn arg ->
+      case String.split(arg, "=", parts: 3) do
+        ["--setenv", name, _value] -> "--setenv=" <> name <> "=<redacted>"
+        _ -> arg
+      end
+    end)
+  end
+
+  @doc """
+  Clone every repository in the active catalog into `run_root`, on a
+  run-scoped `branch`, stamping the bot identity and (when `token` is
+  present) a GitHub Basic auth header so plain `git push` authors as the
+  App. Returns the concatenated `bash` blocks; the caller owns the
+  surrounding `set -euo pipefail` and the `mkdir -p` of `run_root`.
+  """
+  @spec repo_blocks(Config.t(), Path.t(), String.t(), String.t() | nil, [RepositoryCatalog.t()] | nil) :: String.t()
+  def repo_blocks(%Config{} = config, run_root, branch, token, repositories \\ nil) do
+    basic = if is_binary(token), do: Base.encode64("x-access-token:" <> token)
+
+    (repositories || RepositoryCatalog.all(config))
+    |> Enum.map_join("\n", &clone_repo_block(&1, run_root, branch, basic, config))
+  end
+
+  defp clone_repo_block(repo, run_root, branch, basic, config) do
+    target = Path.join(run_root, repo.name)
+    remote = "https://github.com/#{repo.owner_repo}.git"
+    clone_auth = if is_binary(basic), do: "-c http.https://github.com/.extraheader=#{sh("Authorization: Basic " <> basic)}", else: ""
+
+    extraheader =
+      if is_binary(basic),
+        do: "git -C #{sh(target)} config --local http.https://github.com/.extraheader #{sh("Authorization: Basic " <> basic)}",
+        else: ":"
+
+    """
+    rm -rf #{sh(target)}
+    git #{clone_auth} clone --depth 1 --branch #{sh(repo.default_branch)} #{sh(remote)} #{sh(target)}
+    git -C #{sh(target)} checkout -b #{sh(branch)}
+    #{git_identity_lines(target, config)}
+    #{extraheader}
+    """
+  end
+
+  defp git_identity_lines(target, %Config{} = config) do
+    [
+      git_config_line(target, "user.name", config.github_app_bot_username),
+      git_config_line(target, "user.email", config.github_app_bot_email)
+    ]
+    |> Enum.reject(&(&1 == nil))
+    |> case do
+      [] -> ":"
+      lines -> Enum.join(lines, "\n")
+    end
+  end
+
+  defp git_config_line(_target, _key, nil), do: nil
+  defp git_config_line(_target, _key, ""), do: nil
+
+  defp git_config_line(target, key, value) do
+    "git -C #{sh(target)} config --local #{sh(key)} #{sh(value)}"
+  end
+
+  @doc """
+  The environment the remote room-server (and the Codex process it spawns)
+  needs: the bot `GITHUB_TOKEN`/`GH_TOKEN`, then any names listed in
+  `SYMPHONY_IX_ENV_PASSTHROUGH` copied from the Symphony host.
+
+  The GitHub token is `opts[:bot_token]` when the runtime minted a GitHub
+  App installation token for the run, falling back to the static
+  `config.github_token` only when no App token is available. `gh pr create`
+  authors as whoever owns `GH_TOKEN` regardless of the workspace
+  `user.email`, so the same `:bot_token` that stamps the clone auth header
+  in `repo_blocks/4` must own the room-server's `GITHUB_TOKEN`/`GH_TOKEN`;
+  otherwise an agent PR is authored by the static host token. The GitHub
+  vars are placed before the passthrough so a `SYMPHONY_IX_ENV_PASSTHROUGH`
+  entry of the same name cannot shadow the bot identity.
+  """
+  @spec runtime_env(Config.t(), keyword()) :: [{String.t(), String.t()}]
+  def runtime_env(%Config{} = config, opts) when is_list(opts) do
+    token = Keyword.get(opts, :bot_token) || config.github_token
+
+    github_env =
+      case token do
+        t when is_binary(t) and t != "" -> [{"GITHUB_TOKEN", t}, {"GH_TOKEN", t}]
+        _ -> []
+      end
+
+    passthrough =
+      config.ix_env_passthrough
+      |> Enum.flat_map(fn name ->
+        case System.get_env(name) do
+          nil -> []
+          "" -> []
+          value -> [{name, value}]
+        end
+      end)
+
+    Enum.uniq_by(github_env ++ passthrough, fn {key, _value} -> key end)
+  end
+
+  @doc """
+  Render `export KEY='value'` lines for a `bash -lc` script, or `:` (a
+  no-op) when the environment is empty so the surrounding script stays
+  valid.
+  """
+  @spec env_export_lines([{String.t(), String.t()}]) :: String.t()
+  def env_export_lines([]), do: ":"
+
+  def env_export_lines(env) do
+    Enum.map_join(env, "\n", fn {key, value} -> "export #{key}=#{sh(value)}" end)
+  end
+
+  @type context :: %{optional(:identifier) => String.t(), optional(:title) => String.t()}
+
+  @doc "Stable registry id for a run's node-scoped room backend."
+  @spec backend_id(String.t(), String.t()) :: String.t()
+  def backend_id(run_id, node_id), do: "symphony:#{run_id}:#{node_id}"
+
+  @doc "Human-facing backend name shown in the room backend picker."
+  @spec backend_name(context(), String.t(), String.t()) :: String.t()
+  def backend_name(%{identifier: id, title: title}, _run_id, node_id)
+      when is_binary(id) and is_binary(title) do
+    "#{id}: #{title} / #{node_id}"
+  end
+
+  def backend_name(%{identifier: id}, _run_id, node_id) when is_binary(id), do: "#{id} / #{node_id}"
+  def backend_name(_context, run_id, node_id), do: "#{run_id} / #{node_id}"
+
+  @doc """
+  Poll `<url>/api/health` until it answers 2xx or `timeout_ms` elapses.
+  """
+  @spec wait_for_room(String.t(), pos_integer()) :: :ok | {:error, term()}
+  def wait_for_room(url, timeout_ms) do
+    deadline = System.monotonic_time(:millisecond) + timeout_ms
+    do_wait_for_room(url, deadline, nil)
+  end
+
+  defp do_wait_for_room(url, deadline, last_error) do
+    if System.monotonic_time(:millisecond) >= deadline do
+      {:error, {:room_health_timeout, url, last_error}}
+    else
+      case Req.get(url <> "/api/health", receive_timeout: 2_000, connect_options: [timeout: 2_000]) do
+        {:ok, %{status: status}} when status in 200..299 ->
+          :ok
+
+        {:ok, %{status: status, body: body}} ->
+          Process.sleep(1_000)
+          do_wait_for_room(url, deadline, {:status, status, body})
+
+        {:error, reason} ->
+          Process.sleep(1_000)
+          do_wait_for_room(url, deadline, reason)
+      end
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/codex/room_registry.ex b/packages/symphony/elixir/lib/symphony_elixir/codex/room_registry.ex
new file mode 100644
index 000000000..45f4105c0
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/codex/room_registry.ex
@@ -0,0 +1,60 @@
+defmodule SymphonyElixir.Codex.RoomRegistry do
+  @moduledoc """
+  Registers per-VM Room servers with a central Room instance.
+
+  Symphony creates short-lived iXVMs and therefore owns the moment a VM
+  Room server becomes reachable. The central Room service only stores
+  that fact and proxies read paths for the browser UI.
+  """
+
+  alias SymphonyElixir.Config
+
+  require Logger
+
+  @spec register(Config.t(), map()) :: :ok
+  def register(%Config{room: %{registry_url: nil}}, _backend), do: :ok
+
+  def register(%Config{} = config, backend) when is_map(backend) do
+    post(config, "/api/backends", backend, "register")
+  end
+
+  @spec unregister(Config.t(), String.t()) :: :ok
+  def unregister(%Config{room: %{registry_url: nil}}, _id), do: :ok
+
+  def unregister(%Config{} = config, id) when is_binary(id) do
+    case Req.delete(url(config, "/api/backends/" <> URI.encode(id)),
+           headers: headers(config),
+           connect_options: [timeout: 5_000],
+           receive_timeout: 5_000
+         ) do
+      {:ok, %{status: status}} when status in 200..299 or status == 404 -> :ok
+      {:ok, %{status: status, body: body}} -> warn("unregister", {:status, status, body})
+      {:error, reason} -> warn("unregister", reason)
+    end
+  end
+
+  defp post(%Config{} = config, path, payload, action) do
+    case Req.post(url(config, path),
+           headers: headers(config),
+           json: payload,
+           connect_options: [timeout: 5_000],
+           receive_timeout: 5_000
+         ) do
+      {:ok, %{status: status}} when status in 200..299 -> :ok
+      {:ok, %{status: status, body: body}} -> warn(action, {:status, status, body})
+      {:error, reason} -> warn(action, reason)
+    end
+  end
+
+  defp url(%Config{room: %{registry_url: registry_url}}, path) do
+    String.trim_trailing(registry_url, "/") <> path
+  end
+
+  defp headers(%Config{room: %{registry_token: nil}}), do: []
+  defp headers(%Config{room: %{registry_token: token}}), do: [{"authorization", "Bearer " <> token}]
+
+  defp warn(action, reason) do
+    Logger.warning("RoomRegistry: #{action} failed: #{inspect(reason)}")
+    :ok
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/command.ex b/packages/symphony/elixir/lib/symphony_elixir/command.ex
new file mode 100644
index 000000000..a665d5241
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/command.ex
@@ -0,0 +1,61 @@
+defmodule SymphonyElixir.Command do
+  @moduledoc false
+
+  @type result :: {:ok, String.t()} | {:error, {:exit, non_neg_integer(), String.t()} | {:timeout, pos_integer(), String.t()} | {:start_failed, String.t()}}
+
+  @spec run(Path.t(), [String.t()], pos_integer()) :: result()
+  def run(executable, args, timeout_ms) when is_binary(executable) and is_list(args) and timeout_ms > 0 do
+    port =
+      Port.open({:spawn_executable, executable}, [
+        :binary,
+        :exit_status,
+        :stderr_to_stdout,
+        args: args
+      ])
+
+    deadline = System.monotonic_time(:millisecond) + timeout_ms
+    collect(port, deadline, timeout_ms, [])
+  rescue
+    error -> {:error, {:start_failed, Exception.message(error)}}
+  end
+
+  defp collect(port, deadline, timeout_ms, chunks) do
+    remaining_ms = max(deadline - System.monotonic_time(:millisecond), 0)
+
+    receive do
+      {^port, {:data, data}} ->
+        collect(port, deadline, timeout_ms, [data | chunks])
+
+      {^port, {:exit_status, 0}} ->
+        {:ok, output(chunks)}
+
+      {^port, {:exit_status, status}} ->
+        {:error, {:exit, status, output(chunks)}}
+    after
+      remaining_ms ->
+        close_port(port)
+        {:error, {:timeout, timeout_ms, output(chunks)}}
+    end
+  end
+
+  defp output(chunks), do: chunks |> Enum.reverse() |> IO.iodata_to_binary()
+
+  defp close_port(port) do
+    kill_os_process(port)
+    if Port.info(port) != nil, do: Port.close(port)
+  rescue
+    _ -> :ok
+  end
+
+  # Port.close/1 on a :spawn_executable port closes the stdio pipes but
+  # leaves the spawned OS process running. For a long-lived child like
+  # `ix new` (placement's ix_create_timeout_ms is 120s) the process keeps
+  # running well past the timeout and orphans accumulate, so signal the
+  # process before closing the port. Mirrors Placement.real_stop_port_forward/1.
+  defp kill_os_process(port) do
+    case Port.info(port, :os_pid) do
+      {:os_pid, os_pid} -> System.cmd("kill", ["-TERM", Integer.to_string(os_pid)], stderr_to_stdout: true)
+      nil -> :ok
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/config.ex b/packages/symphony/elixir/lib/symphony_elixir/config.ex
new file mode 100644
index 000000000..754381c58
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/config.ex
@@ -0,0 +1,680 @@
+defmodule SymphonyElixir.Config do
+  @moduledoc """
+  Boot-time snapshot of process-environment configuration.
+
+  Env vars are read once on startup. To pick up changes, restart the BEAM.
+  Skill files are hot-reloaded by `SymphonyElixir.Catalog` and workflow
+  files by `SymphonyElixir.WorkflowCatalog`; this module owns only the
+  values that genuinely require a process restart (network endpoints,
+  on-disk paths, polling cadence).
+
+  Required for any work to happen:
+
+      SYMPHONY_ROOT           absolute path of the symphony repo
+      SYMPHONY_PRIMARY_REPO   absolute path of the primary repo used as the local source
+
+  Workflow pack selection:
+
+      SYMPHONY_PACK_DIR       absolute path of an external pack directory; takes precedence
+                              over SYMPHONY_WORKFLOW_PACK when set
+      SYMPHONY_WORKFLOW_PACK  defaults to "example"; selects workflows/<pack> inside the
+                              symphony repo when SYMPHONY_PACK_DIR is unset
+      SYMPHONY_WORKFLOWS_DIR  defaults to <pack_dir>/workflows
+      SYMPHONY_SKILLS_DIR     defaults to <pack_dir>/skills
+      SYMPHONY_REPOSITORIES_FILE defaults to <pack_dir>/repositories.yaml
+
+  Runtime paths:
+
+      SYMPHONY_WORKSPACES_DIR defaults to $SYMPHONY_ROOT/workspaces
+      SYMPHONY_REPO_ROOT      optional local checkout parent used for fast shared clones.
+                              Defaults to the parent directory of SYMPHONY_PRIMARY_REPO.
+      SYMPHONY_RUNS_DIR       defaults to $SYMPHONY_ROOT/runs
+      SYMPHONY_CODEX_COMMAND  defaults to "codex app-server"
+      SYMPHONY_ROOM_SERVER_URL the default room-server base URL for runs whose
+                              node placement is `:local` or `:room`. Per-run
+                              `:ixvm`/`:host` placements resolve their own URL
+                              through `Runtime.Placement`.
+      SYMPHONY_ROOM_REGISTRY_URL optional central room-server URL that receives
+                              per-VM backend registrations
+      SYMPHONY_ROOM_REGISTRY_TOKEN optional bearer token for registry writes
+      SYMPHONY_IX_COMMAND     defaults to "ix"
+      SYMPHONY_IX_IMAGE       defaults to "ix/symphony-codex:latest"
+      SYMPHONY_IX_ROOM_SERVER_COMMAND defaults to "room-server"
+      SYMPHONY_IX_REGION      optional; omitted lets ix choose its default
+      SYMPHONY_IX_ROOM_PORT   defaults to 8080
+      SYMPHONY_IX_ROOM_CONNECT defaults to "direct"; set "port_forward" to
+                              tunnel localhost from the Symphony host
+      SYMPHONY_IX_LOCAL_PORT_BASE defaults to 18080 for port_forward mode
+      SYMPHONY_IX_KEEP_VM     defaults to false; true leaves VMs around after
+                              the turn for inspection
+      SYMPHONY_IX_CREATE_TIMEOUT_MS defaults to 120000 (2 minutes); the
+                              maximum time to wait for `ix new` before the
+                              run falls back to the configured placement
+                              fallback. Set lower for faster fallback when
+                              the ix control plane is degraded.
+      SYMPHONY_IX_ENV_PASSTHROUGH comma-separated env names copied into the
+                              remote room-server/Codex process (applies to both
+                              the ixvm and host runtimes)
+
+  Host placement (a node's `location: host` on the IR engine path):
+
+      SYMPHONY_HOST_USER      OS user the host placement runs codex as.
+                              Required for host placement; absent fails setup
+                              and retries per SYMPHONY_PLACEMENT_FALLBACK.
+      SYMPHONY_HOST_GROUP     optional OS group; omitted uses the user's
+                              primary group.
+      SYMPHONY_HOST_WORKSPACES_DIR optional parent for run checkouts; defaults
+                              to <user home>/symphony-workspaces.
+      SYMPHONY_HOST_ROOM_SERVER_COMMAND defaults to "room-server"; the
+                              per-run room-server launched as the host user.
+      SYMPHONY_HOST_SYSTEMD_RUN_COMMAND defaults to "systemd-run".
+      SYMPHONY_HOST_KEEP      defaults to false; true leaves the unit and
+                              checkout in place after the turn for inspection.
+
+  Placement fallback (IR engine path):
+
+      SYMPHONY_PLACEMENT_FALLBACK defaults to "host"; the placement a run
+                              retries on when its declared `ixvm` placement
+                              fails to provision before the first agent turn.
+                              "host" reprovisions the per-run room-server as
+                              a systemd-run unit on this host; "local" drops
+                              to the in-process server (the dev convenience);
+                              "none" leaves the run to fail against the
+                              missing placement with no fallback.
+
+  Claude models (any skill whose codex_model names a Claude model, e.g.
+  claude-opus-4-8, runs through Claude Code instead of codex):
+
+      ANTHROPIC_API_KEY       Anthropic API key billed for Claude Code turns.
+                              Required for any Claude-model node; absent fails
+                              the node with :anthropic_api_key_not_configured.
+      SYMPHONY_CLAUDE_COMMAND defaults to "claude"; the Claude Code CLI invoked
+                              non-interactively (`--print`).
+      SYMPHONY_CATALOG_POLL_MS defaults to 1000
+
+  Integrations:
+
+      LINEAR_API_KEY          enables the Linear graphql tool and webhook enqueue
+      LINEAR_TEAM_KEY         optional, used by skills that want to scope queries
+      LINEAR_WORKSPACE_SLUG   optional; used to build linear.app issue URLs in
+                              dashboards and notifications (e.g. "myorg" yields
+                              https://linear.app/myorg/issue/ABC-1)
+      LINEAR_WEBHOOK_SECRET   required to accept POST /api/v1/triggers/linear; absent rejects 401
+      GITHUB_WEBHOOK_SECRET   required to accept POST /api/v1/triggers/github; absent rejects 401
+      GITHUB_TOKEN            enables GitHub-backed dashboard statistics
+      SLACK_BOT_OAUTH_TOKEN   enables the Slack huddle trigger; absent disables it
+      SLACK_SIGNING_SECRET    required to accept Slack event webhooks
+      SYMPHONY_SLACK_POLL_MS  defaults to 60000
+      SYMPHONY_SLACK_NOTIFY_CHANNEL optional; set empty to disable post-run notifications
+      SYMPHONY_SLACK_NOTIFY_CRON_FAILURES post failed cron runs to Slack; defaults to true
+      SYMPHONY_SLACK_NOTIFY_CRON_WORKFLOWS comma-separated workflow names whose cron successes also post, or "*" for every cron success; defaults to none
+      SYMPHONY_ROOM_REGISTRY_URL central room.ix.dev a run's room-server registers with; also the Slack run-detail link base
+      SYMPHONY_ROOM_REGISTRY_TOKEN optional bearer token for room backend registration writes
+      SYMPHONY_ROOM_ADVERTISE_HOST optional; address a provisioned room-server binds/advertises so room.ix.dev can reach it
+      SYMPHONY_ROOM_SERVER_URL optional standing room-server URL for :local / {:room, url} placements
+      SYMPHONY_CRON_POLL_MS   defaults to 60000; cadence of the cron trigger tick
+      SYMPHONY_CRON_STATE_PATH defaults to runs_dir/cron_state.json
+      SYMPHONY_SUBRUN_MAX_DEPTH defaults to 8; the deepest nested-subrun chain a
+                              run may spawn before a `subrun` is rejected, the
+                              backstop against unbounded recursion that a cycle
+                              guard alone cannot catch (mutually recursive but
+                              not self-referential workflows)
+
+  GitHub App (optional; when configured, skills push under the App identity):
+
+      SYMPHONY_GITHUB_APP_ID                   numeric GitHub App id. When unset,
+                                               skills push under whatever ambient PAT is on PATH.
+      SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64   base64 of the App's PEM private key.
+      SYMPHONY_GITHUB_APP_OWNER_REPO           repo used for App installation lookup
+                                               (e.g. "owner/repo").
+      SYMPHONY_BOT_USERNAME                    git user.name to stamp on commits made by
+                                               skill nodes (e.g. "my-app[bot]"). Required
+                                               when SYMPHONY_GITHUB_APP_ID is set.
+      SYMPHONY_BOT_EMAIL                       git user.email to stamp on commits.
+
+  Statistics dashboard (optional):
+
+      SYMPHONY_GITHUB_STATS_QUERY              GitHub search query the statistics dashboard
+                                               uses to enumerate bot-authored PRs. Absent
+                                               disables the GitHub side of the dashboard.
+  """
+
+  use GenServer
+
+  @table :symphony_config
+
+  defstruct [
+    :root,
+    :workflow_pack,
+    :pack_dir,
+    :primary_repo,
+    :workflows_dir,
+    :skills_dir,
+    :repositories_file,
+    :workspaces_dir,
+    :repo_root,
+    :runs_dir,
+    :codex_command,
+    # Central room.ix.dev connection settings grouped into one field so the
+    # struct stays under the lint's field ceiling: the standing-server URL,
+    # the registry URL/token a per-run server registers its backend with, and
+    # the host a provisioned server advertises so room.ix.dev can reach it.
+    :room,
+    :ix_command,
+    :ix_image,
+    :ix_room_server_command,
+    :ix_region,
+    :ix_room_port,
+    :ix_room_connect,
+    :ix_local_port_base,
+    :ix_keep_vm?,
+    :ix_create_timeout_ms,
+    :ix_env_passthrough,
+    :host_user,
+    :host_group,
+    :host_workspaces_dir,
+    :host_room_server_command,
+    :host_systemd_run_command,
+    :host_keep?,
+    :placement_fallback,
+    # Remote runtime worker connection settings (a worker's identity, the
+    # control plane it dials, and the address it binds room-servers on),
+    # grouped so the config struct stays under the lint's field ceiling. The
+    # `:worker` role is read from the env in Application, not from here.
+    :worker,
+    :worker_select_label,
+    :anthropic_api_key,
+    :claude_command,
+    :catalog_poll_ms,
+    :linear_api_key,
+    :linear_endpoint,
+    :linear_team_key,
+    :linear_workspace_slug,
+    :linear_webhook_secret,
+    :github_webhook_secret,
+    :github_token,
+    :slack_bot_token,
+    :slack_signing_secret,
+    :slack_endpoint,
+    :slack_poll_ms,
+    :slack_notify_channel,
+    :slack_notify_cron_failures,
+    :slack_notify_cron_workflows,
+    :cron_state_path,
+    :cron_poll_ms,
+    :subrun_max_depth,
+    :github_app_id,
+    :github_app_private_key_pem,
+    :github_app_owner_repo,
+    :github_app_bot_username,
+    :github_app_bot_email,
+    :github_stats_query
+  ]
+
+  @type t :: %__MODULE__{
+          root: Path.t(),
+          workflow_pack: String.t(),
+          pack_dir: Path.t(),
+          primary_repo: Path.t() | nil,
+          workflows_dir: Path.t(),
+          skills_dir: Path.t(),
+          repositories_file: Path.t(),
+          workspaces_dir: Path.t(),
+          repo_root: Path.t() | nil,
+          runs_dir: Path.t(),
+          codex_command: String.t(),
+          room: %{
+            server_url: String.t() | nil,
+            registry_url: String.t() | nil,
+            registry_token: String.t() | nil,
+            advertise_host: String.t() | nil
+          },
+          ix_command: String.t(),
+          ix_image: String.t(),
+          ix_room_server_command: String.t(),
+          ix_region: String.t() | nil,
+          ix_room_port: pos_integer(),
+          ix_room_connect: String.t(),
+          ix_local_port_base: pos_integer(),
+          ix_keep_vm?: boolean(),
+          ix_create_timeout_ms: pos_integer(),
+          ix_env_passthrough: [String.t()],
+          host_user: String.t() | nil,
+          host_group: String.t() | nil,
+          host_workspaces_dir: Path.t() | nil,
+          host_room_server_command: String.t(),
+          host_systemd_run_command: String.t(),
+          host_keep?: boolean(),
+          placement_fallback: :host | :remote | :local | :none,
+          worker: %{
+            control_plane_url: String.t() | nil,
+            worker_id: String.t() | nil,
+            worker_labels: [String.t()],
+            worker_room_host: String.t() | nil
+          },
+          worker_select_label: String.t() | nil,
+          anthropic_api_key: String.t() | nil,
+          claude_command: String.t(),
+          catalog_poll_ms: pos_integer(),
+          linear_api_key: String.t() | nil,
+          linear_endpoint: String.t(),
+          linear_team_key: String.t() | nil,
+          linear_workspace_slug: String.t() | nil,
+          linear_webhook_secret: String.t() | nil,
+          github_webhook_secret: String.t() | nil,
+          github_token: String.t() | nil,
+          slack_bot_token: String.t() | nil,
+          slack_signing_secret: String.t() | nil,
+          slack_endpoint: String.t(),
+          slack_poll_ms: pos_integer(),
+          slack_notify_channel: String.t() | nil,
+          slack_notify_cron_failures: boolean(),
+          slack_notify_cron_workflows: [String.t()],
+          cron_state_path: Path.t(),
+          cron_poll_ms: pos_integer(),
+          subrun_max_depth: pos_integer(),
+          github_app_id: String.t() | nil,
+          github_app_private_key_pem: String.t() | nil,
+          github_app_owner_repo: String.t() | nil,
+          github_app_bot_username: String.t() | nil,
+          github_app_bot_email: String.t() | nil,
+          github_stats_query: String.t() | nil
+        }
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @spec get() :: t()
+  def get do
+    case :ets.lookup(@table, :snapshot) do
+      [{:snapshot, snapshot}] -> snapshot
+      [] -> raise "SymphonyElixir.Config not started"
+    end
+  end
+
+  @impl true
+  def init(opts) do
+    :ets.new(@table, [:named_table, :public, read_concurrency: true])
+
+    snapshot = build_snapshot(opts)
+    :ok = ensure_dirs!(snapshot)
+    :ets.insert(@table, {:snapshot, snapshot})
+
+    {:ok, snapshot}
+  end
+
+  defp build_snapshot(opts) do
+    root = Keyword.get_lazy(opts, :root, fn -> require_env!("SYMPHONY_ROOT") end)
+    root = Path.expand(root)
+    workflow_pack = string_env(opts, :workflow_pack, "SYMPHONY_WORKFLOW_PACK", "example")
+
+    primary_repo =
+      case Keyword.get(opts, :primary_repo) || System.get_env("SYMPHONY_PRIMARY_REPO") do
+        nil -> nil
+        value -> Path.expand(value)
+      end
+
+    pack_dir =
+      path_env(
+        opts,
+        :pack_dir,
+        "SYMPHONY_PACK_DIR",
+        Path.join([root, "workflows", workflow_pack])
+      )
+
+    workflows_dir = path_env(opts, :workflows_dir, "SYMPHONY_WORKFLOWS_DIR", Path.join(pack_dir, "workflows"))
+    skills_dir = path_env(opts, :skills_dir, "SYMPHONY_SKILLS_DIR", Path.join(pack_dir, "skills"))
+
+    repositories_file =
+      path_env(opts, :repositories_file, "SYMPHONY_REPOSITORIES_FILE", Path.join(pack_dir, "repositories.yaml"))
+
+    workspaces_dir = path_env(opts, :workspaces_dir, "SYMPHONY_WORKSPACES_DIR", Path.join(root, "workspaces"))
+    repo_root = repo_root_env(opts, primary_repo)
+    runs_dir = path_env(opts, :runs_dir, "SYMPHONY_RUNS_DIR", Path.join(root, "runs"))
+
+    codex_command = string_env(opts, :codex_command, "SYMPHONY_CODEX_COMMAND", "codex app-server")
+    room_server_url = Keyword.get(opts, :room_server_url) || System.get_env("SYMPHONY_ROOM_SERVER_URL")
+
+    room_registry_url =
+      empty_to_nil(Keyword.get(opts, :room_registry_url) || System.get_env("SYMPHONY_ROOM_REGISTRY_URL"))
+
+    room_registry_token =
+      empty_to_nil(Keyword.get(opts, :room_registry_token) || System.get_env("SYMPHONY_ROOM_REGISTRY_TOKEN"))
+
+    # The address a provisioned per-run room-server binds and advertises so the
+    # central room.ix.dev can reach it to proxy reads. Unset keeps the loopback
+    # default (only reachable when room.ix.dev shares the host).
+    room_advertise_host =
+      empty_to_nil(Keyword.get(opts, :room_advertise_host) || System.get_env("SYMPHONY_ROOM_ADVERTISE_HOST"))
+
+    room = %{
+      server_url: empty_to_nil(room_server_url),
+      registry_url: room_registry_url,
+      registry_token: room_registry_token,
+      advertise_host: room_advertise_host
+    }
+
+    ix_command = string_env(opts, :ix_command, "SYMPHONY_IX_COMMAND", "ix")
+
+    ix_image = string_env(opts, :ix_image, "SYMPHONY_IX_IMAGE", "ix/symphony-codex:latest")
+
+    ix_room_server_command =
+      string_env(
+        opts,
+        :ix_room_server_command,
+        "SYMPHONY_IX_ROOM_SERVER_COMMAND",
+        "room-server"
+      )
+
+    ix_region = empty_to_nil(Keyword.get(opts, :ix_region) || System.get_env("SYMPHONY_IX_REGION"))
+    ix_room_port = int_env(opts, :ix_room_port, "SYMPHONY_IX_ROOM_PORT", 8080)
+    ix_room_connect = string_env(opts, :ix_room_connect, "SYMPHONY_IX_ROOM_CONNECT", "direct")
+    ix_local_port_base = int_env(opts, :ix_local_port_base, "SYMPHONY_IX_LOCAL_PORT_BASE", 18_080)
+    ix_keep_vm? = bool_env(opts, :ix_keep_vm?, "SYMPHONY_IX_KEEP_VM", false)
+    ix_create_timeout_ms = int_env(opts, :ix_create_timeout_ms, "SYMPHONY_IX_CREATE_TIMEOUT_MS", 120_000)
+    ix_env_passthrough = csv_env(opts, :ix_env_passthrough, "SYMPHONY_IX_ENV_PASSTHROUGH", ["OPENAI_API_KEY", "CODEX_API_KEY"])
+
+    host_user = empty_to_nil(Keyword.get(opts, :host_user) || System.get_env("SYMPHONY_HOST_USER"))
+    host_group = empty_to_nil(Keyword.get(opts, :host_group) || System.get_env("SYMPHONY_HOST_GROUP"))
+
+    host_workspaces_dir =
+      empty_to_nil(Keyword.get(opts, :host_workspaces_dir) || System.get_env("SYMPHONY_HOST_WORKSPACES_DIR"))
+
+    host_room_server_command =
+      string_env(opts, :host_room_server_command, "SYMPHONY_HOST_ROOM_SERVER_COMMAND", "room-server")
+
+    host_systemd_run_command =
+      string_env(opts, :host_systemd_run_command, "SYMPHONY_HOST_SYSTEMD_RUN_COMMAND", "systemd-run")
+
+    host_keep? = bool_env(opts, :host_keep?, "SYMPHONY_HOST_KEEP", false)
+    placement_fallback = placement_fallback_env(opts)
+
+    worker = %{
+      control_plane_url: empty_to_nil(Keyword.get(opts, :control_plane_url) || System.get_env("SYMPHONY_CONTROL_PLANE_URL")),
+      worker_id: empty_to_nil(Keyword.get(opts, :worker_id) || System.get_env("SYMPHONY_WORKER_ID")),
+      worker_labels: csv_env(opts, :worker_labels, "SYMPHONY_WORKER_LABELS", []),
+      worker_room_host: empty_to_nil(Keyword.get(opts, :worker_room_host) || System.get_env("SYMPHONY_WORKER_ROOM_HOST"))
+    }
+
+    worker_select_label = empty_to_nil(Keyword.get(opts, :worker_select_label) || System.get_env("SYMPHONY_WORKER_SELECT_LABEL"))
+
+    anthropic_api_key = empty_to_nil(Keyword.get(opts, :anthropic_api_key) || System.get_env("ANTHROPIC_API_KEY"))
+    claude_command = string_env(opts, :claude_command, "SYMPHONY_CLAUDE_COMMAND", "claude")
+
+    catalog_poll_ms = int_env(opts, :catalog_poll_ms, "SYMPHONY_CATALOG_POLL_MS", 1_000)
+
+    linear_api_key = Keyword.get(opts, :linear_api_key) || System.get_env("LINEAR_API_KEY")
+    linear_endpoint = string_env(opts, :linear_endpoint, "LINEAR_API_ENDPOINT", "https://api.linear.app/graphql")
+    linear_team_key = Keyword.get(opts, :linear_team_key) || System.get_env("LINEAR_TEAM_KEY")
+    linear_workspace_slug = Keyword.get(opts, :linear_workspace_slug) || System.get_env("LINEAR_WORKSPACE_SLUG")
+
+    linear_webhook_secret =
+      Keyword.get(opts, :linear_webhook_secret) || System.get_env("LINEAR_WEBHOOK_SECRET")
+
+    github_webhook_secret =
+      Keyword.get(opts, :github_webhook_secret) || System.get_env("GITHUB_WEBHOOK_SECRET")
+
+    github_token = Keyword.get(opts, :github_token) || System.get_env("GITHUB_TOKEN") || System.get_env("GH_TOKEN")
+
+    slack_bot_token = Keyword.get(opts, :slack_bot_token) || System.get_env("SLACK_BOT_OAUTH_TOKEN")
+    slack_signing_secret = Keyword.get(opts, :slack_signing_secret) || System.get_env("SLACK_SIGNING_SECRET")
+    slack_endpoint = string_env(opts, :slack_endpoint, "SLACK_API_ENDPOINT", "https://slack.com/api")
+    slack_poll_ms = int_env(opts, :slack_poll_ms, "SYMPHONY_SLACK_POLL_MS", 60_000)
+
+    slack_notify_channel =
+      Keyword.get(opts, :slack_notify_channel) ||
+        System.get_env("SYMPHONY_SLACK_NOTIFY_CHANNEL")
+
+    slack_notify_cron_failures =
+      bool_env(opts, :slack_notify_cron_failures, "SYMPHONY_SLACK_NOTIFY_CRON_FAILURES", true)
+
+    slack_notify_cron_workflows =
+      csv_env(opts, :slack_notify_cron_workflows, "SYMPHONY_SLACK_NOTIFY_CRON_WORKFLOWS", [])
+
+    cron_state_path =
+      path_env(opts, :cron_state_path, "SYMPHONY_CRON_STATE_PATH", Path.join(runs_dir, "cron_state.json"))
+
+    cron_poll_ms = int_env(opts, :cron_poll_ms, "SYMPHONY_CRON_POLL_MS", 60_000)
+    subrun_max_depth = int_env(opts, :subrun_max_depth, "SYMPHONY_SUBRUN_MAX_DEPTH", 8)
+
+    github_app_id =
+      empty_to_nil(Keyword.get(opts, :github_app_id) || System.get_env("SYMPHONY_GITHUB_APP_ID"))
+
+    github_app_private_key_pem = load_github_app_private_key(opts)
+
+    github_app_owner_repo =
+      empty_to_nil(
+        Keyword.get(opts, :github_app_owner_repo) ||
+          System.get_env("SYMPHONY_GITHUB_APP_OWNER_REPO")
+      )
+
+    github_app_bot_username =
+      empty_to_nil(Keyword.get(opts, :github_app_bot_username) || System.get_env("SYMPHONY_BOT_USERNAME"))
+
+    github_app_bot_email =
+      empty_to_nil(Keyword.get(opts, :github_app_bot_email) || System.get_env("SYMPHONY_BOT_EMAIL"))
+
+    github_stats_query =
+      empty_to_nil(Keyword.get(opts, :github_stats_query) || System.get_env("SYMPHONY_GITHUB_STATS_QUERY"))
+
+    %__MODULE__{
+      root: root,
+      workflow_pack: workflow_pack,
+      pack_dir: pack_dir,
+      primary_repo: primary_repo,
+      workflows_dir: workflows_dir,
+      skills_dir: skills_dir,
+      repositories_file: repositories_file,
+      workspaces_dir: workspaces_dir,
+      repo_root: repo_root,
+      runs_dir: runs_dir,
+      codex_command: codex_command,
+      room: room,
+      ix_command: ix_command,
+      ix_image: ix_image,
+      ix_room_server_command: ix_room_server_command,
+      ix_region: ix_region,
+      ix_room_port: ix_room_port,
+      ix_room_connect: ix_room_connect,
+      ix_local_port_base: ix_local_port_base,
+      ix_keep_vm?: ix_keep_vm?,
+      ix_create_timeout_ms: ix_create_timeout_ms,
+      ix_env_passthrough: ix_env_passthrough,
+      host_user: host_user,
+      host_group: host_group,
+      host_workspaces_dir: host_workspaces_dir,
+      host_room_server_command: host_room_server_command,
+      host_systemd_run_command: host_systemd_run_command,
+      host_keep?: host_keep?,
+      placement_fallback: placement_fallback,
+      worker: worker,
+      worker_select_label: worker_select_label,
+      anthropic_api_key: anthropic_api_key,
+      claude_command: claude_command,
+      catalog_poll_ms: catalog_poll_ms,
+      linear_api_key: empty_to_nil(linear_api_key),
+      linear_endpoint: linear_endpoint,
+      linear_team_key: empty_to_nil(linear_team_key),
+      linear_workspace_slug: empty_to_nil(linear_workspace_slug),
+      linear_webhook_secret: empty_to_nil(linear_webhook_secret),
+      github_webhook_secret: empty_to_nil(github_webhook_secret),
+      github_token: empty_to_nil(github_token),
+      slack_bot_token: empty_to_nil(slack_bot_token),
+      slack_signing_secret: empty_to_nil(slack_signing_secret),
+      slack_endpoint: slack_endpoint,
+      slack_poll_ms: slack_poll_ms,
+      slack_notify_channel: empty_to_nil(slack_notify_channel),
+      slack_notify_cron_failures: slack_notify_cron_failures,
+      slack_notify_cron_workflows: slack_notify_cron_workflows,
+      cron_state_path: cron_state_path,
+      cron_poll_ms: cron_poll_ms,
+      subrun_max_depth: subrun_max_depth,
+      github_app_id: github_app_id,
+      github_app_private_key_pem: github_app_private_key_pem,
+      github_app_owner_repo: github_app_owner_repo,
+      github_app_bot_username: github_app_bot_username,
+      github_app_bot_email: github_app_bot_email,
+      github_stats_query: github_stats_query
+    }
+  end
+
+  # Decode SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64 at boot. The base64 form
+  # is what sits in secret stores because the secret file is a single-line
+  # KEY=VALUE shape that cannot carry the literal PEM newlines. Decode
+  # once here and hand the plain PEM string to GithubApp so it never
+  # has to re-decode per mint.
+  defp load_github_app_private_key(opts) do
+    raw =
+      Keyword.get(opts, :github_app_private_key_base64) ||
+        System.get_env("SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64")
+
+    case empty_to_nil(raw) do
+      nil ->
+        nil
+
+      base64 ->
+        case Base.decode64(base64, ignore: :whitespace) do
+          {:ok, pem} ->
+            pem
+
+          :error ->
+            raise "SYMPHONY_GITHUB_APP_PRIVATE_KEY_BASE64 is not valid base64"
+        end
+    end
+  end
+
+  defp ensure_dirs!(%__MODULE__{} = snapshot) do
+    validate_pack_asset_dir!("SYMPHONY_PACK_DIR", snapshot.pack_dir)
+    validate_pack_asset_dir!("SYMPHONY_WORKFLOWS_DIR", snapshot.workflows_dir)
+    validate_pack_asset_dir!("SYMPHONY_SKILLS_DIR", snapshot.skills_dir)
+    validate_pack_asset_file!("SYMPHONY_REPOSITORIES_FILE", snapshot.repositories_file)
+
+    for dir <- [snapshot.workspaces_dir, snapshot.runs_dir] do
+      File.mkdir_p!(dir)
+    end
+
+    :ok
+  end
+
+  defp validate_pack_asset_dir!(env_name, path) do
+    unless File.dir?(path) do
+      raise "#{env_name} must point at an existing directory, got #{inspect(path)}"
+    end
+  end
+
+  defp validate_pack_asset_file!(env_name, path) do
+    unless File.regular?(path) do
+      raise "#{env_name} must point at an existing file, got #{inspect(path)}"
+    end
+  end
+
+  defp path_env(opts, key, env_name, default) do
+    case Keyword.get(opts, key) || System.get_env(env_name) do
+      nil -> default
+      "" -> default
+      value -> Path.expand(value)
+    end
+  end
+
+  defp string_env(opts, key, env_name, default) do
+    case Keyword.get(opts, key) || System.get_env(env_name) do
+      nil -> default
+      "" -> default
+      value -> value
+    end
+  end
+
+  defp repo_root_env(opts, primary_repo) do
+    case Keyword.get(opts, :repo_root) || System.get_env("SYMPHONY_REPO_ROOT") do
+      nil -> if is_binary(primary_repo), do: Path.dirname(primary_repo), else: nil
+      "" -> nil
+      value -> Path.expand(value)
+    end
+  end
+
+  defp int_env(opts, key, env_name, default) do
+    case Keyword.get(opts, key) || System.get_env(env_name) do
+      nil ->
+        default
+
+      value when is_binary(value) ->
+        case Integer.parse(value) do
+          {parsed, ""} when parsed > 0 -> parsed
+          _ -> raise "#{env_name} must be a positive integer, got #{inspect(value)}"
+        end
+
+      value when is_integer(value) and value > 0 ->
+        value
+    end
+  end
+
+  defp bool_env(opts, key, env_name, default) do
+    case Keyword.get(opts, key) do
+      value when is_boolean(value) ->
+        value
+
+      nil ->
+        case System.get_env(env_name) do
+          nil -> default
+          "" -> default
+          value -> parse_bool_env!(env_name, value)
+        end
+    end
+  end
+
+  defp parse_bool_env!(_env_name, value) when value in ["1", "true", "yes", "on"], do: true
+  defp parse_bool_env!(_env_name, value) when value in ["0", "false", "no", "off"], do: false
+
+  defp parse_bool_env!(env_name, value) do
+    raise "#{env_name} must be boolean-ish, got #{inspect(value)}"
+  end
+
+  # The `ixvm -> fallback` target read once at boot. Defaults to :host so a
+  # run whose ixvm provisioning fails still completes on a per-run
+  # systemd-run room-server rather than aborting; :local is the dev
+  # convenience and :none disables the fallback.
+  defp placement_fallback_env(opts) do
+    case Keyword.get(opts, :placement_fallback) || System.get_env("SYMPHONY_PLACEMENT_FALLBACK") do
+      value when value in [:host, :remote, :local, :none] -> value
+      nil -> :host
+      "" -> :host
+      "host" -> :host
+      "remote" -> :remote
+      "local" -> :local
+      "none" -> :none
+      other -> raise "SYMPHONY_PLACEMENT_FALLBACK must be one of host|remote|local|none, got #{inspect(other)}"
+    end
+  end
+
+  defp csv_env(opts, key, env_name, default) do
+    value = Keyword.get(opts, key) || System.get_env(env_name)
+
+    cond do
+      is_list(value) ->
+        value
+
+      is_binary(value) ->
+        value
+        |> String.split(",", trim: true)
+        |> Enum.map(&String.trim/1)
+        |> Enum.reject(&(&1 == ""))
+
+      true ->
+        default
+    end
+  end
+
+  defp require_env!(name) do
+    case System.get_env(name) do
+      nil -> raise "#{name} must be set"
+      "" -> raise "#{name} must not be empty"
+      value -> value
+    end
+  end
+
+  defp empty_to_nil(nil), do: nil
+  defp empty_to_nil(""), do: nil
+  defp empty_to_nil(value), do: value
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/cron_expression.ex b/packages/symphony/elixir/lib/symphony_elixir/cron_expression.ex
new file mode 100644
index 000000000..4225eee8b
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/cron_expression.ex
@@ -0,0 +1,241 @@
+defmodule SymphonyElixir.CronExpression do
+  @moduledoc """
+  Tiny cron parser and next-fire calculator for the `cron` trigger kind.
+
+  Accepts:
+
+  - Standard 5-field cron strings: `minute hour day-of-month month day-of-week`.
+    Each field supports `*`, a single integer, a comma-separated list
+    (`1,3,5`), a range (`1-5`), and the step form (`*/15`, `0-30/5`).
+  - Nicknames: `@yearly`, `@annually`, `@monthly`, `@weekly`, `@daily`,
+    `@midnight`, `@hourly`.
+
+  Time is treated as UTC. Day-of-week is 0..6 with 0=Sunday, matching
+  POSIX cron.
+
+  When both `day-of-month` and `day-of-week` are restricted (neither is
+  `*`), the match is the OR of the two, again matching POSIX cron. When
+  exactly one is restricted, only that one constrains the match. When
+  both are `*`, any day matches.
+
+  ## Usage
+
+      {:ok, parsed} = CronExpression.parse("@monthly")
+      CronExpression.next_fire_after(parsed, DateTime.utc_now())
+      # => %DateTime{...}  (the first minute of the next month, UTC)
+
+  `next_fire_after/2` returns the first matching minute strictly after
+  the given moment. It steps minute-by-minute and bails out after two
+  years, treating an exhausted search as `{:error, :no_match_within_window}`.
+  """
+
+  @two_years_in_minutes 525_600 * 2
+
+  @type field :: MapSet.t(non_neg_integer())
+
+  @type t :: %{
+          required(:source) => String.t(),
+          required(:minute) => field(),
+          required(:hour) => field(),
+          required(:dom) => field(),
+          required(:month) => field(),
+          required(:dow) => field(),
+          required(:dom_restricted?) => boolean(),
+          required(:dow_restricted?) => boolean()
+        }
+
+  @nicknames %{
+    "@yearly" => "0 0 1 1 *",
+    "@annually" => "0 0 1 1 *",
+    "@monthly" => "0 0 1 * *",
+    "@weekly" => "0 0 * * 0",
+    "@daily" => "0 0 * * *",
+    "@midnight" => "0 0 * * *",
+    "@hourly" => "0 * * * *"
+  }
+
+  @spec parse(String.t()) :: {:ok, t()} | {:error, term()}
+  def parse(expr) when is_binary(expr) do
+    trimmed = String.trim(expr)
+
+    case Map.fetch(@nicknames, trimmed) do
+      {:ok, expanded} -> do_parse(expanded, trimmed)
+      :error -> do_parse(trimmed, trimmed)
+    end
+  end
+
+  def parse(_), do: {:error, :invalid_cron_expression}
+
+  defp do_parse(expanded, source) do
+    case String.split(expanded, ~r/\s+/, trim: true) do
+      [minute, hour, dom, month, dow] ->
+        with {:ok, m} <- parse_field(minute, 0..59),
+             {:ok, h} <- parse_field(hour, 0..23),
+             {:ok, d} <- parse_field(dom, 1..31),
+             {:ok, mo} <- parse_field(month, 1..12),
+             {:ok, w} <- parse_field(dow, 0..6) do
+          {:ok,
+           %{
+             source: source,
+             minute: m,
+             hour: h,
+             dom: d,
+             month: mo,
+             dow: w,
+             dom_restricted?: dom != "*",
+             dow_restricted?: dow != "*"
+           }}
+        end
+
+      _ ->
+        {:error, {:invalid_cron_expression, source}}
+    end
+  end
+
+  defp parse_field(field, range) do
+    field
+    |> String.split(",", trim: true)
+    |> Enum.reduce_while({:ok, MapSet.new()}, fn part, {:ok, acc} ->
+      case parse_part(part, range) do
+        {:ok, values} -> {:cont, {:ok, MapSet.union(acc, values)}}
+        {:error, _} = err -> {:halt, err}
+      end
+    end)
+  end
+
+  # Step form: `<base>/<step>`. Base may itself be `*`, a single integer,
+  # or a range.
+  defp parse_part(part, range) do
+    case String.split(part, "/", parts: 2) do
+      [base, step_str] ->
+        with {:ok, step} <- parse_step(step_str),
+             {:ok, base_values} <- parse_base(base, range) do
+          values = base_values |> Enum.sort() |> apply_step(step) |> MapSet.new()
+          {:ok, values}
+        end
+
+      [base] ->
+        parse_base(base, range)
+    end
+  end
+
+  defp parse_step(s) do
+    case Integer.parse(s) do
+      {n, ""} when n > 0 -> {:ok, n}
+      _ -> {:error, {:invalid_step, s}}
+    end
+  end
+
+  defp parse_base("*", range), do: {:ok, MapSet.new(range)}
+
+  defp parse_base(base, range) do
+    case String.split(base, "-", parts: 2) do
+      [a, b] ->
+        with {:ok, lo} <- parse_int_in(a, range),
+             {:ok, hi} <- parse_int_in(b, range) do
+          if lo <= hi do
+            {:ok, MapSet.new(lo..hi)}
+          else
+            {:error, {:invalid_range, base}}
+          end
+        end
+
+      [single] ->
+        case parse_int_in(single, range) do
+          {:ok, n} -> {:ok, MapSet.new([n])}
+          {:error, _} = err -> err
+        end
+    end
+  end
+
+  defp parse_int_in(s, range) do
+    case Integer.parse(s) do
+      {n, ""} ->
+        if n in range, do: {:ok, n}, else: {:error, {:out_of_range, s, Enum.min(range), Enum.max(range)}}
+
+      _ ->
+        {:error, {:invalid_integer, s}}
+    end
+  end
+
+  defp apply_step(sorted_values, step) when is_list(sorted_values) and step > 0 do
+    case sorted_values do
+      [] ->
+        []
+
+      [first | _] ->
+        sorted_values
+        |> Enum.filter(fn v -> rem(v - first, step) == 0 end)
+    end
+  end
+
+  @doc """
+  Returns the first DateTime strictly after `from` whose minute matches
+  the parsed expression. Resolution is one minute; sub-minute components
+  of `from` are floored before stepping.
+  """
+  @spec next_fire_after(t(), DateTime.t()) :: {:ok, DateTime.t()} | {:error, term()}
+  def next_fire_after(%{} = parsed, %DateTime{} = from) do
+    floored =
+      from
+      |> DateTime.shift_zone!("Etc/UTC")
+      |> truncate_to_minute()
+
+    # Advance one minute past `from` so we never return `from` itself.
+    start = DateTime.add(floored, 60, :second)
+    step(start, parsed, 0)
+  end
+
+  defp step(_dt, _parsed, n) when n > @two_years_in_minutes do
+    {:error, :no_match_within_window}
+  end
+
+  defp step(%DateTime{} = dt, parsed, n) do
+    if matches?(parsed, dt) do
+      {:ok, dt}
+    else
+      step(DateTime.add(dt, 60, :second), parsed, n + 1)
+    end
+  end
+
+  @doc """
+  Whether the given DateTime's minute matches the parsed expression.
+  """
+  @spec matches?(t(), DateTime.t()) :: boolean()
+  def matches?(parsed, %DateTime{} = dt) do
+    dt = DateTime.shift_zone!(dt, "Etc/UTC")
+    date = DateTime.to_date(dt)
+
+    minute_ok = MapSet.member?(parsed.minute, dt.minute)
+    hour_ok = MapSet.member?(parsed.hour, dt.hour)
+    month_ok = MapSet.member?(parsed.month, date.month)
+
+    day_ok = day_matches?(parsed, date)
+
+    minute_ok and hour_ok and month_ok and day_ok
+  end
+
+  # POSIX cron day matching:
+  # - If both DOM and DOW are *, every day matches (and both sets are full).
+  # - If only one of DOM/DOW is restricted, only that one constrains.
+  # - If both are restricted, match if EITHER matches (OR, not AND).
+  defp day_matches?(parsed, %Date{} = date) do
+    dom_match = MapSet.member?(parsed.dom, date.day)
+    dow_match = MapSet.member?(parsed.dow, day_of_week_sunday0(date))
+
+    cond do
+      parsed.dom_restricted? and parsed.dow_restricted? -> dom_match or dow_match
+      parsed.dom_restricted? -> dom_match
+      parsed.dow_restricted? -> dow_match
+      true -> true
+    end
+  end
+
+  # Date.day_of_week/1 returns 1..7 with Monday=1; cron uses 0..6 with
+  # Sunday=0. Convert by `rem(date.day_of_week(), 7)`.
+  defp day_of_week_sunday0(%Date{} = d), do: rem(Date.day_of_week(d), 7)
+
+  defp truncate_to_minute(%DateTime{} = dt) do
+    %{dt | second: 0, microsecond: {0, 0}}
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/cron_state.ex b/packages/symphony/elixir/lib/symphony_elixir/cron_state.ex
new file mode 100644
index 000000000..322d0cba9
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/cron_state.ex
@@ -0,0 +1,138 @@
+defmodule SymphonyElixir.CronState do
+  @moduledoc """
+  Persistent per-workflow fire history for cron-triggered `.sym`
+  workflows.
+
+  Owns a single JSON file at `config.cron_state_path` (defaults to
+  `runs/cron_state.json`) mapping `name => last_fired_at_iso`. The key is
+  the cron producer's choice of identity; it is the workflow basename now
+  that `Triggers.Cron` resolves through `WorkflowCatalog`. Writes go
+  through this GenServer; reads come straight out of ETS for the hot-path
+  tick.
+
+  Survives BEAM restarts. On boot the file is loaded into ETS; missing
+  file means nothing has fired yet.
+
+  Public API:
+
+      get_last_fired(name)         -> {:ok, DateTime.t() | nil}
+      record_fire(name, at)        -> :ok | {:error, term()}
+      list_all()                   -> %{name => DateTime.t()}
+      seed_if_unset(name, at)      -> :ok  (idempotent, atomic)
+
+  `seed_if_unset/2` exists so `Triggers.Cron` can mark a newly observed
+  workflow as 'last fired = now' without firing it on the boot tick. That
+  is the same shape as `systemd Persistent=false` for first observation;
+  subsequent missed windows DO trigger one catch-up fire.
+  """
+
+  use GenServer
+  require Logger
+
+  alias SymphonyElixir.Config
+
+  @table :symphony_cron_state
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @spec get_last_fired(String.t()) :: DateTime.t() | nil
+  def get_last_fired(name) when is_binary(name) do
+    case :ets.lookup(@table, name) do
+      [{^name, %DateTime{} = dt}] -> dt
+      _ -> nil
+    end
+  end
+
+  @spec record_fire(String.t(), DateTime.t()) :: :ok | {:error, term()}
+  def record_fire(name, %DateTime{} = at) when is_binary(name) do
+    GenServer.call(__MODULE__, {:record, name, at})
+  end
+
+  @spec seed_if_unset(String.t(), DateTime.t()) :: :ok
+  def seed_if_unset(name, %DateTime{} = at) when is_binary(name) do
+    GenServer.call(__MODULE__, {:seed_if_unset, name, at})
+  end
+
+  @spec list_all() :: %{String.t() => DateTime.t()}
+  def list_all do
+    @table
+    |> :ets.tab2list()
+    |> Map.new(fn {name, dt} -> {name, dt} end)
+  end
+
+  @impl true
+  def init(_opts) do
+    :ets.new(@table, [:named_table, :public, read_concurrency: true])
+    path = Config.get().cron_state_path
+    load_from_disk(path)
+    {:ok, %{path: path}}
+  end
+
+  @impl true
+  def handle_call({:record, name, %DateTime{} = at}, _from, state) do
+    :ets.insert(@table, {name, at})
+
+    case write_to_disk(state.path) do
+      :ok -> {:reply, :ok, state}
+      {:error, reason} -> {:reply, {:error, reason}, state}
+    end
+  end
+
+  @impl true
+  def handle_call({:seed_if_unset, name, %DateTime{} = at}, _from, state) do
+    case :ets.lookup(@table, name) do
+      [{^name, _dt}] ->
+        {:reply, :ok, state}
+
+      [] ->
+        :ets.insert(@table, {name, at})
+        _ = write_to_disk(state.path)
+        {:reply, :ok, state}
+    end
+  end
+
+  defp load_from_disk(path) do
+    case File.read(path) do
+      {:ok, raw} ->
+        case Jason.decode(raw) do
+          {:ok, %{} = map} ->
+            Enum.each(map, fn {name, iso} ->
+              case iso |> to_string() |> DateTime.from_iso8601() do
+                {:ok, dt, _} -> :ets.insert(@table, {name, dt})
+                _ -> Logger.warning("CronState dropped invalid timestamp for #{name}: #{inspect(iso)}")
+              end
+            end)
+
+          {:ok, other} ->
+            Logger.warning("CronState file at #{path} is not a JSON object, ignoring: #{inspect(other)}")
+
+          {:error, reason} ->
+            Logger.warning("CronState failed to decode #{path}: #{inspect(reason)}")
+        end
+
+      {:error, :enoent} ->
+        :ok
+
+      {:error, reason} ->
+        Logger.warning("CronState failed to read #{path}: #{inspect(reason)}")
+    end
+  end
+
+  defp write_to_disk(path) do
+    payload =
+      @table
+      |> :ets.tab2list()
+      |> Map.new(fn {name, %DateTime{} = dt} -> {name, DateTime.to_iso8601(dt)} end)
+
+    with {:ok, encoded} <- Jason.encode(payload, pretty: true),
+         :ok <- File.mkdir_p(Path.dirname(path)),
+         tmp = path <> ".tmp",
+         :ok <- File.write(tmp, encoded),
+         :ok <- File.rename(tmp, path) do
+      :ok
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/dsl/ast.ex b/packages/symphony/elixir/lib/symphony_elixir/dsl/ast.ex
new file mode 100644
index 000000000..fb09da161
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/dsl/ast.ex
@@ -0,0 +1,272 @@
+defmodule SymphonyElixir.DSL.AST do
+  @moduledoc """
+  Reified data constructors for the workflow surface language.
+
+  The DSL has three representations (see the overhaul plan, Pillar 1):
+
+      .sym source --parse--> reified AST --interpret/expand--> IR graph
+
+  This module is the middle one. Every combinator is plain data, never a
+  host closure. A closure could not be serialized into the durable
+  `RunGraph`, inspected in the dashboard, or replayed deterministically
+  after a restart, so the whole surface is reified as structs the
+  interpreter walks.
+
+  ## Grammar
+
+  A workflow is a `do`-block: an ordered list of statements. The block is
+  monadic in the sense that a binding introduces a name that later
+  statements read, and reading a name is what creates a data dependency.
+  Two statements whose inputs do not reference each other have no edge and
+  the interpreter is free to schedule them in parallel.
+
+      workflow   := do { stmt* }
+      stmt       := bind | let | expr
+      bind       := name "<-" expr          # name binds the effect's output
+      let        := name "="  pure          # name binds a pure value
+      expr       := effect | pure
+
+  ### Effects (become IR nodes)
+
+  Only effectful constructors materialize as `IR.Node`s. They are the
+  things that talk to the world: an engine turn, a shell script, a child
+  run.
+
+      agent  envelope: <map>, prompt: <prompt_ref>, inputs: %{name => pure}
+      exec   script: <pure>, inputs: %{name => pure}, timeout: <pure>?
+      subrun source: <pure>, inputs: %{name => pure}
+
+  An `agent` carries an `Engine.Envelope` spec as a plain map (validated
+  downstream by `Engine.Envelope.from_map/1`) plus a `prompt_ref`:
+
+      prompt_ref := {:skill, name, bindings} | {:inline, text}
+
+  ### Higher-order combinators (dynamic expansion)
+
+  These take a gating input and a body. When the gate's input is
+  unresolved the interpreter emits a placeholder node (`:gate` or
+  `:map_fanout`); when the input resolves it re-runs `expand` and emits
+  the body deterministically.
+
+      when     cond: <pure-over-bindings>, body: <expr>
+      every_nth n: <pos_integer>, key: <counter-name>, body: <expr>
+      map      over: <pure-list>, as: <name>, body: <expr>
+
+  `when` runs its body only if `cond` is truthy. `every_nth` runs its body
+  on every nth expansion of a persisted, named counter (a pure function of
+  that counter, so replay is deterministic: no wall clock, no RNG).
+  `map` fans the body out once per element of `over`, binding each element
+  to `as` inside the body.
+
+  ### Pure expressions (evaluated at expand time, never become nodes)
+
+      pure := literal | var | field | concat | list
+      literal := string | integer | float | boolean | nil
+      var     := {:var, name}                 # read a binding
+      field   := {:field, pure, path}         # e.g. `area session` -> nested read
+      concat  := {:concat, [pure]}            # string interpolation / joining
+      list    := {:list, [pure]}
+
+  Pure expressions are computed inside the interpreter. `{:field, {:var,
+  "session"}, ["area"]}` reads `known_outputs["session"]["area"]` at
+  expand time; it never becomes a trivial IR node.
+
+  ## Stable AST ids
+
+  Every constructor carries an `id` so the interpreter can derive a stable
+  IR node id and the runtime can record which AST construct an expansion
+  came from. The parser assigns ids positionally; `with_id/2` is the
+  single writer so the scheme stays in one place.
+  """
+
+  @typedoc "A bind introduces `name` from an effectful expression's output."
+  @type bind :: {:bind, String.t(), expr()}
+
+  @typedoc "A let introduces `name` from a pure value computed at expand time."
+  @type let :: {:let, String.t(), pure()}
+
+  @typedoc """
+  The declaration that fires a workflow, parsed from the `on <trigger>`
+  header clause. The normalized shape matches the runtime's trigger maps so
+  the catalog can index a workflow by `kind` and a producer can match an
+  event against it. `nil` when the header omits `on` (a workflow only an
+  operator starts by name).
+  """
+  @type trigger :: %{required(:kind) => atom(), optional(atom()) => term()} | nil
+
+  @typedoc "A workflow is an ordered list of statements in a do-block, with an optional trigger."
+  @type workflow :: %{
+          kind: :workflow,
+          id: String.t(),
+          name: String.t() | nil,
+          trigger: trigger(),
+          statements: [statement()]
+        }
+
+  @type statement :: bind() | let() | expr()
+
+  @typedoc "Effectful constructors materialize as IR nodes; pure ones do not."
+  @type expr :: effect() | pure()
+
+  @type effect ::
+          agent()
+          | exec()
+          | subrun()
+          | when_()
+          | every_nth()
+          | map_()
+
+  @type agent :: %{
+          kind: :agent,
+          id: String.t(),
+          envelope: map(),
+          prompt: prompt_ref(),
+          inputs: %{optional(String.t()) => pure()}
+        }
+
+  @type exec :: %{
+          kind: :exec,
+          id: String.t(),
+          script: pure(),
+          timeout: pure() | nil,
+          inputs: %{optional(String.t()) => pure()}
+        }
+
+  @type subrun :: %{
+          kind: :subrun,
+          id: String.t(),
+          source: pure(),
+          inputs: %{optional(String.t()) => pure()}
+        }
+
+  @type when_ :: %{
+          kind: :when,
+          id: String.t(),
+          cond: pure(),
+          body: expr()
+        }
+
+  @type every_nth :: %{
+          kind: :every_nth,
+          id: String.t(),
+          n: pos_integer(),
+          counter: String.t(),
+          body: expr()
+        }
+
+  @type map_ :: %{
+          kind: :map,
+          id: String.t(),
+          over: pure(),
+          as: String.t(),
+          body: expr()
+        }
+
+  @type prompt_ref ::
+          {:skill, String.t(), %{optional(String.t()) => pure()}}
+          | {:inline, pure()}
+
+  @type pure ::
+          {:literal, term()}
+          | {:var, String.t()}
+          | {:field, pure(), [String.t()]}
+          | {:concat, [pure()]}
+          | {:list, [pure()]}
+
+  @effect_kinds [:agent, :exec, :subrun, :when, :every_nth, :map]
+
+  @doc "The effectful constructor kinds. Only these become IR nodes."
+  @spec effect_kinds() :: [atom()]
+  def effect_kinds, do: @effect_kinds
+
+  @doc "True when an AST expression is an effectful constructor (emits a node)."
+  @spec effect?(term()) :: boolean()
+  def effect?(%{kind: kind}) when kind in @effect_kinds, do: true
+  def effect?(_), do: false
+
+  @doc "True when an AST expression is a pure value (evaluated, never a node)."
+  @spec pure?(term()) :: boolean()
+  def pure?({tag, _}) when tag in [:literal, :var], do: true
+  def pure?({tag, _, _}) when tag in [:field], do: true
+  def pure?({tag, list}) when tag in [:concat, :list] and is_list(list), do: true
+  def pure?(_), do: false
+
+  # --- constructors -------------------------------------------------------
+
+  @doc "Build a workflow do-block from an ordered statement list and an optional trigger."
+  @spec workflow(String.t() | nil, trigger(), [statement()], String.t()) :: workflow()
+  def workflow(name, trigger, statements, id)
+      when is_list(statements) and is_binary(id) and (is_nil(trigger) or is_map(trigger)) do
+    %{kind: :workflow, id: id, name: name, trigger: trigger, statements: statements}
+  end
+
+  @doc "A `name <- effect` binding."
+  @spec bind(String.t(), expr()) :: bind()
+  def bind(name, expr) when is_binary(name), do: {:bind, name, expr}
+
+  @doc "A `name = pure` binding."
+  @spec let(String.t(), pure()) :: let()
+  def let(name, pure) when is_binary(name), do: {:let, name, pure}
+
+  @doc "An agent-call node carrying an envelope spec map and a prompt ref."
+  @spec agent(map(), prompt_ref(), %{optional(String.t()) => pure()}, String.t()) :: agent()
+  def agent(envelope, prompt, inputs, id)
+      when is_map(envelope) and is_map(inputs) and is_binary(id) do
+    %{kind: :agent, id: id, envelope: envelope, prompt: prompt, inputs: inputs}
+  end
+
+  @doc "An exec (shell script) node."
+  @spec exec(pure(), pure() | nil, %{optional(String.t()) => pure()}, String.t()) :: exec()
+  def exec(script, timeout, inputs, id) when is_map(inputs) and is_binary(id) do
+    %{kind: :exec, id: id, script: script, timeout: timeout, inputs: inputs}
+  end
+
+  @doc "A subrun (first-class child run) node."
+  @spec subrun(pure(), %{optional(String.t()) => pure()}, String.t()) :: subrun()
+  def subrun(source, inputs, id) when is_map(inputs) and is_binary(id) do
+    %{kind: :subrun, id: id, source: source, inputs: inputs}
+  end
+
+  @doc "A `when cond do body` conditional combinator."
+  @spec when_(pure(), expr(), String.t()) :: when_()
+  def when_(cond, body, id) when is_binary(id) do
+    %{kind: :when, id: id, cond: cond, body: body}
+  end
+
+  @doc "An `every_nth n counter do body` gate keyed on a persisted counter."
+  @spec every_nth(pos_integer(), String.t(), expr(), String.t()) :: every_nth()
+  def every_nth(n, counter, body, id)
+      when is_integer(n) and n > 0 and is_binary(counter) and is_binary(id) do
+    %{kind: :every_nth, id: id, n: n, counter: counter, body: body}
+  end
+
+  @doc "A `map over as elem do body` fan-out combinator."
+  @spec map_(pure(), String.t(), expr(), String.t()) :: map_()
+  def map_(over, as, body, id) when is_binary(as) and is_binary(id) do
+    %{kind: :map, id: id, over: over, as: as, body: body}
+  end
+
+  # --- pure value constructors -------------------------------------------
+
+  @spec literal(term()) :: pure()
+  def literal(value), do: {:literal, value}
+
+  @spec var(String.t()) :: pure()
+  def var(name) when is_binary(name), do: {:var, name}
+
+  @spec field(pure(), [String.t()]) :: pure()
+  def field(base, path) when is_list(path), do: {:field, base, path}
+
+  @spec concat([pure()]) :: pure()
+  def concat(parts) when is_list(parts), do: {:concat, parts}
+
+  @spec list([pure()]) :: pure()
+  def list(items) when is_list(items), do: {:list, items}
+
+  @doc """
+  Attach an id to a constructor map. The single writer of the id scheme so
+  the parser and any future builder cannot drift apart.
+  """
+  @spec with_id(map(), String.t()) :: map()
+  def with_id(node, id) when is_map(node) and is_binary(id), do: Map.put(node, :id, id)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/dsl/interpreter.ex b/packages/symphony/elixir/lib/symphony_elixir/dsl/interpreter.ex
new file mode 100644
index 000000000..90ce73567
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/dsl/interpreter.ex
@@ -0,0 +1,674 @@
+defmodule SymphonyElixir.DSL.Interpreter do
+  @moduledoc """
+  Expand a reified `SymphonyElixir.DSL.AST` into a delta of durable
+  `SymphonyElixir.IR.Node`s. This is the eval step of eval-as-emission and
+  the deepest module in the DSL front end.
+
+      expand(ast, known_outputs, expansion_log) ->
+        {ir_delta, pending, new_log}
+
+  - `ir_delta` is the list of `IR.Node` structs to materialize on this
+    pass. Re-running `expand` with more `known_outputs` yields the next
+    delta; the runtime folds each delta into the `RunGraph`.
+  - `pending` is the set of unresolved AST points still awaiting inputs,
+    as plain data: `{:awaiting, ast_node_id, needed_node_ids}`. The
+    runtime uses it to know an effect cannot be materialized until those
+    upstream node outputs arrive.
+  - `new_log` is the `expansion_log` extended with one event per dynamic
+    expansion that fired on this pass (a `when` that opened, an
+    `every_nth` that fired, a `map` that fanned out). The order is
+    load-bearing for deterministic replay.
+
+  ## Rules (from the overhaul plan, Pillar 1)
+
+  1. Only effectful constructors (`agent`, `exec`, `subrun`) become IR
+     nodes. Pure computation (string concat, `${session.area}` field
+     access) is evaluated inside the interpreter at expand time and never
+     fills the graph with trivial nodes.
+  2. `IR.Node.deps` is derived from `inputs` via
+     `IR.Node.deps_from_inputs/1`. A `{:node, id, path}` input is the only
+     thing that makes an edge; the interpreter never hand-writes `deps`.
+  3. Dynamic constructs (`when`, `every_nth`, `map`) emit a placeholder
+     node (`:gate` or `:map_fanout`) when their gating input is
+     unresolved, and emit children deterministically when re-expanded with
+     the resolved output.
+  4. Determinism: gates are pure functions of `known_outputs` and the
+     persisted counters recovered from `expansion_log`. No wall clock, no
+     RNG. The same `(ast, known_outputs, expansion_log)` always yields the
+     same `ir_delta`, which is the invariant the runtime replays on
+     restart.
+
+  ## Input resolution
+
+  Each input value reduces to a single `IR.Node.input_ref`:
+
+  - A fully-literal pure value folds to `{:literal, computed}`.
+  - A single `${node.path}` read of an effect binding becomes
+    `{:node, id, path}`, the one shape that creates a dependency edge.
+  - A `concat`/`list` that mixes literals with a node read cannot be one
+    ref. The effect carrying it is deferred (reported in `pending`) until
+    every referenced node output is in `known_outputs`, then the value
+    folds to a literal on re-expansion.
+  """
+
+  alias SymphonyElixir.DSL.AST
+  alias SymphonyElixir.IR.Node
+
+  @type known_outputs :: %{optional(String.t()) => term()}
+  @type pending :: {:awaiting, String.t(), [String.t()]}
+  @type expansion_log :: [map()]
+
+  @type result :: {[Node.t()], [pending()], expansion_log()}
+
+  @doc """
+  Expand the workflow against the outputs known so far and the prior
+  expansion log. Pure; same inputs always produce the same result.
+  """
+  @spec expand(AST.workflow(), known_outputs(), expansion_log()) :: result()
+  def expand(%{kind: :workflow, statements: statements}, known_outputs \\ %{}, expansion_log \\ [])
+      when is_map(known_outputs) and is_list(expansion_log) do
+    counters = counters_from_log(expansion_log)
+
+    acc = %{
+      env: %{},
+      nodes: [],
+      pending: [],
+      log: [],
+      counters: counters,
+      prior_ticks: prior_ticks_from_log(expansion_log),
+      known: known_outputs
+    }
+
+    final = Enum.reduce(statements, acc, &expand_statement/2)
+
+    {Enum.reverse(final.nodes), Enum.reverse(final.pending), expansion_log ++ Enum.reverse(final.log)}
+  end
+
+  # --- statements ---------------------------------------------------------
+
+  # A `let` binds a pure value. It is computed now when its dependencies
+  # are resolvable and recorded as a value binding; otherwise it is bound
+  # to whatever node ref it reads so later effects still see the edge.
+  defp expand_statement({:let, name, pure}, acc) do
+    case resolve_value(pure, acc.env, acc.known) do
+      {:value, value} -> put_env(acc, name, {:value, value})
+      {:node, id, path} -> put_env(acc, name, {:node_field, id, path})
+      :deferred -> put_env(acc, name, {:deferred, pure})
+    end
+  end
+
+  defp expand_statement({:bind, name, expr}, acc) do
+    expand_effect(expr, name, acc)
+  end
+
+  defp expand_statement(expr, acc) when is_map(expr) do
+    expand_effect(expr, nil, acc)
+  end
+
+  # --- effects ------------------------------------------------------------
+
+  defp expand_effect(%{kind: :agent} = agent, bind_name, acc) do
+    expansion_key = nil
+    id = node_id(agent.id, expansion_key)
+
+    {prompt_ref, prompt_inputs} = resolve_prompt(agent.prompt, agent.id, acc)
+    {explicit_inputs, explicit_pending} = resolve_inputs(agent.inputs, agent.id, acc)
+    inputs = Map.merge(prompt_inputs.inputs, explicit_inputs)
+    pending_ids = Enum.uniq(prompt_inputs.pending ++ explicit_pending)
+
+    node =
+      Node.new(
+        id: id,
+        ast_origin: agent.id,
+        kind: :agent,
+        envelope: agent.envelope,
+        prompt_ref: prompt_ref,
+        inputs: inputs,
+        expansion_key: expansion_key,
+        state: :pending
+      )
+
+    acc
+    |> add_node(node)
+    |> add_pending_if(agent.id, pending_ids)
+    |> bind_node(bind_name, id)
+  end
+
+  defp expand_effect(%{kind: :exec} = exec, bind_name, acc) do
+    id = node_id(exec.id, nil)
+
+    {script_inputs, script_pending} = resolve_named_inputs(%{"script" => exec.script}, exec.id, acc)
+    {extra_inputs, extra_pending} = resolve_inputs(exec.inputs, exec.id, acc)
+    {timeout_inputs, timeout_pending} = resolve_timeout(exec.timeout, exec.id, acc)
+
+    inputs = script_inputs |> Map.merge(extra_inputs) |> Map.merge(timeout_inputs)
+    pending_ids = Enum.uniq(script_pending ++ extra_pending ++ timeout_pending)
+
+    node =
+      Node.new(
+        id: id,
+        ast_origin: exec.id,
+        kind: :exec,
+        inputs: inputs,
+        expansion_key: nil,
+        state: :pending
+      )
+
+    acc
+    |> add_node(node)
+    |> add_pending_if(exec.id, pending_ids)
+    |> bind_node(bind_name, id)
+  end
+
+  defp expand_effect(%{kind: :subrun} = subrun, bind_name, acc) do
+    id = node_id(subrun.id, nil)
+
+    {source_inputs, source_pending} = resolve_named_inputs(%{"source" => subrun.source}, subrun.id, acc)
+    {extra_inputs, extra_pending} = resolve_inputs(subrun.inputs, subrun.id, acc)
+
+    inputs = Map.merge(source_inputs, extra_inputs)
+    pending_ids = Enum.uniq(source_pending ++ extra_pending)
+
+    node =
+      Node.new(
+        id: id,
+        ast_origin: subrun.id,
+        kind: :subrun,
+        inputs: inputs,
+        expansion_key: nil,
+        state: :pending
+      )
+
+    acc
+    |> add_node(node)
+    |> add_pending_if(subrun.id, pending_ids)
+    |> bind_node(bind_name, id)
+  end
+
+  # `when cond { body }`: a gate that emits its body only if `cond` is
+  # truthy. When `cond` is not yet resolvable it materializes a `:gate`
+  # placeholder whose input edge points at the node it waits on; when the
+  # output arrives the re-expansion evaluates `cond` and emits the body
+  # (recording the decision in the log).
+  defp expand_effect(%{kind: :when} = node, bind_name, acc) do
+    case resolve_value(node.cond, acc.env, acc.known) do
+      {:value, cond_value} ->
+        if truthy?(cond_value) do
+          acc
+          |> log_expansion(node.id, %{gate: :when, opened: true}, child_ids(node.body, node.id))
+          |> expand_gate_body(node.body, node.id, bind_name)
+        else
+          log_expansion(acc, node.id, %{gate: :when, opened: false}, [])
+        end
+
+      {:node, dep_id, path} ->
+        emit_gate(acc, node, dep_id, path, bind_name)
+
+      :deferred ->
+        emit_gate(acc, node, nil, [], bind_name)
+    end
+  end
+
+  # `every n of counter { body }`: deterministic gate keyed on a persisted
+  # counter recovered from the expansion log. It fires when the count of
+  # prior firings makes the next tick a multiple of n. No wall clock.
+  #
+  # A construct is one tick per run. `expand_dynamic/1` re-runs `expand`
+  # several times within a single run (at init, then after each node
+  # success), feeding the grown log back in. If `every_nth` advanced the
+  # tick on every pass it would drift forward inside one run and a cold
+  # replay would never reproduce the live graph. So when the prior log
+  # already holds this construct's tick, reproduce that recorded decision
+  # idempotently; only a genuinely new run (no prior event for this origin)
+  # computes a fresh tick from the counters recovered across prior runs.
+  defp expand_effect(%{kind: :every_nth} = node, bind_name, acc) do
+    case Map.get(acc.prior_ticks, counter_key(node.id, node.counter)) do
+      # Already fired in the prior log: re-emit the body so the materializer
+      # re-derives and idempotently merges the child, but do not re-log the
+      # tick (the materializer adopts the prior log as is).
+      %{fired: true} -> expand_gate_body(acc, node.body, node.id, bind_name)
+      %{fired: false} -> acc
+      nil -> evaluate_every_nth(node, bind_name, acc)
+    end
+  end
+
+  # `map over as elem { body }`: fan out the body once per element of
+  # `over`. When `over` is not resolvable it materializes a `:map_fanout`
+  # placeholder; when the list resolves the re-expansion emits one child
+  # per element with a stable expansion key.
+  defp expand_effect(%{kind: :map} = node, bind_name, acc) do
+    case resolve_value(node.over, acc.env, acc.known) do
+      {:value, list} when is_list(list) ->
+        emit_fanout(acc, node, list, bind_name)
+
+      {:value, other} ->
+        # A non-list `over` is a typed mismatch surfaced as an empty
+        # fan-out rather than a crash; the runtime sees zero children.
+        log_expansion(acc, node.id, %{gate: :map, over: :not_a_list, value: other}, [])
+
+      {:node, dep_id, path} ->
+        emit_map_placeholder(acc, node, dep_id, path, bind_name)
+
+      :deferred ->
+        emit_map_placeholder(acc, node, nil, [], bind_name)
+    end
+  end
+
+  # Compute a fresh `every_nth` tick from the counters recovered across
+  # prior runs' logs. Reached only on a run with no prior event for this
+  # construct; a re-pass within a run reproduces the recorded decision
+  # instead (see the `:every_nth` clause above).
+  defp evaluate_every_nth(node, bind_name, acc) do
+    fired = Map.get(acc.counters, counter_key(node.id, node.counter), 0)
+    tick = fired + 1
+
+    if rem(tick, node.n) == 0 do
+      acc
+      |> log_expansion(node.id, %{gate: :every_nth, counter: node.counter, tick: tick, fired: true}, child_ids(node.body, node.id))
+      |> expand_gate_body(node.body, node.id, bind_name)
+    else
+      log_expansion(acc, node.id, %{gate: :every_nth, counter: node.counter, tick: tick, fired: false}, [])
+    end
+  end
+
+  # --- dynamic placeholders ----------------------------------------------
+
+  defp emit_gate(acc, node, dep_id, path, bind_name) do
+    id = node_id(node.id, nil)
+    inputs = gate_inputs(dep_id, path)
+
+    placeholder =
+      Node.new(
+        id: id,
+        ast_origin: node.id,
+        kind: :gate,
+        inputs: inputs,
+        expansion_key: nil,
+        state: :pending
+      )
+
+    acc
+    |> add_node(placeholder)
+    |> add_pending_if(node.id, deps_of(inputs))
+    |> bind_node(bind_name, id)
+  end
+
+  defp emit_map_placeholder(acc, node, dep_id, path, bind_name) do
+    id = node_id(node.id, nil)
+    inputs = gate_inputs(dep_id, path)
+
+    placeholder =
+      Node.new(
+        id: id,
+        ast_origin: node.id,
+        kind: :map_fanout,
+        inputs: inputs,
+        expansion_key: nil,
+        state: :pending
+      )
+
+    acc
+    |> add_node(placeholder)
+    |> add_pending_if(node.id, deps_of(inputs))
+    |> bind_node(bind_name, id)
+  end
+
+  # A map result binds to no single node (it is a bag of children), so a
+  # `name <- map ...` binding is dropped: nothing downstream can read one
+  # fan-out output as a scalar. The children themselves carry the edges.
+  defp emit_fanout(acc, node, list, _bind_name) do
+    emitted_ids =
+      list
+      |> Enum.with_index()
+      |> Enum.map(fn {_elem, index} -> node_id(child_origin(node.body, node.id), {:fanout, node.id, index}) end)
+
+    acc =
+      list
+      |> Enum.with_index()
+      |> Enum.reduce(acc, fn {elem, index}, inner ->
+        child_env = Map.put(inner.env, node.as, {:value, elem})
+        key = {:fanout, node.id, index}
+
+        inner
+        |> with_env(child_env)
+        |> expand_keyed_body(node.body, key)
+        |> restore_env(inner.env)
+      end)
+
+    log_expansion(acc, node.id, %{gate: :map, count: length(list)}, emitted_ids)
+  end
+
+  # Expand a resolved `when`/`every_nth` body. When the gate itself is
+  # bound (`result <- when ${x} { ... }`), `result` must point at the
+  # body's emitted node, not at the placeholder (which is gone once the
+  # gate resolves). Before this, a bound gate dropped its binding and any
+  # downstream `${result...}` read silently lost its edge.
+  defp expand_gate_body(acc, {:bind, inner, effect}, _gate_id, bind_name) do
+    acc = expand_effect(effect, inner, acc)
+
+    # `result <- when ... { n <- effect }`: alias the gate name to the same
+    # body node the inner binding points at, so `result` and `n` both read
+    # the body output. An unbound gate passes nil and this is a no-op.
+    case {bind_name, Map.get(acc.env, inner)} do
+      {nil, _} -> acc
+      {_gate, nil} -> acc
+      {gate, source} -> put_env(acc, gate, source)
+    end
+  end
+
+  defp expand_gate_body(acc, {:let, _name, _pure} = body, _gate_id, _bind_name) do
+    expand_statement(body, acc)
+  end
+
+  # A bare effect body (`result <- when ${x} { effect }`) binds the gate
+  # name straight to the effect node.
+  defp expand_gate_body(acc, effect, _gate_id, bind_name) when is_map(effect) do
+    expand_effect(effect, bind_name, acc)
+  end
+
+  defp expand_keyed_body(acc, body, key) do
+    expand_with_key(strip_binding(body), key, acc)
+  end
+
+  # --- input resolution ---------------------------------------------------
+
+  # Resolve an inputs map (name => pure) into IR input refs plus the list
+  # of node ids any deferred input still waits on.
+  defp resolve_inputs(inputs, _origin, _acc) when map_size(inputs) == 0, do: {%{}, []}
+
+  defp resolve_inputs(inputs, origin, acc) do
+    resolve_named_inputs(inputs, origin, acc)
+  end
+
+  defp resolve_named_inputs(inputs, _origin, acc) do
+    Enum.reduce(inputs, {%{}, []}, fn {name, pure}, {refs, pending} ->
+      case resolve_value(pure, acc.env, acc.known) do
+        {:value, value} -> {Map.put(refs, name, {:literal, value}), pending}
+        {:node, id, path} -> {Map.put(refs, name, {:node, id, path}), pending}
+        :deferred -> {refs, deferred_node_ids(pure, acc.env) ++ pending}
+      end
+    end)
+  end
+
+  defp resolve_timeout(nil, _origin, _acc), do: {%{}, []}
+
+  defp resolve_timeout(pure, origin, acc) do
+    resolve_named_inputs(%{"timeout" => pure}, origin, acc)
+  end
+
+  # The prompt's skill bindings (or inline interpolation) become inputs so
+  # their node reads form dependency edges. The prompt_ref keeps the same
+  # shape the IR layer expects: {:skill, name, bindings} | {:inline, text}.
+  defp resolve_prompt({:skill, name, bindings}, origin, acc) do
+    {refs, pending} = resolve_named_inputs(bindings, origin, acc)
+    {{:skill, name, bindings_literal(bindings, acc)}, %{inputs: refs, pending: pending}}
+  end
+
+  defp resolve_prompt({:inline, pure}, _origin, acc) do
+    case resolve_value(pure, acc.env, acc.known) do
+      {:value, text} ->
+        {{:inline, to_text(text)}, %{inputs: %{}, pending: []}}
+
+      {:node, id, path} ->
+        {{:inline, nil}, %{inputs: %{"prompt" => {:node, id, path}}, pending: []}}
+
+      :deferred ->
+        {{:inline, nil}, %{inputs: %{}, pending: deferred_node_ids(pure, acc.env)}}
+    end
+  end
+
+  # Best-effort literal snapshot of skill bindings for the prompt_ref. Node
+  # reads stay as their AST form; the resolved inputs carry the edges.
+  defp bindings_literal(bindings, acc) do
+    Map.new(bindings, fn {k, pure} ->
+      case resolve_value(pure, acc.env, acc.known) do
+        {:value, v} -> {k, v}
+        _ -> {k, pure}
+      end
+    end)
+  end
+
+  # --- pure evaluation ----------------------------------------------------
+
+  @typedoc "A resolved pure value, an edge to a node output, or unresolvable yet."
+  @type resolution :: {:value, term()} | {:node, String.t(), [String.t()]} | :deferred
+
+  @spec resolve_value(AST.pure(), map(), known_outputs()) :: resolution()
+  defp resolve_value({:literal, value}, _env, _known), do: {:value, value}
+
+  defp resolve_value({:var, name}, env, known) do
+    case Map.get(env, name) do
+      {:value, value} -> {:value, value}
+      {:node_field, id, path} -> resolve_node(id, path, known)
+      {:node, id} -> resolve_node(id, [], known)
+      {:deferred, pure} -> resolve_value(pure, env, known)
+      nil -> :deferred
+    end
+  end
+
+  defp resolve_value({:field, base, path}, env, known) do
+    case resolve_value(base, env, known) do
+      {:value, value} -> {:value, dig(value, path)}
+      {:node, id, base_path} -> {:node, id, base_path ++ path}
+      :deferred -> :deferred
+    end
+  end
+
+  defp resolve_value({:concat, parts}, env, known) do
+    resolve_aggregate(parts, env, known, fn values -> Enum.map_join(values, "", &to_text/1) end)
+  end
+
+  defp resolve_value({:list, items}, env, known) do
+    resolve_aggregate(items, env, known, & &1)
+  end
+
+  # An aggregate folds to a single value only when every part is a value.
+  # If any part is a node read or deferred, the whole aggregate cannot be
+  # one input_ref, so it is deferred until those node outputs resolve.
+  defp resolve_aggregate(parts, env, known, combine) do
+    resolved = Enum.map(parts, &resolve_value(&1, env, known))
+
+    cond do
+      Enum.all?(resolved, &match?({:value, _}, &1)) ->
+        {:value, combine.(Enum.map(resolved, fn {:value, v} -> v end))}
+
+      Enum.any?(resolved, &(&1 == :deferred)) ->
+        :deferred
+
+      true ->
+        # Mix of literals and node reads. Defer until the node reads
+        # resolve into known_outputs, then the aggregate folds.
+        :deferred
+    end
+  end
+
+  defp resolve_node(id, path, known) do
+    case Map.fetch(known, id) do
+      {:ok, output} -> {:value, dig(output, path)}
+      :error -> {:node, id, path}
+    end
+  end
+
+  # Read a (possibly nested) field from a value. Missing keys yield nil so
+  # a typed mismatch surfaces downstream rather than crashing the expand.
+  defp dig(value, []), do: value
+
+  defp dig(value, [key | rest]) when is_map(value) do
+    dig(Map.get(value, key) || Map.get(value, to_atom(key)), rest)
+  end
+
+  defp dig(_value, _path), do: nil
+
+  defp to_atom(key) when is_binary(key) do
+    String.to_existing_atom(key)
+  rescue
+    ArgumentError -> :"#{key}"
+  end
+
+  # --- helpers ------------------------------------------------------------
+
+  defp gate_inputs(nil, _path), do: %{}
+  defp gate_inputs(dep_id, path), do: %{"gate" => {:node, dep_id, path}}
+
+  defp deps_of(inputs), do: Node.deps_from_inputs(inputs)
+
+  defp truthy?(false), do: false
+  defp truthy?(nil), do: false
+  defp truthy?(_), do: true
+
+  defp to_text(value) when is_binary(value), do: value
+  defp to_text(value), do: to_string(value)
+
+  defp deferred_node_ids(pure, env) do
+    pure
+    |> referenced_bindings()
+    |> Enum.flat_map(fn name ->
+      case Map.get(env, name) do
+        {:node_field, id, _path} -> [id]
+        {:node, id} -> [id]
+        {:deferred, inner} -> deferred_node_ids(inner, env)
+        _ -> []
+      end
+    end)
+    |> Enum.uniq()
+  end
+
+  defp referenced_bindings({:var, name}), do: [name]
+  defp referenced_bindings({:field, base, _path}), do: referenced_bindings(base)
+  defp referenced_bindings({:concat, parts}), do: Enum.flat_map(parts, &referenced_bindings/1)
+  defp referenced_bindings({:list, items}), do: Enum.flat_map(items, &referenced_bindings/1)
+  defp referenced_bindings({:literal, _}), do: []
+
+  # --- accumulator plumbing ----------------------------------------------
+
+  defp add_node(acc, node), do: %{acc | nodes: [node | acc.nodes]}
+
+  defp add_pending_if(acc, _origin, []), do: acc
+
+  defp add_pending_if(acc, origin, needed) do
+    %{acc | pending: [{:awaiting, origin, Enum.uniq(needed)} | acc.pending]}
+  end
+
+  defp put_env(acc, name, source), do: %{acc | env: Map.put(acc.env, name, source)}
+
+  defp bind_node(acc, nil, _id), do: acc
+  defp bind_node(acc, name, id), do: put_env(acc, name, {:node, id})
+
+  defp with_env(acc, env), do: %{acc | env: env}
+  defp restore_env(acc, env), do: %{acc | env: env}
+
+  defp log_expansion(acc, origin, observed, emitted) do
+    event = %{origin: origin, observed: observed, emitted: emitted}
+    %{acc | log: [event | acc.log]}
+  end
+
+  # Stable, content-derived id: the ast origin plus the expansion key, so a
+  # deterministic replay rebuilds the identical id.
+  defp node_id(ast_origin, nil), do: ast_origin
+
+  defp node_id(ast_origin, key) do
+    digest = :crypto.hash(:sha256, :erlang.term_to_binary({ast_origin, key}))
+    ast_origin <> "-" <> (digest |> Base.encode16(case: :lower) |> binary_part(0, 8))
+  end
+
+  # A combinator body keeps its own ast origin so the child id is distinct
+  # from a top-level node of the same shape.
+  defp child_origin(%{id: id}, _gate_id), do: id
+  defp child_origin({:bind, _name, %{id: id}}, _gate_id), do: id
+  defp child_origin(_body, gate_id), do: gate_id
+
+  defp child_ids(body, gate_id) do
+    [node_id(child_origin(body, gate_id), nil)]
+  end
+
+  defp strip_binding({:bind, _name, expr}), do: expr
+  defp strip_binding(expr), do: expr
+
+  # Re-expand a single statement under a fan-out expansion key so each
+  # emitted child gets a distinct, stable id.
+  defp expand_with_key(expr, key, acc) when is_map(expr) do
+    expand_effect_keyed(expr, key, acc)
+  end
+
+  defp expand_effect_keyed(%{kind: kind} = expr, key, acc)
+       when kind in [:agent, :exec, :subrun] do
+    id = node_id(expr.id, key)
+
+    {inputs, pending_ids, prompt_ref, envelope} = keyed_node_parts(expr, acc)
+
+    node =
+      Node.new(
+        id: id,
+        ast_origin: expr.id,
+        kind: kind,
+        envelope: envelope,
+        prompt_ref: prompt_ref,
+        inputs: inputs,
+        expansion_key: key,
+        state: :pending
+      )
+
+    acc
+    |> add_node(node)
+    |> add_pending_if(expr.id, pending_ids)
+  end
+
+  defp keyed_node_parts(%{kind: :agent} = agent, acc) do
+    {prompt_ref, prompt_inputs} = resolve_prompt(agent.prompt, agent.id, acc)
+    {explicit_inputs, explicit_pending} = resolve_inputs(agent.inputs, agent.id, acc)
+    inputs = Map.merge(prompt_inputs.inputs, explicit_inputs)
+    {inputs, Enum.uniq(prompt_inputs.pending ++ explicit_pending), prompt_ref, agent.envelope}
+  end
+
+  defp keyed_node_parts(%{kind: :exec} = exec, acc) do
+    {script_inputs, script_pending} = resolve_named_inputs(%{"script" => exec.script}, exec.id, acc)
+    {extra_inputs, extra_pending} = resolve_inputs(exec.inputs, exec.id, acc)
+    {timeout_inputs, timeout_pending} = resolve_timeout(exec.timeout, exec.id, acc)
+    inputs = script_inputs |> Map.merge(extra_inputs) |> Map.merge(timeout_inputs)
+    {inputs, Enum.uniq(script_pending ++ extra_pending ++ timeout_pending), nil, nil}
+  end
+
+  defp keyed_node_parts(%{kind: :subrun} = subrun, acc) do
+    {source_inputs, source_pending} = resolve_named_inputs(%{"source" => subrun.source}, subrun.id, acc)
+    {extra_inputs, extra_pending} = resolve_inputs(subrun.inputs, subrun.id, acc)
+    inputs = Map.merge(source_inputs, extra_inputs)
+    {inputs, Enum.uniq(source_pending ++ extra_pending), nil, nil}
+  end
+
+  # --- expansion-log counters --------------------------------------------
+
+  # Recover each every_nth counter's tick total from the prior log so a
+  # replay reconstructs the identical gate decisions without a live tick.
+  # Every recorded evaluation is a tick, fired or skipped: the gate fires
+  # on the nth tick, so the count must include the skips between fires.
+  defp counters_from_log(log) do
+    Enum.reduce(log, %{}, fn event, acc ->
+      case event do
+        %{origin: origin, observed: %{gate: :every_nth, counter: counter}} ->
+          Map.update(acc, counter_key(origin, counter), 1, &(&1 + 1))
+
+        _ ->
+          acc
+      end
+    end)
+  end
+
+  # The most recent recorded tick decision per `every_nth` construct in the
+  # prior log. A re-expansion within the same run reproduces this decision
+  # rather than advancing the tick, so the gate is idempotent across the
+  # several `expand_dynamic/1` passes one run makes. A new run carries no
+  # event for the origin and computes a fresh tick from `counters_from_log`.
+  defp prior_ticks_from_log(log) do
+    Enum.reduce(log, %{}, fn event, acc ->
+      case event do
+        %{origin: origin, observed: %{gate: :every_nth, counter: counter, fired: fired}} ->
+          Map.put(acc, counter_key(origin, counter), %{fired: fired})
+
+        _ ->
+          acc
+      end
+    end)
+  end
+
+  defp counter_key(origin, counter), do: {origin, counter}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/dsl/parser.ex b/packages/symphony/elixir/lib/symphony_elixir/dsl/parser.ex
new file mode 100644
index 000000000..6f0611593
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/dsl/parser.ex
@@ -0,0 +1,704 @@
+defmodule SymphonyElixir.DSL.Parser do
+  @moduledoc """
+  Parse a standalone `.sym` workflow surface into a reified
+  `SymphonyElixir.DSL.AST`.
+
+  `parse/1` returns `{:ok, ast}` or `{:error, diagnostic}` where the
+  diagnostic carries a source span (line and column) so an operator can
+  jump straight to the offending token. The surface is monadic in spirit:
+  a `name <- effect` binding introduces a data dependency, and statements
+  whose inputs do not reference each other are independent (the
+  interpreter is then free to run them in parallel).
+
+  ## Surface syntax
+
+      workflow "release" {
+        session <- agent {
+          engine: codex
+          model: "gpt-5.3-codex"
+          permissions: workspace_write
+          location: local
+          prompt: skill "inspect" { repo: "symphony" }
+        }
+
+        summary <- agent {
+          engine: claude
+          model: haiku
+          prompt: inline "summarize ${session.report}"
+        }
+
+        when ${summary.ok} {
+          notice <- exec "./scripts/notify.sh" timeout 30
+        }
+
+        every 3 of build_counter {
+          gc <- exec "./scripts/gc.sh"
+        }
+
+        map ${session.repos} as repo {
+          child <- subrun "audit.sym" { target: ${repo} }
+        }
+      }
+
+  A statement is `name <- <effect>`, `name = <pure>`, or a bare effect.
+  An effect is `agent { ... }`, `exec <string> [timeout <int>] [{ ... }]`,
+  `subrun <string> [{ ... }]`, `when <pure> { stmt* }`,
+  `every <int> of <counter> { stmt* }`, or
+  `map <pure> as <name> { stmt* }`.
+
+  Pure values are string literals (`"..."`, with `${path}` interpolation),
+  integers, floats, `true`/`false`/`null`, bracketed lists `[a, b]`, and
+  interpolation references `${name.field.path}`.
+
+  ## Diagnostics
+
+  Every diagnostic is `{:error, %{message: String.t(), line: pos_integer,
+  column: pos_integer, file: String.t() | nil, got: term()}}`. Line and
+  column are 1-based and point at the token that failed, recovered from the
+  tokenizer's per-token span so the message lands on the real source
+  position rather than a byte offset. `file` is the source filename a caller
+  passed through `parse/2`; it is `nil` for an anonymous string parse and is
+  filled in by the `WorkflowCatalog` so an author sees which `.sym` broke.
+  """
+
+  alias SymphonyElixir.DSL.AST
+  alias SymphonyElixir.DSL.Parser.Lexer
+
+  @type diagnostic :: %{
+          message: String.t(),
+          line: pos_integer(),
+          column: pos_integer(),
+          file: String.t() | nil,
+          got: term()
+        }
+
+  # The surface keywords `parse_trigger_kind/2` dispatches on. This list is
+  # the source of truth for the `on <kind>` vocabulary so the schema
+  # endpoint and the run form offer exactly the kinds the parser accepts;
+  # adding a kind here plus its dispatch clause flows to the UI without a
+  # form edit.
+  @trigger_kinds ~w(manual cron linear slack_huddle slack_mention github_pr_label)a
+
+  @doc "The trigger kinds the `on` clause accepts, as surface keywords."
+  @spec trigger_kinds() :: [atom()]
+  def trigger_kinds, do: @trigger_kinds
+
+  @doc """
+  Parse `.sym` source. `opts` accepts `:file`, the source filename the
+  catalog stamps onto a diagnostic so an author sees which `.sym` broke; it
+  defaults to `nil` for an anonymous string parse.
+  """
+  @spec parse(String.t(), keyword()) :: {:ok, AST.workflow()} | {:error, diagnostic()}
+  def parse(source, opts \\ []) when is_binary(source) and is_list(opts) do
+    file = Keyword.get(opts, :file)
+
+    case Lexer.tokenize(source) do
+      {:ok, tokens} ->
+        state = %{tokens: tokens, counter: 0, file: file}
+
+        case parse_workflow(state) do
+          {:ok, ast, rest} ->
+            case skip_to_end(rest) do
+              :ok -> {:ok, ast}
+              {:error, _} = err -> err
+            end
+
+          {:error, _} = err ->
+            err
+        end
+
+      # The lexer fails before a parse state exists, so it cannot know the
+      # file. Stamp it here so a tokenizer error (unterminated string, stray
+      # character) lands on the same located shape as a parser error.
+      {:error, diag} ->
+        {:error, Map.put(diag, :file, file)}
+    end
+  end
+
+  # --- workflow / statements ---------------------------------------------
+
+  # The workflow keeps a fixed id outside the effect counter so the first
+  # effect is `agent-0`; only effect constructors consume positional ids.
+  defp parse_workflow(state) do
+    with {:ok, _, s1} <- expect(state, :keyword, "workflow"),
+         {:ok, name_tok, s2} <- optional_string(s1),
+         {:ok, trigger, s3} <- parse_optional_trigger(s2),
+         {:ok, _, s4} <- expect(s3, :lbrace, "{"),
+         {:ok, statements, s5} <- parse_statements(s4, []),
+         {:ok, _, s6} <- expect(s5, :rbrace, "}") do
+      name = if name_tok, do: name_tok.value, else: nil
+      {:ok, AST.workflow(name, trigger, statements, "workflow"), s6}
+    end
+  end
+
+  # --- trigger header -----------------------------------------------------
+
+  # `on <kind> <params>` declares what fires the workflow. The header is
+  # optional; a workflow with no `on` clause has a nil trigger and is only
+  # started by an operator. The keyword markers (`on`, the kind, the param
+  # names) are plain identifiers, so the lexer needs no trigger vocabulary.
+  # The normalized maps match the runtime's trigger shapes so the catalog
+  # and producers reuse one representation.
+  defp parse_optional_trigger(state) do
+    case peek(state) do
+      %{type: :ident, value: "on"} -> parse_trigger(advance(state))
+      _ -> {:ok, nil, state}
+    end
+  end
+
+  defp parse_trigger(state) do
+    case peek(state) do
+      %{type: :ident, value: kind} -> parse_trigger_kind(kind, advance(state))
+      other -> error(state, "expected a trigger kind after `on`", token_value(other))
+    end
+  end
+
+  defp parse_trigger_kind("manual", state), do: {:ok, %{kind: :manual}, state}
+
+  defp parse_trigger_kind("cron", state) do
+    with {:ok, schedule, s1} <- trigger_string(state, "cron schedule") do
+      {timezone, s2} = optional_labeled_string(s1, "tz", "UTC")
+      {input, s3} = parse_optional_trigger_input(s2)
+      {:ok, %{kind: :cron, schedule: String.trim(schedule), timezone: timezone, input: input}, s3}
+    end
+  end
+
+  defp parse_trigger_kind("linear", state) do
+    with {:ok, label, s1} <- labeled_string(state, "label") do
+      {:ok, %{kind: :linear, label: normalize_label(label)}, s1}
+    end
+  end
+
+  defp parse_trigger_kind("slack_huddle", state) do
+    with {:ok, channel, s1} <- labeled_string(state, "channel") do
+      {:ok, %{kind: :slack_huddle_completed, channel: String.trim(channel)}, s1}
+    end
+  end
+
+  defp parse_trigger_kind("slack_mention", state) do
+    with {:ok, channel, s1} <- labeled_string(state, "channel") do
+      {:ok, %{kind: :slack_app_mention, channel: String.trim(channel)}, s1}
+    end
+  end
+
+  defp parse_trigger_kind("github_pr_label", state) do
+    with {:ok, repo, s1} <- labeled_string(state, "repo"),
+         {:ok, label, s2} <- labeled_string(s1, "label") do
+      {:ok, %{kind: :github_pr_label, repo: String.trim(repo), label: normalize_label(label)}, s2}
+    end
+  end
+
+  defp parse_trigger_kind(other, state),
+    do: error(state, "unknown trigger kind #{inspect(other)}", other)
+
+  # `<name> "<value>"`: a labeled string param such as `label "..."` or
+  # `repo "..."`. The label is a bare identifier; the value is a string.
+  defp labeled_string(state, label) do
+    with {:ok, _, s1} <- expect_ident_value(state, label),
+         {:ok, value, s2} <- trigger_string(s1, label) do
+      {:ok, value, s2}
+    end
+  end
+
+  defp optional_labeled_string(state, label, default) do
+    case peek(state) do
+      %{type: :ident, value: ^label} ->
+        case trigger_string(advance(state), label) do
+          {:ok, value, rest} -> {String.trim(value), rest}
+          {:error, _} -> {default, state}
+        end
+
+      _ ->
+        {default, state}
+    end
+  end
+
+  defp parse_optional_trigger_input(state) do
+    case peek(state) do
+      %{type: :ident, value: "input"} ->
+        case parse_inputs_block(advance(state)) do
+          {:ok, pairs, rest} -> {literal_input_map(pairs), rest}
+          {:error, _} -> {%{}, state}
+        end
+
+      _ ->
+        {%{}, state}
+    end
+  end
+
+  # The cron input block is authored as literal pure values; collapse them
+  # to plain data so the trigger map round-trips through JSON like the
+  # pre-overhaul DAG cron input did.
+  defp literal_input_map(pairs) do
+    Map.new(pairs, fn
+      {k, {:literal, v}} -> {k, v}
+      {k, other} -> {k, other}
+    end)
+  end
+
+  defp expect_ident_value(state, value) do
+    case peek(state) do
+      %{type: :ident, value: ^value} = tok -> {:ok, tok, advance(state)}
+      other -> error(state, "expected #{inspect(value)}", token_value(other))
+    end
+  end
+
+  defp trigger_string(state, what) do
+    case peek(state) do
+      %{type: :string} = tok -> {:ok, flatten_string(tok.value), advance(state)}
+      other -> error(state, "expected a string for #{what}", token_value(other))
+    end
+  end
+
+  defp normalize_label(label), do: label |> String.trim() |> String.downcase()
+
+  defp parse_statements(state, acc) do
+    case peek(state) do
+      %{type: :rbrace} ->
+        {:ok, Enum.reverse(acc), state}
+
+      :eof ->
+        {:ok, Enum.reverse(acc), state}
+
+      _ ->
+        with {:ok, stmt, rest} <- parse_statement(state) do
+          parse_statements(rest, [stmt | acc])
+        end
+    end
+  end
+
+  # `name <- effect`, `name = pure`, or a bare effect.
+  defp parse_statement(state) do
+    case peek(state) do
+      %{type: :ident} = ident ->
+        rest = advance(state)
+
+        case peek(rest) do
+          %{type: :larrow} ->
+            with {:ok, expr, s} <- parse_expr(advance(rest)) do
+              {:ok, AST.bind(ident.value, expr), s}
+            end
+
+          %{type: :equals} ->
+            with {:ok, pure, s} <- parse_pure(advance(rest)) do
+              {:ok, AST.let(ident.value, pure), s}
+            end
+
+          _ ->
+            # A leading identifier that is not a binding must be a bare
+            # effect keyword (when/every/map). Re-dispatch on the keyword.
+            parse_expr(state)
+        end
+
+      _ ->
+        parse_expr(state)
+    end
+  end
+
+  # --- expressions (effects and pures) -----------------------------------
+
+  defp parse_expr(state) do
+    case peek(state) do
+      %{type: :keyword, value: "agent"} -> parse_agent(state)
+      %{type: :keyword, value: "exec"} -> parse_exec(state)
+      %{type: :keyword, value: "subrun"} -> parse_subrun(state)
+      %{type: :keyword, value: "when"} -> parse_when(state)
+      %{type: :keyword, value: "every"} -> parse_every(state)
+      %{type: :keyword, value: "map"} -> parse_map(state)
+      %{type: :keyword, value: kw} -> error(state, "unexpected keyword #{inspect(kw)} in expression position", kw)
+      :eof -> error(state, "unexpected end of input where an expression was expected", :eof)
+      other -> error(state, "expected an effect (agent/exec/subrun/when/every/map)", other.value)
+    end
+  end
+
+  # Each effect reserves its id before parsing its body, so ids read in
+  # source pre-order (a gate's id precedes its child's). The id is stable
+  # under a re-parse of identical source, which is what the IR layer needs
+  # to rebuild the same node ids on replay.
+  defp parse_agent(state) do
+    {id, state} = next_id(state, "agent")
+
+    with {:ok, _, s1} <- expect(state, :keyword, "agent"),
+         {:ok, _, s2} <- expect(s1, :lbrace, "{"),
+         {:ok, fields, s3} <- parse_agent_fields(s2, %{prompt: nil, inputs: %{}, envelope: %{}}),
+         {:ok, _, s4} <- expect(s3, :rbrace, "}"),
+         {:ok, prompt} <- require_prompt(fields, state) do
+      {:ok, AST.agent(fields.envelope, prompt, fields.inputs, id), s4}
+    end
+  end
+
+  @envelope_keys ~w(engine model effort permissions location)
+
+  # Agent fields may be separated by newlines or commas; a stray leading
+  # comma between fields is skipped so both layouts parse the same.
+  defp parse_agent_fields(%{tokens: [%{type: :comma} | _]} = state, acc) do
+    parse_agent_fields(advance(state), acc)
+  end
+
+  defp parse_agent_fields(state, acc) do
+    case peek(state) do
+      %{type: :rbrace} ->
+        {:ok, acc, state}
+
+      %{type: :ident, value: "prompt"} ->
+        with {:ok, _, s1} <- expect(state, :ident, "prompt"),
+             {:ok, _, s2} <- expect(s1, :colon, ":"),
+             {:ok, prompt, s3} <- parse_prompt(s2) do
+          parse_agent_fields(s3, %{acc | prompt: prompt})
+        end
+
+      %{type: :ident, value: "inputs"} ->
+        with {:ok, _, s1} <- expect(state, :ident, "inputs"),
+             {:ok, _, s2} <- expect(s1, :colon, ":"),
+             {:ok, inputs, s3} <- parse_inputs_block(s2) do
+          parse_agent_fields(s3, %{acc | inputs: inputs})
+        end
+
+      %{type: :ident, value: key} when key in @envelope_keys ->
+        with {:ok, _, s1} <- expect(state, :ident, key),
+             {:ok, _, s2} <- expect(s1, :colon, ":"),
+             {:ok, value, s3} <- parse_envelope_value(s2, key) do
+          parse_agent_fields(s3, %{acc | envelope: Map.put(acc.envelope, key, value)})
+        end
+
+      %{type: :ident, value: other} ->
+        error(state, "unknown agent field #{inspect(other)}", other)
+
+      other ->
+        error(state, "expected an agent field name", token_value(other))
+    end
+  end
+
+  # Envelope scalars are bare identifiers (engine: codex) or strings
+  # (model: "gpt-5.3-codex"). They are kept as plain values for
+  # `Engine.Envelope.from_map/1` to validate downstream.
+  defp parse_envelope_value(state, _key) do
+    case peek(state) do
+      %{type: :ident, value: v} -> {:ok, v, advance(state)}
+      %{type: :keyword, value: v} -> {:ok, v, advance(state)}
+      %{type: :string, value: v} -> {:ok, flatten_string(v), advance(state)}
+      other -> error(state, "expected an envelope value", token_value(other))
+    end
+  end
+
+  defp parse_prompt(state) do
+    case peek(state) do
+      %{type: :keyword, value: "skill"} ->
+        with {:ok, _, s1} <- expect(state, :keyword, "skill"),
+             {:ok, name_tok, s2} <- expect_string(s1) do
+          case peek(s2) do
+            %{type: :lbrace} ->
+              with {:ok, bindings, s3} <- parse_inputs_block(s2) do
+                {:ok, {:skill, name_tok.value, bindings}, s3}
+              end
+
+            _ ->
+              {:ok, {:skill, name_tok.value, %{}}, s2}
+          end
+        end
+
+      %{type: :keyword, value: "inline"} ->
+        with {:ok, _, s1} <- expect(state, :keyword, "inline"),
+             {:ok, pure, s2} <- parse_pure(s1) do
+          {:ok, {:inline, pure}, s2}
+        end
+
+      other ->
+        error(state, "expected a prompt (skill \"name\" or inline \"text\")", token_value(other))
+    end
+  end
+
+  defp parse_exec(state) do
+    {id, state} = next_id(state, "exec")
+
+    with {:ok, _, s1} <- expect(state, :keyword, "exec"),
+         {:ok, script, s2} <- parse_pure(s1) do
+      {timeout, s3} = parse_optional_timeout(s2)
+
+      with {:ok, inputs, s4} <- parse_optional_inputs(s3) do
+        {:ok, AST.exec(script, timeout, inputs, id), s4}
+      end
+    end
+  end
+
+  defp parse_optional_timeout(state) do
+    case peek(state) do
+      %{type: :keyword, value: "timeout"} ->
+        rest = advance(state)
+
+        case peek(rest) do
+          %{type: :int, value: n} -> {AST.literal(n), advance(rest)}
+          _ -> {nil, state}
+        end
+
+      _ ->
+        {nil, state}
+    end
+  end
+
+  defp parse_subrun(state) do
+    {id, state} = next_id(state, "subrun")
+
+    with {:ok, _, s1} <- expect(state, :keyword, "subrun"),
+         {:ok, source, s2} <- parse_pure(s1),
+         {:ok, inputs, s3} <- parse_optional_inputs(s2) do
+      {:ok, AST.subrun(source, inputs, id), s3}
+    end
+  end
+
+  defp parse_when(state) do
+    {id, state} = next_id(state, "when")
+
+    with {:ok, _, s1} <- expect(state, :keyword, "when"),
+         {:ok, cond, s2} <- parse_pure(s1),
+         {:ok, body, s3} <- parse_block_single(s2) do
+      {:ok, AST.when_(cond, body, id), s3}
+    end
+  end
+
+  defp parse_every(state) do
+    {id, state} = next_id(state, "every")
+
+    with {:ok, _, s1} <- expect(state, :keyword, "every"),
+         {:ok, n_tok, s2} <- expect_int(s1),
+         {:ok, _, s3} <- expect(s2, :keyword, "of"),
+         {:ok, counter_tok, s4} <- expect_ident(s3),
+         {:ok, body, s5} <- parse_block_single(s4) do
+      {:ok, AST.every_nth(n_tok.value, counter_tok.value, body, id), s5}
+    end
+  end
+
+  defp parse_map(state) do
+    {id, state} = next_id(state, "map")
+
+    with {:ok, _, s1} <- expect(state, :keyword, "map"),
+         {:ok, over, s2} <- parse_pure(s1),
+         {:ok, _, s3} <- expect(s2, :keyword, "as"),
+         {:ok, as_tok, s4} <- expect_ident(s3),
+         {:ok, body, s5} <- parse_block_single(s4) do
+      {:ok, AST.map_(over, as_tok.value, body, id), s5}
+    end
+  end
+
+  # A combinator body is a brace block with exactly one statement. One
+  # statement keeps the gate's emitted child unambiguous; nesting another
+  # do-block is how a body grows past one effect.
+  defp parse_block_single(state) do
+    with {:ok, _, s1} <- expect(state, :lbrace, "{"),
+         {:ok, stmt, s2} <- parse_statement(s1),
+         {:ok, _, s3} <- expect(s2, :rbrace, "}") do
+      {:ok, stmt, s3}
+    end
+  end
+
+  # --- inputs blocks ------------------------------------------------------
+
+  defp parse_optional_inputs(state) do
+    case peek(state) do
+      %{type: :lbrace} -> parse_inputs_block(state)
+      _ -> {:ok, %{}, state}
+    end
+  end
+
+  defp parse_inputs_block(state) do
+    with {:ok, _, s1} <- expect(state, :lbrace, "{"),
+         {:ok, pairs, s2} <- parse_input_pairs(s1, %{}),
+         {:ok, _, s3} <- expect(s2, :rbrace, "}") do
+      {:ok, pairs, s3}
+    end
+  end
+
+  defp parse_input_pairs(state, acc) do
+    case peek(state) do
+      %{type: :rbrace} ->
+        {:ok, acc, state}
+
+      %{type: :ident, value: key} ->
+        with {:ok, _, s1} <- expect(state, :ident, key),
+             {:ok, _, s2} <- expect(s1, :colon, ":"),
+             {:ok, value, s3} <- parse_pure(s2) do
+          {next, s4} = skip_optional_comma(s3)
+          _ = next
+          parse_input_pairs(s4, Map.put(acc, key, value))
+        end
+
+      other ->
+        error(state, "expected an input key", token_value(other))
+    end
+  end
+
+  defp skip_optional_comma(state) do
+    case peek(state) do
+      %{type: :comma} -> {:comma, advance(state)}
+      _ -> {:none, state}
+    end
+  end
+
+  # --- pure values --------------------------------------------------------
+
+  defp parse_pure(state) do
+    case peek(state) do
+      %{type: :string} = tok ->
+        {:ok, string_to_pure(tok.value), advance(state)}
+
+      %{type: :int, value: n} ->
+        {:ok, AST.literal(n), advance(state)}
+
+      %{type: :float, value: f} ->
+        {:ok, AST.literal(f), advance(state)}
+
+      %{type: :keyword, value: "true"} ->
+        {:ok, AST.literal(true), advance(state)}
+
+      %{type: :keyword, value: "false"} ->
+        {:ok, AST.literal(false), advance(state)}
+
+      %{type: :keyword, value: "null"} ->
+        {:ok, AST.literal(nil), advance(state)}
+
+      %{type: :interp, value: path} ->
+        {:ok, interp_to_pure(path), advance(state)}
+
+      %{type: :lbracket} ->
+        parse_list(state)
+
+      other ->
+        error(state, "expected a value (string, number, boolean, list, or ${ref})", token_value(other))
+    end
+  end
+
+  defp parse_list(state) do
+    with {:ok, _, s1} <- expect(state, :lbracket, "[") do
+      parse_list_items(s1, [])
+    end
+  end
+
+  defp parse_list_items(state, acc) do
+    case peek(state) do
+      %{type: :rbracket} ->
+        {:ok, AST.list(Enum.reverse(acc)), advance(state)}
+
+      _ ->
+        with {:ok, item, s1} <- parse_pure(state) do
+          {_, s2} = skip_optional_comma(s1)
+
+          case peek(s2) do
+            %{type: :rbracket} -> {:ok, AST.list(Enum.reverse([item | acc])), advance(s2)}
+            _ -> parse_list_items(s2, [item | acc])
+          end
+        end
+    end
+  end
+
+  # A string literal may carry `${path}` interpolations. With none it is a
+  # plain literal; with any it lowers to a concat of literal and field
+  # segments so the interpreter can resolve the refs at expand time.
+  defp string_to_pure(parts) when is_list(parts) do
+    case parts do
+      [{:lit, text}] ->
+        AST.literal(text)
+
+      [] ->
+        AST.literal("")
+
+      _ ->
+        AST.concat(Enum.map(parts, &segment_to_pure/1))
+    end
+  end
+
+  defp segment_to_pure({:lit, text}), do: AST.literal(text)
+  defp segment_to_pure({:ref, path}), do: interp_to_pure(path)
+
+  # `${name.a.b}` -> field read of binding `name` at path [a, b]; a bare
+  # `${name}` is just the binding.
+  defp interp_to_pure([name]), do: AST.var(name)
+  defp interp_to_pure([name | path]), do: AST.field(AST.var(name), path)
+
+  # --- token helpers ------------------------------------------------------
+
+  defp require_prompt(%{prompt: nil}, state),
+    do: error(state, "agent is missing a prompt field", :missing_prompt)
+
+  defp require_prompt(%{prompt: prompt}, _state), do: {:ok, prompt}
+
+  defp optional_string(state) do
+    case peek(state) do
+      %{type: :string} = tok -> {:ok, %{tok | value: flatten_string(tok.value)}, advance(state)}
+      _ -> {:ok, nil, state}
+    end
+  end
+
+  defp expect_string(state) do
+    case peek(state) do
+      %{type: :string} = tok ->
+        # A workflow / skill name is a flat literal; interpolation is not
+        # meaningful in a name position.
+        {:ok, %{tok | value: flatten_string(tok.value)}, advance(state)}
+
+      other ->
+        error(state, "expected a string", token_value(other))
+    end
+  end
+
+  defp flatten_string(parts) do
+    Enum.map_join(parts, "", fn
+      {:lit, text} -> text
+      {:ref, path} -> "${" <> Enum.join(path, ".") <> "}"
+    end)
+  end
+
+  defp expect_int(state) do
+    case peek(state) do
+      %{type: :int} = tok -> {:ok, tok, advance(state)}
+      other -> error(state, "expected an integer", token_value(other))
+    end
+  end
+
+  defp expect_ident(state) do
+    case peek(state) do
+      %{type: :ident} = tok -> {:ok, tok, advance(state)}
+      other -> error(state, "expected an identifier", token_value(other))
+    end
+  end
+
+  defp expect(state, type, literal) do
+    case peek(state) do
+      %{type: ^type} = tok -> {:ok, tok, advance(state)}
+      other -> error(state, "expected #{inspect(literal)}", token_value(other))
+    end
+  end
+
+  defp skip_to_end(state) do
+    case peek(state) do
+      :eof -> :ok
+      other -> error(state, "unexpected trailing input", token_value(other))
+    end
+  end
+
+  defp peek(%{tokens: [tok | _]}), do: tok
+  defp peek(%{tokens: []}), do: :eof
+
+  defp advance(%{tokens: [_ | rest]} = state), do: %{state | tokens: rest}
+  defp advance(%{tokens: []} = state), do: state
+
+  defp token_value(:eof), do: :eof
+  defp token_value(%{value: value}), do: value
+  defp token_value(other), do: other
+
+  # IR node ids must be stable across a deterministic replay. The parser
+  # assigns each effect a monotonically increasing positional id; the
+  # interpreter combines it with an expansion key to derive the final
+  # IR.Node id, so re-parsing the same source yields the same ids.
+  defp next_id(state, kind) do
+    n = state.counter
+    {"#{kind}-#{n}", %{state | counter: n + 1}}
+  end
+
+  defp error(state, message, got) do
+    {line, column} = span_at(state)
+    {:error, %{message: message, line: line, column: column, file: Map.get(state, :file), got: got}}
+  end
+
+  defp span_at(%{tokens: [%{line: line, column: column} | _]}), do: {line, column}
+  defp span_at(%{tokens: []}), do: {1, 1}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/dsl/parser/lexer.ex b/packages/symphony/elixir/lib/symphony_elixir/dsl/parser/lexer.ex
new file mode 100644
index 000000000..bd6f8078d
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/dsl/parser/lexer.ex
@@ -0,0 +1,222 @@
+defmodule SymphonyElixir.DSL.Parser.Lexer do
+  @moduledoc """
+  Tokenize `.sym` source into a flat token list, each token carrying its
+  1-based line and column so the parser can attach a precise span to any
+  diagnostic.
+
+  The lexer owns three non-obvious decisions:
+
+  - String literals are emitted as a list of `{:lit, text}` and `{:ref,
+    path}` segments. `"summarize ${session.report}"` becomes `[{:lit,
+    "summarize "}, {:ref, ["session", "report"]}]`, so the parser can
+    lower interpolation to a `concat` of pure values without re-scanning.
+  - A bare `${path}` outside a string is its own `:interp` token, the
+    common shape for `when ${gate.ok} { ... }`.
+  - `#` starts a line comment to end of line. Comments and whitespace
+    advance the position counters but emit no token.
+  """
+
+  @keywords ~w(workflow agent exec subrun when every of map as skill inline timeout true false null)
+
+  @type segment :: {:lit, String.t()} | {:ref, [String.t()]}
+
+  @type token :: %{
+          type: atom(),
+          value: term(),
+          line: pos_integer(),
+          column: pos_integer()
+        }
+
+  @spec tokenize(String.t()) :: {:ok, [token()]} | {:error, map()}
+  def tokenize(source) when is_binary(source) do
+    do_tokenize(source, 1, 1, [])
+  end
+
+  defp do_tokenize("", _line, _col, acc), do: {:ok, Enum.reverse(acc)}
+
+  defp do_tokenize(<<"\n", rest::binary>>, line, _col, acc),
+    do: do_tokenize(rest, line + 1, 1, acc)
+
+  defp do_tokenize(<<c::utf8, rest::binary>>, line, col, acc) when c in [?\s, ?\t, ?\r],
+    do: do_tokenize(rest, line, col + 1, acc)
+
+  defp do_tokenize(<<"#", rest::binary>>, line, col, acc) do
+    {_comment, rest_after, advanced} = take_line(rest, col + 1)
+    do_tokenize(rest_after, line, advanced, acc)
+  end
+
+  defp do_tokenize(<<"<-", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 2, [tok(:larrow, "<-", line, col) | acc])
+
+  defp do_tokenize(<<"{", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:lbrace, "{", line, col) | acc])
+
+  defp do_tokenize(<<"}", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:rbrace, "}", line, col) | acc])
+
+  defp do_tokenize(<<"[", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:lbracket, "[", line, col) | acc])
+
+  defp do_tokenize(<<"]", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:rbracket, "]", line, col) | acc])
+
+  defp do_tokenize(<<":", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:colon, ":", line, col) | acc])
+
+  defp do_tokenize(<<",", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:comma, ",", line, col) | acc])
+
+  defp do_tokenize(<<"=", rest::binary>>, line, col, acc),
+    do: do_tokenize(rest, line, col + 1, [tok(:equals, "=", line, col) | acc])
+
+  defp do_tokenize(<<"\"", rest::binary>>, line, col, acc) do
+    case scan_string(rest, line, col + 1, [], []) do
+      {:ok, segments, rest_after, new_line, new_col} ->
+        do_tokenize(rest_after, new_line, new_col, [tok(:string, segments, line, col) | acc])
+
+      {:error, _} = err ->
+        err
+    end
+  end
+
+  defp do_tokenize(<<"${", rest::binary>>, line, col, acc) do
+    case scan_interp(rest, line, col + 2) do
+      {:ok, path, rest_after, new_col} ->
+        do_tokenize(rest_after, line, new_col, [tok(:interp, path, line, col) | acc])
+
+      {:error, _} = err ->
+        err
+    end
+  end
+
+  defp do_tokenize(<<c::utf8, _::binary>> = bin, line, col, acc) when c in ?0..?9 do
+    {number, rest, advanced} = scan_number(bin, col)
+    do_tokenize(rest, line, advanced, [number_token(number, line, col) | acc])
+  end
+
+  defp do_tokenize(<<c::utf8, _::binary>> = bin, line, col, acc)
+       when c in ?a..?z or c in ?A..?Z or c == ?_ do
+    {word, rest, advanced} = scan_ident(bin, col)
+    type = if word in @keywords, do: :keyword, else: :ident
+    do_tokenize(rest, line, advanced, [tok(type, word, line, col) | acc])
+  end
+
+  defp do_tokenize(<<c::utf8, _::binary>>, line, col, _acc) do
+    {:error, %{message: "unexpected character #{inspect(<<c::utf8>>)}", line: line, column: col, got: <<c::utf8>>}}
+  end
+
+  # --- scanners -----------------------------------------------------------
+
+  defp take_line(bin, col), do: take_line(bin, col, [])
+  defp take_line(<<"\n", _::binary>> = rest, col, acc), do: {IO.iodata_to_binary(Enum.reverse(acc)), rest, col}
+  defp take_line("", col, acc), do: {IO.iodata_to_binary(Enum.reverse(acc)), "", col}
+  defp take_line(<<c::utf8, rest::binary>>, col, acc), do: take_line(rest, col + 1, [<<c::utf8>> | acc])
+
+  # Scan a double-quoted string into interpolation segments. `lit` is the
+  # literal-character accumulator for the current run; `segs` is the list
+  # of finished segments. A `${` opens an interpolation that closes at `}`.
+  defp scan_string(<<"\"", rest::binary>>, line, col, lit, segs) do
+    segs = flush_lit(lit, segs)
+    {:ok, Enum.reverse(segs), rest, line, col + 1}
+  end
+
+  defp scan_string(<<"\\", c::utf8, rest::binary>>, line, col, lit, segs) do
+    scan_string(rest, line, col + 2, [unescape(c) | lit], segs)
+  end
+
+  defp scan_string(<<"${", rest::binary>>, line, col, lit, segs) do
+    segs = flush_lit(lit, segs)
+
+    case scan_interp(rest, line, col + 2) do
+      {:ok, path, rest_after, new_col} ->
+        scan_string(rest_after, line, new_col, [], [{:ref, path} | segs])
+
+      {:error, _} = err ->
+        err
+    end
+  end
+
+  defp scan_string(<<"\n", _::binary>>, line, col, _lit, _segs) do
+    {:error, %{message: "unterminated string", line: line, column: col, got: :newline}}
+  end
+
+  defp scan_string("", line, col, _lit, _segs) do
+    {:error, %{message: "unterminated string", line: line, column: col, got: :eof}}
+  end
+
+  defp scan_string(<<c::utf8, rest::binary>>, line, col, lit, segs) do
+    scan_string(rest, line, col + 1, [<<c::utf8>> | lit], segs)
+  end
+
+  defp flush_lit([], segs), do: segs
+  defp flush_lit(lit, segs), do: [{:lit, IO.iodata_to_binary(Enum.reverse(lit))} | segs]
+
+  defp unescape(?n), do: "\n"
+  defp unescape(?t), do: "\t"
+  defp unescape(?r), do: "\r"
+  defp unescape(?"), do: "\""
+  defp unescape(?\\), do: "\\"
+  defp unescape(c), do: <<c::utf8>>
+
+  # An interpolation reference is a dotted path of identifiers terminated
+  # by `}`. `${session.report.ok}` -> ["session", "report", "ok"].
+  defp scan_interp(bin, line, col), do: scan_interp(bin, line, col, [], [])
+
+  defp scan_interp(<<"}", rest::binary>>, line, col, current, acc) do
+    path = Enum.reverse(flush_path(current, acc))
+
+    case path do
+      [] -> {:error, %{message: "empty interpolation", line: line, column: col, got: :empty_interp}}
+      _ -> {:ok, path, rest, col + 1}
+    end
+  end
+
+  defp scan_interp(<<".", rest::binary>>, line, col, current, acc) do
+    scan_interp(rest, line, col + 1, [], flush_path(current, acc))
+  end
+
+  defp scan_interp(<<c::utf8, rest::binary>>, line, col, current, acc)
+       when c in ?a..?z or c in ?A..?Z or c in ?0..?9 or c == ?_ do
+    scan_interp(rest, line, col + 1, [<<c::utf8>> | current], acc)
+  end
+
+  defp scan_interp("", line, col, _current, _acc) do
+    {:error, %{message: "unterminated interpolation", line: line, column: col, got: :eof}}
+  end
+
+  defp scan_interp(<<c::utf8, _::binary>>, line, col, _current, _acc) do
+    {:error, %{message: "invalid character in interpolation #{inspect(<<c::utf8>>)}", line: line, column: col, got: <<c::utf8>>}}
+  end
+
+  defp flush_path([], acc), do: acc
+  defp flush_path(current, acc), do: [IO.iodata_to_binary(Enum.reverse(current)) | acc]
+
+  defp scan_number(bin, col), do: scan_number(bin, col, [], false)
+
+  defp scan_number(<<c::utf8, rest::binary>>, col, acc, dot?) when c in ?0..?9,
+    do: scan_number(rest, col + 1, [<<c::utf8>> | acc], dot?)
+
+  defp scan_number(<<".", c::utf8, rest::binary>>, col, acc, false) when c in ?0..?9,
+    do: scan_number(rest, col + 2, [<<c::utf8>>, "." | acc], true)
+
+  defp scan_number(rest, col, acc, dot?) do
+    text = IO.iodata_to_binary(Enum.reverse(acc))
+    {%{text: text, float?: dot?}, rest, col}
+  end
+
+  defp number_token(%{text: text, float?: true}, line, col),
+    do: tok(:float, String.to_float(text), line, col)
+
+  defp number_token(%{text: text, float?: false}, line, col),
+    do: tok(:int, String.to_integer(text), line, col)
+
+  defp scan_ident(bin, col), do: scan_ident(bin, col, [])
+
+  defp scan_ident(<<c::utf8, rest::binary>>, col, acc)
+       when c in ?a..?z or c in ?A..?Z or c in ?0..?9 or c == ?_,
+       do: scan_ident(rest, col + 1, [<<c::utf8>> | acc])
+
+  defp scan_ident(rest, col, acc), do: {IO.iodata_to_binary(Enum.reverse(acc)), rest, col}
+
+  defp tok(type, value, line, col), do: %{type: type, value: value, line: line, column: col}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/dsl/schema.ex b/packages/symphony/elixir/lib/symphony_elixir/dsl/schema.ex
new file mode 100644
index 000000000..5d72f4bc4
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/dsl/schema.ex
@@ -0,0 +1,36 @@
+defmodule SymphonyElixir.DSL.Schema do
+  @moduledoc """
+  One JSON-able snapshot of the runtime's vocabulary: the engines, efforts,
+  permission levels, placement locations, node kinds, node states, effect
+  kinds, and trigger kinds the runtime actually accepts.
+
+  Each field reads the single source-of-truth accessor on the module that
+  owns the enum, so the schema cannot drift from what a turn, a node, or
+  the parser will take. Forms and renderers build their option lists from
+  `to_map/0` rather than hard-coding literals, so adding an enum value at
+  its owner flows to the UI without a form edit.
+  """
+
+  alias SymphonyElixir.DSL.{AST, Parser}
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.Node
+
+  @doc """
+  Collect the runtime enums into one map keyed by domain. Values are atoms
+  straight from each accessor; `Jason.encode/1` renders them as strings, so
+  a consumer reads `"codex"`, `"high"`, `"workspace_write"`, and so on.
+  """
+  @spec to_map() :: %{atom() => [atom()]}
+  def to_map do
+    %{
+      engines: Envelope.engines(),
+      efforts: Envelope.efforts(),
+      permissions: Envelope.permission_levels(),
+      locations: Envelope.locations(),
+      node_kinds: Node.kinds(),
+      node_states: Node.states(),
+      effect_kinds: AST.effect_kinds(),
+      trigger_kinds: Parser.trigger_kinds()
+    }
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/engine/client.ex b/packages/symphony/elixir/lib/symphony_elixir/engine/client.ex
new file mode 100644
index 000000000..e84ca5c2d
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/engine/client.ex
@@ -0,0 +1,274 @@
+defmodule SymphonyElixir.Engine.Client do
+  @moduledoc """
+  The single door between the Elixir runtime and the room-server engine
+  host. Every engine turn the runtime issues passes through here, and
+  nothing else in `elixir/lib/` speaks the room-server wire. This is the
+  layer boundary the overhaul encodes: DSL -> IR -> Runtime ->
+  `Engine.Client` -> room-server, with `Engine.Client` the only module
+  that names the room-server's HTTP contract.
+
+  ## What it owns
+
+  - Lowering a typed `Engine.Envelope` plus a prompt and working
+    directory into the room-server's canonical `TurnRequest` JSON
+    (camelCase keys, the engine-agnostic shape from room-server's
+    `engine.rs` in the IX monorepo, mirrored by `contracts/fixtures`).
+  - Resolving the envelope's `location` to a concrete room-server base
+    URL. `:local`, `{:room, url}`, and the default config URL are
+    handled here; `:ixvm` and `{:host, name}` both resolve to the per-run
+    URL the run's `Runtime.Placement` provisioned (the run acquires its
+    own room-server before the first agent turn), looked up by `run_id`.
+    The same `run_id` lookup also serves an `:ixvm` node whose VM setup
+    failed and fell back to a host room-server, since the fallback
+    registers under the same `run_id`. A turn submitted without the
+    runtime's `run_id` context fails with a clear `{:unresolved_location,
+    _}` rather than silently routing to the default server.
+  - Speaking `POST /api/agent/turns` and parsing `AgentTurnResponse`
+    (`threadId`, `outcome`, `eventCount`, `usage`) into a runtime-facing
+    result, mapping the turn's terminal `usage` totals to the
+    `IR.Attempt.cost` shape so per-turn cost reaches the run.
+
+  The room-server runs the whole turn and returns its terminal outcome
+  plus the thread id it assigned, so the synchronous `submit_turn/2` is
+  the natural shape for a runtime that schedules one node attempt as one
+  monitored task. A streaming surface (subscribe to `EngineEvent`s,
+  answer approvals, interrupt) is a later addition behind the same module;
+  the synchronous turn is the smallest contract that drives a node to a
+  terminal state.
+
+  ## Known limitations
+
+  The room-server's `/api/agent/turns` is request/response: it blocks
+  until the turn completes. A turn that runs for an hour holds the HTTP
+  connection open for that hour, so `submit_turn/2` sets a long receive
+  timeout and the caller must run it off the runtime process (the runtime
+  already schedules each attempt in a monitored task). Approvals and
+  interrupts are not reachable through this synchronous path; an engine
+  configured for `:read_only` or `:workspace_write` that pauses for an
+  approval would stall until the timeout. Use `:danger_full_access` (or a
+  self-executing engine) for the synchronous path until the streaming
+  client lands.
+  """
+
+  alias SymphonyElixir.Engine.Envelope
+
+  @default_timeout_ms :timer.minutes(60)
+
+  @typedoc """
+  Everything a turn needs beyond the envelope: the prompt text the engine
+  runs, the working directory it runs in, the dynamic-tool specs the host
+  will execute, and the runtime correlation ids echoed on every event.
+  """
+  @type turn :: %{
+          required(:prompt) => String.t(),
+          required(:cwd) => String.t(),
+          optional(:tools) => [map()],
+          optional(:run_id) => String.t() | nil,
+          optional(:node_id) => String.t() | nil
+        }
+
+  @typedoc """
+  Result of a completed turn. `thread_id` is the engine handle the turn
+  opened, carried even on failure so the runtime can record it for a
+  later reattach probe.
+  """
+  @type result ::
+          {:ok,
+           %{
+             thread_id: String.t(),
+             event_count: non_neg_integer(),
+             cost: cost() | nil
+           }}
+          | {:error, term()}
+
+  @typedoc """
+  The turn's terminal token/cost totals, already mapped to the
+  `IR.Attempt.cost` shape so the runtime can store it without a second
+  translation. `nil` when the room-server reported no usage (an older
+  server or a turn that emitted none), so the runtime records "unknown"
+  rather than a sham zero. `:usd` is present only when the engine priced
+  the turn.
+  """
+  @type cost :: %{
+          optional(:usd) => float(),
+          optional(:tokens_in) => non_neg_integer(),
+          optional(:tokens_out) => non_neg_integer(),
+          optional(:cache_read) => non_neg_integer(),
+          optional(:cache_creation) => non_neg_integer()
+        }
+
+  @doc """
+  Run one engine turn through the room-server and return its terminal
+  outcome. Lowers `envelope` to a `TurnRequest`, resolves the target
+  room-server URL, POSTs `/api/agent/turns`, and maps the response.
+
+  `opts` carries the room-server URL resolution context:
+
+  - `:room_server_url` - the default room-server base URL, used when the
+    envelope location is `:local` or a default. Usually the value from
+    `Config`.
+  - `:req_options` - extra options merged into the `Req` request (tests
+    inject a `:plug` or `:base_url` stub here).
+  - `:timeout_ms` - receive timeout for the (long) turn. Defaults to one
+    hour.
+  """
+  @spec submit_turn(Envelope.t(), turn(), keyword()) :: result()
+  def submit_turn(%Envelope{} = envelope, turn, opts \\ []) when is_map(turn) and is_list(opts) do
+    with {:ok, base_url} <- resolve_base_url(envelope.location, opts),
+         {:ok, body} <- request_body(envelope, turn) do
+      post_turn(base_url, body, opts)
+    end
+  end
+
+  @doc """
+  Lower a typed envelope plus a turn into the room-server's `TurnRequest`
+  JSON map (camelCase keys). Public so a test can assert the wire shape
+  without a running server, and so a caller can inspect what it would
+  send.
+  """
+  @spec request_body(Envelope.t(), turn()) :: {:ok, map()} | {:error, term()}
+  def request_body(%Envelope{} = envelope, turn) when is_map(turn) do
+    with {:ok, prompt} <- fetch_prompt(turn),
+         {:ok, cwd} <- fetch_cwd(turn) do
+      body =
+        %{
+          "engine" => Atom.to_string(envelope.engine),
+          "model" => envelope.model,
+          "permissions" => Atom.to_string(envelope.permissions),
+          "cwd" => cwd,
+          "prompt" => prompt,
+          "tools" => Map.get(turn, :tools, []),
+          "runId" => Map.get(turn, :run_id),
+          "nodeId" => Map.get(turn, :node_id)
+        }
+        |> put_effort(envelope.effort)
+        |> drop_nil()
+
+      {:ok, body}
+    end
+  end
+
+  # The room-server omits `effort` when null (serde skip_serializing_if),
+  # so the request only carries it when the envelope declared a budget.
+  defp put_effort(body, nil), do: body
+  defp put_effort(body, effort), do: Map.put(body, "effort", Atom.to_string(effort))
+
+  defp drop_nil(body), do: Map.reject(body, fn {_k, v} -> is_nil(v) end)
+
+  defp fetch_prompt(%{prompt: prompt}) when is_binary(prompt) and prompt != "", do: {:ok, prompt}
+  defp fetch_prompt(_), do: {:error, :missing_prompt}
+
+  defp fetch_cwd(%{cwd: cwd}) when is_binary(cwd) and cwd != "", do: {:ok, cwd}
+  defp fetch_cwd(_), do: {:error, :missing_cwd}
+
+  # Location resolution is the deployment-topology seam. The synchronous
+  # client routes `:local` and an explicit `{:room, url}` to a fixed URL,
+  # and `:ixvm` / `{:host, _}` to the per-run room-server the run's
+  # `Runtime.Placement` provisioned, looked up by `run_id`. Failing loudly
+  # here keeps a turn from silently running on the wrong server.
+  defp resolve_base_url(:local, opts), do: fetch_default_url(opts)
+  defp resolve_base_url({:room, url}, _opts) when is_binary(url) and url != "", do: {:ok, url}
+  defp resolve_base_url(:ixvm, opts), do: fetch_placement_url(:ixvm, opts)
+  defp resolve_base_url({:host, _} = location, opts), do: fetch_placement_url(location, opts)
+
+  defp resolve_base_url(other, _opts), do: {:error, {:invalid_location, other}}
+
+  # The run's `Runtime.Placement` provisioned its own room-server and
+  # registered the URL under `run_id` before the first agent turn, so the
+  # turn routes there rather than to the shared default. The placement
+  # module is injectable through `opts[:placement]` so a test can resolve
+  # against a stub without a real VM; production defaults to
+  # `Runtime.Placement`. A missing `run_id` (a turn submitted without the
+  # runtime context) or an unresolved run is an explicit error, never a
+  # silent fall-through to the default server.
+  defp fetch_placement_url(location, opts) do
+    placement = Keyword.get(opts, :placement, SymphonyElixir.Runtime.Placement)
+
+    case Keyword.get(opts, :run_id) do
+      run_id when is_binary(run_id) and run_id != "" ->
+        case placement.base_url(run_id) do
+          {:ok, url} when is_binary(url) and url != "" -> {:ok, url}
+          _ -> {:error, {:unresolved_location, location}}
+        end
+
+      _ ->
+        {:error, {:unresolved_location, location}}
+    end
+  end
+
+  defp fetch_default_url(opts) do
+    case Keyword.get(opts, :room_server_url) do
+      url when is_binary(url) and url != "" -> {:ok, url}
+      _ -> {:error, :missing_room_server_url}
+    end
+  end
+
+  defp post_turn(base_url, body, opts) do
+    timeout = Keyword.get(opts, :timeout_ms, @default_timeout_ms)
+    req_options = Keyword.get(opts, :req_options, [])
+
+    request =
+      [
+        url: join(base_url, "/api/agent/turns"),
+        json: body,
+        receive_timeout: timeout,
+        connect_options: [timeout: 30_000]
+      ]
+      |> Keyword.merge(req_options)
+
+    case Req.post(request) do
+      {:ok, %{status: status, body: response}} when status in 200..299 ->
+        parse_response(response)
+
+      {:ok, %{status: status, body: response}} ->
+        {:error, {:agent_turn_status, status, response}}
+
+      {:error, reason} ->
+        {:error, {:agent_turn_failed, reason}}
+    end
+  end
+
+  defp parse_response(%{"outcome" => outcome} = response) do
+    thread_id = Map.get(response, "threadId", "")
+    event_count = Map.get(response, "eventCount", 0)
+    cost = parse_cost(Map.get(response, "usage"))
+
+    case outcome do
+      %{"kind" => "ok"} ->
+        {:ok, %{thread_id: thread_id, event_count: event_count, cost: cost}}
+
+      %{"kind" => "error", "message" => message} ->
+        {:error, {:turn_error, message, thread_id}}
+
+      %{"kind" => "cancelled"} ->
+        {:error, {:turn_cancelled, thread_id}}
+
+      other ->
+        {:error, {:unexpected_outcome, other}}
+    end
+  end
+
+  defp parse_response(other), do: {:error, {:unexpected_agent_response, other}}
+
+  # Map the room-server's `Usage` (camelCase) to the `IR.Attempt.cost`
+  # shape. A response without `usage` (older server) yields nil so the
+  # attempt records "unknown" rather than a sham zero; `costUsd` is dropped
+  # when the engine did not price the turn, so a present `:usd` always
+  # means a real number.
+  defp parse_cost(usage) when is_map(usage) do
+    %{
+      usd: Map.get(usage, "costUsd"),
+      tokens_in: Map.get(usage, "tokensIn", 0),
+      tokens_out: Map.get(usage, "tokensOut", 0),
+      cache_read: Map.get(usage, "cacheRead", 0),
+      cache_creation: Map.get(usage, "cacheCreation", 0)
+    }
+    |> drop_nil()
+  end
+
+  defp parse_cost(_), do: nil
+
+  defp join(base_url, path) do
+    String.trim_trailing(base_url, "/") <> path
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/engine/envelope.ex b/packages/symphony/elixir/lib/symphony_elixir/engine/envelope.ex
new file mode 100644
index 000000000..7cd454264
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/engine/envelope.ex
@@ -0,0 +1,239 @@
+defmodule SymphonyElixir.Engine.Envelope do
+  @moduledoc """
+  The typed execution envelope for one agent node: which engine runs it,
+  with which model, at what reasoning effort, under which permissions, and
+  where the engine process lives.
+
+  This replaces the pre-overhaul magic strings, where the engine was
+  sniffed from a `codex_model` value (`opus`/`sonnet`/`haiku`/`claude*`),
+  `runtime:` meant "where Codex runs" but read like "which engine," and
+  codex-only fields (`sandbox`, `approval_policy`) were silently ignored
+  for Claude. Every axis is now explicit and validated at load.
+
+  ## Fields
+
+  - `engine` - `:codex` or `:claude`. Explicit; never inferred from the
+    model name.
+  - `model` - the model identifier passed through to the engine verbatim
+    (for example `gpt-5.3-codex` or `claude-opus-4-8`, or the `opus` /
+    `sonnet` / `haiku` aliases Claude accepts).
+  - `effort` - reasoning budget. One of `:none`, `:minimal`, `:low`,
+    `:medium`, `:high`, `:xhigh`, or `nil` to let the engine pick its
+    default.
+  - `permissions` - one engine-agnostic level: `:read_only`,
+    `:workspace_write`, or `:danger_full_access`. Each engine adapter
+    lowers this to its native shape (Codex sandbox + approval policy;
+    Claude permission mode / `--dangerously-skip-permissions`).
+  - `location` - where the engine process runs: `:local`, `:ixvm`,
+    `{:host, name}`, or `{:room, url}`. This is the deployment topology,
+    resolved by `Engine.Client` to a concrete room-server URL.
+
+  The dynamic-tool surface (`tools`) is intentionally NOT part of the
+  envelope: it is a property of the prompt/skill, not of execution.
+
+  Validation is strict and fails at load (`validate/1`): unknown keys,
+  a Claude-looking model under `engine: :codex` (or vice versa), an
+  out-of-range effort, an unknown permission level, or a malformed
+  location are all errors rather than silently-ignored fields.
+  """
+
+  @enforce_keys [:engine, :model]
+  defstruct [:engine, :model, :effort, :permissions, :location]
+
+  @engines [:codex, :claude]
+  @efforts [:none, :minimal, :low, :medium, :high, :xhigh]
+  @permissions [:read_only, :workspace_write, :danger_full_access]
+  # The placement targets a `location` can name. `:host` and `:room` carry
+  # a payload (`{:host, name}` / `{:room, url}`) so they are listed as the
+  # bare tag the form offers; the operator supplies the payload separately.
+  @locations [:local, :ixvm, :host, :room]
+
+  # Derive the flat atom-union types from the same lists the accessors and
+  # validator read, so the `@type` (what Dialyzer checks) cannot drift from
+  # the runtime vocabulary (what the form and `validate/1` accept). Adding a
+  # value to `@engines`/`@efforts`/`@permissions` updates the spec, the
+  # accessor, and the check in one place. ENG-1825. `location` is left
+  # explicit below because its members carry payloads (`{:host, name}` /
+  # `{:room, url}`), a shape the bare-tag `@locations` list cannot express.
+  atom_union = fn [first | rest] ->
+    Enum.reduce(rest, first, fn value, acc -> {:|, [], [acc, value]} end)
+  end
+
+  @type engine :: unquote(atom_union.(@engines))
+  @type effort :: unquote(atom_union.(@efforts))
+  @type permissions :: unquote(atom_union.(@permissions))
+  @type location :: :local | :ixvm | {:host, String.t()} | {:room, String.t()}
+
+  @type t :: %__MODULE__{
+          engine: engine(),
+          model: String.t(),
+          effort: effort() | nil,
+          permissions: permissions(),
+          location: location()
+        }
+
+  @doc "The engines an envelope may select."
+  @spec engines() :: [engine()]
+  def engines, do: @engines
+
+  @doc "The reasoning-effort values an envelope may declare."
+  @spec efforts() :: [effort()]
+  def efforts, do: @efforts
+
+  @doc "The permission levels an envelope may declare."
+  @spec permission_levels() :: [permissions()]
+  def permission_levels, do: @permissions
+
+  @doc "The placement target tags a `location` may name (`:host`/`:room` carry a payload)."
+  @spec locations() :: [atom()]
+  def locations, do: @locations
+
+  @doc """
+  Build a validated envelope from a plain map (string or atom keys), as
+  parsed out of a DSL node. Returns `{:ok, envelope}` or `{:error,
+  reason}` with a reason that names the offending field.
+  """
+  @spec from_map(map()) :: {:ok, t()} | {:error, term()}
+  def from_map(map) when is_map(map) do
+    with {:ok, known} <- reject_unknown_keys(map),
+         {:ok, engine} <- fetch_engine(known),
+         {:ok, model} <- fetch_model(known),
+         {:ok, effort} <- fetch_effort(known),
+         {:ok, permissions} <- fetch_permissions(known),
+         {:ok, location} <- fetch_location(known) do
+      validate(%__MODULE__{
+        engine: engine,
+        model: model,
+        effort: effort,
+        permissions: permissions,
+        location: location
+      })
+    end
+  end
+
+  def from_map(_other), do: {:error, :envelope_not_map}
+
+  @doc """
+  Validate a constructed envelope. The defaulting rule lives here: a
+  missing `permissions` defaults to `:workspace_write` and a missing
+  `location` defaults to `:local`, both the conservative common case.
+  """
+  @spec validate(t()) :: {:ok, t()} | {:error, term()}
+  def validate(%__MODULE__{} = env) do
+    env = %{
+      env
+      | permissions: env.permissions || :workspace_write,
+        location: env.location || :local
+    }
+
+    with :ok <- check_engine(env.engine),
+         :ok <- check_model(env.model),
+         :ok <- check_effort(env.effort),
+         :ok <- check_permissions(env.permissions),
+         :ok <- check_location(env.location),
+         :ok <- check_engine_model_agree(env.engine, env.model) do
+      {:ok, env}
+    end
+  end
+
+  @doc """
+  Whether a model string names a Claude model. Used to catch an engine
+  and model that disagree. Kept deliberately loose (prefix/alias match)
+  rather than an exhaustive list so new model names do not need a code
+  change; the check only rejects an unambiguous mismatch.
+  """
+  @spec claude_model?(String.t()) :: boolean()
+  def claude_model?(model) when is_binary(model) do
+    normalized = model |> String.trim() |> String.downcase()
+    String.starts_with?(normalized, "claude") or normalized in ~w(opus sonnet haiku)
+  end
+
+  defp reject_unknown_keys(map) do
+    normalized = Map.new(map, fn {k, v} -> {to_string(k), v} end)
+    known = ~w(engine model effort permissions location)
+    extra = Map.keys(normalized) -- known
+
+    case extra do
+      [] -> {:ok, normalized}
+      _ -> {:error, {:unknown_envelope_keys, Enum.sort(extra)}}
+    end
+  end
+
+  defp fetch_engine(%{"engine" => engine}), do: to_known_atom(engine, @engines, :invalid_engine)
+  defp fetch_engine(_), do: {:error, {:missing_envelope_field, "engine"}}
+
+  defp fetch_model(%{"model" => model}) when is_binary(model) do
+    case String.trim(model) do
+      "" -> {:error, {:invalid_model, model}}
+      trimmed -> {:ok, trimmed}
+    end
+  end
+
+  defp fetch_model(%{"model" => other}), do: {:error, {:invalid_model, other}}
+  defp fetch_model(_), do: {:error, {:missing_envelope_field, "model"}}
+
+  defp fetch_effort(%{"effort" => nil}), do: {:ok, nil}
+  defp fetch_effort(%{"effort" => effort}), do: to_known_atom(effort, @efforts, :invalid_effort)
+  defp fetch_effort(_), do: {:ok, nil}
+
+  defp fetch_permissions(%{"permissions" => nil}), do: {:ok, nil}
+  defp fetch_permissions(%{"permissions" => perm}), do: to_known_atom(perm, @permissions, :invalid_permissions)
+  defp fetch_permissions(_), do: {:ok, nil}
+
+  defp fetch_location(%{"location" => nil}), do: {:ok, nil}
+  defp fetch_location(%{"location" => location}), do: parse_location(location)
+  defp fetch_location(_), do: {:ok, nil}
+
+  defp parse_location(loc) when loc in [:local, "local"], do: {:ok, :local}
+  defp parse_location(loc) when loc in [:ixvm, "ixvm"], do: {:ok, :ixvm}
+  defp parse_location(%{"host" => name}) when is_binary(name) and name != "", do: {:ok, {:host, name}}
+  defp parse_location(%{"room" => url}) when is_binary(url) and url != "", do: {:ok, {:room, url}}
+  defp parse_location({:host, name} = loc) when is_binary(name) and name != "", do: {:ok, loc}
+  defp parse_location({:room, url} = loc) when is_binary(url) and url != "", do: {:ok, loc}
+  defp parse_location(other), do: {:error, {:invalid_location, other}}
+
+  defp to_known_atom(value, allowed, error) when is_atom(value) do
+    if value in allowed, do: {:ok, value}, else: {:error, {error, value}}
+  end
+
+  defp to_known_atom(value, allowed, error) when is_binary(value) do
+    normalized = value |> String.trim() |> String.downcase()
+
+    case Enum.find(allowed, fn a -> Atom.to_string(a) == normalized end) do
+      nil -> {:error, {error, value}}
+      atom -> {:ok, atom}
+    end
+  end
+
+  defp to_known_atom(value, _allowed, error), do: {:error, {error, value}}
+
+  defp check_engine(engine) when engine in @engines, do: :ok
+  defp check_engine(other), do: {:error, {:invalid_engine, other}}
+
+  defp check_model(model) when is_binary(model) and model != "", do: :ok
+  defp check_model(other), do: {:error, {:invalid_model, other}}
+
+  defp check_effort(nil), do: :ok
+  defp check_effort(effort) when effort in @efforts, do: :ok
+  defp check_effort(other), do: {:error, {:invalid_effort, other}}
+
+  defp check_permissions(perm) when perm in @permissions, do: :ok
+  defp check_permissions(other), do: {:error, {:invalid_permissions, other}}
+
+  defp check_location(:local), do: :ok
+  defp check_location(:ixvm), do: :ok
+  defp check_location({:host, name}) when is_binary(name) and name != "", do: :ok
+  defp check_location({:room, url}) when is_binary(url) and url != "", do: :ok
+  defp check_location(other), do: {:error, {:invalid_location, other}}
+
+  # The mismatch guard the pre-overhaul code could not express: a Claude
+  # model under engine: :codex (or a non-Claude model under :claude) is a
+  # load error, not a silent mis-route.
+  defp check_engine_model_agree(:codex, model) do
+    if claude_model?(model), do: {:error, {:engine_model_mismatch, :codex, model}}, else: :ok
+  end
+
+  defp check_engine_model_agree(:claude, model) do
+    if claude_model?(model), do: :ok, else: {:error, {:engine_model_mismatch, :claude, model}}
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/github_app.ex b/packages/symphony/elixir/lib/symphony_elixir/github_app.ex
new file mode 100644
index 000000000..d6b2b8aa0
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/github_app.ex
@@ -0,0 +1,256 @@
+defmodule SymphonyElixir.GithubApp do
+  @moduledoc """
+  Mint and cache installation access tokens for a configured GitHub App.
+
+  Why this exists:
+
+  - PRs authored under an installation token show up under the App's
+    bot identity (`<app-slug>[bot]`) at the API level. Workflow packs
+    that gate behavior on a specific bot author (e.g. auto-merge guards)
+    rely on this. PRs authored with a human PAT bypass that gate.
+  - Doing the JWT signature in Elixir via `:public_key.sign/4` keeps
+    token minting in-process with no `openssl` dependency on the host.
+  - Centralizing the mint in one process lets us cache the installation
+    token across nodes in the same run (and across runs in the same
+    hour) instead of paying the JWT + REST round-trip on every node.
+
+  Token lifecycle:
+
+  - Build a JWT signed with the App's RSA private key (RS256). `iat`
+    is 60s in the past for clock skew tolerance; `exp` is 9 minutes out
+    (GitHub caps JWT exp at 10 minutes).
+  - POST that JWT to `/app/installations/<id>/access_tokens` to receive
+    the installation token. GitHub installation tokens expire after one
+    hour.
+  - Cache the token until `expires_at - skew`. The skew must be long
+    enough for a Codex node to finish implementation and still push with
+    the token stamped into the workspace's git config.
+
+  This module is a no-op when `SYMPHONY_GITHUB_APP_ID` is unset. That is
+  the dev-laptop default; production hosts must set the App credentials.
+  Callers that require the bot identity should match on
+  `{:error, :not_configured}` and decide whether to fail or proceed
+  with the ambient `GITHUB_TOKEN`.
+  """
+
+  use GenServer
+
+  alias SymphonyElixir.Config
+
+  require Logger
+
+  @table :symphony_github_app_token
+
+  # Re-mint when the cached token has less than this much life left.
+  # GitHub installation tokens last 60 minutes. Skill nodes routinely spend
+  # 10-15 minutes before their final git push, and the token is copied into
+  # the workspace's git config only once at node startup. Keep enough
+  # headroom that a token accepted at startup is still valid at publish time.
+  @reissue_skew_seconds 30 * 60
+
+  # GitHub JWT max exp is 10 minutes from iat. Use 9 to leave a safety
+  # margin against clock skew between this host and api.github.com.
+  @jwt_lifetime_seconds 9 * 60
+  @jwt_clock_skew_seconds 60
+
+  @type token :: %{token: String.t(), expires_at: DateTime.t(), installation_id: integer()}
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @doc """
+  Return a valid installation token, minting one if the cache is cold
+  or near expiry. `{:error, :not_configured}` when the App credentials
+  are absent (dev laptops); `{:error, reason}` on mint failure.
+  """
+  @spec installation_token() :: {:ok, String.t()} | {:error, term()}
+  def installation_token do
+    case :ets.lookup(@table, :current) do
+      [{:current, %{token: token, expires_at: expires_at}}] ->
+        if DateTime.diff(expires_at, DateTime.utc_now()) > @reissue_skew_seconds do
+          {:ok, token}
+        else
+          GenServer.call(__MODULE__, :mint, 30_000)
+        end
+
+      [] ->
+        GenServer.call(__MODULE__, :mint, 30_000)
+    end
+  end
+
+  @doc """
+  True iff `SYMPHONY_GITHUB_APP_ID` and the private key are both configured.
+  Used by the IR exec runner to decide whether to attempt token injection
+  at all.
+  """
+  @spec configured?() :: boolean()
+  def configured? do
+    configured?(Config.get())
+  end
+
+  @doc """
+  Pure variant: caller passes the config snapshot. Lets tests probe
+  this decision without needing the Config GenServer running.
+  """
+  @spec configured?(Config.t() | map()) :: boolean()
+  def configured?(%{github_app_id: id, github_app_private_key_pem: pem}) do
+    is_binary(id) and id != "" and is_binary(pem) and pem != ""
+  end
+
+  def configured?(_), do: false
+
+  @impl true
+  def init(_opts) do
+    :ets.new(@table, [:named_table, :public, read_concurrency: true])
+    {:ok, %{}}
+  end
+
+  @impl true
+  def handle_call(:mint, _from, state) do
+    # Double-check cache after acquiring the call lock; a concurrent
+    # caller may have minted between our ETS read and this point.
+    case :ets.lookup(@table, :current) do
+      [{:current, %{token: token, expires_at: expires_at}}] ->
+        if DateTime.diff(expires_at, DateTime.utc_now()) > @reissue_skew_seconds do
+          {:reply, {:ok, token}, state}
+        else
+          do_mint(state)
+        end
+
+      [] ->
+        do_mint(state)
+    end
+  end
+
+  defp do_mint(state) do
+    case mint_token() do
+      {:ok, %{token: token} = entry} ->
+        :ets.insert(@table, {:current, entry})
+        {:reply, {:ok, token}, state}
+
+      {:error, reason} = err ->
+        Logger.warning("GithubApp mint failed: #{inspect(reason)}")
+        {:reply, err, state}
+    end
+  end
+
+  @spec mint_token() :: {:ok, token()} | {:error, term()}
+  defp mint_token do
+    config = Config.get()
+
+    with :ok <- ensure_configured(config),
+         :ok <- ensure_owner_repo(config),
+         {:ok, pem} <- decode_pem(config.github_app_private_key_pem),
+         {:ok, jwt} <- build_jwt(config.github_app_id, pem),
+         {:ok, installation_id} <- fetch_installation_id(jwt, config.github_app_owner_repo),
+         {:ok, body} <- request_installation_token(jwt, installation_id) do
+      parse_token_response(body, installation_id)
+    end
+  end
+
+  defp ensure_configured(%Config{github_app_id: id, github_app_private_key_pem: pem})
+       when is_binary(id) and is_binary(pem),
+       do: :ok
+
+  defp ensure_configured(_), do: {:error, :not_configured}
+
+  defp ensure_owner_repo(%Config{github_app_owner_repo: repo}) when is_binary(repo) and repo != "",
+    do: :ok
+
+  defp ensure_owner_repo(_), do: {:error, :missing_owner_repo}
+
+  defp decode_pem(pem) when is_binary(pem) do
+    case :public_key.pem_decode(pem) do
+      [entry | _] ->
+        try do
+          {:ok, :public_key.pem_entry_decode(entry)}
+        rescue
+          e -> {:error, {:pem_decode_failed, Exception.message(e)}}
+        end
+
+      [] ->
+        {:error, :pem_empty}
+    end
+  end
+
+  defp build_jwt(app_id, private_key) when is_binary(app_id) do
+    now = System.system_time(:second)
+
+    header = %{"alg" => "RS256", "typ" => "JWT"}
+
+    claims = %{
+      "iat" => now - @jwt_clock_skew_seconds,
+      "exp" => now + @jwt_lifetime_seconds,
+      "iss" => app_id
+    }
+
+    with {:ok, header_b64} <- encode_segment(header),
+         {:ok, claims_b64} <- encode_segment(claims) do
+      signing_input = header_b64 <> "." <> claims_b64
+      signature = :public_key.sign(signing_input, :sha256, private_key)
+      signature_b64 = Base.url_encode64(signature, padding: false)
+      {:ok, signing_input <> "." <> signature_b64}
+    end
+  end
+
+  defp encode_segment(map) do
+    case Jason.encode(map) do
+      {:ok, json} -> {:ok, Base.url_encode64(json, padding: false)}
+      {:error, reason} -> {:error, {:json_encode_failed, reason}}
+    end
+  end
+
+  defp fetch_installation_id(jwt, owner_repo) when is_binary(owner_repo) do
+    url = "https://api.github.com/repos/" <> owner_repo <> "/installation"
+
+    case Req.get(url, headers: gh_headers(jwt)) do
+      {:ok, %{status: 200, body: %{"id" => id}}} when is_integer(id) ->
+        {:ok, id}
+
+      {:ok, %{status: status, body: body}} ->
+        {:error, {:installation_lookup_failed, status, body}}
+
+      {:error, reason} ->
+        {:error, {:installation_lookup_transport, reason}}
+    end
+  end
+
+  defp request_installation_token(jwt, installation_id) do
+    url = "https://api.github.com/app/installations/#{installation_id}/access_tokens"
+
+    case Req.post(url, headers: gh_headers(jwt), body: "") do
+      {:ok, %{status: 201, body: body}} when is_map(body) ->
+        {:ok, body}
+
+      {:ok, %{status: status, body: body}} ->
+        {:error, {:token_mint_failed, status, body}}
+
+      {:error, reason} ->
+        {:error, {:token_mint_transport, reason}}
+    end
+  end
+
+  defp parse_token_response(%{"token" => token, "expires_at" => expires_at_iso}, installation_id)
+       when is_binary(token) and is_binary(expires_at_iso) do
+    case DateTime.from_iso8601(expires_at_iso) do
+      {:ok, expires_at, _offset} ->
+        {:ok, %{token: token, expires_at: expires_at, installation_id: installation_id}}
+
+      {:error, reason} ->
+        {:error, {:invalid_expires_at, reason}}
+    end
+  end
+
+  defp parse_token_response(other, _id), do: {:error, {:malformed_token_payload, other}}
+
+  defp gh_headers(jwt) do
+    [
+      {"accept", "application/vnd.github+json"},
+      {"authorization", "Bearer " <> jwt},
+      {"x-github-api-version", "2022-11-28"},
+      {"user-agent", "symphony-github-app/0.2.0"}
+    ]
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/attempt.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/attempt.ex
new file mode 100644
index 000000000..25e465647
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/attempt.ex
@@ -0,0 +1,98 @@
+defmodule SymphonyElixir.IR.Attempt do
+  @moduledoc """
+  One execution attempt of one `IR.Node`. A node accumulates attempts as
+  it is retried or recovered after a crash, so the run record explains
+  whether a node was retried, by which engine, at what cost, and how each
+  attempt ended.
+
+  `thread_id` is the room-server thread/session handle for the attempt.
+  It is the reattach probe used on restart: a node found `:running` after
+  a BEAM restart is reconciled by asking the engine for the status of
+  this thread (see `IR.Node` and the runtime recovery path).
+
+  `events_ref` points at the streamed event log for the attempt rather
+  than inlining it, so the durable run file stays small.
+  """
+
+  @enforce_keys [:n, :engine, :state]
+  defstruct [
+    :n,
+    :engine,
+    :thread_id,
+    :state,
+    :started_at,
+    :finished_at,
+    :outcome,
+    :cost,
+    :events_ref
+  ]
+
+  @typedoc """
+  What executed the attempt. `:codex`/`:claude` are engine turns; `:exec`
+  is a pack shell script; `:subrun` is a child run. A non-agent node has
+  no engine, so its attempt records the executor kind instead of a sham
+  `:codex`.
+  """
+  @type engine :: :codex | :claude | :exec | :subrun
+  @type state :: :running | :succeeded | :failed | :timeout | :cancelled | :stranded
+
+  @typedoc """
+  Resolved outcome of a finished attempt. `:stranded` marks an attempt
+  whose owning task or BEAM died without reporting a result; the runtime
+  cannot assume it had no side effects.
+  """
+  @type outcome ::
+          :ok
+          | {:error, term()}
+          | :timeout
+          | :cancelled
+          | :stranded
+
+  @type cost :: %{
+          optional(:usd) => float(),
+          optional(:tokens_in) => non_neg_integer(),
+          optional(:tokens_out) => non_neg_integer(),
+          optional(:cache_read) => non_neg_integer(),
+          optional(:cache_creation) => non_neg_integer()
+        }
+
+  @type t :: %__MODULE__{
+          n: pos_integer(),
+          engine: engine(),
+          thread_id: String.t() | nil,
+          state: state(),
+          started_at: DateTime.t() | nil,
+          finished_at: DateTime.t() | nil,
+          outcome: outcome() | nil,
+          cost: cost() | nil,
+          events_ref: String.t() | nil
+        }
+
+  @states [:running, :succeeded, :failed, :timeout, :cancelled, :stranded]
+  @engines [:codex, :claude, :exec, :subrun]
+
+  @doc "The attempt states a persisted attempt may hold. Source of truth for safe decode."
+  @spec states() :: [state()]
+  def states, do: @states
+
+  @doc "The executor kinds an attempt may record. Source of truth for safe decode."
+  @spec engines() :: [engine()]
+  def engines, do: @engines
+
+  @spec start(pos_integer(), engine(), String.t() | nil) :: t()
+  def start(n, engine, thread_id \\ nil)
+      when is_integer(n) and n > 0 and engine in @engines do
+    %__MODULE__{
+      n: n,
+      engine: engine,
+      thread_id: thread_id,
+      state: :running,
+      started_at: DateTime.utc_now()
+    }
+  end
+
+  @spec finish(t(), state(), outcome(), cost() | nil) :: t()
+  def finish(%__MODULE__{} = attempt, state, outcome, cost \\ nil) do
+    %{attempt | state: state, outcome: outcome, cost: cost, finished_at: DateTime.utc_now()}
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/graph.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/graph.ex
new file mode 100644
index 000000000..e3864c683
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/graph.ex
@@ -0,0 +1,210 @@
+defmodule SymphonyElixir.IR.Graph do
+  @moduledoc """
+  Pure operations over a `RunGraph`. No process state, no IO: every
+  function takes a graph (and arguments) and returns a new graph or a
+  derived value. The `Runtime` GenServer owns the side effects
+  (scheduling tasks, persisting); this module owns the graph algebra it
+  schedules against.
+
+  The two load-bearing rules:
+
+  - Dependency satisfaction is read off `IR.Node.deps`, which is itself
+    derived from `inputs` (`IR.Node.deps_from_inputs/1`). A node is ready
+    only when every dep has reached `:succeeded`.
+  - Failure propagates. When a node fails, each transitive dependent that
+    is still waiting transitions to `:upstream_failed` unless its trigger
+    rule opts to run on failure. A dependent already running or terminal
+    is left alone; the runtime reconciles those through the task path.
+
+  `ready_nodes/1` is the scheduler's input, `apply_output/3` is the
+  scheduler's commit step, and `reset_node/2` is the retry path.
+  """
+
+  alias SymphonyElixir.IR.{Node, RunGraph}
+
+  @doc """
+  Nodes that may start now: state `:pending`, `:ready`, or `:retrying`,
+  with every dep `:succeeded`. Running and terminal nodes are excluded, so
+  calling this on a graph with live tasks never reschedules an in-flight
+  node. A `:retrying` node is one a crash stranded that policy cleared for
+  another attempt; it is eligible for a fresh schedule while its attempt
+  history is preserved.
+
+  A node with no deps is ready immediately. The result order is stable
+  (sorted by id) so a deterministic replay schedules in a deterministic
+  order.
+  """
+  @schedulable [:pending, :ready, :retrying]
+
+  # `:gate` and `:map_fanout` are dynamic-expansion placeholders, not work
+  # to run. The materializer retires a resolved one to `:skipped` before
+  # the next schedule pass, but excluding the kinds here is the guard that
+  # holds even if a placeholder's deps are satisfied before expansion runs,
+  # so one is never handed to an executor as if it were an agent turn.
+  @placeholder_kinds [:gate, :map_fanout]
+
+  @spec ready_nodes(RunGraph.t()) :: [Node.t()]
+  def ready_nodes(%RunGraph{nodes: nodes}) do
+    nodes
+    |> Map.values()
+    |> Enum.filter(fn node ->
+      node.kind not in @placeholder_kinds and node.state in @schedulable and deps_satisfied?(node, nodes)
+    end)
+    |> Enum.sort_by(& &1.id)
+  end
+
+  @doc "Whether every dependency of `node` has succeeded. A node with no deps is satisfied."
+  @spec deps_satisfied?(Node.t(), %{String.t() => Node.t()}) :: boolean()
+  def deps_satisfied?(%Node{deps: deps}, nodes) when is_map(nodes) do
+    Enum.all?(deps, fn dep_id ->
+      case Map.fetch(nodes, dep_id) do
+        {:ok, %Node{state: :succeeded}} -> true
+        _ -> false
+      end
+    end)
+  end
+
+  @doc """
+  Record the result of a node's attempt and re-derive dependent states.
+
+  `result` is `{:ok, output}` or `{:error, reason}`. On success the node
+  becomes `:succeeded` carrying `output`, which can unlock dependents on
+  the next `ready_nodes/1`. On failure the node becomes `:failed` and
+  failure propagates to dependents that do not opt to run on failure
+  (see `trigger_runs_on_failure?/1`).
+
+  Marking a node terminal is idempotent in the sense that re-applying the
+  same result yields the same graph; callers that already moved a node to
+  a terminal state via reconciliation should not re-apply.
+  """
+  @spec apply_output(RunGraph.t(), String.t(), {:ok, term()} | {:error, term()}) :: RunGraph.t()
+  def apply_output(%RunGraph{} = graph, node_id, result) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, node} -> commit_result(graph, node, result)
+      :error -> graph
+    end
+  end
+
+  defp commit_result(%RunGraph{} = graph, %Node{} = node, {:ok, output}) do
+    updated = %{node | state: :succeeded, output: output, updated_at: DateTime.utc_now()}
+    %{graph | nodes: Map.put(graph.nodes, node.id, updated), updated_at: DateTime.utc_now()}
+  end
+
+  defp commit_result(%RunGraph{} = graph, %Node{} = node, {:error, reason}) do
+    updated = %{node | state: :failed, output: {:error, reason}, updated_at: DateTime.utc_now()}
+
+    graph
+    |> Map.put(:nodes, Map.put(graph.nodes, node.id, updated))
+    |> Map.put(:updated_at, DateTime.utc_now())
+    |> propagate_upstream_failed(node.id)
+  end
+
+  @doc """
+  Mark every node transitively downstream of `failed_id` that is still
+  waiting (`:pending`/`:ready`) and does not run on failure as
+  `:upstream_failed`. Already-running or terminal dependents are left for
+  the runtime's task path to resolve. Idempotent: nodes already
+  `:upstream_failed` stop the walk.
+  """
+  @spec propagate_upstream_failed(RunGraph.t(), String.t()) :: RunGraph.t()
+  def propagate_upstream_failed(%RunGraph{nodes: nodes} = graph, failed_id) do
+    now = DateTime.utc_now()
+
+    updated =
+      nodes
+      |> direct_dependents(failed_id)
+      |> Enum.reduce(nodes, fn dependent, acc ->
+        if dependent.state in @schedulable and not trigger_runs_on_failure?(dependent) do
+          marked = %{dependent | state: :upstream_failed, updated_at: now}
+          acc = Map.put(acc, dependent.id, marked)
+          # Recurse so a chain a -> b -> c fails c when a fails, not just b.
+          %{nodes: deeper} = propagate_upstream_failed(%{graph | nodes: acc}, dependent.id)
+          deeper
+        else
+          acc
+        end
+      end)
+
+    %{graph | nodes: updated, updated_at: now}
+  end
+
+  defp direct_dependents(nodes, dep_id) do
+    nodes
+    |> Map.values()
+    |> Enum.filter(fn node -> dep_id in node.deps end)
+  end
+
+  @doc """
+  The trigger rule for failure propagation. The default is conservative:
+  a node does not run once a dependency failed. A node opts in by carrying
+  `inputs["__on_failure__"]` set to the `{:literal, true}` sentinel, which
+  the interpreter emits for combinators that want to observe a failed
+  upstream (error handlers, cleanup). Kept narrow on purpose; widen only
+  when a combinator needs it.
+  """
+  @spec trigger_runs_on_failure?(Node.t()) :: boolean()
+  def trigger_runs_on_failure?(%Node{inputs: inputs}) when is_map(inputs) do
+    Map.get(inputs, "__on_failure__") == {:literal, true}
+  end
+
+  def trigger_runs_on_failure?(_node), do: false
+
+  @doc """
+  Reset a node back to `:pending` for a retry, clearing its prior output
+  while preserving the attempt history. The caller decides retry policy;
+  this is the pure state transition the retry path uses.
+  """
+  @spec reset_node(RunGraph.t(), String.t()) :: RunGraph.t()
+  def reset_node(%RunGraph{} = graph, node_id) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, node} ->
+        reset = %{node | state: :pending, output: nil, updated_at: DateTime.utc_now()}
+        %{graph | nodes: Map.put(graph.nodes, node_id, reset), updated_at: DateTime.utc_now()}
+
+      :error ->
+        graph
+    end
+  end
+
+  @doc "Nodes currently `:running`. The runtime owns the live task for each of these."
+  @spec running_nodes(RunGraph.t()) :: [Node.t()]
+  def running_nodes(%RunGraph{nodes: nodes}) do
+    nodes |> Map.values() |> Enum.filter(&(&1.state == :running))
+  end
+
+  @doc "Whether every node has reached a terminal state (`IR.Node.terminal_states/0`)."
+  @spec all_terminal?(RunGraph.t()) :: boolean()
+  def all_terminal?(%RunGraph{nodes: nodes}) do
+    nodes != %{} and Enum.all?(Map.values(nodes), &Node.terminal?/1)
+  end
+
+  @doc "Whether any node has failed (`:failed`) or could not run (`:upstream_failed`)."
+  @spec any_failed?(RunGraph.t()) :: boolean()
+  def any_failed?(%RunGraph{nodes: nodes}) do
+    Enum.any?(Map.values(nodes), &(&1.state in [:failed, :upstream_failed]))
+  end
+
+  @doc """
+  The terminal run status implied by the node states, or `:running` when
+  work remains. A run with any failed/upstream_failed node finishes
+  `:failed`; an all-succeeded/skipped/cancelled graph finishes
+  `:succeeded`. Used by the runtime to stamp the final `RunGraph.status`.
+
+  An empty node map is a no-op run (every gate resolved its body off) and
+  finishes `:succeeded`. This is the deliberate counterpart to
+  `all_terminal?/1`, which keeps an empty map non-terminal so a run is
+  never declared done before its first materialization; the runtime only
+  reaches here once a `:running` graph has no schedulable work left.
+  """
+  @spec finished_status(RunGraph.t()) :: RunGraph.status() | :running
+  def finished_status(%RunGraph{nodes: nodes}) when map_size(nodes) == 0, do: :succeeded
+
+  def finished_status(%RunGraph{} = graph) do
+    cond do
+      not all_terminal?(graph) -> :running
+      any_failed?(graph) -> :failed
+      Enum.any?(Map.values(graph.nodes), &(&1.state == :cancelled)) -> :cancelled
+      true -> :succeeded
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/materializer.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/materializer.ex
new file mode 100644
index 000000000..c4cefdfa4
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/materializer.ex
@@ -0,0 +1,255 @@
+defmodule SymphonyElixir.IR.Materializer do
+  @moduledoc """
+  The seam between the DSL interpreter and the durable IR graph. It runs
+  `DSL.Interpreter.expand/3` and folds the result into a `RunGraph`: the
+  initial materialization at run start, and the dynamic re-expansion that
+  emits a gate's or fan-out's children once the gating output arrives.
+
+  Pure: every function takes a graph (or the pieces to build one) and
+  returns a new graph. The `Runtime` GenServer owns scheduling and
+  persistence; this module owns turning interpreter output into graph
+  nodes and expansion-log events.
+
+  ## Why re-expansion is a merge, not a replace
+
+  `DSL.Interpreter.expand/3` is a pure function of `(ast, known_outputs,
+  expansion_log)`. Each call re-emits every node the current
+  `known_outputs` justify, with content-derived stable ids. So the
+  materializer cannot blindly overwrite: a node already materialized and
+  possibly already `:running` or `:succeeded` must keep its live state. It
+  merges by id, adding only nodes the graph has never seen and preserving
+  the state of nodes it already has. The expansion log grows the same way:
+  the interpreter returns the prior log plus this pass's new events, so
+  the materializer takes the returned log as the new one.
+
+  This is exactly the restart-replay invariant from `IR.RunGraph`:
+  re-running the interpreter against the recorded outputs and log
+  reconstructs the same node set, so a live re-expansion and a
+  cold replay produce identical graphs.
+  """
+
+  alias SymphonyElixir.DSL.{AST, Interpreter}
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Node, RunGraph}
+
+  @doc """
+  Build the initial `RunGraph` for a run from its AST. Expands against no
+  known outputs (the static slice of the graph plus any gate/fan-out
+  placeholders), validates every agent node's envelope, and records the
+  expansion log the first pass produced.
+
+  Envelope validation is the load-time fail-fast the overhaul plan
+  requires: the interpreter emits each agent's envelope as a raw spec map,
+  and this is the boundary that lowers it to a typed `Engine.Envelope` (or
+  fails the whole run with `{:error, {:invalid_envelope, node_id, reason}}`
+  rather than scheduling a node with a malformed envelope).
+  """
+  @spec materialize(String.t(), binary(), AST.workflow()) :: {:ok, RunGraph.t()} | {:error, term()}
+  def materialize(run_id, source_hash, ast) when is_binary(run_id) and is_binary(source_hash) do
+    {nodes, pending, log} = Interpreter.expand(ast, %{}, [])
+    nodes = thread_pending_deps(nodes, pending)
+
+    with {:ok, validated} <- validate_envelopes(nodes) do
+      graph =
+        RunGraph.new(run_id, source_hash, ast)
+        |> RunGraph.put_nodes(validated)
+        |> put_log(log)
+        |> Map.put(:status, :running)
+
+      {:ok, graph}
+    end
+  end
+
+  @doc """
+  Re-expand the AST against the outputs of succeeded nodes and merge the
+  fresh expansion into the graph. Returns `{graph, new_node_ids}` so the
+  runtime knows which ids first appeared on this pass.
+
+  The merge is by id, with state deciding what survives:
+
+  - A node the graph has never seen is added.
+  - A node the graph holds at `:pending` is replaced by the fresh
+    version, because the only thing that changes a still-pending node is
+    a dependency output it was waiting on resolving. This is what lets a
+    deferred prompt fold from `{:inline, nil}` to its real text, and a
+    skill binding fold from an unresolved node ref to the resolved value,
+    once the referenced node succeeds. The node's `created_at` and
+    `attempts` are preserved so the identity and history are unbroken.
+  - A node the graph holds `:running` or terminal keeps its live state;
+    the fresh expansion never clobbers a node mid-flight.
+
+  A resolved gate retires its placeholder. A `when`/`map` placeholder the
+  interpreter emitted while its gating output was unknown is no longer
+  re-emitted once that output resolves (the interpreter emits the body
+  instead). A still-`:pending` placeholder that the fresh expansion no
+  longer produces is marked `:skipped`, so the placeholder does not sit
+  `:pending` forever and deadlock the run. This is the load-bearing pair
+  with the runtime's deadlock guard.
+
+  A newly-emitted agent node has its envelope validated and lowered the
+  same way as the initial pass; an invalid envelope on a dynamically
+  emitted child fails with `{:error, {:invalid_envelope, id, reason}}`.
+
+  A graph with no `ast` (a hand-built graph in a test, or a pre-DSL run)
+  is returned unchanged with no new ids: there is nothing to re-expand.
+  """
+  @spec expand_dynamic(RunGraph.t()) :: {:ok, RunGraph.t(), [String.t()]} | {:error, term()}
+  def expand_dynamic(%RunGraph{ast: %{kind: :workflow} = ast} = graph) do
+    known = known_outputs(graph)
+    {nodes, pending, log} = Interpreter.expand(ast, known, graph.expansion_log)
+    nodes = thread_pending_deps(nodes, pending)
+
+    {to_apply, new_ids} = mergeable(nodes, graph.nodes)
+    emitted_ids = MapSet.new(nodes, & &1.id)
+
+    with {:ok, validated} <- validate_envelopes(to_apply) do
+      updated =
+        graph
+        |> RunGraph.put_nodes(validated)
+        |> retire_resolved_placeholders(emitted_ids)
+        |> put_log(log)
+
+      {:ok, updated, new_ids}
+    end
+  end
+
+  # A graph with no AST, or an `ast` that is not a reified workflow (a
+  # hand-built graph in a test, or a pre-DSL run), has nothing to
+  # re-expand. Return it unchanged.
+  def expand_dynamic(%RunGraph{} = graph), do: {:ok, graph, []}
+
+  @placeholder_kinds [:gate, :map_fanout]
+
+  # A placeholder that the fresh expansion no longer emits has resolved: it
+  # waited on an output that is now known, so the interpreter produced the
+  # body in its place. Mark the leftover placeholder `:skipped` so it
+  # leaves the schedulable/non-terminal set. Only `:pending` placeholders
+  # are retired; one already terminal or running is left alone.
+  defp retire_resolved_placeholders(%RunGraph{nodes: nodes} = graph, emitted_ids) do
+    retired =
+      Map.new(nodes, fn {id, node} ->
+        if node.kind in @placeholder_kinds and node.state == :pending and not MapSet.member?(emitted_ids, id) do
+          {id, %{node | state: :skipped, updated_at: DateTime.utc_now()}}
+        else
+          {id, node}
+        end
+      end)
+
+    %{graph | nodes: retired, updated_at: DateTime.utc_now()}
+  end
+
+  @doc """
+  The outputs of every succeeded node, keyed by node id. This is the
+  `known_outputs` the interpreter folds into pure values and gate
+  decisions, so a gate sees a dependency's result exactly once that
+  dependency reaches `:succeeded`.
+  """
+  @spec known_outputs(RunGraph.t()) :: %{optional(String.t()) => term()}
+  def known_outputs(%RunGraph{nodes: nodes}) do
+    for {id, %Node{state: :succeeded, output: output}} <- nodes, into: %{}, do: {id, output}
+  end
+
+  # Lower each agent node's raw envelope spec map to a typed, validated
+  # `Engine.Envelope`. A non-agent node has no envelope and passes
+  # through. An already-lowered envelope (a struct) is left as is, so this
+  # is idempotent across re-expansions. The first invalid envelope fails
+  # the whole pass with the offending node id.
+  defp validate_envelopes(nodes) do
+    Enum.reduce_while(nodes, {:ok, []}, fn node, {:ok, acc} ->
+      case lower_envelope(node) do
+        {:ok, lowered} -> {:cont, {:ok, [lowered | acc]}}
+        {:error, _} = err -> {:halt, err}
+      end
+    end)
+    |> case do
+      {:ok, lowered} -> {:ok, Enum.reverse(lowered)}
+      {:error, _} = err -> err
+    end
+  end
+
+  defp lower_envelope(%Node{kind: :agent, envelope: %Envelope{}} = node), do: {:ok, node}
+
+  defp lower_envelope(%Node{kind: :agent, envelope: spec, id: id} = node) when is_map(spec) do
+    case Envelope.from_map(spec) do
+      {:ok, envelope} -> {:ok, %{node | envelope: envelope}}
+      {:error, reason} -> {:error, {:invalid_envelope, id, reason}}
+    end
+  end
+
+  defp lower_envelope(%Node{kind: :agent, id: id}), do: {:error, {:missing_envelope, id}}
+  defp lower_envelope(%Node{} = node), do: {:ok, node}
+
+  # Partition the fresh expansion against the graph's nodes into the set to
+  # apply. A re-expansion re-emits every already-materialized node with its
+  # stable id, so a blind overwrite would clobber a node mid-flight. The
+  # rule is by state: a brand-new id is added; an existing `:pending` node
+  # is replaced (this is how a deferred prompt or skill binding folds to
+  # its resolved value once the awaited output arrives), carrying its
+  # `created_at` and `attempts` so identity and history survive; an
+  # existing `:running` or terminal node is left untouched. `new_ids` are
+  # the ids that first appeared this pass.
+  defp mergeable(emitted, existing) do
+    {to_apply, new_ids} =
+      Enum.reduce(emitted, {[], []}, fn %Node{id: id} = node, {apply_acc, new_ids} ->
+        case Map.fetch(existing, id) do
+          :error ->
+            {[node | apply_acc], [id | new_ids]}
+
+          {:ok, %Node{state: :pending} = old} ->
+            # Union the deps: once a deferred prompt or binding folds, its
+            # input ref becomes a literal and the fresh pass derives no edge
+            # for it, but the dependency is part of the run's true structure
+            # and the operator view should keep it. The edge points at an
+            # already-succeeded node, so deps stay satisfied and scheduling
+            # is unaffected.
+            merged = %{
+              node
+              | created_at: old.created_at,
+                attempts: old.attempts,
+                deps: Enum.uniq(old.deps ++ node.deps)
+            }
+
+            {[merged | apply_acc], new_ids}
+
+          {:ok, _live} ->
+            {apply_acc, new_ids}
+        end
+      end)
+
+    {Enum.reverse(to_apply), Enum.reverse(new_ids)}
+  end
+
+  # Fold the interpreter's `pending` set into node deps. An effect whose
+  # prompt or input mixes a literal with a node read cannot be one
+  # `input_ref`, so the interpreter reports the awaited node ids in
+  # `pending` rather than as input edges. Without this the node would carry
+  # no dep for that read, become ready immediately, and run before the
+  # output it interpolates exists. Matching `{:awaiting, origin, needed}`
+  # to a node by id covers the statically-emitted effects (`node.id` equals
+  # the AST origin when `expansion_key` is nil); fan-out children resolve
+  # their edges through keyed inputs already.
+  defp thread_pending_deps(nodes, pending) do
+    awaited =
+      Enum.reduce(pending, %{}, fn {:awaiting, origin, needed}, acc ->
+        Map.update(acc, origin, needed, &(&1 ++ needed))
+      end)
+
+    Enum.map(nodes, fn %Node{} = node ->
+      case Map.get(awaited, node.id, []) do
+        [] -> node
+        extra -> %{node | deps: Enum.uniq(node.deps ++ extra)}
+      end
+    end)
+  end
+
+  # The interpreter returns the full log (prior + this pass). Adopt it as
+  # the graph's log directly, normalizing each event to the RunGraph
+  # expansion_event shape (the interpreter's events carry no `at`).
+  defp put_log(%RunGraph{} = graph, log) do
+    normalized = Enum.map(log, &normalize_event/1)
+    %{graph | expansion_log: normalized, updated_at: DateTime.utc_now()}
+  end
+
+  defp normalize_event(%{at: _} = event), do: event
+  defp normalize_event(event), do: Map.put(event, :at, DateTime.utc_now())
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/node.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/node.ex
new file mode 100644
index 000000000..f685ebdbb
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/node.ex
@@ -0,0 +1,181 @@
+defmodule SymphonyElixir.IR.Node do
+  @moduledoc """
+  One node in the intermediate-representation graph: the durable unit the
+  runtime schedules, persists, recovers, and exposes to operators.
+
+  The IR graph is what the DSL interpreter emits. The monadic DSL surface
+  composes at the AST layer; evaluating the AST emits these plain-data
+  nodes (eval-as-emission). Nothing here is a host closure, so a node can
+  be serialized, inspected in the dashboard, retried in isolation, and
+  rebuilt deterministically after a restart.
+
+  ## Identity and origin
+
+  - `id` is stable and content-derived (a hash of `ast_origin` plus the
+    `expansion_key`), so the same logical node keeps the same id across a
+    deterministic replay of the run.
+  - `ast_origin` names the AST construct that emitted the node, so a
+    retry can re-run the right slice of the interpreter.
+  - `expansion_key` distinguishes the instances a dynamic construct emits
+    (one per fan-out element, or per `everyNth` iteration); `nil` for
+    statically-emitted nodes.
+
+  ## Edges
+
+  `deps` is DERIVED from `inputs`, never hand-written: an input that
+  references another node's output is a dependency edge. Two nodes whose
+  inputs do not reference each other have no edge and run in parallel.
+  This is how the runtime gets auto-parallelism without a `needs:` list.
+
+  ## Kinds
+
+  - `:agent` - an engine turn; carries an `envelope` and a prompt.
+  - `:exec` - a shell script under the pack; carries no envelope.
+  - `:subrun` - a first-class child run; its output is the child result.
+  - `:map_fanout` / `:gate` - dynamic-expansion placeholders that emit
+    children when their gating input resolves. They carry no envelope.
+  """
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.Attempt
+
+  @enforce_keys [:id, :ast_origin, :kind, :inputs, :deps, :state]
+  defstruct [
+    :id,
+    :ast_origin,
+    :kind,
+    :envelope,
+    :prompt_ref,
+    :inputs,
+    :deps,
+    :expansion_key,
+    :state,
+    :output,
+    :created_at,
+    :updated_at,
+    attempts: []
+  ]
+
+  @type kind :: :agent | :exec | :subrun | :map_fanout | :gate
+
+  @typedoc """
+  Node lifecycle. `:upstream_failed` is set when a dependency failed and
+  the node's trigger rule did not allow it to run; `:stranded` is set
+  when an attempt's task or BEAM died without a result. Both are distinct
+  terminal-ish states so operators can tell why a node did not run.
+  """
+  @type state ::
+          :pending
+          | :ready
+          | :running
+          | :succeeded
+          | :failed
+          | :skipped
+          | :upstream_failed
+          | :retrying
+          | :cancelled
+          | :stranded
+
+  @typedoc """
+  A reference an input resolves against. `{:node, id, path}` reads a
+  (possibly nested) field of another node's output; `{:literal, value}`
+  is a constant computed at expand-time.
+  """
+  @type input_ref ::
+          {:node, String.t(), [term()]}
+          | {:literal, term()}
+
+  @typedoc """
+  How a node's prompt is built. A `{:skill, ref, bindings}` reference is
+  rendered by `SymphonyElixir.Prompt`; `{:inline, text}` is a literal.
+  """
+  @type prompt_ref ::
+          {:skill, String.t(), map()}
+          | {:inline, String.t()}
+          | nil
+
+  @type t :: %__MODULE__{
+          id: String.t(),
+          ast_origin: term(),
+          kind: kind(),
+          envelope: Envelope.t() | nil,
+          prompt_ref: prompt_ref(),
+          inputs: %{optional(String.t()) => input_ref()},
+          deps: [String.t()],
+          expansion_key: term() | nil,
+          state: state(),
+          output: term() | nil,
+          attempts: [Attempt.t()],
+          created_at: DateTime.t() | nil,
+          updated_at: DateTime.t() | nil
+        }
+
+  @kinds [:agent, :exec, :subrun, :map_fanout, :gate]
+  @states [
+    :pending,
+    :ready,
+    :running,
+    :succeeded,
+    :failed,
+    :skipped,
+    :upstream_failed,
+    :retrying,
+    :cancelled,
+    :stranded
+  ]
+  @terminal [:succeeded, :failed, :skipped, :upstream_failed, :cancelled]
+
+  @doc "The node kinds the interpreter may emit. Source of truth for safe decode."
+  @spec kinds() :: [kind()]
+  def kinds, do: @kinds
+
+  @doc "Every node state. Source of truth for safe decode."
+  @spec states() :: [state()]
+  def states, do: @states
+
+  @doc "States after which a node will not run again without operator action."
+  @spec terminal_states() :: [state()]
+  def terminal_states, do: @terminal
+
+  @spec terminal?(t()) :: boolean()
+  def terminal?(%__MODULE__{state: state}), do: state in @terminal
+
+  @doc """
+  Build a node with `deps` derived from `inputs`. The caller passes the
+  inputs map; the dependency edges fall out of it, so the two can never
+  disagree.
+  """
+  @spec new(keyword()) :: t()
+  def new(fields) when is_list(fields) do
+    now = DateTime.utc_now()
+    inputs = Keyword.get(fields, :inputs, %{})
+
+    %__MODULE__{
+      id: Keyword.fetch!(fields, :id),
+      ast_origin: Keyword.fetch!(fields, :ast_origin),
+      kind: Keyword.fetch!(fields, :kind),
+      envelope: Keyword.get(fields, :envelope),
+      prompt_ref: Keyword.get(fields, :prompt_ref),
+      inputs: inputs,
+      deps: deps_from_inputs(inputs),
+      expansion_key: Keyword.get(fields, :expansion_key),
+      state: Keyword.get(fields, :state, :pending),
+      output: Keyword.get(fields, :output),
+      attempts: Keyword.get(fields, :attempts, []),
+      created_at: now,
+      updated_at: now
+    }
+  end
+
+  @doc "Derive the dependency id list from an inputs map. Pure; the single source of edges."
+  @spec deps_from_inputs(%{optional(String.t()) => input_ref()}) :: [String.t()]
+  def deps_from_inputs(inputs) when is_map(inputs) do
+    inputs
+    |> Map.values()
+    |> Enum.flat_map(fn
+      {:node, id, _path} -> [id]
+      {:literal, _} -> []
+    end)
+    |> Enum.uniq()
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/run_graph.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/run_graph.ex
new file mode 100644
index 000000000..20249c199
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/run_graph.ex
@@ -0,0 +1,136 @@
+defmodule SymphonyElixir.IR.RunGraph do
+  @moduledoc """
+  The durable state of one DSL workflow run: the reified AST it started
+  from, the IR nodes materialized so far, and the append-only expansion
+  log that makes a restart deterministic.
+
+  ## Why the expansion log exists
+
+  Dynamic constructs (`when`, `everyNth`, fan-out) expand the graph at
+  runtime based on data that arrived from engines, so the materialized
+  graph is not a pure function of the source alone. Each expansion is
+  recorded as an event ("gate G saw output X, emitted nodes [...]").
+
+  On restart the runtime does not restore a live computation. It loads
+  this record, replays `expansion_log` against `ast` to rebuild the exact
+  same materialized graph, reconciles any node left `:running`, recomputes
+  the ready set, and resumes. The interpreter is re-run, never resurrected
+  from a frozen closure. The invariant the runtime tests assert is
+  `replay(ast, expansion_log) == nodes`.
+
+  `source_hash` snapshots the `.sym` source the run started with, the same
+  way the pre-overhaul runtime snapshotted the DAG, so editing the pack
+  does not perturb runs in flight.
+  """
+
+  alias SymphonyElixir.IR.Node
+
+  @enforce_keys [:run_id, :source_hash, :status, :nodes]
+  defstruct [
+    :run_id,
+    :source_hash,
+    :ast,
+    :trigger,
+    :status,
+    :placement,
+    :created_at,
+    :updated_at,
+    nodes: %{},
+    expansion_log: [],
+    audit_log: []
+  ]
+
+  @type status :: :pending | :running | :succeeded | :failed | :cancelled
+
+  @statuses [:pending, :running, :succeeded, :failed, :cancelled]
+
+  @doc "The run statuses a persisted graph may hold. Source of truth for safe decode."
+  @spec statuses() :: [status()]
+  def statuses, do: @statuses
+
+  @typedoc """
+  One dynamic-expansion event. `origin` is the AST construct that
+  expanded; `observed` is the gating output it reacted to; `emitted` is
+  the list of node ids it added. Replaying the log in order reconstructs
+  the materialized graph.
+  """
+  @type expansion_event :: %{
+          origin: term(),
+          observed: term(),
+          emitted: [String.t()],
+          at: DateTime.t()
+        }
+
+  @typedoc """
+  One operator action recorded for audit. `action` is the operation
+  (`:cancel`, `:retry_node`, `:rerun`, `:clear_failed`); `target` is the
+  node id it acted on or `nil` for run-wide actions; `actor` identifies
+  who requested it (an operator id, or `:system` for automatic actions);
+  `detail` carries action-specific context. The log is append-only and
+  ordered, so it reconstructs the operator history of a run.
+  """
+  @type audit_event :: %{
+          action: atom(),
+          target: String.t() | nil,
+          actor: term(),
+          detail: term(),
+          at: DateTime.t()
+        }
+
+  @type t :: %__MODULE__{
+          run_id: String.t(),
+          source_hash: binary(),
+          ast: term() | nil,
+          trigger: map() | nil,
+          status: status(),
+          placement: %{declared: term(), effective: :ixvm | :host | :local | nil} | nil,
+          nodes: %{String.t() => Node.t()},
+          expansion_log: [expansion_event()],
+          audit_log: [audit_event()],
+          created_at: DateTime.t() | nil,
+          updated_at: DateTime.t() | nil
+        }
+
+  @spec new(String.t(), binary(), term()) :: t()
+  def new(run_id, source_hash, ast) when is_binary(run_id) and is_binary(source_hash) do
+    now = DateTime.utc_now()
+
+    %__MODULE__{
+      run_id: run_id,
+      source_hash: source_hash,
+      ast: ast,
+      status: :pending,
+      nodes: %{},
+      expansion_log: [],
+      audit_log: [],
+      created_at: now,
+      updated_at: now
+    }
+  end
+
+  @doc "Add or replace nodes, keeping the map keyed by node id."
+  @spec put_nodes(t(), [Node.t()]) :: t()
+  def put_nodes(%__MODULE__{nodes: nodes} = graph, new_nodes) when is_list(new_nodes) do
+    merged = Enum.reduce(new_nodes, nodes, fn %Node{id: id} = n, acc -> Map.put(acc, id, n) end)
+    %{graph | nodes: merged, updated_at: DateTime.utc_now()}
+  end
+
+  @doc "Append a dynamic-expansion event. The order is load-bearing for replay."
+  @spec append_expansion(t(), term(), term(), [String.t()]) :: t()
+  def append_expansion(%__MODULE__{expansion_log: log} = graph, origin, observed, emitted) do
+    event = %{origin: origin, observed: observed, emitted: emitted, at: DateTime.utc_now()}
+    %{graph | expansion_log: log ++ [event], updated_at: DateTime.utc_now()}
+  end
+
+  @doc """
+  Append an operator audit event. Append-only and ordered, so the log is
+  the durable record of who acted on the run and how. `target` is the node
+  id for a node-scoped action or `nil` for a run-wide one.
+  """
+  @spec append_audit(t(), atom(), String.t() | nil, term(), term()) :: t()
+  def append_audit(%__MODULE__{audit_log: log} = graph, action, target, actor, detail)
+      when is_atom(action) do
+    event = %{action: action, target: target, actor: actor, detail: detail, at: DateTime.utc_now()}
+    %{graph | audit_log: log ++ [event], updated_at: DateTime.utc_now()}
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/run_notifier.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/run_notifier.ex
new file mode 100644
index 000000000..66fb499df
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/run_notifier.ex
@@ -0,0 +1,311 @@
+defmodule SymphonyElixir.IR.RunNotifier do
+  @moduledoc """
+  Posts one Slack summary to `config.slack_notify_channel` when an IR run
+  reaches a terminal state.
+
+  Best-effort: a Slack failure is logged and never changes the run outcome.
+  The notifier reinstates the post-run notification that was dropped when the
+  YAML/DAG runtime and its `RunNotifier` were deleted in the IR cutover
+  (originally #111); the `SYMPHONY_SLACK_NOTIFY_CHANNEL` knob had no consumer
+  in between, so the channel went silent.
+
+  Cron notifications follow a configurable policy so the high-frequency
+  internal dispatchers do not flood the channel while real failures and
+  selected digests stay visible. A failed cron run posts when
+  `config.slack_notify_cron_failures` is set (default true); a succeeded
+  cron run posts when its workflow name is listed in
+  `config.slack_notify_cron_workflows`, or when that list contains the
+  wildcard `"*"` to post every cron success. Set the allowlist to `"*"` to
+  turn the whole channel back on without enumerating every workflow; list
+  specific names to surface only a few. The policy reads workflow names from
+  config, never a literal in source, so `elixir/lib/` stays pack-agnostic.
+  Non-cron terminal runs always notify.
+  """
+
+  require Logger
+
+  alias SymphonyElixir.Codex.Provision
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.IR.RunGraph
+  alias SymphonyElixir.Slack.Client, as: SlackClient
+
+  @doc """
+  Post the terminal summary for `graph`. No-op when the run should not notify
+  (non-terminal, cancelled, or a cron run the policy suppresses) or when
+  Slack is not configured.
+  """
+  @spec notify_finished(RunGraph.t()) :: :ok
+  def notify_finished(%RunGraph{} = graph) do
+    config = Config.get()
+
+    cond do
+      not notify?(graph, config) ->
+        :ok
+
+      is_nil(config.slack_bot_token) or is_nil(config.slack_notify_channel) ->
+        :ok
+
+      true ->
+        payload = build_payload(graph, config.room.registry_url)
+
+        case SlackClient.post_message(config.slack_notify_channel, payload) do
+          {:ok, _body} ->
+            :ok
+
+          {:error, reason} ->
+            Logger.warning("RunNotifier Slack post failed for #{graph.run_id}: #{inspect(reason)}")
+            :ok
+        end
+    end
+  end
+
+  @doc """
+  Whether a finished run should produce a Slack notification. Only real
+  outcomes (`:succeeded`/`:failed`) notify. Non-cron runs always notify; a
+  cron run defers to the per-workflow policy in `config` so scheduled
+  dispatchers stay out of the channel unless a failure or an allowlisted
+  workflow warrants it.
+  """
+  @spec notify?(RunGraph.t(), Config.t()) :: boolean()
+  def notify?(%RunGraph{status: status}, _config) when status not in [:succeeded, :failed], do: false
+
+  def notify?(%RunGraph{trigger: trigger} = graph, %Config{} = config) do
+    if trigger_kind(trigger) == :cron, do: cron_notify?(graph, config), else: true
+  end
+
+  # A cron failure posts when failure notifications are enabled; a cron
+  # success posts for an allowlisted workflow, or for every workflow when the
+  # allowlist is the wildcard "*", so digests (or the whole channel) can be
+  # surfaced while babysit-dispatch and other tight-interval runs stay quiet by
+  # default (ENG-2012, indexable-inc/symphony#242).
+  defp cron_notify?(%RunGraph{status: :failed}, %Config{slack_notify_cron_failures: notify_failures}) do
+    notify_failures
+  end
+
+  defp cron_notify?(%RunGraph{} = graph, %Config{slack_notify_cron_workflows: workflows}) do
+    "*" in workflows or workflow_name(graph.run_id) in workflows
+  end
+
+  # `room_base_url` is the central room UI origin (`config.room.registry_url`),
+  # the same room.ix.dev the run's room-server registers its backend with. The
+  # "Run details" button deep-links into that UI's transcript for the run, not
+  # into this dashboard.
+  @doc false
+  @spec build_payload(RunGraph.t(), String.t() | nil) :: map()
+  def build_payload(%RunGraph{} = graph, room_base_url) do
+    workflow = workflow_name(graph.run_id)
+    status = graph.status
+    summary = summary(graph, workflow)
+    header_text = "#{status_icon(status)} #{workflow} #{status_word(status)}"
+
+    blocks =
+      [
+        header(header_text),
+        section(summary),
+        context(context_text(graph)),
+        actions(graph, room_base_url)
+      ]
+      |> Enum.reject(&is_nil/1)
+
+    %{
+      "text" => fallback_text(workflow, status, summary),
+      "unfurl_links" => false,
+      "unfurl_media" => false,
+      "blocks" => blocks
+    }
+  end
+
+  # run_id is "<workflow-slug>-<ms>-<unique>" (Ingress.generate_run_id/1), so
+  # the display name is the id with that numeric suffix stripped.
+  @doc false
+  @spec workflow_name(String.t()) :: String.t()
+  def workflow_name(run_id) when is_binary(run_id) do
+    case String.replace(run_id, ~r/-\d+-\d+$/, "") do
+      "" -> run_id
+      name -> name
+    end
+  end
+
+  defp summary(%RunGraph{status: :failed} = graph, workflow) do
+    case failed_node_ids(graph) do
+      [] -> "Run #{code(workflow)} failed."
+      ids -> "Run #{code(workflow)} failed in #{Enum.map_join(ids, ", ", &code/1)}."
+    end
+  end
+
+  defp summary(%RunGraph{} = graph, workflow) do
+    "Completed #{code(workflow)} (#{node_breakdown(graph)})."
+  end
+
+  defp failed_node_ids(%RunGraph{nodes: nodes}) do
+    for {id, node} <- nodes, node.state == :failed, do: id
+  end
+
+  defp node_breakdown(%RunGraph{nodes: nodes}) do
+    nodes
+    |> Map.values()
+    |> Enum.frequencies_by(& &1.state)
+    |> Enum.map_join(", ", fn {state, count} -> "#{count} #{state}" end)
+  end
+
+  defp context_text(%RunGraph{} = graph) do
+    [code(graph.run_id), trigger_label(graph.trigger), Atom.to_string(graph.status), duration(graph)]
+    |> Enum.reject(&(&1 in [nil, ""]))
+    |> Enum.join(" - ")
+  end
+
+  defp actions(%RunGraph{} = graph, room_base_url) do
+    buttons =
+      []
+      |> maybe_add_linear_button(graph.trigger)
+      |> maybe_add_run_button(graph, room_base_url)
+      |> Enum.reverse()
+
+    case buttons do
+      [] -> nil
+      _ -> %{"type" => "actions", "elements" => buttons}
+    end
+  end
+
+  defp maybe_add_linear_button(buttons, trigger) when is_map(trigger) do
+    case {trigger_field(trigger, :url), trigger_field(trigger, :identifier)} do
+      {url, id} when is_binary(url) and url != "" and is_binary(id) and id != "" ->
+        [button(id, url, "primary") | buttons]
+
+      _ ->
+        buttons
+    end
+  end
+
+  defp maybe_add_linear_button(buttons, _trigger), do: buttons
+
+  # The run's transcript lives on room.ix.dev, not in this dashboard: every
+  # agent turn streams into the run's room-server, which registers a backend
+  # with the central room UI under `Provision.backend_id(run_id, "room")`.
+  # Deep-link to that backend's most recent thread when the run opened one, else
+  # to the room root. `base_url` is `config.room.registry_url`; with no room
+  # configured there is nothing to point at, so the button is omitted rather
+  # than emitting a dead link.
+  defp maybe_add_run_button(buttons, %RunGraph{} = graph, base_url) when is_binary(base_url) and base_url != "" do
+    [button("Run details", room_run_url(base_url, graph), nil) | buttons]
+  end
+
+  defp maybe_add_run_button(buttons, _graph, _base_url), do: buttons
+
+  # The room client is a hash router: `#/s/<server_id>/t/<thread_id>` opens a
+  # thread on a backend, `/` lands on the room. `server_id` is the registered
+  # backend id; segments are encoded the way the client's encodeURIComponent
+  # links are, so its decodeURIComponent parse recovers the raw ids.
+  defp room_run_url(base_url, %RunGraph{run_id: run_id} = graph) do
+    base = String.trim_trailing(base_url, "/")
+    server = URI.encode(Provision.backend_id(run_id, "room"), &URI.char_unreserved?/1)
+
+    case primary_thread_id(graph) do
+      nil -> base <> "/"
+      thread_id -> base <> "/#/s/" <> server <> "/t/" <> URI.encode(thread_id, &URI.char_unreserved?/1)
+    end
+  end
+
+  # The latest agent thread the run opened on its room-server, ordered by
+  # attempt start. A run with no agent turn that reached the engine has no
+  # thread, so the link falls back to the room root.
+  defp primary_thread_id(%RunGraph{nodes: nodes}) do
+    nodes
+    |> Map.values()
+    |> Enum.filter(&(&1.kind == :agent))
+    |> Enum.flat_map(& &1.attempts)
+    |> Enum.filter(fn attempt -> is_binary(attempt.thread_id) and attempt.thread_id != "" end)
+    |> Enum.sort_by(& &1.started_at, {:desc, DateTime})
+    |> case do
+      [%{thread_id: thread_id} | _] -> thread_id
+      [] -> nil
+    end
+  end
+
+  defp fallback_text(workflow, status, summary) do
+    # Slack flattens blocks to this text in push/desktop/sidebar previews, and
+    # mrkdwn does not render there, so keep it plain.
+    "Symphony: #{workflow} #{status_word(status)} - #{plain(summary)}"
+    |> truncate(200)
+  end
+
+  defp header(text) do
+    # header blocks only accept plain_text and cap at 150 chars.
+    %{"type" => "header", "text" => %{"type" => "plain_text", "text" => truncate(text, 150), "emoji" => true}}
+  end
+
+  defp section(text) do
+    %{"type" => "section", "text" => %{"type" => "mrkdwn", "text" => text}}
+  end
+
+  defp context(text) do
+    %{"type" => "context", "elements" => [%{"type" => "mrkdwn", "text" => text}]}
+  end
+
+  defp button(text, url, style) do
+    %{"type" => "button", "text" => %{"type" => "plain_text", "text" => text, "emoji" => true}, "url" => url}
+    |> maybe_put_style(style)
+  end
+
+  defp maybe_put_style(button, nil), do: button
+  defp maybe_put_style(button, style), do: Map.put(button, "style", style)
+
+  defp trigger_kind(%{kind: kind}) when is_atom(kind), do: kind
+  defp trigger_kind(%{"kind" => kind}) when is_binary(kind), do: kind_atom(kind)
+  defp trigger_kind(_), do: nil
+
+  defp trigger_field(trigger, key) do
+    Map.get(trigger, key) || Map.get(trigger, Atom.to_string(key))
+  end
+
+  # Trigger maps reach us with atom keys in-process; a string "kind" only
+  # appears after a store round-trip. Match the known kinds rather than
+  # minting atoms from arbitrary input.
+  defp kind_atom("cron"), do: :cron
+  defp kind_atom("linear"), do: :linear
+  defp kind_atom(_other), do: :other
+
+  defp trigger_label(trigger) do
+    case trigger_kind(trigger) do
+      :cron -> "Cron trigger"
+      :linear -> "Linear trigger"
+      :manual -> "Manual trigger"
+      :github_pr_label -> "GitHub trigger"
+      :slack_app_mention -> "Slack mention trigger"
+      :slack_huddle_completed -> "Slack huddle trigger"
+      _ -> "Symphony"
+    end
+  end
+
+  defp duration(%RunGraph{created_at: %DateTime{} = created, updated_at: %DateTime{} = updated}) do
+    seconds = max(DateTime.diff(updated, created, :second), 0)
+
+    cond do
+      seconds >= 3600 -> "#{div(seconds, 3600)}h #{div(rem(seconds, 3600), 60)}m"
+      seconds >= 60 -> "#{div(seconds, 60)}m #{rem(seconds, 60)}s"
+      true -> "#{seconds}s"
+    end
+  end
+
+  defp duration(_graph), do: nil
+
+  defp status_word(:succeeded), do: "finished"
+  defp status_word(:failed), do: "failed"
+  defp status_word(status), do: Atom.to_string(status)
+
+  defp status_icon(:succeeded), do: ":white_check_mark:"
+  defp status_icon(:failed), do: ":x:"
+  defp status_icon(_status), do: ":information_source:"
+
+  defp plain(text) when is_binary(text) do
+    text |> String.replace(~r/[`*_~]/, "") |> String.replace(~r/\s+/, " ") |> String.trim()
+  end
+
+  defp code(text), do: "`" <> to_string(text) <> "`"
+
+  defp truncate(text, limit) when byte_size(text) <= limit, do: text
+
+  defp truncate(text, limit) do
+    text |> String.slice(0, limit - 1) |> String.trim() |> Kernel.<>("...")
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/store.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/store.ex
new file mode 100644
index 000000000..263fab060
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/store.ex
@@ -0,0 +1,470 @@
+defmodule SymphonyElixir.IR.Store do
+  @moduledoc """
+  Durable persistence of a `RunGraph` to disk as JSON, one file per run.
+  Atomic temp-then-rename writes so a crash mid-write never leaves a
+  half-written run file, and a tolerant loader that quarantines a corrupt
+  file rather than crashing boot.
+
+  Disk layout, under `runs_dir/ir/`:
+
+      runs/
+        ir/
+          <run_id>.json       one RunGraph, full state
+          <run_id>.json.bad   a file that failed to decode, quarantined
+
+  This is plain serialization. It holds no process state; `Runtime` calls
+  `persist/1` after every transition. The directory is taken from
+  `Config.get().runs_dir` by default and can be overridden with `dir:` so
+  tests isolate to a tmp dir without booting Config.
+
+  The round-trip target is the full `RunGraph`: nodes (with envelope,
+  prompt_ref, inputs, deps, attempts, output), the run status, and the
+  append-only `expansion_log`. Recovery (`Runtime.reconcile/1`) depends on
+  that round-trip being faithful, so the encode/decode pair here is the
+  contract restart correctness rests on.
+  """
+
+  require Logger
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Attempt, Node, RunGraph}
+
+  @doc "Directory holding IR run files. Defaults to `Config.get().runs_dir/ir`."
+  @spec dir(keyword()) :: Path.t()
+  def dir(opts \\ []) do
+    case Keyword.get(opts, :dir) do
+      nil -> Path.join(Config.get().runs_dir, "ir")
+      explicit -> explicit
+    end
+  end
+
+  @doc """
+  Load every decodable RunGraph from the store directory. A file that
+  fails to decode is renamed to `<name>.bad` and skipped, with a warning,
+  so one corrupt run never blocks boot. Returns the graphs that loaded.
+  """
+  @spec load_all(keyword()) :: [RunGraph.t()]
+  def load_all(opts \\ []) do
+    store_dir = dir(opts)
+    File.mkdir_p!(store_dir)
+
+    store_dir
+    |> Path.join("*.json")
+    |> Path.wildcard()
+    |> Enum.flat_map(fn path ->
+      case read(path) do
+        {:ok, graph} ->
+          [graph]
+
+        {:error, reason} ->
+          quarantine(path, reason)
+          []
+      end
+    end)
+  end
+
+  @doc "Load one RunGraph by run id. `{:ok, graph}` or `{:error, :not_found}` / decode error."
+  @spec load(String.t(), keyword()) :: {:ok, RunGraph.t()} | {:error, term()}
+  def load(run_id, opts \\ []) when is_binary(run_id) do
+    path = run_path(dir(opts), run_id)
+
+    if File.exists?(path) do
+      read(path)
+    else
+      {:error, :not_found}
+    end
+  end
+
+  @doc "Persist a RunGraph, atomically replacing any prior file for the run."
+  @spec persist(RunGraph.t(), keyword()) :: :ok | {:error, term()}
+  def persist(%RunGraph{} = graph, opts \\ []) do
+    store_dir = dir(opts)
+    File.mkdir_p!(store_dir)
+    path = run_path(store_dir, graph.run_id)
+    tmp = path <> ".tmp"
+
+    with {:ok, encoded} <- Jason.encode(encode(graph), pretty: true),
+         :ok <- File.write(tmp, encoded),
+         :ok <- File.rename(tmp, path) do
+      :ok
+    end
+  end
+
+  @doc """
+  Append a dynamic-expansion event and persist. A thin wrapper over
+  `RunGraph.append_expansion/4` plus `persist/2`, so the append-only log
+  that drives replay is never updated without hitting disk.
+  """
+  @spec append_expansion(RunGraph.t(), {term(), term(), [String.t()]}, keyword()) ::
+          {:ok, RunGraph.t()} | {:error, term()}
+  def append_expansion(%RunGraph{} = graph, {origin, observed, emitted}, opts \\ []) do
+    next = RunGraph.append_expansion(graph, origin, observed, emitted)
+
+    case persist(next, opts) do
+      :ok -> {:ok, next}
+      error -> error
+    end
+  end
+
+  @doc "Delete a run's file. Returns `:ok` even when the file was already gone."
+  @spec delete(String.t(), keyword()) :: :ok
+  def delete(run_id, opts \\ []) when is_binary(run_id) do
+    _ = File.rm(run_path(dir(opts), run_id))
+    :ok
+  end
+
+  defp run_path(store_dir, run_id), do: Path.join(store_dir, run_id <> ".json")
+
+  defp read(path) do
+    with {:ok, raw} <- File.read(path),
+         {:ok, decoded} <- Jason.decode(raw),
+         {:ok, graph} <- decode(decoded) do
+      {:ok, graph}
+    end
+  rescue
+    # Any raise inside decode (an enum string outside its set, a corrupt
+    # timestamp, an undecodable term blob) becomes a quarantine reason
+    # rather than a boot crash, keeping the load_all promise that one bad
+    # file never blocks startup.
+    error -> {:error, {:decode_crashed, error}}
+  end
+
+  defp quarantine(path, reason) do
+    bad = path <> ".bad"
+    _ = File.rename(path, bad)
+    Logger.warning("IR.Store quarantined #{path} (#{inspect(reason)}) -> #{bad}")
+  end
+
+  # --- encode ---------------------------------------------------------
+
+  defp encode(%RunGraph{} = graph) do
+    %{
+      "run_id" => graph.run_id,
+      "source_hash" => Base.encode16(graph.source_hash, case: :lower),
+      "ast" => encode_term(graph.ast),
+      "trigger" => encode_term(graph.trigger),
+      "status" => Atom.to_string(graph.status),
+      "placement" => encode_placement(graph.placement),
+      "nodes" => Map.new(graph.nodes, fn {id, node} -> {id, encode_node(node)} end),
+      "expansion_log" => Enum.map(graph.expansion_log, &encode_expansion/1),
+      "audit_log" => Enum.map(graph.audit_log, &encode_audit/1),
+      "created_at" => encode_dt(graph.created_at),
+      "updated_at" => encode_dt(graph.updated_at)
+    }
+  end
+
+  defp encode_placement(nil), do: nil
+
+  defp encode_placement(%{declared: declared, effective: effective}) do
+    %{
+      "declared" => encode_placement_location(declared),
+      "effective" => if(effective, do: Atom.to_string(effective), else: nil)
+    }
+  end
+
+  # Placement declared is an Envelope location, which can be :ixvm, :local,
+  # {:host, name}, {:room, url}, or nil. Encode using the same shape as
+  # encode_location/1 in the envelope path so the wire format is consistent.
+  defp encode_placement_location(:local), do: "local"
+  defp encode_placement_location(:ixvm), do: "ixvm"
+  defp encode_placement_location({:host, name}), do: %{"host" => name}
+  defp encode_placement_location({:room, url}), do: %{"room" => url}
+  defp encode_placement_location(nil), do: nil
+
+  defp encode_node(%Node{} = node) do
+    %{
+      "id" => node.id,
+      "ast_origin" => encode_term(node.ast_origin),
+      "kind" => Atom.to_string(node.kind),
+      "envelope" => encode_envelope(node.envelope),
+      "prompt_ref" => encode_term(node.prompt_ref),
+      "inputs" => encode_inputs(node.inputs),
+      "deps" => node.deps,
+      "expansion_key" => encode_term(node.expansion_key),
+      "state" => Atom.to_string(node.state),
+      "output" => encode_term(node.output),
+      "attempts" => Enum.map(node.attempts, &encode_attempt/1),
+      "created_at" => encode_dt(node.created_at),
+      "updated_at" => encode_dt(node.updated_at)
+    }
+  end
+
+  defp encode_envelope(nil), do: nil
+
+  defp encode_envelope(%Envelope{} = env) do
+    %{
+      "engine" => Atom.to_string(env.engine),
+      "model" => env.model,
+      "effort" => env.effort && Atom.to_string(env.effort),
+      "permissions" => env.permissions && Atom.to_string(env.permissions),
+      "location" => encode_location(env.location)
+    }
+  end
+
+  defp encode_location(:local), do: "local"
+  defp encode_location(:ixvm), do: "ixvm"
+  defp encode_location({:host, name}), do: %{"host" => name}
+  defp encode_location({:room, url}), do: %{"room" => url}
+  defp encode_location(nil), do: nil
+
+  defp encode_attempt(%Attempt{} = attempt) do
+    %{
+      "n" => attempt.n,
+      "engine" => Atom.to_string(attempt.engine),
+      "thread_id" => attempt.thread_id,
+      "state" => Atom.to_string(attempt.state),
+      "started_at" => encode_dt(attempt.started_at),
+      "finished_at" => encode_dt(attempt.finished_at),
+      "outcome" => encode_term(attempt.outcome),
+      "cost" => encode_cost(attempt.cost),
+      "events_ref" => attempt.events_ref
+    }
+  end
+
+  defp encode_cost(nil), do: nil
+  defp encode_cost(cost) when is_map(cost), do: Map.new(cost, fn {k, v} -> {Atom.to_string(k), v} end)
+
+  # Inputs and AST fragments carry tuples (`{:node, id, path}`,
+  # `{:literal, value}`) that JSON cannot represent. Encode through the
+  # Erlang external term format and Base64 so the decode side reconstructs
+  # the exact term, including atoms, tuples, and nested structures. This
+  # is the same round-trip guarantee `:erlang.term_to_binary/1` gives,
+  # chosen over a bespoke tuple-to-list scheme because the AST shape is
+  # owned by the interpreter (WS-1) and must survive verbatim for replay.
+  defp encode_inputs(inputs) when is_map(inputs) do
+    Map.new(inputs, fn {key, ref} -> {key, encode_term(ref)} end)
+  end
+
+  defp encode_term(nil), do: nil
+  defp encode_term(term), do: %{"__term__" => Base.encode64(:erlang.term_to_binary(term))}
+
+  defp encode_dt(nil), do: nil
+  defp encode_dt(%DateTime{} = dt), do: DateTime.to_iso8601(dt)
+
+  # --- decode ---------------------------------------------------------
+
+  defp decode(%{"run_id" => run_id, "source_hash" => source_hash_hex, "status" => status, "nodes" => nodes} = payload) do
+    with {:ok, source_hash} <- Base.decode16(source_hash_hex, case: :lower),
+         {:ok, decoded_nodes} <- decode_nodes(nodes) do
+      {:ok,
+       %RunGraph{
+         run_id: run_id,
+         source_hash: source_hash,
+         ast: decode_term(payload["ast"]),
+         trigger: decode_term(payload["trigger"]),
+         status: known_atom(status, RunGraph.statuses(), "run status"),
+         placement: decode_placement(payload["placement"]),
+         nodes: decoded_nodes,
+         expansion_log: Enum.map(payload["expansion_log"] || [], &decode_expansion/1),
+         audit_log: Enum.map(payload["audit_log"] || [], &decode_audit/1),
+         created_at: decode_dt(payload["created_at"]),
+         updated_at: decode_dt(payload["updated_at"])
+       }}
+    else
+      :error -> {:error, :invalid_source_hash}
+      other -> other
+    end
+  end
+
+  defp decode(_), do: {:error, :invalid_run_graph_payload}
+
+  # Valid effective locations that may appear in a persisted placement.
+  # Guards against a tampered file minting atoms outside the known set.
+  # `:remote` is the effective location when an `:ixvm` run falls back to a
+  # runtime worker; omitting it quarantines every successful remote run.
+  @effective_locations [:ixvm, :host, :remote, :local]
+
+  defp decode_placement(nil), do: nil
+
+  defp decode_placement(%{"declared" => declared, "effective" => effective}) do
+    %{
+      declared: decode_placement_location(declared),
+      effective: known_atom_or_nil(effective, @effective_locations, "effective placement location")
+    }
+  end
+
+  defp decode_placement(_), do: nil
+
+  # Mirrors encode_placement_location/1; decodes the same shapes the
+  # envelope location decoder handles.
+  defp decode_placement_location("local"), do: :local
+  defp decode_placement_location("ixvm"), do: :ixvm
+  defp decode_placement_location(%{"host" => name}), do: {:host, name}
+  defp decode_placement_location(%{"room" => url}), do: {:room, url}
+  defp decode_placement_location(nil), do: nil
+
+  defp decode_nodes(nodes) when is_map(nodes) do
+    decoded =
+      Map.new(nodes, fn {id, node_payload} ->
+        {id, decode_node(node_payload)}
+      end)
+
+    {:ok, decoded}
+  rescue
+    error -> {:error, {:invalid_node, error}}
+  end
+
+  defp decode_nodes(_), do: {:error, :invalid_nodes}
+
+  defp decode_node(%{"id" => id, "kind" => kind, "state" => state} = payload) do
+    %Node{
+      id: id,
+      ast_origin: decode_term(payload["ast_origin"]),
+      kind: known_atom(kind, Node.kinds(), "node kind"),
+      envelope: decode_envelope(payload["envelope"]),
+      prompt_ref: decode_term(payload["prompt_ref"]),
+      inputs: decode_inputs(payload["inputs"]),
+      deps: payload["deps"] || [],
+      expansion_key: decode_term(payload["expansion_key"]),
+      state: known_atom(state, Node.states(), "node state"),
+      output: decode_term(payload["output"]),
+      attempts: Enum.map(payload["attempts"] || [], &decode_attempt/1),
+      created_at: decode_dt(payload["created_at"]),
+      updated_at: decode_dt(payload["updated_at"])
+    }
+  end
+
+  defp decode_envelope(nil), do: nil
+
+  defp decode_envelope(%{"engine" => engine, "model" => model} = payload) do
+    %Envelope{
+      engine: known_atom(engine, Envelope.engines(), "engine"),
+      model: model,
+      effort: known_atom_or_nil(payload["effort"], Envelope.efforts(), "effort"),
+      permissions: known_atom_or_nil(payload["permissions"], Envelope.permission_levels(), "permissions"),
+      location: decode_location(payload["location"])
+    }
+  end
+
+  defp decode_location("local"), do: :local
+  defp decode_location("ixvm"), do: :ixvm
+  defp decode_location(%{"host" => name}), do: {:host, name}
+  defp decode_location(%{"room" => url}), do: {:room, url}
+  defp decode_location(nil), do: nil
+
+  defp decode_attempt(%{"n" => n, "engine" => engine, "state" => state} = payload) do
+    %Attempt{
+      n: n,
+      engine: known_atom(engine, Attempt.engines(), "attempt engine"),
+      thread_id: payload["thread_id"],
+      state: known_atom(state, Attempt.states(), "attempt state"),
+      started_at: decode_dt(payload["started_at"]),
+      finished_at: decode_dt(payload["finished_at"]),
+      outcome: decode_term(payload["outcome"]),
+      cost: decode_cost(payload["cost"]),
+      events_ref: payload["events_ref"]
+    }
+  end
+
+  @cost_keys [:usd, :tokens_in, :tokens_out, :cache_read, :cache_creation]
+
+  defp decode_cost(nil), do: nil
+
+  defp decode_cost(cost) when is_map(cost) do
+    Map.new(cost, fn {k, v} -> {known_atom(k, @cost_keys, "cost key"), v} end)
+  end
+
+  defp decode_inputs(nil), do: %{}
+  defp decode_inputs(inputs) when is_map(inputs), do: Map.new(inputs, fn {key, ref} -> {key, decode_term(ref)} end)
+
+  # Decode an enum string against its owning module's set. An unknown value
+  # raises (caught by read/1 and quarantined) with an actionable reason,
+  # instead of String.to_existing_atom's opaque ArgumentError or accepting
+  # an unrelated-but-existing atom. Only matches against atoms that already
+  # exist as module attributes, so it cannot grow the atom table.
+  defp known_atom(value, allowed, context) when is_binary(value) do
+    case Enum.find(allowed, fn atom -> Atom.to_string(atom) == value end) do
+      nil -> raise ArgumentError, "invalid #{context} #{inspect(value)} in run graph"
+      atom -> atom
+    end
+  end
+
+  defp known_atom(value, _allowed, context) do
+    raise ArgumentError, "invalid #{context} #{inspect(value)} in run graph"
+  end
+
+  defp known_atom_or_nil(nil, _allowed, _context), do: nil
+  defp known_atom_or_nil(value, allowed, context), do: known_atom(value, allowed, context)
+
+  defp decode_term(nil), do: nil
+
+  defp decode_term(%{"__term__" => encoded}) when is_binary(encoded) do
+    encoded
+    |> Base.decode64!()
+    # These terms are symphony's own data: it wrote them with
+    # `:erlang.term_to_binary/1`, so every atom inside existed in this app at
+    # write time (AST tags, node kinds, error reasons like `:missing_cwd`).
+    # `:safe` would refuse to recreate any of those atoms that are not yet
+    # interned when a run is reloaded (e.g. a failure-path reason atom after a
+    # fresh boot), which crashed decode and quarantined otherwise-valid runs.
+    # The store is root-owned local state under /var/lib/symphony; an attacker
+    # who can rewrite it already owns the host, so `:safe`'s tamper guard buys
+    # nothing here while costing run durability.
+    |> :erlang.binary_to_term()
+  end
+
+  defp encode_expansion(%{origin: origin, observed: observed, emitted: emitted, at: at}) do
+    %{
+      "origin" => encode_term(origin),
+      "observed" => encode_term(observed),
+      "emitted" => emitted,
+      "at" => encode_dt(at)
+    }
+  end
+
+  defp decode_expansion(%{"origin" => origin, "observed" => observed, "emitted" => emitted} = payload) do
+    %{
+      origin: decode_term(origin),
+      observed: decode_term(observed),
+      emitted: emitted || [],
+      at: decode_dt(payload["at"])
+    }
+  end
+
+  # `actor` and `detail` carry arbitrary terms (operator ids, tuples), so
+  # they round-trip through the same term encoding the inputs use; `action`
+  # is a known operator-action atom.
+  defp encode_audit(%{action: action, target: target, actor: actor, detail: detail, at: at}) do
+    %{
+      "action" => Atom.to_string(action),
+      "target" => target,
+      "actor" => encode_term(actor),
+      "detail" => encode_term(detail),
+      "at" => encode_dt(at)
+    }
+  end
+
+  defp decode_audit(%{"action" => action} = payload) do
+    %{
+      action: known_audit_action(action),
+      target: payload["target"],
+      actor: decode_term(payload["actor"]),
+      detail: decode_term(payload["detail"]),
+      at: decode_dt(payload["at"])
+    }
+  end
+
+  @audit_actions ~w(cancel retry_node rerun clear_failed)a
+
+  # Map a serialized action back to a known atom. An unknown string is
+  # kept as a string rather than minting an atom, so a tampered or
+  # future-version file cannot exhaust the atom table on load.
+  defp known_audit_action(action) when is_binary(action) do
+    Enum.find(@audit_actions, action, fn a -> Atom.to_string(a) == action end)
+  end
+
+  defp decode_dt(nil), do: nil
+
+  defp decode_dt(iso) when is_binary(iso) do
+    case DateTime.from_iso8601(iso) do
+      {:ok, dt, _} ->
+        dt
+
+      # A corrupt timestamp is a decode failure (caught by read/1 and
+      # quarantined), not a silent drop of audit-trail metadata to nil.
+      _ ->
+        raise ArgumentError, "invalid ISO8601 datetime #{inspect(iso)} in run graph"
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/ir/view.ex b/packages/symphony/elixir/lib/symphony_elixir/ir/view.ex
new file mode 100644
index 000000000..4ffef44ac
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/ir/view.ex
@@ -0,0 +1,226 @@
+defmodule SymphonyElixir.IR.View do
+  @moduledoc """
+  Render a `RunGraph` as plain JSON-able facts for the API and dashboard.
+
+  This is a protocol emitter kept separate from the runtime: the runtime
+  and `IR.*` modules produce facts (typed structs), and this module turns
+  them into the canonical wire shape a consumer renders. Keeping it out of
+  the runtime means a wire-format change never touches scheduling logic,
+  and the same facts can feed an HTTP response, a LiveView, or a test
+  assertion.
+
+  The shapes are deliberately flat and string-keyed so `Jason.encode/1`
+  handles them without a custom encoder. Tuples that only the interpreter
+  understands (input refs, AST origins) are rendered as readable strings,
+  not round-tripped: this is a read view, not the durable store (that is
+  `IR.Store`, which preserves the exact terms).
+
+  Two granularities:
+
+  - `summary/1` is the list-row view: id, status, counts, cost total. Cheap
+    enough to render for every run on an index.
+  - `detail/1` is the single-run view: every node with its deps, attempts,
+    and output, plus the expansion and audit logs.
+  """
+
+  alias SymphonyElixir.IR.{Attempt, Node, RunGraph}
+
+  @doc "Compact row for a run index: status and aggregate counts/cost."
+  @spec summary(RunGraph.t()) :: map()
+  def summary(%RunGraph{} = graph) do
+    nodes = Map.values(graph.nodes)
+
+    %{
+      "run_id" => graph.run_id,
+      "status" => Atom.to_string(graph.status),
+      "trigger" => trigger_view(graph.trigger),
+      "placement" => placement_view(graph.placement),
+      "node_count" => length(nodes),
+      "states" => state_counts(nodes),
+      "cost_usd" => total_cost_usd(nodes),
+      "created_at" => iso(graph.created_at),
+      "updated_at" => iso(graph.updated_at)
+    }
+  end
+
+  @doc """
+  A human-readable label for a trigger map, shared between the summary view
+  and the LiveView form so the same string appears in both places.
+  """
+  @spec trigger_label(map() | nil) :: String.t()
+  def trigger_label(%{kind: :manual}), do: "manual"
+  def trigger_label(%{kind: :cron, schedule: schedule}), do: "cron " <> to_string(schedule)
+  def trigger_label(%{kind: :linear, label: label}), do: "linear: " <> to_string(label)
+  def trigger_label(%{kind: :slack_huddle_completed, channel: c}), do: "huddle #" <> to_string(c)
+  def trigger_label(%{kind: :slack_app_mention, channel: c}), do: "mention #" <> to_string(c)
+  def trigger_label(%{kind: :github_pr_label, label: label}), do: "github: " <> to_string(label)
+  def trigger_label(%{kind: kind}), do: to_string(kind)
+  def trigger_label(_), do: "manual"
+
+  @doc "Full run view: nodes with attempts and outputs, plus expansion and audit logs."
+  @spec detail(RunGraph.t()) :: map()
+  def detail(%RunGraph{} = graph) do
+    graph
+    |> summary()
+    |> Map.merge(%{
+      "nodes" => graph.nodes |> Map.values() |> Enum.sort_by(& &1.id) |> Enum.map(&render_node/1),
+      "expansion_log" => Enum.map(graph.expansion_log, &expansion_event/1),
+      "audit_log" => Enum.map(graph.audit_log, &audit_event/1)
+    })
+  end
+
+  @doc "One node's facts: kind, state, deps, label, envelope, attempts, output."
+  @spec render_node(Node.t()) :: map()
+  def render_node(%Node{} = node) do
+    %{
+      "id" => node.id,
+      "kind" => Atom.to_string(node.kind),
+      "state" => Atom.to_string(node.state),
+      "deps" => node.deps,
+      "label" => node_label(node),
+      "envelope" => envelope(node.envelope),
+      "attempts" => Enum.map(node.attempts, &attempt/1),
+      "output" => render_term(node.output),
+      "updated_at" => iso(node.updated_at)
+    }
+  end
+
+  # Derive a human-readable primary label for a node from its prompt_ref or
+  # inputs. Agent nodes show the skill name (or "inline" for inline prompts).
+  # Exec nodes show the script path from the resolved input literal. Other
+  # kinds fall back to their kind string. This is the label the graph and
+  # table surfaces use as the primary line; the node id is always available
+  # separately as the secondary.
+  defp node_label(%Node{kind: :agent, prompt_ref: {:skill, name, _}}), do: name
+  defp node_label(%Node{kind: :agent, prompt_ref: {:inline, _}}), do: "inline"
+  defp node_label(%Node{kind: :agent}), do: "agent"
+
+  defp node_label(%Node{kind: :exec, inputs: inputs}) do
+    case inputs["script"] do
+      {:literal, script} when is_binary(script) -> script
+      _ -> "exec"
+    end
+  end
+
+  defp node_label(%Node{kind: kind}), do: Atom.to_string(kind)
+
+  defp envelope(nil), do: nil
+
+  defp envelope(%{engine: engine, model: model} = env) do
+    %{
+      "engine" => Atom.to_string(engine),
+      "model" => model,
+      "effort" => env.effort && Atom.to_string(env.effort),
+      "permissions" => env.permissions && Atom.to_string(env.permissions),
+      "location" => location(env.location)
+    }
+  end
+
+  defp location(:local), do: "local"
+  defp location(:ixvm), do: "ixvm"
+  defp location({:host, name}), do: "host:#{name}"
+  defp location({:room, url}), do: "room:#{url}"
+  defp location(nil), do: nil
+
+  defp attempt(%Attempt{} = attempt) do
+    %{
+      "n" => attempt.n,
+      "engine" => Atom.to_string(attempt.engine),
+      "state" => Atom.to_string(attempt.state),
+      "thread_id" => attempt.thread_id,
+      "outcome" => render_term(attempt.outcome),
+      "cost" => cost(attempt.cost),
+      "started_at" => iso(attempt.started_at),
+      "finished_at" => iso(attempt.finished_at)
+    }
+  end
+
+  defp cost(nil), do: nil
+  defp cost(cost) when is_map(cost), do: Map.new(cost, fn {k, v} -> {Atom.to_string(k), v} end)
+
+  defp audit_event(%{action: action} = event) do
+    %{
+      "action" => Atom.to_string(action),
+      "target" => event.target,
+      "actor" => render_term(event.actor),
+      "detail" => render_term(event.detail),
+      "at" => iso(event[:at])
+    }
+  end
+
+  defp expansion_event(%{origin: origin, emitted: emitted} = event) do
+    %{
+      "origin" => render_term(origin),
+      "observed" => render_term(event[:observed]),
+      "emitted" => emitted,
+      "at" => iso(event[:at])
+    }
+  end
+
+  defp state_counts(nodes) do
+    nodes
+    |> Enum.frequencies_by(fn node -> Atom.to_string(node.state) end)
+  end
+
+  # Sum the per-attempt usd cost across every node's every attempt. nil when
+  # no attempt reported a cost, so the consumer can distinguish "free" from
+  # "unknown".
+  defp total_cost_usd(nodes) do
+    costs =
+      for node <- nodes,
+          attempt <- node.attempts,
+          is_map(attempt.cost),
+          usd = attempt.cost[:usd],
+          is_number(usd),
+          do: usd
+
+    case costs do
+      [] -> nil
+      _ -> Enum.sum(costs)
+    end
+  end
+
+  # Render the trigger as a plain string label for the read view. Uses the
+  # same label set as `trigger_label/1` so the API and the LiveView agree.
+  defp trigger_view(nil), do: "manual"
+  defp trigger_view(trigger), do: trigger_label(trigger)
+
+  # Render the placement map for the read view. Exposes declared and
+  # effective as strings so JSON consumers can distinguish a fallback
+  # (declared: "ixvm", effective: "host") from a clean resolve.
+  defp placement_view(nil), do: nil
+
+  defp placement_view(%{declared: declared, effective: effective}) do
+    %{
+      "declared" => placement_location_string(declared),
+      "effective" => if(effective, do: Atom.to_string(effective), else: nil)
+    }
+  end
+
+  defp placement_location_string(:local), do: "local"
+  defp placement_location_string(:ixvm), do: "ixvm"
+  defp placement_location_string({:host, name}), do: "host:#{name}"
+  defp placement_location_string({:room, url}), do: "room:#{url}"
+  defp placement_location_string(nil), do: nil
+
+  defp iso(nil), do: nil
+  defp iso(%DateTime{} = dt), do: DateTime.to_iso8601(dt)
+
+  # A read view stringifies terms the interpreter owns (tuples, atoms,
+  # nested refs) rather than round-tripping them. A plain JSON-able value
+  # passes through so a node output map stays structured.
+  defp render_term(nil), do: nil
+  defp render_term(value) when is_binary(value) or is_number(value) or is_boolean(value), do: value
+  defp render_term(value) when is_atom(value), do: Atom.to_string(value)
+
+  defp render_term(value) when is_map(value) and not is_struct(value) do
+    Map.new(value, fn {k, v} -> {render_key(k), render_term(v)} end)
+  end
+
+  defp render_term(value) when is_list(value), do: Enum.map(value, &render_term/1)
+  defp render_term(value), do: inspect(value)
+
+  defp render_key(k) when is_binary(k), do: k
+  defp render_key(k) when is_atom(k), do: Atom.to_string(k)
+  defp render_key(k), do: inspect(k)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/linear/client.ex b/packages/symphony/elixir/lib/symphony_elixir/linear/client.ex
new file mode 100644
index 000000000..91c66a688
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/linear/client.ex
@@ -0,0 +1,126 @@
+defmodule SymphonyElixir.Linear.Client do
+  @moduledoc """
+  Thin Linear GraphQL client.
+
+  Two responsibilities:
+
+  - Polling issues with a given label, scoped to a team key.
+  - Generic `graphql/2` for the `linear_graphql` tool exposed to skills.
+
+  Auth, endpoint, and team scope come from `Config.get()` at call time.
+  No fallback: if `LINEAR_API_KEY` is missing the call returns
+  `{:error, :missing_linear_api_token}`.
+  """
+
+  require Logger
+  alias SymphonyElixir.{Config, Linear.Issue}
+
+  @issue_page_size 50
+
+  @poll_query """
+  query SymphonyPoll($teamKey: String!, $first: Int!, $after: String) {
+    issues(filter: {team: {key: {eq: $teamKey}}}, first: $first, after: $after) {
+      nodes {
+        id
+        identifier
+        title
+        url
+        state { name }
+        labels { nodes { name } }
+      }
+      pageInfo { hasNextPage endCursor }
+    }
+  }
+  """
+
+  @spec fetch_issues_with_label(String.t()) :: {:ok, [Issue.t()]} | {:error, term()}
+  def fetch_issues_with_label(label) when is_binary(label) do
+    config = Config.get()
+
+    cond do
+      is_nil(config.linear_api_key) -> {:error, :missing_linear_api_token}
+      is_nil(config.linear_team_key) -> {:error, :missing_linear_team_key}
+      true -> do_paged_fetch(config, label, nil, [])
+    end
+  end
+
+  @spec graphql(String.t(), map()) :: {:ok, map()} | {:error, term()}
+  def graphql(query, variables \\ %{}) when is_binary(query) and is_map(variables) do
+    config = Config.get()
+
+    case config.linear_api_key do
+      nil ->
+        {:error, :missing_linear_api_token}
+
+      token ->
+        payload = %{"query" => query, "variables" => variables}
+
+        case Req.post(config.linear_endpoint,
+               headers: [{"Authorization", token}, {"Content-Type", "application/json"}],
+               json: payload,
+               connect_options: [timeout: 30_000]
+             ) do
+          {:ok, %{status: 200, body: body}} -> {:ok, body}
+          {:ok, %{status: status, body: body}} -> {:error, {:linear_status, status, body}}
+          {:error, reason} -> {:error, {:linear_request_failed, reason}}
+        end
+    end
+  end
+
+  defp do_paged_fetch(config, label, after_cursor, acc) do
+    variables = %{
+      teamKey: config.linear_team_key,
+      first: @issue_page_size,
+      after: after_cursor
+    }
+
+    with {:ok, body} <- graphql(@poll_query, variables) do
+      case body do
+        %{"data" => %{"issues" => %{"nodes" => nodes, "pageInfo" => page_info}}} ->
+          new_issues =
+            nodes
+            |> Enum.map(&normalize_issue/1)
+            |> Enum.reject(&is_nil/1)
+            |> Enum.filter(fn issue -> label in issue.labels end)
+
+          next_acc = acc ++ new_issues
+
+          case page_info do
+            %{"hasNextPage" => true, "endCursor" => cursor} when is_binary(cursor) ->
+              do_paged_fetch(config, label, cursor, next_acc)
+
+            _ ->
+              {:ok, next_acc}
+          end
+
+        %{"errors" => errors} ->
+          {:error, {:linear_graphql_errors, errors}}
+
+        _ ->
+          {:error, :linear_unknown_payload}
+      end
+    end
+  end
+
+  defp normalize_issue(%{"id" => id, "identifier" => identifier} = node) do
+    %Issue{
+      id: id,
+      identifier: identifier,
+      title: node["title"],
+      url: node["url"],
+      state: get_in(node, ["state", "name"]),
+      labels: extract_labels(node)
+    }
+  end
+
+  defp normalize_issue(_), do: nil
+
+  defp extract_labels(%{"labels" => %{"nodes" => nodes}}) when is_list(nodes) do
+    nodes
+    |> Enum.map(& &1["name"])
+    |> Enum.reject(&is_nil/1)
+    |> Enum.map(&String.downcase/1)
+  end
+
+  defp extract_labels(_), do: []
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/linear/issue.ex b/packages/symphony/elixir/lib/symphony_elixir/linear/issue.ex
new file mode 100644
index 000000000..a10a93c30
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/linear/issue.ex
@@ -0,0 +1,18 @@
+defmodule SymphonyElixir.Linear.Issue do
+  @moduledoc """
+  Minimal Linear issue representation used by the orchestrator.
+  Carries only what the trigger needs to enqueue and identify a run.
+  """
+
+  @enforce_keys [:id, :identifier, :labels]
+  defstruct [:id, :identifier, :title, :url, :state, :labels]
+
+  @type t :: %__MODULE__{
+          id: String.t(),
+          identifier: String.t(),
+          title: String.t() | nil,
+          url: String.t() | nil,
+          state: String.t() | nil,
+          labels: [String.t()]
+        }
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/log_file.ex b/packages/symphony/elixir/lib/symphony_elixir/log_file.ex
new file mode 100644
index 000000000..ca9f1f230
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/log_file.ex
@@ -0,0 +1,79 @@
+defmodule SymphonyElixir.LogFile do
+  @moduledoc """
+  Configures OTP's built-in rotating disk log handler for application logs.
+  """
+
+  require Logger
+
+  @handler_id :symphony_disk_log
+  @default_log_relative_path "log/symphony.log"
+  @default_max_bytes 10 * 1024 * 1024
+  @default_max_files 5
+
+  @spec default_log_file() :: Path.t()
+  def default_log_file do
+    default_log_file(File.cwd!())
+  end
+
+  @spec default_log_file(Path.t()) :: Path.t()
+  def default_log_file(logs_root) when is_binary(logs_root) do
+    Path.join(logs_root, @default_log_relative_path)
+  end
+
+  @spec configure() :: :ok
+  def configure do
+    log_file = Application.get_env(:symphony_elixir, :log_file, default_log_file())
+    max_bytes = Application.get_env(:symphony_elixir, :log_file_max_bytes, @default_max_bytes)
+    max_files = Application.get_env(:symphony_elixir, :log_file_max_files, @default_max_files)
+
+    setup_disk_handler(log_file, max_bytes, max_files)
+  end
+
+  defp setup_disk_handler(log_file, max_bytes, max_files) do
+    expanded_path = Path.expand(log_file)
+    :ok = File.mkdir_p(Path.dirname(expanded_path))
+    :ok = remove_existing_handler()
+
+    case :logger.add_handler(
+           @handler_id,
+           :logger_disk_log_h,
+           disk_log_handler_config(expanded_path, max_bytes, max_files)
+         ) do
+      :ok ->
+        # Intentionally KEEP the :default console handler. Disk-log
+        # rotation under $SYMPHONY_LOGS_ROOT is good for
+        # long-term retention but writes to a binary disk_log format
+        # that systemd cannot tail. Leaving the default handler in
+        # place means stdout still flows to journald, so
+        # `journalctl -u symphony.service` shows live log output and
+        # any unhandled crash from a LiveView / GenServer surfaces
+        # there. The two handlers are independent; logs land in both.
+        :ok
+
+      {:error, reason} ->
+        Logger.warning("Failed to configure rotating log file handler: #{inspect(reason)}")
+        :ok
+    end
+  end
+
+  defp remove_existing_handler do
+    case :logger.remove_handler(@handler_id) do
+      :ok -> :ok
+      {:error, {:not_found, @handler_id}} -> :ok
+      {:error, _reason} -> :ok
+    end
+  end
+
+  defp disk_log_handler_config(path, max_bytes, max_files) do
+    %{
+      level: :all,
+      formatter: {:logger_formatter, %{single_line: true}},
+      config: %{
+        file: String.to_charlist(path),
+        type: :wrap,
+        max_no_bytes: max_bytes,
+        max_no_files: max_files
+      }
+    }
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/path_safety.ex b/packages/symphony/elixir/lib/symphony_elixir/path_safety.ex
new file mode 100644
index 000000000..fca59887a
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/path_safety.ex
@@ -0,0 +1,50 @@
+defmodule SymphonyElixir.PathSafety do
+  @moduledoc false
+
+  @spec canonicalize(Path.t()) :: {:ok, Path.t()} | {:error, term()}
+  def canonicalize(path) when is_binary(path) do
+    expanded_path = Path.expand(path)
+    {root, segments} = split_absolute_path(expanded_path)
+
+    case resolve_segments(root, [], segments) do
+      {:ok, canonical_path} ->
+        {:ok, canonical_path}
+
+      {:error, reason} ->
+        {:error, {:path_canonicalize_failed, expanded_path, reason}}
+    end
+  end
+
+  defp split_absolute_path(path) when is_binary(path) do
+    [root | segments] = Path.split(path)
+    {root, segments}
+  end
+
+  defp resolve_segments(root, resolved_segments, []), do: {:ok, join_path(root, resolved_segments)}
+
+  defp resolve_segments(root, resolved_segments, [segment | rest]) do
+    candidate_path = join_path(root, resolved_segments ++ [segment])
+
+    case File.lstat(candidate_path) do
+      {:ok, %File.Stat{type: :symlink}} ->
+        with {:ok, target} <- :file.read_link_all(String.to_charlist(candidate_path)) do
+          resolved_target = Path.expand(IO.chardata_to_string(target), join_path(root, resolved_segments))
+          {target_root, target_segments} = split_absolute_path(resolved_target)
+          resolve_segments(target_root, [], target_segments ++ rest)
+        end
+
+      {:ok, _stat} ->
+        resolve_segments(root, resolved_segments ++ [segment], rest)
+
+      {:error, :enoent} ->
+        {:ok, join_path(root, resolved_segments ++ [segment | rest])}
+
+      {:error, reason} ->
+        {:error, reason}
+    end
+  end
+
+  defp join_path(root, segments) when is_list(segments) do
+    Enum.reduce(segments, root, fn segment, acc -> Path.join(acc, segment) end)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/prompt.ex b/packages/symphony/elixir/lib/symphony_elixir/prompt.ex
new file mode 100644
index 000000000..9f962a31a
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/prompt.ex
@@ -0,0 +1,178 @@
+defmodule SymphonyElixir.Prompt do
+  @moduledoc """
+  Render an agent node's prompt from its `prompt_ref` and the bindings the
+  interpreter resolved for it. This is the piece the engine client needs
+  to turn a `{:skill, name, bindings}` reference into the actual text an
+  engine runs.
+
+  Two prompt shapes flow out of the DSL (`SymphonyElixir.DSL.AST`):
+
+  - `{:inline, text}` is literal text, already interpolated at expand
+    time. `build/2` returns it verbatim.
+  - `{:skill, name, bindings}` names a markdown skill body under the
+    active pack. `build/2` loads the body through the injected resolver,
+    expands shared `{{partial:name}}` includes, and interpolates
+    `${binding}` and `${binding.path}` placeholders from `bindings`.
+
+  ## Why a resolver is injected
+
+  The body source (which pack, which directory, hot-reload vs a snapshot)
+  is owned by the catalog layer, not by prompt rendering. `build/2` takes
+  a `:resolver` function `name -> {:ok, body} | {:error, reason}` so this
+  module stays pack-agnostic and unit-testable without touching the
+  filesystem. `SymphonyElixir.Prompt.Skill` is the default resolver over a
+  pack's `skills/` directory.
+
+  ## Interpolation
+
+  A placeholder is `${path}` where `path` is a dotted key sequence into
+  the bindings map (`${ticket.id}` reads `bindings["ticket"]["id"]`). A
+  placeholder whose binding is missing is a render error rather than a
+  silently empty substitution, so a skill that references an input the
+  node never bound fails loudly. Literal `$` that is not a placeholder is
+  left untouched: only `${...}` is special.
+
+  Write `$${path}` to emit a literal `${path}` with no binding lookup.
+  Skill bodies routinely embed shell, Make, or JS-template snippets whose
+  own `${VAR}` would otherwise be read as a binding and fail the run; the
+  doubled `$$` is the escape that lets those survive. The escape consumes
+  one `$`, so `$${x}` renders `${x}`.
+  """
+
+  @typedoc "Resolver from a skill name to its raw markdown body."
+  @type resolver :: (String.t() -> {:ok, String.t()} | {:error, term()})
+
+  @typedoc "Bindings the interpreter resolved for the prompt (string keys, literal values)."
+  @type bindings :: %{optional(String.t()) => term()}
+
+  # Group 1 is an optional leading `$` that escapes the match to a literal
+  # `${...}`; group 2 is the binding path. Both forms match in one pass so
+  # an escaped `$${x}` cannot also match as the placeholder `${x}` at the
+  # next offset.
+  @placeholder ~r/(\$?)\$\{([A-Za-z0-9_.]+)\}/
+
+  @doc """
+  Build the prompt text for a `prompt_ref`. `opts` carries the skill body
+  `:resolver` (required for a `{:skill, _, _}` ref) and an optional
+  `:partial_resolver` for `{{partial:name}}` includes.
+  """
+  @spec build(SymphonyElixir.IR.Node.prompt_ref(), keyword()) :: {:ok, String.t()} | {:error, term()}
+  def build(prompt_ref, opts \\ [])
+
+  def build({:inline, text}, _opts) when is_binary(text), do: {:ok, text}
+  def build({:inline, nil}, _opts), do: {:error, :unresolved_inline_prompt}
+
+  def build({:skill, name, bindings}, opts) when is_binary(name) and is_map(bindings) do
+    with {:ok, resolver} <- fetch_resolver(opts),
+         {:ok, body} <- resolver.(name),
+         {:ok, expanded} <- expand_partials(body, opts) do
+      render(expanded, bindings)
+    end
+  end
+
+  def build(nil, _opts), do: {:error, :missing_prompt_ref}
+  def build(other, _opts), do: {:error, {:invalid_prompt_ref, other}}
+
+  @doc """
+  Interpolate `${path}` placeholders in `body` from `bindings`. Pure: the
+  core of `build/2`, exposed so a caller can render an already-loaded body
+  and so tests can assert interpolation without a resolver. A placeholder
+  with no matching binding returns `{:error, {:unbound_placeholder, path}}`.
+  An escaped `$${path}` collapses to a literal `${path}` and is never
+  looked up, so a missing binding there is not an error.
+  """
+  @spec render(String.t(), bindings()) :: {:ok, String.t()} | {:error, term()}
+  def render(body, bindings) when is_binary(body) and is_map(bindings) do
+    # Only the unescaped matches (empty group 1) are real placeholders, so
+    # an escaped `$${x}` neither needs a binding nor reports one missing.
+    missing =
+      @placeholder
+      |> Regex.scan(body, capture: :all_but_first)
+      |> Enum.filter(fn [escape, _path] -> escape == "" end)
+      |> Enum.map(fn [_escape, path] -> path end)
+      |> Enum.uniq()
+      |> Enum.find(fn path -> resolve_binding(bindings, path) == :missing end)
+
+    case missing do
+      nil ->
+        rendered =
+          Regex.replace(@placeholder, body, fn
+            _full, "", path -> to_text(fetch_binding(bindings, path))
+            _full, _escape, path -> "${" <> path <> "}"
+          end)
+
+        {:ok, rendered}
+
+      path ->
+        {:error, {:unbound_placeholder, path}}
+    end
+  end
+
+  defp fetch_resolver(opts) do
+    case Keyword.get(opts, :resolver) do
+      fun when is_function(fun, 1) -> {:ok, fun}
+      _ -> {:error, :missing_skill_resolver}
+    end
+  end
+
+  # `{{partial:name}}` includes reuse the catalog's partial convention.
+  # When no partial resolver is supplied, a body with no partial token
+  # passes through; a body that references a partial without a resolver is
+  # a render error so a half-rendered prompt never reaches an engine.
+  @partial ~r/\{\{partial:([A-Za-z0-9_-]+)\}\}/
+
+  defp expand_partials(body, opts) do
+    names = @partial |> Regex.scan(body, capture: :all_but_first) |> List.flatten() |> Enum.uniq()
+
+    if names == [] do
+      {:ok, body}
+    else
+      case Keyword.get(opts, :partial_resolver) do
+        fun when is_function(fun, 1) -> substitute_partials(body, names, fun)
+        _ -> {:error, {:missing_partial_resolver, names}}
+      end
+    end
+  end
+
+  defp substitute_partials(body, names, resolver) do
+    case load_partials(names, resolver) do
+      {:ok, map} -> {:ok, Regex.replace(@partial, body, fn _full, name -> Map.fetch!(map, name) end)}
+      {:error, _} = err -> err
+    end
+  end
+
+  defp load_partials(names, resolver) do
+    Enum.reduce_while(names, {:ok, %{}}, fn name, {:ok, acc} ->
+      case resolver.(name) do
+        {:ok, body} when is_binary(body) -> {:cont, {:ok, Map.put(acc, name, body)}}
+        {:error, reason} -> {:halt, {:error, {:missing_partial, name, reason}}}
+      end
+    end)
+  end
+
+  defp resolve_binding(bindings, path) do
+    case fetch_binding(bindings, path) do
+      :missing -> :missing
+      _value -> :present
+    end
+  end
+
+  defp fetch_binding(bindings, path) do
+    keys = String.split(path, ".")
+    dig(bindings, keys)
+  end
+
+  defp dig(value, []), do: value
+
+  defp dig(value, [key | rest]) when is_map(value) do
+    case Map.fetch(value, key) do
+      {:ok, inner} -> dig(inner, rest)
+      :error -> :missing
+    end
+  end
+
+  defp dig(_value, _keys), do: :missing
+
+  defp to_text(value) when is_binary(value), do: value
+  defp to_text(value), do: to_string(value)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/repository_catalog.ex b/packages/symphony/elixir/lib/symphony_elixir/repository_catalog.ex
new file mode 100644
index 000000000..7d9d8022c
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/repository_catalog.ex
@@ -0,0 +1,65 @@
+defmodule SymphonyElixir.RepositoryCatalog do
+  @moduledoc """
+  The repositories each Symphony skill workspace receives.
+
+  Repository membership lives in the selected workflow pack's
+  \`repositories.yaml\`. Every entry is cloned for each skill run, with writable
+  refs and a run-scoped branch, so agents can open PRs in any listed repository
+  when the skill asks them to.
+  """
+
+  alias SymphonyElixir.Config
+
+  defstruct [:name, :owner_repo, :default_branch, :primary?]
+
+  @type t :: %__MODULE__{
+          name: String.t(),
+          owner_repo: String.t(),
+          default_branch: String.t(),
+          primary?: boolean()
+        }
+
+  @spec all(Config.t()) :: [t()]
+  def all(%Config{} = config) do
+    config.repositories_file
+    |> read_yaml!()
+    |> Map.fetch!("repositories")
+    |> Enum.map(&repo_from_map!/1)
+  end
+
+  @spec primary(Config.t()) :: t()
+  def primary(%Config{} = config) do
+    repos = all(config)
+    primaries = Enum.filter(repos, & &1.primary?)
+
+    case primaries do
+      [repo] -> repo
+      [] -> raise "RepositoryCatalog must define one primary repo"
+      _ -> raise "RepositoryCatalog must define exactly one primary repo"
+    end
+  end
+
+  defp repo_from_map!(%{} = map) do
+    %__MODULE__{
+      name: fetch_string!(map, "name"),
+      owner_repo: fetch_string!(map, "owner_repo"),
+      default_branch: fetch_string!(map, "default_branch"),
+      primary?: Map.get(map, "primary", false) == true
+    }
+  end
+
+  defp fetch_string!(map, key) do
+    case Map.fetch!(map, key) do
+      value when is_binary(value) and value != "" -> value
+      value -> raise "repositories.yaml field #{key} must be a non-empty string, got #{inspect(value)}"
+    end
+  end
+
+  defp read_yaml!(path) do
+    case path |> File.read!() |> YamlElixir.read_from_string() do
+      {:ok, decoded} when is_map(decoded) -> decoded
+      {:ok, other} -> raise "repositories.yaml must decode to a map, got #{inspect(other)}"
+      {:error, reason} -> raise "failed to read repositories.yaml: #{inspect(reason)}"
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime.ex
new file mode 100644
index 000000000..201653bf5
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime.ex
@@ -0,0 +1,816 @@
+defmodule SymphonyElixir.Runtime do
+  @moduledoc """
+  One GenServer per active IR run. It schedules ready `IR.Node`s as
+  monitored BEAM tasks, commits each result into the durable `RunGraph`
+  through `IR.Store`, and resolves the run when every node is terminal.
+
+  It runs under `Runtime.Supervisor` in the live tree, resumes persisted
+  runs at boot, and backs the `/api/v1/ir/runs` operator surface. The
+  engine is injected (`Runtime.RoomEngineClient` in production), so tests
+  drive it against a fake `EngineClient` with no room-server.
+
+  ## Crash recovery (issue #90)
+
+  Two failure modes are handled, with the same conservative bias:
+
+  1. Executor crash. Every executor task is monitored. A `:DOWN` that
+     arrives without a prior `{:node_done, id, result}` means the task
+     died mid-attempt. The runtime cannot assume the attempt had no side
+     effect (an agent turn may have pushed a commit), so it marks the
+     attempt `:stranded` and routes the node by the non-idempotent retry
+     policy in `Runtime.Recovery`: auto-retry only when the node opted in
+     and showed no observed side effect, otherwise leave it `:stranded`
+     for human review.
+
+  2. BEAM restart. A node persisted `:running` is reconciled by
+     `Runtime.Recovery.reconcile/2` at boot (reattach via
+     `EngineClient.status/1`, else strand by policy), then the run resumes
+     from the recomputed ready set. The runtime calls `reconcile/1` in its
+     init continuation when started from a reloaded graph.
+
+  ## Deadlock guard
+
+  If a scheduling pass finds no ready nodes, no live tasks, and a
+  non-terminal run, the run cannot make progress and would otherwise hang
+  forever. The guard fails the run with `:deadlock` and a clear reason
+  rather than leaving it stuck. This is the safety net behind the
+  upstream-failed propagation: a graph whose only remaining nodes are
+  blocked resolves instead of stalling.
+
+  ## Operator hooks
+
+  `cancel/1`, `retry_node/2`, and `rerun/1` are the operator surface, as
+  function clauses the HTTP layer can call later. They manipulate the
+  graph and reschedule; they do not assume any particular transport.
+  """
+
+  use GenServer, restart: :transient
+  require Logger
+
+  alias SymphonyElixir.GithubApp
+  alias SymphonyElixir.IR.{Attempt, Graph, Materializer, Node, RunGraph}
+  alias SymphonyElixir.Runtime.{Events, ExecRunner, Placement, Recovery, SubrunRunner}
+
+  @registry SymphonyElixir.Runtime.Registry
+
+  @typedoc """
+  Runtime process state. `graph` is the live `RunGraph`; `tasks` maps a
+  monitor ref to the node id it is executing, so a `:DOWN` resolves to the
+  right node; `node_refs` is the reverse map for cancellation. `opts`
+  carries the injected `EngineClient` and `IR.Store` dir so tests isolate.
+  `subrun_depth` is how many subrun levels sit above this run (0 for a
+  top-level run); `subrun_ancestors` is the workflow-name chain open above
+  it. Both are threaded into a `:subrun` node's executor so a child run
+  guards against a cycle and an over-deep chain.
+  """
+  @type state :: %{
+          graph: RunGraph.t(),
+          tasks: %{reference() => String.t()},
+          node_refs: %{String.t() => reference()},
+          engine: module(),
+          store_opts: keyword(),
+          subrun_depth: non_neg_integer(),
+          subrun_ancestors: [String.t()],
+          placement: module(),
+          placement_acquired?: boolean()
+        }
+
+  @spec start_link(RunGraph.t(), keyword()) :: GenServer.on_start()
+  def start_link(%RunGraph{} = graph, opts \\ []) do
+    GenServer.start_link(__MODULE__, {graph, opts}, name: via(graph.run_id))
+  end
+
+  @spec child_spec({RunGraph.t(), keyword()}) :: Supervisor.child_spec()
+  def child_spec({%RunGraph{} = graph, opts}) do
+    %{
+      id: {__MODULE__, graph.run_id},
+      start: {__MODULE__, :start_link, [graph, opts]},
+      restart: :transient,
+      type: :worker
+    }
+  end
+
+  defp via(run_id), do: {:via, Registry, {@registry, run_id}}
+
+  @doc "Read the current graph snapshot. Used by tests and the operator surface."
+  @spec graph(pid() | String.t()) :: RunGraph.t()
+  def graph(pid) when is_pid(pid), do: GenServer.call(pid, :graph)
+  def graph(run_id) when is_binary(run_id), do: GenServer.call(via(run_id), :graph)
+
+  @typedoc "Who requested an operator action, recorded in the audit log."
+  @type actor :: term()
+
+  @doc """
+  Cancel the run. Running nodes' tasks are killed, every non-terminal node
+  is marked `:cancelled`, and the run is stopped. `actor` is recorded in
+  the audit log (defaults to `:operator`). An operator hook.
+  """
+  @spec cancel(pid() | String.t(), actor()) :: :ok
+  def cancel(target, actor \\ :operator)
+  def cancel(pid, actor) when is_pid(pid), do: GenServer.call(pid, {:cancel, actor})
+  def cancel(run_id, actor) when is_binary(run_id), do: GenServer.call(via(run_id), {:cancel, actor})
+
+  @doc """
+  Retry one node: reset it to `:pending` and reschedule. This is the
+  explicit operator override of the conservative auto-retry default, so it
+  does not consult `__retry__`; the operator is asserting the retry is
+  safe. `actor` is recorded in the audit log. An operator hook.
+  """
+  @spec retry_node(pid() | String.t(), String.t(), actor()) :: :ok
+  def retry_node(target, node_id, actor \\ :operator)
+  def retry_node(pid, node_id, actor) when is_pid(pid), do: GenServer.call(pid, {:retry_node, node_id, actor})
+
+  def retry_node(run_id, node_id, actor) when is_binary(run_id),
+    do: GenServer.call(via(run_id), {:retry_node, node_id, actor})
+
+  @doc """
+  Re-run the whole graph from scratch: reset every node to `:pending` and
+  reschedule. The AST and expansion log are preserved. `actor` is recorded
+  in the audit log. An operator hook.
+  """
+  @spec rerun(pid() | String.t(), actor()) :: :ok
+  def rerun(target, actor \\ :operator)
+  def rerun(pid, actor) when is_pid(pid), do: GenServer.call(pid, {:rerun, actor})
+  def rerun(run_id, actor) when is_binary(run_id), do: GenServer.call(via(run_id), {:rerun, actor})
+
+  @doc """
+  Clear failed nodes: reset every `:failed`, `:upstream_failed`, and
+  `:stranded` node to `:pending` and reschedule, leaving succeeded nodes
+  intact. This is the surgical recovery operators reach for after fixing
+  the cause of a failure, rather than re-running the whole graph. `actor`
+  is recorded in the audit log. An operator hook.
+  """
+  @spec clear_failed(pid() | String.t(), actor()) :: :ok
+  def clear_failed(target, actor \\ :operator)
+  def clear_failed(pid, actor) when is_pid(pid), do: GenServer.call(pid, {:clear_failed, actor})
+  def clear_failed(run_id, actor) when is_binary(run_id), do: GenServer.call(via(run_id), {:clear_failed, actor})
+
+  @impl true
+  def init({%RunGraph{} = graph, opts}) do
+    state = %{
+      graph: graph,
+      tasks: %{},
+      node_refs: %{},
+      engine: Keyword.fetch!(opts, :engine),
+      store_opts: Keyword.get(opts, :store_opts, []),
+      subrun_depth: Keyword.get(opts, :subrun_depth, 0),
+      subrun_ancestors: Keyword.get(opts, :subrun_ancestors, []),
+      placement: Keyword.get(opts, :placement, Placement),
+      placement_acquired?: false
+    }
+
+    # A graph reloaded from disk may carry orphaned :running nodes. The
+    # `recover: true` option asks the runtime to reconcile them before its
+    # first scheduling pass, the BEAM-restart half of #90.
+    state =
+      if Keyword.get(opts, :recover, false) do
+        recovered = Recovery.reconcile(graph, fn thread_id -> state.engine.status(thread_id) end)
+        %{state | graph: recovered}
+      else
+        state
+      end
+
+    # Reconcile may have harvested outputs that resolve a gate, so re-expand
+    # before the first scheduling pass. Idempotent and a no-op for a graph
+    # with no AST, so it is safe on both the fresh-start and restart paths.
+    # An invalid dynamically-emitted envelope fails the run rather than
+    # crashing init, so a bad child surfaces as a failed run, not a
+    # supervisor restart loop.
+    case Materializer.expand_dynamic(state.graph) do
+      {:ok, expanded, _new_ids} ->
+        state = %{state | graph: expanded}
+        # Persist before the first scheduling pass so a producer that
+        # navigates to /ir/:run_id the moment start_run returns finds the
+        # run on disk, even while a slow placement acquire is still in
+        # flight. The run shows :running with :pending nodes; the broadcast
+        # also lands so the index row appears without a navigation.
+        persist(expanded, state)
+        {:ok, state, {:continue, :advance}}
+
+      {:error, reason} ->
+        {:ok, %{state | graph: fail_run(state.graph, reason, state.store_opts)}, {:continue, :advance}}
+    end
+  end
+
+  @impl true
+  def handle_continue(:advance, state), do: advance(state)
+
+  @impl true
+  def handle_call(:graph, _from, state), do: {:reply, state.graph, state}
+
+  @impl true
+  def handle_call({:cancel, actor}, _from, state) do
+    Enum.each(Map.keys(state.tasks), &Process.demonitor(&1, [:flush]))
+
+    cancelled =
+      Enum.reduce(state.graph.nodes, state.graph, fn {id, node}, acc ->
+        if Node.terminal?(node), do: acc, else: transition(acc, id, :cancelled)
+      end)
+
+    finished =
+      %{cancelled | status: :cancelled}
+      |> RunGraph.append_audit(:cancel, nil, actor, %{})
+
+    persist(finished, state)
+    release_placement(state)
+    {:stop, :normal, :ok, %{state | graph: finished, tasks: %{}, node_refs: %{}}}
+  end
+
+  @impl true
+  def handle_call({:retry_node, node_id, actor}, _from, state) do
+    graph =
+      state.graph
+      |> Graph.reset_node(node_id)
+      |> RunGraph.append_audit(:retry_node, node_id, actor, %{})
+
+    persist(graph, state)
+    advance_reply(%{state | graph: graph})
+  end
+
+  @impl true
+  def handle_call({:rerun, actor}, _from, state) do
+    graph =
+      Enum.reduce(Map.keys(state.graph.nodes), state.graph, fn id, acc -> Graph.reset_node(acc, id) end)
+
+    graph =
+      %{graph | status: :running}
+      |> RunGraph.append_audit(:rerun, nil, actor, %{})
+
+    persist(graph, state)
+    advance_reply(%{state | graph: graph})
+  end
+
+  @impl true
+  def handle_call({:clear_failed, actor}, _from, state) do
+    cleared_ids =
+      for {id, node} <- state.graph.nodes, node.state in [:failed, :upstream_failed, :stranded], do: id
+
+    graph =
+      cleared_ids
+      |> Enum.reduce(state.graph, fn id, acc -> Graph.reset_node(acc, id) end)
+      |> Map.put(:status, :running)
+      |> RunGraph.append_audit(:clear_failed, nil, actor, %{cleared: cleared_ids})
+
+    persist(graph, state)
+    advance_reply(%{state | graph: graph})
+  end
+
+  @impl true
+  def handle_info({:node_done, node_id, result, thread_id}, state) do
+    state = drop_task_for(state, node_id)
+    graph = record_finished_attempt(state.graph, node_id, result, thread_id)
+    graph = Graph.apply_output(graph, node_id, result)
+    # A succeeded node may unlock a gate or fan-out: its output is now in
+    # known_outputs, so re-expand the AST to emit any newly-justified
+    # children before the next scheduling pass. A failure cannot resolve a
+    # gate (the dep did not produce an output), so re-expansion only runs
+    # on success.
+    graph = expand_on_success(graph, result, state.store_opts)
+    persist(graph, state)
+    advance(%{state | graph: graph})
+  end
+
+  @impl true
+  def handle_info({:DOWN, ref, :process, _pid, reason}, state) do
+    case Map.fetch(state.tasks, ref) do
+      {:ok, node_id} ->
+        # A :DOWN with the node still :running means the task died without
+        # reporting a result. (A clean finish removes the monitor before
+        # this arrives via `drop_task_for/2`.) Strand the attempt and route
+        # by the non-idempotent retry policy.
+        Logger.warning("Runtime #{state.graph.run_id} node #{node_id} task down: #{inspect(reason)}")
+        state = %{state | tasks: Map.delete(state.tasks, ref), node_refs: Map.delete(state.node_refs, node_id)}
+        graph = strand_node(state.graph, node_id)
+        persist(graph, state)
+        advance(%{state | graph: graph})
+
+      :error ->
+        # A monitor we already flushed, or an unrelated process. Ignore.
+        {:noreply, state}
+    end
+  end
+
+  # Re-expand the AST after a successful node so a resolved gate or
+  # fan-out emits its children. Only runs on `{:ok, _}`: a failure does not
+  # produce an output a gate can read. The new children land `:pending`
+  # and the next scheduling pass picks up the ready ones; resolved
+  # placeholders are retired to `:skipped` by the materializer.
+  defp expand_on_success(%RunGraph{} = graph, {:ok, _output}, store_opts) do
+    case Materializer.expand_dynamic(graph) do
+      {:ok, expanded, _new_ids} -> expanded
+      # A dynamically-emitted child with an invalid envelope fails the run.
+      {:error, reason} -> fail_run(graph, reason, store_opts)
+    end
+  end
+
+  defp expand_on_success(%RunGraph{} = graph, _result, _store_opts), do: graph
+
+  # Mark the run failed for a load-time error (an invalid envelope on a
+  # dynamically-emitted node). Every non-terminal node becomes
+  # :upstream_failed so the run resolves instead of stalling on a child
+  # that can never be scheduled.
+  defp fail_run(%RunGraph{} = graph, reason, store_opts) do
+    Logger.error("Runtime #{graph.run_id} expansion failed: #{inspect(reason)}")
+
+    failed =
+      Enum.reduce(graph.nodes, graph, fn {id, node}, acc ->
+        if Node.terminal?(node), do: acc, else: transition(acc, id, :upstream_failed)
+      end)
+
+    failed = %{failed | status: :failed}
+    persist(failed, %{store_opts: store_opts})
+    failed
+  end
+
+  # --- scheduling -----------------------------------------------------
+
+  defp advance(state) do
+    case advance_step(state) do
+      {:noreply, _next} = reply -> reply
+      {:stop, next} -> {:stop, :normal, next}
+    end
+  end
+
+  defp advance_reply(state) do
+    case advance_step(state) do
+      {:noreply, next} -> {:reply, :ok, next}
+      {:stop, next} -> {:stop, :normal, :ok, next}
+    end
+  end
+
+  defp advance_step(state) do
+    cond do
+      Graph.all_terminal?(state.graph) ->
+        finished = finish(state)
+        # A failed run stays alive and idle so the operator surface
+        # (clear_failed, retry_node, rerun) can reach a live process. A
+        # succeeded or cancelled run has nothing left to operate on, so it
+        # stops and frees the process. The supervisor can still resume a
+        # failed run from the store after a restart.
+        if finished.graph.status == :failed do
+          {:noreply, finished}
+        else
+          {:stop, finished}
+        end
+
+      true ->
+        ready = Graph.ready_nodes(state.graph)
+        schedule(state, ready)
+    end
+  end
+
+  defp schedule(state, []) do
+    cond do
+      map_size(state.tasks) > 0 ->
+        # Work is in flight; wait for a :node_done or :DOWN to wake us.
+        {:noreply, state}
+
+      no_nonterminal_nodes?(state.graph) ->
+        # No ready nodes, no live tasks, and nothing non-terminal left. This
+        # is a completed run, not a deadlock: it covers a gate that resolved
+        # every body off (`when` falsy, `every n` that did not fire this
+        # tick) so the graph materialized to zero schedulable work. Resolve
+        # it through the normal finish path rather than tripping the guard.
+        # `Graph.all_terminal?/1` treats an empty node map as not-terminal so
+        # a run is never declared done before its first materialization; here
+        # the run is already :running, so an empty or all-terminal node set
+        # is a real no-op completion.
+        finished = finish(state)
+        if finished.graph.status == :failed, do: {:noreply, finished}, else: {:stop, finished}
+
+      true ->
+        # No ready nodes, no live tasks, but a non-terminal node remains: the
+        # remaining nodes are permanently blocked. Fail rather than hang.
+        # This is the #90 deadlock guard.
+        {:stop, deadlock(state)}
+    end
+  end
+
+  defp schedule(state, ready) do
+    next = Enum.reduce(ready, state, &start_node(&2, &1))
+    {:noreply, next}
+  end
+
+  # Whether every node in the graph is terminal. An empty node map (a
+  # fully-gated-off materialization) is vacuously all-terminal: there is no
+  # work left, so the run completes as a no-op rather than deadlocking.
+  defp no_nonterminal_nodes?(%RunGraph{nodes: nodes}) do
+    Enum.all?(Map.values(nodes), &Node.terminal?/1)
+  end
+
+  defp start_node(state, %Node{} = node) do
+    attempt_n = length(node.attempts) + 1
+    # Mark + persist the attempt as running before provisioning so the node
+    # is observable during a slow placement acquire. The turn task is only
+    # spawned after placement resolves (it reads the per-run base_url).
+    graph = mark_running(state.graph, node, attempt_n)
+    persist(graph, state)
+    state = ensure_placement(%{state | graph: graph}, node)
+    graph = state.graph
+    engine = state.engine
+    runtime = self()
+    run_opts = run_opts(state, node, attempt_n)
+
+    # Fire-and-forget the task, then monitor the spawned pid. The task
+    # reports its result through an explicit `{:node_done, ...}` message;
+    # the monitor's `:DOWN` is the crash signal. Owning the monitor ref
+    # ourselves (rather than `async_nolink`) keeps the `:DOWN` the only
+    # task-lifecycle message the GenServer ever sees, so a clean exit and a
+    # crash are told apart purely by whether `:node_done` arrived first.
+    {:ok, pid} =
+      Task.Supervisor.start_child(SymphonyElixir.TaskSupervisor, fn ->
+        case run_attempt(node, engine, run_opts) do
+          {:ok, output, thread_id} -> send(runtime, {:node_done, node.id, {:ok, output}, thread_id})
+          {:error, reason, thread_id} -> send(runtime, {:node_done, node.id, {:error, reason}, thread_id})
+        end
+      end)
+
+    ref = Process.monitor(pid)
+
+    %{
+      state
+      | graph: graph,
+        tasks: Map.put(state.tasks, ref, node.id),
+        node_refs: Map.put(state.node_refs, node.id, ref)
+    }
+  end
+
+  # The per-attempt context handed to an executor. Every node gets the run
+  # id and attempt number; a `:subrun` node additionally gets the engine,
+  # store dir, its place in the subrun depth/ancestor chain, and its inputs
+  # resolved against upstream outputs, since a child run is launched from the
+  # task and must guard recursion and select its workflow there. The other
+  # kinds ignore the subrun keys.
+  defp run_opts(state, %Node{kind: :subrun} = node, attempt_n) do
+    %{
+      run_id: state.graph.run_id,
+      attempt: attempt_n,
+      engine: state.engine,
+      store_opts: state.store_opts,
+      subrun_depth: state.subrun_depth,
+      subrun_ancestors: state.subrun_ancestors,
+      resolved_inputs: resolve_inputs(state.graph, node)
+    }
+  end
+
+  # An agent node carries the placement module so `Engine.Client` can
+  # resolve an `:ixvm` envelope to the run's own provisioned room-server
+  # by `run_id`. `ensure_placement/2` already ran before this node was
+  # scheduled, so the registry entry exists for an `:ixvm`/`:host` location.
+  #
+  # The engine turn runs from the run's primary-repo checkout, so the cwd
+  # is read back from the resolved placement (`:host` and `:ixvm` clone to
+  # different roots). A run with no acquired placement (`:local`/`:room`)
+  # has no checkout to name and omits `:cwd`; the engine client then fails
+  # loudly with `:missing_cwd` rather than running an agent turn in an
+  # unknown directory.
+  defp run_opts(state, %Node{kind: :agent}, attempt_n) do
+    base = %{
+      run_id: state.graph.run_id,
+      attempt: attempt_n,
+      placement: state.placement,
+      trigger: state.graph.trigger
+    }
+
+    case state.placement.workspace_cwd(state.graph.run_id, placement_opts(state)) do
+      {:ok, cwd} -> Map.put(base, :cwd, cwd)
+      :error -> base
+    end
+  end
+
+  defp run_opts(state, %Node{}, attempt_n) do
+    %{run_id: state.graph.run_id, attempt: attempt_n}
+  end
+
+  # Provision the run's own room-server before its first agent turn when
+  # the node's placement needs one (`:ixvm` or `{:host, _}`). Acquisition
+  # is idempotent and run-scoped: one room-server serves every agent node
+  # in the run, so only the first such agent node provisions; the rest
+  # reuse it. `:local` and `{:room, _}` resolve to a fixed URL in the
+  # client and need no per-run server, so they are a no-op here. The
+  # `ixvm -> host` fallback (target from `Config.placement_fallback`) lives
+  # inside `Placement.acquire`; an `ixvm` failure that falls back to
+  # `:local` returns `{:error, {:no_placement_needed, :local}}`, which is a
+  # resolved outcome (the client uses the default URL), not an acquire
+  # failure. Teardown at run end releases whatever was acquired.
+  defp ensure_placement(%{placement_acquired?: true} = state, _node), do: state
+
+  defp ensure_placement(state, %Node{kind: :agent, envelope: %{location: location}})
+       when location == :ixvm or (is_tuple(location) and elem(location, 0) == :host) do
+    case state.placement.acquire(state.graph.run_id, location, acquire_opts(state)) do
+      {:ok, _base_url} ->
+        graph = stamp_placement(state.graph, state.placement, location)
+        %{state | graph: graph, placement_acquired?: true}
+
+      # The fallback chose `:local`: no per-run server, the turn resolves
+      # to the default URL. Mark acquired so later agent nodes do not retry.
+      {:error, {:no_placement_needed, :local}} ->
+        graph = %{state.graph | placement: %{declared: location, effective: :local}}
+        %{state | graph: graph, placement_acquired?: true}
+
+      {:error, reason} ->
+        # Setup (and any configured fallback) failed; log and leave the
+        # engine turn to fail against the missing placement. Mark acquired
+        # so a per-node retry does not re-provision what just failed.
+        Logger.warning("Runtime #{state.graph.run_id} placement acquire failed: #{inspect(reason)}")
+        %{state | placement_acquired?: true}
+    end
+  end
+
+  defp ensure_placement(state, _node), do: state
+
+  # Read the resolved placement from the registry (effective location after
+  # any ixvm -> host fallback) and stamp it onto the graph so the read view
+  # can expose "ixvm (fallback host)" without re-querying ETS on every read.
+  defp stamp_placement(%RunGraph{} = graph, placement_mod, declared) do
+    effective =
+      case placement_mod.resolved(graph.run_id) do
+        {:ok, %{location: loc}} -> loc
+        :error -> nil
+      end
+
+    %{graph | placement: %{declared: declared, effective: effective}}
+  end
+
+  defp placement_opts(state), do: Keyword.get(state.store_opts, :placement_opts, [])
+
+  # Acquiring a run's placement clones its repos and boots the room-server
+  # the agent turn runs against. When a GitHub App is configured, mint an
+  # installation token and pass it as `:bot_token` so the clone auth header
+  # and the room-server `GITHUB_TOKEN`/`GH_TOKEN` author agent PRs under the
+  # App's bot identity. Without this the placement falls back to the static
+  # host `config.github_token`, and `gh pr create` authors PRs as that human
+  # account (ENG-2012, indexable-inc/symphony#242). An explicit `:bot_token`
+  # in `placement_opts` (tests) is left untouched.
+  defp acquire_opts(state) do
+    opts = placement_opts(state)
+
+    if Keyword.has_key?(opts, :bot_token) do
+      opts
+    else
+      case bot_token() do
+        {:ok, token} -> Keyword.put(opts, :bot_token, token)
+        :none -> opts
+      end
+    end
+  end
+
+  # Best-effort, mirroring `Runtime.ExecRunner`: a missing or unconfigured
+  # GitHub App (dev laptops, tests) yields no token and the placement keeps
+  # the inherited env rather than crashing the run.
+  defp bot_token do
+    if GithubApp.configured?() do
+      case GithubApp.installation_token() do
+        {:ok, token} ->
+          {:ok, token}
+
+        {:error, reason} ->
+          Logger.warning("Runtime: GitHub App token mint failed (#{inspect(reason)}); agent placement uses the static host token")
+          :none
+      end
+    else
+      :none
+    end
+  rescue
+    error ->
+      Logger.warning("Runtime: bot identity unavailable (#{inspect(error)}); agent placement uses the static host token")
+      :none
+  end
+
+  # Resolve a node's inputs to concrete values using the outputs of its
+  # already-succeeded dependencies. A `{:literal, v}` is the value; a
+  # `{:node, id, path}` reads the dependency's output at `path`. A subrun
+  # node is only scheduled once every dep succeeded, so every node ref
+  # resolves; an unresolvable ref is dropped rather than guessed.
+  defp resolve_inputs(%RunGraph{nodes: nodes}, %Node{inputs: inputs}) do
+    Enum.reduce(inputs, %{}, fn {name, ref}, acc ->
+      case resolve_input_ref(ref, nodes) do
+        {:ok, value} -> Map.put(acc, name, value)
+        :skip -> acc
+      end
+    end)
+  end
+
+  defp resolve_input_ref({:literal, value}, _nodes), do: {:ok, value}
+
+  defp resolve_input_ref({:node, id, path}, nodes) do
+    case Map.fetch(nodes, id) do
+      {:ok, %Node{state: :succeeded, output: output}} -> {:ok, dig(output, path)}
+      _ -> :skip
+    end
+  end
+
+  defp resolve_input_ref(_ref, _nodes), do: :skip
+
+  defp dig(value, []), do: value
+
+  defp dig(value, [key | rest]) when is_map(value) do
+    dig(Map.get(value, key) || Map.get(value, to_string(key)), rest)
+  end
+
+  defp dig(_value, _path), do: nil
+
+  # --- graph transitions ----------------------------------------------
+
+  defp mark_running(%RunGraph{} = graph, %Node{} = node, attempt_n) do
+    attempt = Attempt.start(attempt_n, attempt_engine(node))
+    updated = %{node | state: :running, attempts: node.attempts ++ [attempt], updated_at: DateTime.utc_now()}
+    %{graph | nodes: Map.put(graph.nodes, node.id, updated), updated_at: DateTime.utc_now()}
+  end
+
+  defp record_finished_attempt(%RunGraph{} = graph, node_id, result, thread_id) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, %Node{attempts: []} = node} ->
+        attempt =
+          attempt_n_seed()
+          |> Attempt.start(attempt_engine(node), thread_id)
+          |> Attempt.finish(attempt_state_for(result), outcome_for(result), cost_for(result))
+
+        put_node(graph, %{node | attempts: [attempt]})
+
+      {:ok, node} ->
+        attempts = finish_current_attempt(node.attempts, result, thread_id)
+        put_node(graph, %{node | attempts: attempts})
+
+      :error ->
+        graph
+    end
+  end
+
+  defp finish_current_attempt(attempts, result, thread_id) do
+    current = Enum.max_by(attempts, & &1.n)
+    finished = %{Attempt.finish(current, attempt_state_for(result), outcome_for(result), cost_for(result)) | thread_id: thread_id}
+    Enum.map(attempts, fn a -> if a.n == current.n, do: finished, else: a end)
+  end
+
+  defp strand_node(%RunGraph{} = graph, node_id) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, node} ->
+        graph = mark_attempt_stranded(graph, node)
+        node = graph.nodes[node_id]
+
+        if Recovery.auto_retryable?(node) do
+          # Mark :retrying so the next scheduling pass picks it up
+          # (`Graph.ready_nodes/1` treats :retrying as schedulable). The
+          # attempt history, including the stranded attempt just recorded,
+          # is preserved so the retry budget and audit trail survive.
+          transition(graph, node_id, :retrying)
+        else
+          transition(graph, node_id, :stranded)
+        end
+
+      :error ->
+        graph
+    end
+  end
+
+  defp mark_attempt_stranded(%RunGraph{} = graph, %Node{attempts: []} = node) do
+    attempt = Attempt.start(1, attempt_engine(node)) |> Attempt.finish(:stranded, :stranded)
+    put_node(graph, %{node | attempts: [attempt]})
+  end
+
+  defp mark_attempt_stranded(%RunGraph{} = graph, %Node{attempts: attempts} = node) do
+    current = Enum.max_by(attempts, & &1.n)
+    finished = Attempt.finish(current, :stranded, :stranded)
+    updated = Enum.map(attempts, fn a -> if a.n == current.n, do: finished, else: a end)
+    put_node(graph, %{node | attempts: updated})
+  end
+
+  defp transition(%RunGraph{} = graph, node_id, state) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, node} -> put_node(graph, %{node | state: state})
+      :error -> graph
+    end
+  end
+
+  defp put_node(%RunGraph{} = graph, %Node{} = node) do
+    updated = %{node | updated_at: DateTime.utc_now()}
+    %{graph | nodes: Map.put(graph.nodes, node.id, updated), updated_at: DateTime.utc_now()}
+  end
+
+  defp drop_task_for(state, node_id) do
+    case Map.fetch(state.node_refs, node_id) do
+      {:ok, ref} ->
+        Process.demonitor(ref, [:flush])
+        %{state | tasks: Map.delete(state.tasks, ref), node_refs: Map.delete(state.node_refs, node_id)}
+
+      :error ->
+        state
+    end
+  end
+
+  # --- run resolution -------------------------------------------------
+
+  defp finish(state) do
+    status = Graph.finished_status(state.graph)
+    graph = %{state.graph | status: status}
+    persist(graph, state)
+    Logger.info("Runtime #{graph.run_id} finished with status=#{status}")
+    notify_finished(graph)
+    finished = %{state | graph: graph}
+
+    # A succeeded run is done and its process stops, so release the per-run
+    # room-server now. A failed run stays alive for the operator surface
+    # (clear_failed/retry/rerun may schedule more agent turns against the
+    # same placement), so keep it until the run truly ends through cancel
+    # or a later success.
+    unless status == :failed, do: release_placement(finished)
+    finished
+  end
+
+  defp deadlock(state) do
+    Logger.error("Runtime #{state.graph.run_id} deadlocked: no ready nodes, no live tasks, run not terminal")
+    graph = %{state.graph | status: :failed}
+    persist(graph, state)
+    notify_finished(graph)
+    deadlocked = %{state | graph: graph}
+    release_placement(deadlocked)
+    deadlocked
+  end
+
+  # Fire the terminal Slack summary off the runtime process so a slow Slack
+  # round-trip never stalls run resolution. Best-effort: the notifier swallows
+  # its own failures and the channel/token may be unset.
+  defp notify_finished(%RunGraph{} = graph) do
+    Task.Supervisor.start_child(SymphonyElixir.TaskSupervisor, fn ->
+      SymphonyElixir.IR.RunNotifier.notify_finished(graph)
+    end)
+
+    :ok
+  end
+
+  # Tear down the run's per-run room-server, if it acquired one. Run-scoped
+  # and idempotent: a `:local`/`:room` run never acquired a placement, so
+  # this is a no-op for it. Wrapped so a teardown failure (a slow `ix rm`,
+  # an unreachable VM) never blocks the run from resolving. The placement
+  # module is the one threaded into state, so a test injects a fake.
+  defp release_placement(%{placement: placement, graph: %RunGraph{run_id: run_id}}) do
+    placement.release(run_id)
+    :ok
+  rescue
+    error ->
+      Logger.warning("Runtime #{run_id} placement release failed: #{inspect(error)}")
+      :ok
+  end
+
+  defp release_placement(_state), do: :ok
+
+  # Persist then announce. The store write is the durable record; the
+  # PubSub broadcast is the live notification the dashboard subscribes to,
+  # so the operator sees a transition without polling. Announcing only
+  # after a successful persist keeps a subscriber's refresh-from-store path
+  # consistent with the event. A failed broadcast (no subscribers, dead
+  # PubSub) never blocks the run: the durable state already landed.
+  defp persist(%RunGraph{} = graph, state) do
+    case SymphonyElixir.IR.Store.persist(graph, state.store_opts) do
+      :ok ->
+        Events.broadcast(graph)
+        :ok
+
+      {:error, reason} ->
+        Logger.warning("Runtime #{graph.run_id} persist failed: #{inspect(reason)}")
+        :ok
+    end
+  end
+
+  # --- helpers --------------------------------------------------------
+
+  defp attempt_n_seed, do: 1
+
+  # Dispatch one attempt by node kind. Only `:agent` nodes are engine
+  # turns and go through the injected engine client; `:exec` runs a pack
+  # script locally; `:subrun` launches a nested run through `SubrunRunner`
+  # and maps its terminal state back to one result triple. Placeholder
+  # kinds never reach here: `Graph.ready_nodes/1` excludes them.
+  defp run_attempt(%Node{kind: :agent} = node, engine, run_opts), do: engine.run_node(node, run_opts)
+  defp run_attempt(%Node{kind: :exec} = node, _engine, run_opts), do: ExecRunner.run(node, run_opts)
+  defp run_attempt(%Node{kind: :subrun} = node, _engine, run_opts), do: SubrunRunner.run(node, run_opts)
+
+  # An attempt records what executed it. Agent attempts carry the engine;
+  # exec/subrun carry the executor kind so the run record is honest about a
+  # node that never touched an engine.
+  defp attempt_engine(%Node{kind: :agent, envelope: %{engine: engine}}) when engine in [:codex, :claude], do: engine
+  defp attempt_engine(%Node{kind: :exec}), do: :exec
+  defp attempt_engine(%Node{kind: :subrun}), do: :subrun
+  defp attempt_engine(_node), do: :codex
+
+  defp attempt_state_for({:ok, _}), do: :succeeded
+  defp attempt_state_for({:error, _}), do: :failed
+
+  defp outcome_for({:ok, _}), do: :ok
+  defp outcome_for({:error, reason}), do: {:error, reason}
+
+  # Per-turn cost rides on the successful result's output map (the engine
+  # client lowers the room-server `usage` totals to the `Attempt.cost`
+  # shape there). A failure carries only the error reason on the
+  # synchronous path, so its cost is unknown (nil), and an exec/subrun
+  # output without a cost key is also nil.
+  defp cost_for({:ok, output}) when is_map(output) do
+    case Map.get(output, :cost) do
+      cost when is_map(cost) -> cost
+      _ -> nil
+    end
+  end
+
+  defp cost_for(_), do: nil
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/engine_client.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/engine_client.ex
new file mode 100644
index 000000000..b2574322e
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/engine_client.ex
@@ -0,0 +1,61 @@
+defmodule SymphonyElixir.Runtime.EngineClient do
+  @moduledoc """
+  The seam between the IR runtime and the engine host. The runtime never
+  speaks to the room-server directly: it schedules a node by calling
+  `run_node/2` through this behaviour, which a later workstream (WS-4)
+  implements against the room-server `/api/agent/*` routes. This
+  workstream depends only on the behaviour, so its tests use an in-process
+  fake and never need a running room-server.
+
+  Two callbacks, matching the two questions the runtime asks:
+
+  - `run_node/2` executes one attempt of a node and returns its terminal
+    result. It runs inside a monitored BEAM `Task`; if it raises or the
+    BEAM dies, the runtime treats the missing result as a strand (see
+    issue #90), so an implementation must return a value rather than
+    leaning on the caller to interpret a crash.
+  - `status/1` is the restart reattach probe. Given an attempt's
+    `thread_id`, it reports whether the engine turn is still alive,
+    already finished, or unknown. Recovery uses it to decide whether a
+    node found `:running` after a BEAM restart can be harvested or must be
+    stranded.
+
+  The `run_opts` map carries the runtime's per-attempt context (the node,
+  the attempt number, the run id) so an implementation has what it needs
+  without reaching back into runtime state.
+  """
+
+  alias SymphonyElixir.IR.Node
+
+  @typedoc "Per-attempt context handed to `run_node/2`."
+  @type run_opts :: %{
+          required(:run_id) => String.t(),
+          required(:attempt) => pos_integer(),
+          optional(atom()) => term()
+        }
+
+  @typedoc """
+  Result of one attempt. `{:ok, output}` succeeds the node; `{:error,
+  reason}` fails it. `thread_id` is the engine handle the attempt opened,
+  carried so the runtime can record it on the `Attempt` for a later
+  reattach probe even when the attempt then fails.
+  """
+  @type result ::
+          {:ok, output :: term(), thread_id :: String.t() | nil}
+          | {:error, reason :: term(), thread_id :: String.t() | nil}
+
+  @typedoc """
+  Liveness of a previously-started engine turn. `:running` means the turn
+  is still in flight and may be reattached; `{:finished, result}` means
+  the engine already has a terminal result to harvest; `:unknown` means
+  the engine cannot account for the thread (the conservative case, which
+  recovery treats as a strand).
+  """
+  @type turn_status ::
+          :running
+          | {:finished, {:ok, term()} | {:error, term()}}
+          | :unknown
+
+  @callback run_node(Node.t(), run_opts()) :: result()
+  @callback status(thread_id :: String.t() | nil) :: turn_status()
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/events.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/events.ex
new file mode 100644
index 000000000..f98f01f57
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/events.ex
@@ -0,0 +1,62 @@
+defmodule SymphonyElixir.Runtime.Events do
+  @moduledoc """
+  The one place that owns IR-run PubSub: topic names, the payload shape,
+  and the subscribe helpers.
+
+  `Runtime` calls `broadcast/1` after each persisted transition so the
+  operator dashboard (`IRRunsLive`) updates without polling. The payload is
+  an `IR.View.summary/1` map (string-keyed, JSON-able) so a subscriber can
+  refresh an index row from the event alone, and re-read `IR.Store` for the
+  detail view when the open run changes.
+
+  Two topics, mirroring the dashboard's two granularities:
+
+  - `"ir_runs"` is the index fan-out: every run transition publishes here so
+    the index page can refresh its table.
+  - `"ir_run:<run_id>"` is the per-run topic: a detail page subscribes only
+    to the run it is showing and ignores the rest of the fleet.
+
+  Both carry the same `{:ir_run_event, run_id, summary}` message, so a
+  subscriber pattern-matches one shape regardless of which topic delivered it.
+  """
+
+  alias SymphonyElixir.IR.{RunGraph, View}
+
+  @index_topic "ir_runs"
+
+  @typedoc "The PubSub message every IR-run topic delivers."
+  @type event :: {:ir_run_event, run_id :: String.t(), summary :: map()}
+
+  @doc "The index topic every run transition fans out to."
+  @spec index_topic() :: String.t()
+  def index_topic, do: @index_topic
+
+  @doc "The per-run topic a detail page subscribes to."
+  @spec run_topic(String.t()) :: String.t()
+  def run_topic(run_id) when is_binary(run_id), do: "ir_run:" <> run_id
+
+  @doc "Subscribe the calling process to the index topic."
+  @spec subscribe_index() :: :ok | {:error, term()}
+  def subscribe_index, do: Phoenix.PubSub.subscribe(pubsub(), @index_topic)
+
+  @doc "Subscribe the calling process to one run's topic."
+  @spec subscribe_run(String.t()) :: :ok | {:error, term()}
+  def subscribe_run(run_id) when is_binary(run_id),
+    do: Phoenix.PubSub.subscribe(pubsub(), run_topic(run_id))
+
+  @doc """
+  Broadcast a run transition to both the index and the per-run topic. The
+  payload is the run's `IR.View.summary/1` so subscribers refresh from the
+  event without a store read. Persistence is a separate concern: the caller
+  has already written the graph before announcing it.
+  """
+  @spec broadcast(RunGraph.t()) :: :ok
+  def broadcast(%RunGraph{} = graph) do
+    message = {:ir_run_event, graph.run_id, View.summary(graph)}
+    Phoenix.PubSub.broadcast(pubsub(), @index_topic, message)
+    Phoenix.PubSub.broadcast(pubsub(), run_topic(graph.run_id), message)
+    :ok
+  end
+
+  defp pubsub, do: SymphonyElixir.PubSub
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/exec_runner.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/exec_runner.ex
new file mode 100644
index 000000000..6d5ebf8da
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/exec_runner.ex
@@ -0,0 +1,192 @@
+defmodule SymphonyElixir.Runtime.ExecRunner do
+  @moduledoc """
+  Executor for `:exec` IR nodes: one pack shell script, run in the pack
+  directory. It lives outside the engine path because an exec node is not
+  an engine turn.
+
+  The node carries its script path and optional timeout as literal inputs
+  (`inputs["script"]`, `inputs["timeout"]`), set by the interpreter from
+  `exec "<path>" [timeout <seconds>]`. The path is resolved relative to
+  the active pack directory so a pack references its own scripts without
+  carrying absolute deployment paths.
+
+  The return shape matches `Runtime.EngineClient.run_node/2`
+  (`{:ok, output, thread_id}` / `{:error, reason, thread_id}`) so the
+  runtime treats every node kind through one result path; an exec has no
+  engine thread, so `thread_id` is always `nil`.
+
+  Bot identity: when a GitHub App is configured, a fresh installation
+  token is injected as `GH_TOKEN` so `gh`/`git` inside the script author
+  as the bot. A missing or unconfigured `GithubApp`/`Config` is not fatal:
+  the script still runs with the inherited environment. This mirrors the
+  conservative stance of the pre-overhaul exec path.
+  """
+
+  require Logger
+
+  alias SymphonyElixir.{Config, GithubApp}
+  alias SymphonyElixir.IR.Node
+
+  # Keep the last 64 KB of combined stdout/stderr on the result: enough to
+  # fingerprint a failure, small enough to keep the run file cheap.
+  @output_tail_bytes 64 * 1024
+  @default_timeout_seconds 300
+
+  @type result :: {:ok, map(), nil} | {:error, term(), nil}
+
+  @spec run(Node.t(), map()) :: result()
+  def run(%Node{kind: :exec, inputs: inputs, id: node_id}, run_opts) when is_map(run_opts) do
+    with {:ok, rel_path} <- fetch_script(inputs),
+         pack_dir = pack_dir(run_opts),
+         absolute = Path.expand(rel_path, pack_dir),
+         :ok <- check_exists(absolute, rel_path),
+         :ok <- check_executable(absolute, rel_path) do
+      run_id = Map.get(run_opts, :run_id)
+      timeout_seconds = fetch_timeout(inputs)
+      Logger.info("ExecRunner run=#{run_id} node=#{node_id} cmd=#{rel_path} timeout=#{timeout_seconds}s")
+
+      port =
+        Port.open({:spawn_executable, absolute}, [
+          :exit_status,
+          :binary,
+          :stderr_to_stdout,
+          {:cd, pack_dir},
+          {:env, exec_env_with_bot_identity()}
+        ])
+
+      deadline = System.monotonic_time(:millisecond) + timeout_seconds * 1_000
+      collect(port, [], 0, deadline, run_id, node_id, timeout_seconds)
+    else
+      {:error, reason} -> {:error, reason, nil}
+    end
+  end
+
+  defp fetch_script(inputs) do
+    case Map.get(inputs, "script") do
+      {:literal, path} when is_binary(path) and path != "" -> {:ok, path}
+      _ -> {:error, :missing_exec_script}
+    end
+  end
+
+  # An exec timeout is optional in the surface; default to a finite bound
+  # so a runaway script eventually fails the run rather than hanging.
+  defp fetch_timeout(inputs) do
+    case Map.get(inputs, "timeout") do
+      {:literal, n} when is_integer(n) and n > 0 -> n
+      _ -> @default_timeout_seconds
+    end
+  end
+
+  defp pack_dir(run_opts) do
+    case Map.get(run_opts, :pack_dir) do
+      dir when is_binary(dir) and dir != "" -> dir
+      _ -> Config.get().pack_dir
+    end
+  end
+
+  defp check_exists(absolute, rel_path) do
+    if File.exists?(absolute), do: :ok, else: {:error, {:exec_not_found, rel_path}}
+  end
+
+  # POSIX execute bit on owner/group/other. Surfacing a clear error beats
+  # letting Port.open crash with EACCES.
+  defp check_executable(absolute, rel_path) do
+    case File.stat(absolute) do
+      {:ok, %File.Stat{mode: mode}} ->
+        if Bitwise.band(mode, 0o111) != 0, do: :ok, else: {:error, {:exec_not_executable, rel_path}}
+
+      _ ->
+        {:error, {:exec_not_executable, rel_path}}
+    end
+  end
+
+  defp collect(port, acc, acc_bytes, deadline, run_id, node_id, timeout_seconds) do
+    remaining = max(deadline - System.monotonic_time(:millisecond), 0)
+
+    receive do
+      {^port, {:data, chunk}} when is_binary(chunk) ->
+        Logger.info("[exec #{run_id}/#{node_id}] " <> String.trim_trailing(chunk))
+        {next_acc, next_bytes} = append_with_tail(acc, acc_bytes, chunk)
+        collect(port, next_acc, next_bytes, deadline, run_id, node_id, timeout_seconds)
+
+      {^port, {:exit_status, 0}} ->
+        {:ok, %{kind: :exec, exit_code: 0, output: IO.iodata_to_binary(acc)}, nil}
+
+      {^port, {:exit_status, status}} ->
+        {:error, {:exec_failed, status, IO.iodata_to_binary(acc)}, nil}
+    after
+      remaining ->
+        # :spawn_executable does not die on Port.close, so kill the OS
+        # process explicitly, then drain the close so the mailbox stays clean.
+        case Port.info(port, :os_pid) do
+          {:os_pid, os_pid} ->
+            Logger.warning("ExecRunner timeout run=#{run_id} node=#{node_id} after #{timeout_seconds}s; killing pid=#{os_pid}")
+            System.cmd("kill", ["-KILL", Integer.to_string(os_pid)], stderr_to_stdout: true)
+
+          _ ->
+            :ok
+        end
+
+        Port.close(port)
+        {:error, {:exec_timeout, timeout_seconds, IO.iodata_to_binary(acc)}, nil}
+    end
+  end
+
+  # iodata accumulator with a byte budget: keep the tail, drop the head.
+  defp append_with_tail(acc, acc_bytes, chunk) do
+    chunk_size = byte_size(chunk)
+    combined = acc_bytes + chunk_size
+
+    cond do
+      combined <= @output_tail_bytes ->
+        {[acc, chunk], combined}
+
+      chunk_size >= @output_tail_bytes ->
+        {binary_part(chunk, chunk_size - @output_tail_bytes, @output_tail_bytes), @output_tail_bytes}
+
+      true ->
+        joined = IO.iodata_to_binary([acc, chunk])
+        drop = byte_size(joined) - @output_tail_bytes
+        {binary_part(joined, drop, @output_tail_bytes), @output_tail_bytes}
+    end
+  end
+
+  # Inherit the BEAM env (PATH for gh/jq/git, secrets from the unit's
+  # EnvironmentFile), then append a fresh GitHub App token as GH_TOKEN when
+  # one is configured. gh prefers GH_TOKEN over GITHUB_TOKEN, so appending
+  # is enough; the inherited PAT need not be scrubbed.
+  defp exec_env_with_bot_identity do
+    base = inherited_env()
+
+    case bot_token() do
+      {:ok, token} -> base ++ [{~c"GH_TOKEN", String.to_charlist(token)}]
+      :none -> base
+    end
+  end
+
+  defp inherited_env do
+    System.get_env()
+    |> Enum.map(fn {k, v} -> {String.to_charlist(k), String.to_charlist(v)} end)
+  end
+
+  # Best-effort: a missing Config/GithubApp process (tests, dev) yields no
+  # token rather than crashing the script run.
+  defp bot_token do
+    if GithubApp.configured?() do
+      case GithubApp.installation_token() do
+        {:ok, token} ->
+          {:ok, token}
+
+        {:error, reason} ->
+          Logger.warning("ExecRunner: GitHub App token mint failed (#{inspect(reason)}); script runs with inherited env only")
+          :none
+      end
+    else
+      :none
+    end
+  rescue
+    error ->
+      Logger.warning("ExecRunner: bot identity unavailable (#{inspect(error)}); script runs with inherited env only")
+      :none
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/host_runtime.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/host_runtime.ex
new file mode 100644
index 000000000..6a05589d3
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/host_runtime.ex
@@ -0,0 +1,328 @@
+defmodule SymphonyElixir.Runtime.HostRuntime do
+  @moduledoc """
+  Spawns and tears down a per-run room-server on *this* host.
+
+  The mechanics of a host placement - clone a run-scoped workspace, start a
+  privilege-dropped `systemd-run` unit bound to `room_host:port`, health-poll
+  it, and clean it up on teardown - live here as one implementation, used two
+  ways:
+
+    * in-process by `Runtime.Placement` for a local `:host` placement, where
+      the room-server binds loopback (`room_host` = `"127.0.0.1"`); and
+    * inside a `Runtime.WorkerClient` that provisions on its own host on behalf
+      of a remote control plane, where the room-server binds the worker's
+      reachable address (`room_host` = the worker's advertised host) so the
+      control plane can reach it over the engine wire.
+
+  It owns no registry. The caller records the returned `handle`: the control
+  plane in its ETS table and on `room.ix.dev`, the worker in its channel reply.
+  The low-level host ops go through the same injectable driver seam as
+  `Runtime.Placement` (`host_passwd`, `systemd_run`, `systemctl_stop`,
+  `pick_port`, `wait_for_room`, ...), so tests exercise the lifecycle without
+  `systemd-run`. The unit names share the `symphony-host-` prefix the polkit
+  grant in `modules/services/symphony` scopes to.
+  """
+
+  alias SymphonyElixir.{Command, Config}
+  alias SymphonyElixir.Codex.Provision
+
+  require Logger
+
+  @default_setup_timeout_ms 10 * 60 * 1000
+  @default_start_timeout_ms 30 * 1000
+  @default_stop_timeout_ms 60 * 1000
+  @default_health_timeout_ms 60 * 1000
+
+  # The active per-run room units, by bare unit name. Matches only the
+  # "symphony-host-<hash>.service" room units, not the "-setup"/"-clean" sync
+  # units (those are oneshot and gone).
+  @host_room_unit ~r/^symphony-host-[0-9a-f]+\.service$/
+
+  @typedoc """
+  A provisioned host room-server: the `base_url` the engine wire targets, the
+  `systemd-run` `unit`, the dropped-to `user`/`home`, and the `run_root` to
+  remove on teardown.
+  """
+  @type handle :: %{
+          base_url: String.t(),
+          unit: String.t(),
+          user: String.t(),
+          home: String.t(),
+          run_root: String.t(),
+          primary_workspace: String.t()
+        }
+
+  @typedoc """
+  The subset of a provisioned handle `teardown/2` consumes: the `unit` to stop
+  and the `user`/`home`/`run_root` to reap. An open map so both a full
+  `handle()` (WorkerClient) and the smaller record `Runtime.Placement`
+  reconstructs (no `primary_workspace`) satisfy the contract.
+  """
+  @type teardown_handle :: %{
+          :unit => String.t(),
+          :user => String.t(),
+          :home => String.t(),
+          :run_root => String.t(),
+          optional(any()) => any()
+        }
+
+  @doc """
+  Provision the run's room-server on this host bound to `room_host`
+  (`opts[:room_host]`, default `"127.0.0.1"`). Returns `{:ok, handle}` or a
+  bare `{:error, reason}`; the caller wraps the reason in its own contract
+  (`Placement` as `{:host_setup_failed, reason}`).
+  """
+  @spec provision(String.t(), keyword()) :: {:ok, handle()} | {:error, term()}
+  def provision(run_id, opts \\ []) when is_binary(run_id) and is_list(opts) do
+    config = config(opts)
+    driver = driver(opts)
+    bind_host = room_host(opts)
+
+    with {:ok, user} <- host_user(config),
+         {:ok, home} <- host_home(config, driver, user) do
+      run_root = Provision.host_run_root(config, home, run_id)
+      state_dir = Provision.host_room_state_dir(home, run_id)
+      base = Provision.host_unit_base(run_id, "room")
+      unit = base <> ".service"
+      port = driver.pick_port.()
+      url = "http://#{bind_host}:#{port}"
+
+      Logger.info("HostRuntime: creating unit=#{unit} url=#{url} user=#{user} run=#{run_id}")
+
+      # The resolved host identity (config, driver seam, dropped-to user, and
+      # that user's home) is shared by both setup and start; pass it as one
+      # named context so neither helper crosses the credo arity ceiling.
+      host = %{config: config, driver: driver, user: user, home: home}
+
+      with :ok <- setup_workspace(host, run_root, state_dir, base, run_id, opts),
+           :ok <- start_room_server(host, bind_host, state_dir, unit, port, url, opts) do
+        Logger.info("HostRuntime: ready unit=#{unit} url=#{url} run=#{run_id}")
+
+        primary_workspace =
+          Provision.host_primary_workspace(config, run_root, run_id, Keyword.get(opts, :repositories))
+
+        {:ok,
+         %{
+           base_url: url,
+           unit: unit,
+           user: user,
+           home: home,
+           run_root: run_root,
+           primary_workspace: primary_workspace
+         }}
+      else
+        {:error, reason} ->
+          # Stop a half-started unit so a failed provision does not leave a
+          # room-server bound to the port.
+          driver.systemctl_stop.(unit)
+          {:error, reason}
+      end
+    end
+  end
+
+  @doc """
+  Tear down a previously provisioned `handle`: stop the unit and remove its
+  checkout. A no-op-safe `keep?` (default `config.host_keep?`) leaves the unit
+  up for inspection. Idempotent.
+  """
+  @spec teardown(teardown_handle(), keyword()) :: :ok
+  def teardown(%{} = handle, opts \\ []) when is_list(opts) do
+    config = config(opts)
+    driver = driver(opts)
+
+    if Keyword.get(opts, :keep?, config.host_keep?) do
+      Logger.info("HostRuntime: keeping unit=#{handle.unit} for inspection")
+    else
+      driver.systemctl_stop.(handle.unit)
+
+      cleanup_workspace(config, driver, %{
+        host_unit: handle.unit,
+        host_user: handle.user,
+        host_home: handle.home,
+        host_run_root: handle.run_root
+      })
+    end
+
+    :ok
+  end
+
+  @doc """
+  Remove a run's checkout via a `systemd-run` cleanup unit under the same
+  `symphony-host-` prefix the polkit grant authorizes. Used by teardown and by
+  reconcile's reaping path.
+  """
+  @spec cleanup_workspace(Config.t(), map(), %{
+          host_unit: String.t(),
+          host_user: String.t(),
+          host_home: String.t(),
+          host_run_root: String.t()
+        }) :: :ok
+  def cleanup_workspace(%Config{} = config, driver, placement) do
+    base = String.replace_suffix(placement.host_unit, ".service", "")
+    unit = base <> "-clean.service"
+    script = Provision.host_cleanup_script(placement.host_run_root)
+
+    args =
+      Provision.host_run_sync_args(config, placement.host_user, placement.host_home, unit, [], [
+        bash_executable(),
+        "-lc",
+        script
+      ])
+
+    case driver.systemd_run.(config, args, @default_stop_timeout_ms) do
+      :ok -> :ok
+      {:error, reason} -> Logger.warning("HostRuntime: cleanup failed unit=#{unit}: #{inspect(reason)}")
+    end
+
+    :ok
+  end
+
+  @doc "The configured host user, or `{:error, :host_user_not_configured}`."
+  @spec host_user(Config.t()) :: {:ok, String.t()} | {:error, term()}
+  def host_user(%Config{host_user: user}) when is_binary(user) and user != "", do: {:ok, user}
+  def host_user(%Config{}), do: {:error, :host_user_not_configured}
+
+  @doc "Resolve the target user's home from `getent passwd` via the driver."
+  @spec host_home(Config.t(), map(), String.t()) :: {:ok, Path.t()} | {:error, term()}
+  def host_home(%Config{} = config, driver, user) do
+    case driver.host_passwd.(config, user) do
+      {:ok, output} -> Provision.parse_passwd_home(output, user)
+      {:error, reason} -> {:error, {:host_user_lookup_failed, user, reason}}
+    end
+  end
+
+  @doc """
+  The default host portion of the placement driver: the real `systemd-run`,
+  `getent`, `systemctl`, room-health, and free-port implementations. Merged
+  into `Runtime.Placement`'s driver and used as this module's default.
+  """
+  @spec default_driver() :: map()
+  def default_driver do
+    %{
+      host_passwd: &real_host_passwd/2,
+      systemd_run: &real_systemd_run/3,
+      systemctl_stop: &real_systemctl_stop/1,
+      systemctl_list_host_units: &real_systemctl_list_host_units/0,
+      systemctl_show_exec_start: &real_systemctl_show_exec_start/1,
+      wait_for_room: &Provision.wait_for_room/2,
+      pick_port: &real_pick_port/0
+    }
+  end
+
+  # --- internals ------------------------------------------------------
+
+  defp setup_workspace(%{config: config, driver: driver, user: user, home: home}, run_root, state_dir, base, run_id, opts) do
+    token = Keyword.get(opts, :bot_token) || config.github_token
+    script = Provision.host_workspace_script(config, run_root, state_dir, run_id, token, Keyword.get(opts, :repositories))
+    unit = base <> "-setup.service"
+    args = Provision.host_run_sync_args(config, user, home, unit, [], [bash_executable(), "-lc", script])
+    driver.systemd_run.(config, args, @default_setup_timeout_ms)
+  end
+
+  defp start_room_server(%{config: config, driver: driver, user: user, home: home}, bind_host, state_dir, unit, port, url, opts) do
+    # A remote worker receives the run's env already resolved from the control
+    # plane (it holds no secrets itself), so an explicit `opts[:env]` overrides
+    # the local `Provision.runtime_env` resolution.
+    env = Keyword.get(opts, :env) || Provision.runtime_env(config, opts)
+    cmd = Provision.host_room_server_command(config, bind_host, port, state_dir)
+    args = Provision.host_run_unit_args(config, user, home, unit, env, cmd)
+
+    case driver.systemd_run.(config, args, @default_start_timeout_ms) do
+      :ok ->
+        case driver.wait_for_room.(url, @default_health_timeout_ms) do
+          :ok -> :ok
+          {:error, reason} -> {:error, {:room_start_failed, reason}}
+        end
+
+      {:error, reason} ->
+        {:error, {:room_start_failed, reason}}
+    end
+  end
+
+  defp room_host(opts), do: Keyword.get(opts, :room_host, "127.0.0.1")
+
+  defp config(opts), do: Keyword.get_lazy(opts, :config, &Config.get/0)
+
+  defp driver(opts), do: Map.merge(default_driver(), Keyword.get(opts, :driver, %{}))
+
+  # --- host driver ----------------------------------------------------
+
+  defp real_host_passwd(%Config{}, user) do
+    case Command.run(getent_executable(), ["passwd", user], 5_000) do
+      {:ok, output} -> {:ok, output}
+      {:error, reason} -> {:error, reason}
+    end
+  end
+
+  defp real_systemd_run(%Config{} = config, args, timeout_ms) do
+    case Command.run(systemd_run_executable(config), args, timeout_ms) do
+      {:ok, _output} -> :ok
+      {:error, {:exit, status, output}} -> {:error, {:systemd_run_failed, Provision.sanitize_setenv_args(args), status, String.trim(output)}}
+      {:error, {:timeout, ms, output}} -> {:error, {:systemd_run_timeout, Provision.sanitize_setenv_args(args), ms, String.trim(output)}}
+      {:error, {:start_failed, reason}} -> {:error, {:systemd_run_error, Provision.sanitize_setenv_args(args), reason}}
+    end
+  end
+
+  defp real_systemctl_stop(nil), do: :ok
+
+  defp real_systemctl_stop(unit) when is_binary(unit) do
+    case Command.run(systemctl_executable(), ["stop", unit], @default_stop_timeout_ms) do
+      {:ok, _output} -> Logger.info("HostRuntime: stopped unit=#{unit}")
+      {:error, reason} -> Logger.warning("HostRuntime: failed to stop unit=#{unit}: #{inspect(reason)}")
+    end
+
+    :ok
+  end
+
+  defp real_systemctl_list_host_units do
+    args = ["list-units", "--type=service", "--all", "--plain", "--no-legend", "symphony-host-*.service"]
+
+    case Command.run(systemctl_executable(), args, @default_stop_timeout_ms) do
+      {:ok, output} ->
+        output
+        |> String.split("\n", trim: true)
+        |> Enum.map(fn line -> line |> String.trim() |> String.split(~r/\s+/, trim: true) |> List.first() end)
+        |> Enum.filter(&(is_binary(&1) and Regex.match?(@host_room_unit, &1)))
+
+      {:error, reason} ->
+        Logger.warning("HostRuntime: failed to list host units: #{inspect(reason)}")
+        []
+    end
+  end
+
+  defp real_systemctl_show_exec_start(unit) when is_binary(unit) do
+    case Command.run(systemctl_executable(), ["show", unit, "--property=ExecStart", "--value"], @default_stop_timeout_ms) do
+      {:ok, output} -> {:ok, String.trim(output)}
+      {:error, reason} -> {:error, reason}
+    end
+  end
+
+  # A free port chosen by the OS for the host room-server. The bind/close
+  # window is a small TOCTOU race against the unit binding the same port;
+  # acceptable because the port space is large and one run provisions one
+  # server.
+  defp real_pick_port do
+    {:ok, socket} = :gen_tcp.listen(0, [:binary, ip: {127, 0, 0, 1}, reuseaddr: true])
+    {:ok, port} = :inet.port(socket)
+    :gen_tcp.close(socket)
+    port
+  end
+
+  defp systemd_run_executable(%Config{host_systemd_run_command: command}) do
+    System.find_executable(command) || command
+  end
+
+  defp systemctl_executable do
+    System.find_executable("systemctl") || "systemctl"
+  end
+
+  defp getent_executable do
+    System.find_executable("getent") || "getent"
+  end
+
+  # Resolve bash to an absolute path: a transient unit's default PATH does not
+  # include the Nix store, so a bare "bash" would fail to exec on NixOS.
+  defp bash_executable do
+    System.find_executable("bash") || "bash"
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/ingress.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/ingress.ex
new file mode 100644
index 000000000..69c6697a3
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/ingress.ex
@@ -0,0 +1,135 @@
+defmodule SymphonyElixir.Runtime.Ingress do
+  @moduledoc """
+  The single door that turns a workflow plus a trigger event into a live IR
+  run. A producer (cron, a webhook, the enqueue UI) resolves an event to a
+  `WorkflowCatalog` entry, then calls here.
+
+  `start_workflow/3` materializes the workflow's AST into a `RunGraph`
+  (validating envelopes at load), stamps the trigger event onto the graph
+  so a node can read it as `<input>` context, and starts the run under
+  `Runtime.Supervisor`. The source hash recorded on the run is the
+  catalog's hash of the `.sym` bytes, so editing the pack never perturbs a
+  run already in flight.
+
+  The engine and store options pass straight through to the supervisor, so
+  a test injects a fake engine and an isolated store dir the same way the
+  runtime tests do.
+  """
+
+  alias SymphonyElixir.IR.{Materializer, RunGraph, Store}
+  alias SymphonyElixir.Runtime
+  alias SymphonyElixir.Runtime.Trigger
+  alias SymphonyElixir.WorkflowCatalog
+
+  @typedoc "A started run: its generated id and the supervised runtime pid."
+  @type started :: %{run_id: String.t(), pid: pid()}
+
+  @doc """
+  Materialize a catalog entry and start it. `trigger_context` is the event
+  payload (`nil` for an operator-started run); `opts` forwards `:engine`,
+  `:store_opts`, and an optional `:run_id` to the supervisor.
+  """
+  @spec start_workflow(WorkflowCatalog.entry(), map() | nil, keyword()) :: {:ok, started()} | {:error, term()}
+  def start_workflow(entry, trigger_context \\ nil, opts \\ [])
+
+  def start_workflow(%{ast: ast, hash: hash} = entry, trigger_context, opts) do
+    run_id = Keyword.get_lazy(opts, :run_id, fn -> generate_run_id(entry) end)
+    start_opts = Keyword.drop(opts, [:run_id])
+
+    with {:ok, graph} <- Materializer.materialize(run_id, hash, ast) do
+      graph = %{graph | trigger: trigger_context}
+
+      case Runtime.Supervisor.start_run(graph, start_opts) do
+        {:ok, pid} -> {:ok, %{run_id: run_id, pid: pid}}
+        {:error, _} = err -> err
+      end
+    end
+  end
+
+  @doc """
+  Resolve every `.sym` workflow that declared interest in this trigger
+  event and start one IR run per match, carrying the event as the run's
+  trigger context.
+
+  This is the one ingress door for every event-driven producer (cron, the
+  webhooks, the Slack poller, the HTTP API). The producer owns event
+  extraction, signature verification, and dedup; this owns resolution and
+  start. Candidates come from `WorkflowCatalog.for_trigger_kind/1` (the
+  cheap kind filter) and are narrowed by the shared `Runtime.Trigger`
+  matcher, so the selector vocabulary lives in one module rather than
+  re-implemented per producer.
+
+  Returns `{:ok, [started()]}` with one entry per started run (an empty
+  list when no workflow matched, which is not an error: an event with no
+  interested workflow is a no-op). Returns `{:error, {:partial, started,
+  failures}}` if any matched workflow failed to start, after starting the
+  ones that could, so a single bad workflow does not silence the rest.
+
+  `opts` forwards `:engine` and `:store_opts` to the supervisor; in
+  production both default (the room-server client and the configured runs
+  dir), so a producer calls `start_by_trigger(event)` with no opts.
+  """
+  @spec start_by_trigger(map(), keyword()) :: {:ok, [started()]} | {:error, term()}
+  def start_by_trigger(%{kind: kind} = event, opts \\ []) when is_atom(kind) do
+    kind
+    |> WorkflowCatalog.for_trigger_kind()
+    |> Enum.filter(fn entry -> Trigger.matches?(entry.trigger, event) end)
+    |> Enum.reduce({[], []}, fn entry, {started, failures} ->
+      case start_workflow(entry, event, opts) do
+        {:ok, run} -> {[run | started], failures}
+        {:error, reason} -> {started, [{entry.name, reason} | failures]}
+      end
+    end)
+    |> case do
+      {started, []} -> {:ok, Enum.reverse(started)}
+      {started, failures} -> {:error, {:partial, Enum.reverse(started), Enum.reverse(failures)}}
+    end
+  end
+
+  @doc "Resolve a workflow by catalog name, then start it. Convenience for the manual/enqueue path."
+  @spec start_by_name(String.t(), map() | nil, keyword()) :: {:ok, started()} | {:error, term()}
+  def start_by_name(name, trigger_context \\ nil, opts \\ []) when is_binary(name) do
+    case WorkflowCatalog.workflow(name) do
+      {:ok, entry} -> start_workflow(entry, trigger_context, opts)
+      {:error, :not_found} -> {:error, {:workflow_not_found, name}}
+    end
+  end
+
+  @doc """
+  Has any IR run already been started for `trigger` events that satisfy
+  `match_fun`? The dedup read every event-driven producer shares.
+
+  A producer keeps its own field-level predicate (a GitHub run dedups on
+  `repo`/`pr_number`, a Slack huddle on `message_ts`), and this owns the
+  one shared capability: where the run history lives. Runs are
+  `RunGraph`s, so the history is `IR.Store`. `match_fun` receives
+  `{status, trigger}` for every persisted IR run, so a caller can scope to
+  active runs (`status in [:pending, :running]`) or to any run.
+
+  `opts` forwards `:store_opts` so a test points the read at an isolated
+  store dir.
+  """
+  @spec seen_trigger?(({RunGraph.status(), map() | nil} -> boolean()), keyword()) :: boolean()
+  def seen_trigger?(match_fun, opts \\ []) when is_function(match_fun, 1) do
+    store_opts = Keyword.get(opts, :store_opts, [])
+
+    store_opts
+    |> Store.load_all()
+    |> Enum.any?(fn graph -> match_fun.({graph.status, graph.trigger}) end)
+  end
+
+  # A readable, collision-resistant run id: the workflow slug, the wall
+  # clock, and a monotonic counter. Ids are opaque to the store; the slug is
+  # only there to make a runs listing scannable.
+  defp generate_run_id(%{name: name}) do
+    slug =
+      name
+      |> to_string()
+      |> String.downcase()
+      |> String.replace(~r/[^a-z0-9]+/, "-")
+      |> String.trim("-")
+
+    slug = if slug == "", do: "workflow", else: slug
+    "#{slug}-#{System.system_time(:millisecond)}-#{System.unique_integer([:positive, :monotonic])}"
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/placement.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/placement.ex
new file mode 100644
index 000000000..7e96e1aaa
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/placement.ex
@@ -0,0 +1,788 @@
+defmodule SymphonyElixir.Runtime.Placement do
+  @moduledoc """
+  Owns the per-run room-server lifecycle for the IR engine path.
+
+  A run whose agent nodes declare `location: :ixvm` gets its own
+  room-server process living in a short-lived iXVM (its own cgroup/PID per
+  the PRD), provisioned once before the run's first agent turn and torn
+  down when the run ends. `Engine.Client.resolve_base_url/2` reads the
+  resolved per-run URL back from here, so a turn routes to the run's own
+  server rather than the shared `SYMPHONY_ROOM_SERVER_URL`.
+
+  This is the IR successor to the lifecycle the legacy `Codex.IxVm` ran
+  per node turn. The load-bearing shell construction (the `ix new`/`shell`
+  argv, the clone and room-start scripts, the port-forward mapping, the
+  secret redaction) is reused from `Codex.Provision` so this path and the
+  legacy path build the same commands and redact the same way. The
+  difference is the unit of work: one room-server serves the whole run and
+  speaks the engine wire (`/api/agent/turns`), rather than one VM per node
+  driving the old `/api/workflow/turns` poll loop.
+
+  ## Registry
+
+  Resolved placements live in a public named ETS table keyed by `run_id`,
+  so the `Engine.Client` (which runs inside a monitored attempt task, off
+  the runtime process) can read the URL without a GenServer round-trip.
+  The table is owned by this process so it is reclaimed if the supervisor
+  restarts the placement registry.
+
+  ## Driver seam (no real VMs in tests)
+
+  Every `ix` invocation, the room-health poll, and the port-forward tunnel
+  go through an injectable driver (`opts[:driver]`), defaulting to the
+  real implementation. Tests pass a stub driver so the lifecycle logic is
+  exercised without spawning a microVM or shelling out to `ix`.
+
+  ## `host` placement and the `ixvm -> host` fallback
+
+  A run whose agent nodes declare `location: {:host, _}` gets its per-run
+  room-server as a privilege-dropped `systemd-run` unit on this host (its
+  own cgroup/PID, no VM), the IR successor to the per-node lifecycle in
+  `Codex.Host`. The unit names share the `symphony-host-` prefix the polkit
+  grant in `modules/services/symphony` scopes to, so the non-root Symphony
+  service is authorized to manage them.
+
+  When `:ixvm` provisioning fails before the first turn, `acquire/3` retries
+  on the fallback placement read from `Config.placement_fallback` (default
+  `:host`). The fallback URL is registered under the same `run_id`, so a
+  turn carrying an `:ixvm` envelope resolves to the host room-server without
+  the node knowing it fell back. `:local` stays the dev convenience (drop to
+  the in-process server); `:none` disables the fallback and the run fails
+  against the missing placement.
+
+  ## Known limitations
+
+  Setup is synchronous and can take minutes (`ix new` plus a clone, or the
+  host clone unit). It runs on the runtime's behalf before the first turn,
+  so a run blocks on provisioning. A setup failure with no usable fallback
+  surfaces as `{:error, {:ixvm_setup_failed, reason}}` /
+  `{:error, {:host_setup_failed, reason}}`.
+  """
+
+  use GenServer
+
+  alias SymphonyElixir.{Command, Config, RepositoryCatalog}
+  alias SymphonyElixir.Codex.{Provision, RoomRegistry}
+  alias SymphonyElixir.Runtime.{HostRuntime, RuntimeRegistry, WorkerDispatch}
+
+  require Logger
+
+  @table :symphony_placement
+  @default_setup_timeout_ms 10 * 60 * 1000
+  @default_health_timeout_ms 60 * 1000
+  # A remote provision covers a worker-side clone + room-server start, so it
+  # shares the generous setup budget rather than a short RPC default.
+  @default_remote_timeout_ms 10 * 60 * 1000
+
+  @typedoc """
+  A resolved per-run placement: the base URL the engine wire targets, the
+  location tag the room-server actually runs on (the effective placement
+  after any `ixvm -> host`/`ixvm -> remote` fallback, not the node's declared
+  location), and the teardown handles for that placement.
+
+  iXVM placements carry `vm_name` and the port-forward `Port`; host placements
+  carry the `systemd-run` `unit`, the `user`/`home` the unit runs as, and the
+  `run_root` to remove on teardown; remote placements carry the `worker_id` to
+  dispatch teardown to and the worker-side `remote_cwd` the engine turn runs in.
+  Each path leaves the other paths' handles `nil`.
+  """
+  @type placement :: %{
+          base_url: String.t(),
+          location: :ixvm | :host | :remote,
+          vm_name: String.t() | nil,
+          port_forward: port() | nil,
+          backend_id: String.t() | nil,
+          host_unit: String.t() | nil,
+          host_user: String.t() | nil,
+          host_home: String.t() | nil,
+          host_run_root: String.t() | nil,
+          worker_id: String.t() | nil,
+          remote_cwd: String.t() | nil
+        }
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @impl true
+  def init(_opts) do
+    :ets.new(@table, [:named_table, :public, :set, read_concurrency: true])
+    {:ok, %{}}
+  end
+
+  @doc """
+  Resolve a per-run base URL for `location`, provisioning the run's
+  room-server if `location` needs one. Idempotent per run: a second call
+  for an already-resolved `run_id` returns the same URL without
+  re-provisioning, so the runtime can acquire lazily before any agent
+  turn without tracking whether it already did.
+
+  Returns `{:ok, base_url}` or `{:error, reason}`. `opts` carries
+  `:config` (defaults to the boot snapshot) and an injectable `:driver`
+  for tests.
+  """
+  @spec acquire(String.t(), SymphonyElixir.Engine.Envelope.location(), keyword()) ::
+          {:ok, String.t()} | {:error, term()}
+  def acquire(run_id, location, opts \\ []) when is_binary(run_id) and is_list(opts) do
+    case lookup(run_id) do
+      {:ok, %{base_url: base_url}} -> {:ok, base_url}
+      :error -> provision(run_id, location, opts)
+    end
+  end
+
+  @doc """
+  The per-run base URL the engine wire should target, or `:error` if no
+  placement was acquired for this run. Read by `Engine.Client` when an
+  envelope's location is `:ixvm`.
+  """
+  @spec base_url(String.t()) :: {:ok, String.t()} | :error
+  def base_url(run_id) when is_binary(run_id) do
+    case lookup(run_id) do
+      {:ok, %{base_url: base_url}} -> {:ok, base_url}
+      :error -> :error
+    end
+  end
+
+  @doc "The resolved placement for a run (effective location after fallback), or :error."
+  @spec resolved(String.t()) :: {:ok, %{location: :ixvm | :host | :remote, base_url: String.t()}} | :error
+  def resolved(run_id) when is_binary(run_id) do
+    case lookup(run_id) do
+      {:ok, %{location: location, base_url: base_url}} -> {:ok, %{location: location, base_url: base_url}}
+      :error -> :error
+    end
+  end
+
+  @doc """
+  The working directory an agent turn runs in: the run's primary-repo
+  checkout for the resolved placement. The clone landed there during
+  acquire, so the engine turn must run from the same path the room-server
+  can see. `:host` checks out under the target user's home and `:ixvm` at
+  the VM-internal workspace root, which differ by placement; reading the
+  path back from the stored record keeps the cwd consistent with where the
+  clone actually went after any `ixvm -> host` fallback.
+
+  Returns `:error` when no placement was acquired (a `:local`/`:room` run),
+  so the caller can decide what an agent turn with no resolved checkout
+  means rather than this module inventing a path.
+  """
+  @spec workspace_cwd(String.t(), keyword()) :: {:ok, String.t()} | :error
+  def workspace_cwd(run_id, opts \\ []) when is_binary(run_id) do
+    case lookup(run_id) do
+      {:ok, %{location: :host, host_run_root: run_root}} when is_binary(run_root) ->
+        {:ok, Provision.host_primary_workspace(config(opts), run_root, run_id)}
+
+      {:ok, %{location: :ixvm}} ->
+        {:ok, Provision.ix_primary_workspace(config(opts), run_id)}
+
+      {:ok, %{location: :remote, remote_cwd: cwd}} when is_binary(cwd) ->
+        {:ok, cwd}
+
+      _ ->
+        :error
+    end
+  end
+
+  @doc """
+  Tear down a run's placement: stop the port-forward, unregister the room
+  backend, remove the VM, and drop the registry entry. Idempotent and a
+  no-op for a run that never acquired one (a `:local`/`:room` run), so the
+  runtime can call it unconditionally at run end.
+  """
+  @spec release(String.t(), keyword()) :: :ok
+  def release(run_id, opts \\ []) when is_binary(run_id) and is_list(opts) do
+    case lookup(run_id) do
+      {:ok, placement} ->
+        teardown(run_id, placement, config(opts), driver(opts))
+        :ets.delete(table(), run_id)
+        :ok
+
+      :error ->
+        :ok
+    end
+  end
+
+  @doc """
+  Reap host room-server units left orphaned by a BEAM restart, and
+  re-attach the ones whose run is still live.
+
+  The placement registry is in-memory ETS, so a restart loses every
+  resolved placement: units started before the restart can no longer be
+  found by `release/2`, and a resumed run that re-`acquire`s would collide
+  on the deterministic `symphony-host-<hash>` unit name. `reconcile/2`
+  rebuilds that state from the host. For each live `symphony-host-*.service`
+  room unit it recovers the `run_id` from the `--state-dir` in the unit's
+  `ExecStart`, then:
+
+    * if the run is non-terminal (`:pending`/`:running` - the same set
+      `Supervisor.resume_pending/1` resumes), re-inserts the placement into
+      the registry so the resumed run re-attaches to the existing server
+      instead of provisioning a duplicate;
+    * otherwise stops the unit, removes its checkout, and unregisters its
+      room backend so a terminal run's server and its room.ix.dev entry do
+      not linger.
+
+  `graphs` is the full run set from `IR.Store.load_all/0`; the caller loads
+  it once and shares it with `resume_pending/1`. Host placements only -
+  iXVM reaping is not handled here. Idempotent and a no-op when no host
+  units exist or the host user is unconfigured.
+  """
+  @spec reconcile([SymphonyElixir.IR.RunGraph.t()], keyword()) :: :ok
+  def reconcile(graphs, opts \\ []) when is_list(graphs) and is_list(opts) do
+    config = config(opts)
+    driver = driver(opts)
+
+    live =
+      for %{run_id: run_id, status: status} <- graphs,
+          status in [:pending, :running],
+          into: MapSet.new(),
+          do: run_id
+
+    with {:ok, user} <- HostRuntime.host_user(config),
+         {:ok, home} <- HostRuntime.host_home(config, driver, user) do
+      host = %{config: config, driver: driver, user: user, home: home}
+
+      driver.systemctl_list_host_units.()
+      |> Enum.each(&reconcile_unit(&1, host, live))
+    else
+      {:error, reason} ->
+        Logger.warning("Placement: reconcile skipped, host identity unresolved: #{inspect(reason)}")
+    end
+
+    :ok
+  end
+
+  defp reconcile_unit(unit, %{driver: driver} = host, live) when is_binary(unit) do
+    case unit_run(driver, unit) do
+      {:ok, run_id, port, state_dir} ->
+        if MapSet.member?(live, run_id) do
+          reattach_unit(host, unit, run_id, port)
+        else
+          reap_unit(host, unit, run_id, state_dir)
+        end
+
+      :error ->
+        Logger.warning("Placement: reconcile leaving #{unit}; could not recover its run from ExecStart")
+    end
+  end
+
+  # A live non-terminal run owns this unit: register the existing server so
+  # the resumed run's `acquire` short-circuits to it rather than colliding
+  # on the deterministic unit name.
+  defp reattach_unit(%{config: config, user: user, home: home}, unit, run_id, port) do
+    placement = %{
+      base_url: "http://127.0.0.1:#{port}",
+      location: :host,
+      vm_name: nil,
+      port_forward: nil,
+      backend_id: Provision.backend_id(run_id, "room"),
+      host_unit: unit,
+      host_user: user,
+      host_home: home,
+      host_run_root: Provision.host_run_root(config, home, run_id),
+      worker_id: nil,
+      remote_cwd: nil
+    }
+
+    :ets.insert(table(), {run_id, placement})
+    Logger.info("Placement: reconcile re-attached host unit=#{unit} run=#{run_id}")
+  end
+
+  # No live run owns this unit: stop the server, drop its checkout, and
+  # unregister its room.ix.dev backend.
+  defp reap_unit(%{config: config, driver: driver, user: user, home: home}, unit, run_id, _state_dir) do
+    Logger.info("Placement: reconcile reaping orphaned host unit=#{unit} run=#{run_id}")
+    driver.systemctl_stop.(unit)
+    RoomRegistry.unregister(config, Provision.backend_id(run_id, "room"))
+
+    HostRuntime.cleanup_workspace(config, driver, %{
+      host_unit: unit,
+      host_user: user,
+      host_home: home,
+      host_run_root: Provision.host_run_root(config, home, run_id)
+    })
+  end
+
+  # The room unit's `ExecStart` carries the bind port and the per-run state
+  # dir whose basename is the run id (the unit name is a non-reversible
+  # hash, so the run is recovered from the state dir, not the name).
+  defp unit_run(driver, unit) do
+    case driver.systemctl_show_exec_start.(unit) do
+      {:ok, exec_start} -> parse_room_exec_start(exec_start)
+      {:error, _reason} -> :error
+    end
+  end
+
+  defp parse_room_exec_start(exec_start) when is_binary(exec_start) do
+    args = String.split(exec_start, ~r/\s+/, trim: true)
+
+    with {:ok, state_dir} <- exec_flag(args, "--state-dir"),
+         {:ok, port_str} <- exec_flag(args, "--port"),
+         {port, ""} <- Integer.parse(port_str),
+         run_id when run_id != "" <- Path.basename(state_dir) do
+      {:ok, run_id, port, state_dir}
+    else
+      _ -> :error
+    end
+  end
+
+  defp exec_flag(args, flag) do
+    case Enum.drop_while(args, &(&1 != flag)) do
+      [^flag, value | _] -> {:ok, value}
+      _ -> :error
+    end
+  end
+
+  # --- provisioning ---------------------------------------------------
+
+  # Only :ixvm and host placements run a provisioned per-run server today.
+  # :local and {:room, _} resolve to a fixed URL in the client and never
+  # acquire a placement, so a call here for one of them is a no-op success:
+  # there is nothing to provision and nothing to release.
+  defp provision(_run_id, :local, _opts), do: {:error, {:no_placement_needed, :local}}
+  defp provision(_run_id, {:room, _}, _opts), do: {:error, {:no_placement_needed, :room}}
+
+  defp provision(run_id, :ixvm, opts) do
+    case provision_ixvm(run_id, opts) do
+      {:ok, base_url} ->
+        {:ok, base_url}
+
+      {:error, {:ixvm_setup_failed, _reason}} = err ->
+        fallback(run_id, config(opts).placement_fallback, err, opts)
+    end
+  end
+
+  # An explicit {:host, _} node placement provisions a host room-server
+  # directly. The host carries no payload here: the per-run room-server is
+  # named by `run_id`, not by the location's host string (which named a
+  # box in the legacy topology, not a per-run server).
+  defp provision(run_id, {:host, _}, opts), do: provision_host(run_id, opts)
+  defp provision(run_id, :host, opts), do: provision_host(run_id, opts)
+
+  defp provision(_run_id, location, _opts), do: {:error, {:unresolvable_location, location}}
+
+  defp provision_ixvm(run_id, opts) do
+    config = config(opts)
+    driver = driver(opts)
+    vm_name = Provision.vm_name(run_id, "room")
+
+    Logger.info("Placement: creating ixvm vm=#{vm_name} image=#{config.ix_image} run=#{run_id}")
+
+    with {:ok, vm} <- create_vm(config, driver, vm_name, Provision.runtime_env(config, opts)),
+         :ok <- setup_workspace(config, driver, vm_name, run_id, opts),
+         :ok <- start_room_server(config, driver, vm_name, run_id, opts),
+         {:ok, base_url, port_forward} <- room_url(config, driver, vm) do
+      backend_id = register_backend(config, run_id, base_url, vm_name, "ixvm")
+
+      placement = %{
+        base_url: base_url,
+        location: :ixvm,
+        vm_name: vm_name,
+        port_forward: port_forward,
+        backend_id: backend_id,
+        host_unit: nil,
+        host_user: nil,
+        host_home: nil,
+        host_run_root: nil,
+        worker_id: nil,
+        remote_cwd: nil
+      }
+
+      :ets.insert(table(), {run_id, placement})
+      Logger.info("Placement: ixvm ready vm=#{vm_name} url=#{base_url} run=#{run_id}")
+      {:ok, base_url}
+    else
+      {:error, reason} ->
+        # Best-effort cleanup of a half-created VM so a failed acquire does
+        # not leak a microVM before the fallback takes over.
+        driver.ix_cmd.(config, Provision.rm_vm_args(vm_name), @default_setup_timeout_ms)
+        {:error, {:ixvm_setup_failed, reason}}
+    end
+  end
+
+  # The `ixvm -> fallback` retry, target read from Config (never a .sym
+  # literal). :host reprovisions the per-run room-server on this host;
+  # :local drops to the in-process default URL (no placement to acquire),
+  # so it is a no-op success the client resolves through the default URL;
+  # :none leaves the original ixvm failure standing.
+  defp fallback(run_id, :host, _ixvm_error, opts) do
+    Logger.warning("Placement: ixvm setup failed for run=#{run_id}; falling back to host")
+    provision_host(run_id, opts)
+  end
+
+  defp fallback(run_id, :remote, ixvm_error, opts) do
+    Logger.warning("Placement: ixvm setup failed for run=#{run_id}; falling back to remote worker")
+
+    case provision_remote(run_id, opts) do
+      {:ok, base_url} -> {:ok, base_url}
+      # No worker is connected: surface the original ixvm failure rather than a
+      # confusing "no worker" so the operator sees the real cause.
+      {:error, {:remote_setup_failed, :no_worker}} -> ixvm_error
+      {:error, _reason} = err -> err
+    end
+  end
+
+  defp fallback(_run_id, :local, _ixvm_error, _opts), do: {:error, {:no_placement_needed, :local}}
+  defp fallback(_run_id, :none, ixvm_error, _opts), do: ixvm_error
+
+  # Provision the run's room-server on a registered remote worker: pick a
+  # worker, dispatch the per-run env + clone token to it, and record the
+  # worker-bound base_url + worker-side cwd in the registry. HostRuntime runs
+  # inside the worker; here we only select, dispatch, and bookkeep.
+  defp provision_remote(run_id, opts) do
+    config = config(opts)
+    driver = driver(opts)
+
+    with {:ok, worker} <- driver.worker_select.(config.worker_select_label),
+         spec = %{
+           env: Provision.runtime_env(config, opts),
+           bot_token: Keyword.get(opts, :bot_token) || config.github_token,
+           # The control plane owns the bot identity: it mints the App token
+           # above, so it must also ship the matching commit user.name/
+           # user.email. A worker holds no bot config of its own, so without
+           # these the worker clone keeps its host's personal git identity and
+           # the babysit skill's identity guard refuses to push.
+           bot_username: config.github_app_bot_username,
+           bot_email: config.github_app_bot_email,
+           repositories: RepositoryCatalog.all(config)
+         },
+         {:ok, remote} <- driver.worker_provision.(worker, run_id, spec, @default_remote_timeout_ms) do
+      backend_id = register_backend(config, run_id, remote.base_url, nil, "remote")
+
+      placement = %{
+        base_url: remote.base_url,
+        location: :remote,
+        vm_name: nil,
+        port_forward: nil,
+        backend_id: backend_id,
+        host_unit: nil,
+        host_user: nil,
+        host_home: nil,
+        host_run_root: nil,
+        worker_id: worker.worker_id,
+        remote_cwd: Map.get(remote, :primary_workspace)
+      }
+
+      :ets.insert(table(), {run_id, placement})
+      Logger.info("Placement: remote ready worker=#{worker.worker_id} url=#{remote.base_url} run=#{run_id}")
+      {:ok, remote.base_url}
+    else
+      {:error, :no_worker} -> {:error, {:remote_setup_failed, :no_worker}}
+      {:error, reason} -> {:error, {:remote_setup_failed, reason}}
+    end
+  end
+
+  defp create_vm(%Config{} = config, driver, vm_name, env) do
+    case driver.ix_cmd.(config, Provision.create_vm_args(config, vm_name, env), config.ix_create_timeout_ms) do
+      :ok ->
+        case driver.ix_vm_by_name.(config, vm_name) do
+          {:ok, vm} -> {:ok, Map.put(vm, "id", vm_name)}
+          {:error, reason} -> {:error, reason}
+        end
+
+      {:error, reason} ->
+        {:error, reason}
+    end
+  end
+
+  defp setup_workspace(%Config{} = config, driver, vm_name, run_id, opts) do
+    driver.ix_cmd.(config, Provision.shell_args(vm_name, Provision.ix_workspace_script(config, run_id, opts)), @default_setup_timeout_ms)
+  end
+
+  defp start_room_server(%Config{} = config, driver, vm_name, run_id, opts) do
+    driver.ix_cmd.(config, Provision.shell_args(vm_name, Provision.ix_room_start_script(config, run_id, opts)), @default_setup_timeout_ms)
+  end
+
+  defp room_url(%Config{ix_room_connect: "port_forward"} = config, driver, %{"name" => vm_name}) do
+    {mapping, url} = Provision.port_forward_mapping(config, vm_name)
+
+    case driver.port_forward.(config, vm_name, mapping) do
+      {:ok, port} ->
+        case driver.wait_for_room.(url, @default_health_timeout_ms) do
+          :ok ->
+            {:ok, url, port}
+
+          {:error, reason} ->
+            driver.stop_port_forward.(port)
+            {:error, {:room_port_forward_failed, reason}}
+        end
+
+      {:error, reason} ->
+        {:error, {:room_port_forward_failed, reason}}
+    end
+  end
+
+  defp room_url(%Config{} = config, driver, %{"name" => vm_name} = vm) do
+    with {:ok, address} <- vm_address(config, vm),
+         url = direct_room_url(address, config.ix_room_port),
+         :ok <- driver.wait_for_room.(url, @default_health_timeout_ms) do
+      {:ok, url, nil}
+    else
+      {:error, reason} -> {:error, {:room_direct_connect_failed, vm_name, reason}}
+    end
+  end
+
+  defp vm_address(%Config{} = config, vm) do
+    case {config.ix_room_connect, Map.get(vm, "ipv4"), Map.get(vm, "ipv6")} do
+      {"direct_ipv4", ipv4, _ipv6} when is_binary(ipv4) and ipv4 != "" -> {:ok, {:ipv4, ipv4}}
+      {_mode, _ipv4, ipv6} when is_binary(ipv6) and ipv6 != "" -> {:ok, {:ipv6, ipv6}}
+      {_mode, ipv4, _ipv6} when is_binary(ipv4) and ipv4 != "" -> {:ok, {:ipv4, ipv4}}
+      _ -> {:error, {:vm_has_no_address, Map.get(vm, "name")}}
+    end
+  end
+
+  defp direct_room_url({:ipv4, address}, port), do: "http://#{address}:#{port}"
+  defp direct_room_url({:ipv6, address}, port), do: "http://[#{address}]:#{port}"
+
+  # --- host provisioning ----------------------------------------------
+
+  # Provision the run's room-server on this host via HostRuntime (clone,
+  # privilege-dropped systemd-run, health-poll), then record the placement in
+  # the registry and on room.ix.dev. HostRuntime owns the host mechanics;
+  # Placement owns the registry. room_host stays loopback for a local host
+  # placement.
+  defp provision_host(run_id, opts) do
+    config = config(opts)
+    host_opts = opts |> Keyword.put(:driver, driver(opts)) |> maybe_put_room_host(config)
+
+    case HostRuntime.provision(run_id, host_opts) do
+      {:ok, host} ->
+        backend_id = register_backend(config, run_id, host.base_url, nil, "host")
+
+        placement = %{
+          base_url: host.base_url,
+          location: :host,
+          vm_name: nil,
+          port_forward: nil,
+          backend_id: backend_id,
+          host_unit: host.unit,
+          host_user: host.user,
+          host_home: host.home,
+          host_run_root: host.run_root,
+          worker_id: nil,
+          remote_cwd: nil
+        }
+
+        :ets.insert(table(), {run_id, placement})
+        Logger.info("Placement: host ready unit=#{host.unit} url=#{host.base_url} run=#{run_id}")
+        {:ok, host.base_url}
+
+      {:error, reason} ->
+        {:error, {:host_setup_failed, reason}}
+    end
+  end
+
+  # Bind the per-run room-server to the configured advertised host instead of
+  # loopback so the central room.ix.dev can reach it to proxy the run's
+  # transcript. HostRuntime uses room_host for both the bind and the registered
+  # base_url, so a reachable host here is what gets registered. An explicit
+  # room_host already in opts (tests, or a worker's own address) wins.
+  defp maybe_put_room_host(opts, %Config{room: %{advertise_host: host}}) when is_binary(host) and host != "" do
+    Keyword.put_new(opts, :room_host, host)
+  end
+
+  defp maybe_put_room_host(opts, _config), do: opts
+
+  defp register_backend(%Config{} = config, run_id, base_url, vm_name, runtime) do
+    backend_id = Provision.backend_id(run_id, "room")
+
+    RoomRegistry.register(config, %{
+      id: backend_id,
+      name: Provision.backend_name(%{}, run_id, "room"),
+      url: base_url,
+      source: "symphony",
+      runtime: runtime,
+      run_id: run_id,
+      node_id: "room",
+      vm_name: vm_name,
+      status: "active"
+    })
+
+    backend_id
+  end
+
+  # --- teardown -------------------------------------------------------
+
+  defp teardown(_run_id, %{location: :ixvm} = placement, %Config{} = config, driver) do
+    driver.stop_port_forward.(placement.port_forward)
+
+    if placement.backend_id, do: RoomRegistry.unregister(config, placement.backend_id)
+
+    if config.ix_keep_vm? do
+      Logger.info("Placement: keeping ixvm vm=#{placement.vm_name} for inspection")
+    else
+      case driver.ix_cmd.(config, Provision.rm_vm_args(placement.vm_name), @default_setup_timeout_ms) do
+        :ok -> Logger.info("Placement: removed ixvm vm=#{placement.vm_name}")
+        {:error, reason} -> Logger.warning("Placement: failed to remove vm=#{placement.vm_name}: #{inspect(reason)}")
+      end
+    end
+
+    :ok
+  end
+
+  defp teardown(_run_id, %{location: :host} = placement, %Config{} = config, driver) do
+    if placement.backend_id, do: RoomRegistry.unregister(config, placement.backend_id)
+
+    HostRuntime.teardown(
+      %{
+        base_url: placement.base_url,
+        unit: placement.host_unit,
+        user: placement.host_user,
+        home: placement.host_home,
+        run_root: placement.host_run_root
+      },
+      config: config,
+      driver: driver
+    )
+
+    :ok
+  end
+
+  # Remote teardown is best-effort: unregister the room backend, then ask the
+  # worker (if still connected) to stop the run's room-server. A disconnected
+  # worker reaps its own orphaned units, so a missing worker is not an error.
+  defp teardown(run_id, %{location: :remote} = placement, %Config{} = config, driver) do
+    if placement.backend_id, do: RoomRegistry.unregister(config, placement.backend_id)
+
+    case placement.worker_id && driver.worker_get.(placement.worker_id) do
+      {:ok, worker} ->
+        driver.worker_teardown.(worker, run_id, @default_remote_timeout_ms)
+
+      _ ->
+        Logger.info("Placement: remote teardown skipped, worker=#{inspect(placement.worker_id)} not connected run=#{run_id}")
+    end
+
+    :ok
+  end
+
+  defp teardown(_run_id, _placement, _config, _driver), do: :ok
+
+  # --- registry -------------------------------------------------------
+
+  defp lookup(run_id) do
+    case :ets.whereis(@table) do
+      :undefined ->
+        :error
+
+      _tid ->
+        case :ets.lookup(@table, run_id) do
+          [{^run_id, placement}] -> {:ok, placement}
+          [] -> :error
+        end
+    end
+  end
+
+  # The registry table is created in `init/1`. Tests that exercise the
+  # lifecycle without the supervised process create it on first write.
+  defp table do
+    case :ets.whereis(@table) do
+      :undefined -> :ets.new(@table, [:named_table, :public, :set, read_concurrency: true])
+      _tid -> @table
+    end
+  end
+
+  # --- driver ---------------------------------------------------------
+
+  defp config(opts), do: Keyword.get_lazy(opts, :config, &Config.get/0)
+
+  # The real driver: every `ix` call, the health poll, and the
+  # port-forward tunnel. Tests override `opts[:driver]` with stubs so no
+  # real VM is created. The driver is a plain map of named functions so a
+  # test can replace exactly the calls it cares about.
+  defp driver(opts), do: Map.merge(default_driver(), Keyword.get(opts, :driver, %{}))
+
+  # The iXVM half of the driver lives here; the host half (systemd-run,
+  # getent, systemctl, room-health, free-port) is owned by HostRuntime and
+  # merged in, so both the local :host path and a remote worker share one
+  # implementation.
+  defp default_driver do
+    Map.merge(
+      %{
+        ix_cmd: &real_ix_cmd/3,
+        ix_vm_by_name: &real_ix_vm_by_name/2,
+        port_forward: &real_port_forward/3,
+        stop_port_forward: &real_stop_port_forward/1,
+        # The remote half: pick a worker, look one up, and dispatch
+        # provision/teardown to it. Tests override these to avoid a real
+        # registry or channel.
+        worker_select: &RuntimeRegistry.select/1,
+        worker_get: &RuntimeRegistry.get/1,
+        worker_provision: &WorkerDispatch.provision/4,
+        worker_teardown: &WorkerDispatch.teardown/3
+      },
+      HostRuntime.default_driver()
+    )
+  end
+
+  defp real_ix_cmd(%Config{} = config, args, timeout_ms) do
+    case Command.run(ix_executable(config), args, timeout_ms) do
+      {:ok, _output} -> :ok
+      {:error, {:exit, status, output}} -> {:error, {:ix_cli_failed, Provision.sanitize_ix_args(args), status, String.trim(output)}}
+      {:error, {:timeout, ms, output}} -> {:error, {:ix_cli_timeout, Provision.sanitize_ix_args(args), ms, String.trim(output)}}
+      {:error, {:start_failed, reason}} -> {:error, {:ix_cli_error, Provision.sanitize_ix_args(args), reason}}
+    end
+  end
+
+  defp real_ix_vm_by_name(%Config{} = config, vm_name) do
+    with {:ok, output} <- real_ix_cmd_output(config, Provision.list_vms_args(), 30_000),
+         {:ok, vms} <- decode_ix_json(output) do
+      case Enum.find(vms, &(Map.get(&1, "name") == vm_name)) do
+        %{} = vm -> {:ok, vm}
+        nil -> {:error, {:ix_vm_not_found, vm_name}}
+      end
+    end
+  end
+
+  defp real_ix_cmd_output(%Config{} = config, args, timeout_ms) do
+    case Command.run(ix_executable(config), args, timeout_ms) do
+      {:ok, output} -> {:ok, output}
+      {:error, {:exit, status, output}} -> {:error, {:ix_cli_failed, Provision.sanitize_ix_args(args), status, String.trim(output)}}
+      {:error, {:timeout, ms, output}} -> {:error, {:ix_cli_timeout, Provision.sanitize_ix_args(args), ms, String.trim(output)}}
+      {:error, {:start_failed, reason}} -> {:error, {:ix_cli_error, Provision.sanitize_ix_args(args), reason}}
+    end
+  end
+
+  defp decode_ix_json(output) do
+    output
+    |> String.trim()
+    |> Jason.decode()
+    |> case do
+      {:ok, list} when is_list(list) -> {:ok, list}
+      {:ok, other} -> {:error, {:invalid_ix_cli_payload, other}}
+      {:error, reason} -> {:error, {:invalid_ix_cli_json, String.trim(output), reason}}
+    end
+  end
+
+  defp real_port_forward(%Config{} = config, vm_name, mapping) do
+    executable = ix_executable(config)
+
+    port =
+      Port.open({:spawn_executable, executable}, [
+        :binary,
+        :exit_status,
+        args: Provision.port_forward_args(vm_name, mapping)
+      ])
+
+    {:ok, port}
+  rescue
+    error -> {:error, {:port_forward_start_failed, Exception.message(error)}}
+  end
+
+  defp real_stop_port_forward(nil), do: :ok
+
+  defp real_stop_port_forward(port) when is_port(port) do
+    case Port.info(port, :os_pid) do
+      {:os_pid, os_pid} -> System.cmd("kill", ["-TERM", Integer.to_string(os_pid)], stderr_to_stdout: true)
+      nil -> :ok
+    end
+
+    if Port.info(port) != nil, do: Port.close(port)
+    :ok
+  rescue
+    _ -> :ok
+  end
+
+  defp ix_executable(%Config{ix_command: command}) do
+    System.find_executable(command) || command
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/recovery.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/recovery.ex
new file mode 100644
index 000000000..1f2ebd27a
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/recovery.ex
@@ -0,0 +1,217 @@
+defmodule SymphonyElixir.Runtime.Recovery do
+  @moduledoc """
+  Restart reconciliation for the IR runtime, the correctness core of
+  issue #90.
+
+  When the BEAM restarts, the live runtime processes and their monitored
+  tasks are gone, but the `RunGraph` persisted by `IR.Store` survives. Two
+  facts must be rebuilt from that record:
+
+  1. The materialized graph. The graph is not a pure function of the
+     source: dynamic constructs (`when`, `everyNth`, fan-out) expanded it
+     based on data that arrived at runtime. Each expansion was recorded in
+     the append-only `expansion_log`. `replay/2` re-runs the interpreter's
+     expansion against the AST in log order, reproducing the identical
+     node set. The invariant the tests assert is
+     `replay(ast, log) == live graph`.
+
+  2. The orphaned `:running` nodes. A node persisted `:running` had a live
+     task that the restart killed. Its owning task is provably gone, so
+     the runtime cannot assume the attempt succeeded or even that it had
+     no side effects. `reconcile/2` resolves each such node by policy.
+
+  ## The non-idempotent retry safety rule
+
+  Agent turns are not idempotent: a turn may have pushed a commit before
+  the BEAM died. Blindly auto-retrying a stranded agent node could push a
+  second commit, double-open a PR, or repeat any other side effect. So the
+  default policy is conservative and matches the plan's locked decision:
+
+  - Retry is opt-in per node (`node.inputs["__retry__"]` carries
+    `{:literal, true}`). A node that did not opt in is never auto-retried.
+  - Even an opt-in node is only auto-retried when its attempt had no
+    observed side effect. An attempt that recorded a `thread_id` is
+    treated as having possibly acted, so it routes to a human-review
+    `:stranded` state instead of a blind retry.
+
+  Recovery first tries to reattach: if `EngineClient.status/1` reports the
+  thread `:running` it is left `:running` for the live runtime to keep
+  monitoring (a future workstream re-subscribes); if it reports
+  `{:finished, result}` the result is harvested through `IR.Graph`. Only an
+  `:unknown` thread falls through to the strand/retry policy.
+  """
+
+  alias SymphonyElixir.IR.{Attempt, Graph, Node, RunGraph}
+
+  @doc """
+  Rebuild a materialized graph from an AST and an expansion log by
+  replaying each expansion in order through `expand_fun`. The function
+  signature mirrors the interpreter's `expand`: given the AST, the
+  observed gating output, and the running node map, it returns the nodes
+  that expansion emits. Replaying the same log against the same AST is
+  deterministic, so two replays produce the same node set.
+
+  `expand_fun` defaults to a stub that emits nothing, which is correct for
+  a statically-materialized graph (no dynamic expansion). WS-5 wires the
+  real interpreter in.
+  """
+  @spec replay(RunGraph.t(), (term(), term(), %{String.t() => Node.t()} -> [Node.t()])) ::
+          RunGraph.t()
+  def replay(%RunGraph{} = graph, expand_fun \\ &default_expand/3) when is_function(expand_fun, 3) do
+    graph.expansion_log
+    |> Enum.reduce(graph, fn event, acc ->
+      emitted = expand_fun.(event.origin, event.observed, acc.nodes)
+      RunGraph.put_nodes(acc, emitted)
+    end)
+  end
+
+  defp default_expand(_origin, _observed, _nodes), do: []
+
+  @doc """
+  Reconcile a reloaded graph after a restart. For every node left
+  `:running`, probe the engine and apply policy, then recompute nothing
+  else: the ready set falls out of `IR.Graph.ready_nodes/1` on the
+  returned graph. Pure except for the `status_fun` probe, which a test
+  supplies as a fake.
+
+  `status_fun` is `EngineClient.status/1` (probe by `thread_id`). The
+  returned graph has no `:running` nodes; each has moved to `:succeeded`,
+  `:failed`, `:retrying`, or `:stranded` by the rules in the moduledoc.
+  """
+  @spec reconcile(RunGraph.t(), (String.t() | nil -> term())) :: RunGraph.t()
+  def reconcile(%RunGraph{} = graph, status_fun) when is_function(status_fun, 1) do
+    graph
+    |> Graph.running_nodes()
+    |> Enum.reduce(graph, fn node, acc -> reconcile_node(acc, node, status_fun) end)
+  end
+
+  defp reconcile_node(%RunGraph{} = graph, %Node{} = node, status_fun) do
+    case status_fun.(current_thread_id(node)) do
+      :running ->
+        # The engine still owns the turn. Leave it :running; the live
+        # runtime keeps monitoring (re-subscription lands in a later
+        # workstream). Recovery does not strand a turn the engine can
+        # still account for.
+        graph
+
+      {:finished, result} ->
+        graph
+        |> mark_attempt(node.id, attempt_state_for(result), result)
+        |> Graph.apply_output(node.id, result)
+
+      :unknown ->
+        strand_or_retry(graph, node)
+    end
+  end
+
+  # The thread is gone. The owning task died without a result, so the
+  # attempt is stranded. Whether we auto-retry depends on the
+  # non-idempotent safety rule.
+  defp strand_or_retry(%RunGraph{} = graph, %Node{} = node) do
+    graph = mark_attempt(graph, node.id, :stranded, :stranded)
+
+    if auto_retryable?(node) do
+      transition(graph, node.id, :retrying)
+    else
+      transition(graph, node.id, :stranded)
+    end
+  end
+
+  # A bounded retry budget so a node that crashes deterministically does
+  # not strand-retry forever. Conservative: a few attempts then human
+  # review. The interpreter can carry a per-node override later; this is
+  # the safe default.
+  @max_attempts 3
+
+  @doc """
+  Whether a stranded node may be auto-retried. Conservative by default:
+  the node must opt in (`inputs["__retry__"] == {:literal, true}`), its
+  current attempt must show no observed side effect (no `thread_id`
+  recorded), and it must be under the retry budget (`#{@max_attempts}`
+  attempts). An attempt that opened an engine thread is assumed to have
+  possibly acted and routes to human review instead.
+  """
+  @spec auto_retryable?(Node.t()) :: boolean()
+  def auto_retryable?(%Node{} = node) do
+    opted_in?(node) and not observed_side_effect?(node) and under_budget?(node)
+  end
+
+  defp under_budget?(%Node{attempts: attempts}), do: length(attempts) < @max_attempts
+
+  defp opted_in?(%Node{inputs: inputs}) when is_map(inputs) do
+    Map.get(inputs, "__retry__") == {:literal, true}
+  end
+
+  defp opted_in?(_), do: false
+
+  # A recorded thread_id means an engine turn started, which may have
+  # pushed a commit. That is the side effect the safety rule guards
+  # against, so its presence blocks auto-retry.
+  defp observed_side_effect?(%Node{} = node) do
+    case current_attempt(node) do
+      %Attempt{thread_id: thread_id} when is_binary(thread_id) and thread_id != "" -> true
+      _ -> false
+    end
+  end
+
+  defp current_attempt(%Node{attempts: []}), do: nil
+  defp current_attempt(%Node{attempts: attempts}), do: Enum.max_by(attempts, & &1.n)
+
+  defp current_thread_id(%Node{} = node) do
+    case current_attempt(node) do
+      %Attempt{thread_id: thread_id} -> thread_id
+      nil -> nil
+    end
+  end
+
+  defp transition(%RunGraph{} = graph, node_id, state) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, node} ->
+        updated = %{node | state: state, updated_at: DateTime.utc_now()}
+        %{graph | nodes: Map.put(graph.nodes, node_id, updated), updated_at: DateTime.utc_now()}
+
+      :error ->
+        graph
+    end
+  end
+
+  defp mark_attempt(%RunGraph{} = graph, node_id, attempt_state, outcome) do
+    case Map.fetch(graph.nodes, node_id) do
+      {:ok, %Node{attempts: []} = node} ->
+        # No attempt was ever recorded (persisted :running before the
+        # attempt struct was appended). Synthesize one so the run record
+        # still explains the strand.
+        attempt = Attempt.start(1, attempt_engine(node)) |> Attempt.finish(:stranded, :stranded)
+        put_attempts(graph, node, [attempt])
+
+      {:ok, node} ->
+        attempts = update_current_attempt(node.attempts, attempt_state, finish_outcome(outcome))
+        put_attempts(graph, node, attempts)
+
+      :error ->
+        graph
+    end
+  end
+
+  defp put_attempts(%RunGraph{} = graph, %Node{} = node, attempts) do
+    updated = %{node | attempts: attempts, updated_at: DateTime.utc_now()}
+    %{graph | nodes: Map.put(graph.nodes, node.id, updated), updated_at: DateTime.utc_now()}
+  end
+
+  defp update_current_attempt(attempts, state, outcome) do
+    current = Enum.max_by(attempts, & &1.n)
+    finished = Attempt.finish(current, state, outcome)
+    Enum.map(attempts, fn a -> if a.n == current.n, do: finished, else: a end)
+  end
+
+  defp attempt_engine(%Node{envelope: %{engine: engine}}) when engine in [:codex, :claude], do: engine
+  defp attempt_engine(_node), do: :codex
+
+  defp attempt_state_for({:ok, _}), do: :succeeded
+  defp attempt_state_for({:error, _}), do: :failed
+
+  # The Attempt state is one of :succeeded | :failed; pick from the result.
+  defp finish_outcome(:stranded), do: :stranded
+  defp finish_outcome({:ok, _}), do: :ok
+  defp finish_outcome({:error, reason}), do: {:error, reason}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/room_engine_client.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/room_engine_client.ex
new file mode 100644
index 000000000..adc193e20
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/room_engine_client.ex
@@ -0,0 +1,151 @@
+defmodule SymphonyElixir.Runtime.RoomEngineClient do
+  @moduledoc """
+  The production `Runtime.EngineClient`: it runs a node's attempt by
+  lowering the node to an engine turn and submitting it through
+  `Engine.Client` to the room-server. This is the WS-4 implementation of
+  the behaviour the IR runtime depends on; tests still inject an
+  in-process fake, so the runtime never requires a live room-server.
+
+  The runtime hands this module an `IR.Node` and per-attempt context
+  (`run_id`, `attempt`, and the resolved working directory and
+  room-server URL). The module turns the node's `envelope` and
+  `prompt_ref` into the `Engine.Client` turn shape, submits it, and maps
+  the room-server outcome back to the behaviour's `result()` triple
+  (carrying the engine's `thread_id` even on failure so the runtime can
+  record it for a later reattach probe).
+
+  ## Prompt resolution
+
+  A node's `prompt_ref` is either `{:inline, text}` or
+  `{:skill, ref, bindings}`. Both are rendered through
+  `SymphonyElixir.Prompt`: inline text passes through, and a skill ref is
+  rendered from the active pack's skill body interpolated with the
+  bindings the interpreter resolved. The skill-body resolver is injectable
+  through `run_opts[:skill_resolver]` for tests; production defaults to the
+  `Catalog`, which already expands shared `{{partial:_}}` includes when it
+  loads a skill. A skill that names an input the node never bound is a
+  render error, so a half-rendered prompt never reaches an engine.
+
+  ## status/1 and restart reattach
+
+  The synchronous `/api/agent/turns` path the room-server exposes today
+  runs the whole turn in one request and has no probe-by-thread route, so
+  `status/1` cannot ask the engine whether an orphaned thread is still
+  alive. It returns `:unknown`, the conservative answer: recovery strands
+  the node (or auto-retries only under the opt-in side-effect-free
+  policy). A real reattach probe needs a room-server status route and
+  lands with the streaming client.
+  """
+
+  @behaviour SymphonyElixir.Runtime.EngineClient
+
+  alias SymphonyElixir.{Catalog, Prompt}
+  alias SymphonyElixir.Engine.Client
+  alias SymphonyElixir.IR.Node
+
+  @impl true
+  def run_node(%Node{kind: :agent, envelope: envelope} = node, run_opts) when not is_nil(envelope) do
+    with {:ok, body} <- resolve_prompt(node.prompt_ref, run_opts),
+         {:ok, cwd} <- fetch_cwd(run_opts) do
+      prompt = append_input_block(body, Map.get(run_opts, :trigger))
+
+      turn = %{
+        prompt: prompt,
+        cwd: cwd,
+        tools: Map.get(run_opts, :tools, []),
+        run_id: Map.get(run_opts, :run_id),
+        node_id: node.id
+      }
+
+      envelope
+      |> Client.submit_turn(turn, client_opts(run_opts))
+      |> to_result()
+    else
+      {:error, reason} -> {:error, reason, nil}
+    end
+  end
+
+  def run_node(%Node{kind: :agent} = node, _run_opts) do
+    {:error, {:missing_envelope, node.id}, nil}
+  end
+
+  def run_node(%Node{kind: kind} = node, _run_opts) do
+    # Only :agent nodes go through the engine host. :exec/:subrun/:gate
+    # nodes have their own executors; routing one here is a wiring bug, so
+    # fail loudly rather than submit a meaningless engine turn.
+    {:error, {:not_an_agent_node, kind, node.id}, nil}
+  end
+
+  @impl true
+  def status(_thread_id) do
+    # No probe-by-thread route on the synchronous path; see moduledoc.
+    :unknown
+  end
+
+  # Render the prompt through `SymphonyElixir.Prompt`. Inline text passes
+  # through; a skill ref is rendered from the active pack's skill body and
+  # the bindings the interpreter resolved. The skill-body resolver is
+  # injectable through `run_opts[:skill_resolver]` (tests pass a fake);
+  # production defaults to the `Catalog`, which already expands shared
+  # `{{partial:_}}` includes when it loads a skill, so no partial resolver
+  # is needed here.
+  defp resolve_prompt(prompt_ref, run_opts) do
+    Prompt.build(prompt_ref, resolver: skill_resolver(run_opts))
+  end
+
+  # Append the run's trigger context to the agent prompt as an `<input>`
+  # block. Every dispatch-driven skill body documents reading its payload
+  # (the cron envelope with `scheduled_for`/`fired_at`/`input`, a webhook
+  # event, or a manual input map) from this block; `Ingress` stamps the
+  # trigger onto `graph.trigger` and the IR runtime forwards it here as
+  # `run_opts[:trigger]`, so this is the one place it reaches the engine
+  # prompt. An operator-started run carries no trigger and appends nothing,
+  # leaving the skill body verbatim.
+  defp append_input_block(prompt, nil), do: prompt
+
+  defp append_input_block(prompt, trigger) do
+    prompt <> "\n\n<input>\n" <> Jason.encode!(trigger, pretty: true) <> "\n</input>\n"
+  end
+
+  defp skill_resolver(run_opts) do
+    case Map.get(run_opts, :skill_resolver) do
+      fun when is_function(fun, 1) -> fun
+      _ -> &catalog_skill_body/1
+    end
+  end
+
+  defp catalog_skill_body(name) do
+    case Catalog.skill(name) do
+      {:ok, skill} -> {:ok, skill.body}
+      {:error, :not_found} -> {:error, {:skill_not_found, name}}
+    end
+  end
+
+  defp fetch_cwd(run_opts) do
+    case Map.get(run_opts, :cwd) do
+      cwd when is_binary(cwd) and cwd != "" -> {:ok, cwd}
+      _ -> {:error, :missing_cwd}
+    end
+  end
+
+  # Pass the room-server URL and any Req injection from the runtime's
+  # per-attempt context straight through to the client. `run_id` and an
+  # optional `placement` module ride along so the client can resolve an
+  # `:ixvm` envelope to the run's own provisioned room-server. Drop nils
+  # so the client's own defaults apply.
+  defp client_opts(run_opts) do
+    [
+      room_server_url: Map.get(run_opts, :room_server_url),
+      req_options: Map.get(run_opts, :req_options, []),
+      timeout_ms: Map.get(run_opts, :timeout_ms),
+      run_id: Map.get(run_opts, :run_id),
+      placement: Map.get(run_opts, :placement)
+    ]
+    |> Enum.reject(fn {_k, v} -> is_nil(v) end)
+  end
+
+  defp to_result({:ok, %{thread_id: thread_id} = output}), do: {:ok, output, thread_id}
+  defp to_result({:error, {:turn_error, _msg, thread_id} = reason}), do: {:error, reason, thread_id}
+  defp to_result({:error, {:turn_cancelled, thread_id} = reason}), do: {:error, reason, thread_id}
+  defp to_result({:error, reason}), do: {:error, reason, nil}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/runtime_registry.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/runtime_registry.ex
new file mode 100644
index 000000000..9749712b8
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/runtime_registry.ex
@@ -0,0 +1,167 @@
+defmodule SymphonyElixir.Runtime.RuntimeRegistry do
+  @moduledoc """
+  Registry of connected runtime workers, held on the control plane.
+
+  A runtime worker (a `Runtime.WorkerClient` running on another host) opens a
+  channel to the control plane and registers here, advertising the address the
+  engine wire can reach its per-run room-servers at, the labels it carries, and
+  its capacity. `Runtime.Placement` selects a worker from here when a run falls
+  back to the `:remote` placement.
+
+  Entries live in a `:public` ETS table keyed by `worker_id`, so a selection is
+  a direct read off the runtime path with no GenServer round-trip. The owning
+  GenServer monitors each worker's channel process and drops its entry when that
+  process goes down, so a disconnected or crashed worker is never selected.
+  """
+
+  use GenServer
+
+  require Logger
+
+  @table :symphony_runtime_workers
+
+  @typedoc """
+  A registered runtime worker. `pid` is the worker's channel process on the
+  control plane (monitored for liveness); `address` is the host the worker
+  binds its per-run room-servers to, which the engine wire targets.
+  """
+  @type worker :: %{
+          worker_id: String.t(),
+          pid: pid(),
+          address: String.t(),
+          labels: [String.t()],
+          capacity: non_neg_integer(),
+          registered_at: integer()
+        }
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @impl true
+  def init(_opts) do
+    :ets.new(@table, [:named_table, :public, :set, read_concurrency: true])
+    {:ok, %{monitors: %{}}}
+  end
+
+  @doc """
+  Register (or refresh) a worker. The given `pid` (the worker's channel
+  process) is monitored; when it goes down the entry is dropped. Re-registering
+  the same `worker_id` replaces the prior entry.
+  """
+  @spec register(%{
+          required(:worker_id) => String.t(),
+          required(:pid) => pid(),
+          required(:address) => String.t(),
+          optional(:labels) => [String.t()],
+          optional(:capacity) => non_neg_integer()
+        }) :: :ok
+  def register(%{worker_id: worker_id, pid: pid, address: address} = worker)
+      when is_binary(worker_id) and is_pid(pid) and is_binary(address) do
+    GenServer.call(__MODULE__, {:register, normalize(worker)})
+  end
+
+  @doc "Drop a worker by id. Idempotent."
+  @spec unregister(String.t()) :: :ok
+  def unregister(worker_id) when is_binary(worker_id) do
+    GenServer.call(__MODULE__, {:unregister, worker_id})
+  end
+
+  @doc "Look up a worker by id, or `:error` if it is not (or no longer) registered."
+  @spec get(String.t()) :: {:ok, worker()} | :error
+  def get(worker_id) when is_binary(worker_id) do
+    case :ets.whereis(@table) do
+      :undefined ->
+        :error
+
+      _tid ->
+        case :ets.lookup(@table, worker_id) do
+          [{^worker_id, worker}] -> {:ok, worker}
+          [] -> :error
+        end
+    end
+  end
+
+  @doc "All currently registered workers."
+  @spec list() :: [worker()]
+  def list do
+    case :ets.whereis(@table) do
+      :undefined -> []
+      _tid -> :ets.tab2list(@table) |> Enum.map(fn {_id, worker} -> worker end)
+    end
+  end
+
+  @doc """
+  Select a healthy worker, restricted to those carrying `label` when one is
+  given. Returns `{:ok, worker}` or `{:error, :no_worker}`. Picks the
+  earliest-registered match for a stable choice; capacity-aware scheduling is a
+  later refinement for multi-worker pools.
+  """
+  @spec select(String.t() | nil) :: {:ok, worker()} | {:error, :no_worker}
+  def select(label \\ nil) do
+    list()
+    |> Enum.filter(fn worker -> is_nil(label) or label in worker.labels end)
+    |> case do
+      [] -> {:error, :no_worker}
+      workers -> {:ok, Enum.min_by(workers, & &1.registered_at)}
+    end
+  end
+
+  @impl true
+  def handle_call({:register, worker}, _from, state) do
+    ref = Process.monitor(worker.pid)
+    :ets.insert(@table, {worker.worker_id, worker})
+
+    # Drop any stale monitor for a prior connection of the same worker id.
+    state = drop_monitor_for(state, worker.worker_id)
+    Logger.info("RuntimeRegistry: registered worker=#{worker.worker_id} address=#{worker.address} labels=#{inspect(worker.labels)}")
+    {:reply, :ok, put_in(state.monitors[ref], worker.worker_id)}
+  end
+
+  def handle_call({:unregister, worker_id}, _from, state) do
+    :ets.delete(@table, worker_id)
+    Logger.info("RuntimeRegistry: unregistered worker=#{worker_id}")
+    {:reply, :ok, drop_monitor_for(state, worker_id)}
+  end
+
+  @impl true
+  def handle_info({:DOWN, ref, :process, _pid, _reason}, state) do
+    case Map.pop(state.monitors, ref) do
+      {nil, _monitors} ->
+        {:noreply, state}
+
+      {worker_id, monitors} ->
+        :ets.delete(@table, worker_id)
+        Logger.info("RuntimeRegistry: worker=#{worker_id} disconnected; dropped")
+        {:noreply, %{state | monitors: monitors}}
+    end
+  end
+
+  defp drop_monitor_for(state, worker_id) do
+    monitors =
+      state.monitors
+      |> Enum.reject(fn {ref, id} ->
+        if id == worker_id do
+          Process.demonitor(ref, [:flush])
+          true
+        else
+          false
+        end
+      end)
+      |> Map.new()
+
+    %{state | monitors: monitors}
+  end
+
+  defp normalize(worker) do
+    %{
+      worker_id: worker.worker_id,
+      pid: worker.pid,
+      address: worker.address,
+      labels: Map.get(worker, :labels, []),
+      capacity: Map.get(worker, :capacity, 0),
+      registered_at: System.monotonic_time(:millisecond)
+    }
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/subrun_runner.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/subrun_runner.ex
new file mode 100644
index 000000000..1bbc9e9ca
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/subrun_runner.ex
@@ -0,0 +1,267 @@
+defmodule SymphonyElixir.Runtime.SubrunRunner do
+  @moduledoc """
+  Executor for `:subrun` IR nodes: a first-class nested run. This is the
+  IR-era replacement for the `{:error, {:subrun_unsupported, id}, nil}`
+  stub the runtime carried while the rest of the substrate landed.
+
+  A subrun node names a child workflow (`subrun "child.sym"`) and optional
+  extra inputs. The runner resolves the child against `WorkflowCatalog`,
+  starts it through `Runtime.Ingress.start_workflow/3` under the same
+  supervisor, waits for the child to settle, and maps the child's terminal
+  `RunGraph.status` back to the one result triple every node kind returns
+  (`{:ok, output, nil}` / `{:error, reason, nil}`). A subrun has no engine
+  thread of its own, so `thread_id` is always `nil`.
+
+  ## Guarding recursion
+
+  Two distinct guards keep a `subrun` from spawning an unbounded tree:
+
+  - A cycle guard rejects a child whose workflow name is already on the
+    ancestor chain (`{:subrun_cycle, name, chain}`). This catches direct
+    self-subruns and any loop back to a workflow already running above.
+  - A depth ceiling rejects a chain longer than `Config.subrun_max_depth`
+    (`{:subrun_depth_exceeded, depth, ceiling}`). This is the backstop the
+    cycle guard cannot provide: two workflows that call each other through
+    a third, or any mutually recursive set with no repeated name on a
+    single branch, would otherwise recurse forever.
+
+  Both the depth and the ancestor chain are threaded down through
+  `run_opts`; the parent runtime carries its own depth and chain in process
+  state and stamps the child's onto the start opts, so a child run knows
+  exactly how deep it sits and which workflows are open above it.
+
+  ## Why monitor instead of message
+
+  The child run is a supervised `Runtime` GenServer. A succeeded or
+  cancelled run stops its process; a failed run stays alive and idle so the
+  operator surface can reach it. The runner monitors the child pid and, on
+  the `:DOWN` (or immediately for a run that started already-failed), reads
+  the durable terminal graph from `IR.Store` rather than trusting an
+  in-memory snapshot, so the mapped result reflects the persisted truth.
+  """
+
+  require Logger
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.IR.{Node, RunGraph, Store}
+  alias SymphonyElixir.Runtime
+  alias SymphonyElixir.WorkflowCatalog
+
+  @type result :: {:ok, map(), nil} | {:error, term(), nil}
+
+  # A child that started :failed (or a graph that resolves the moment it is
+  # scheduled) never emits a :DOWN we are waiting on, so cap the wait and
+  # fall back to a store read. The ceiling is generous: a real child run is
+  # bounded by its own node executors' timeouts, not this value.
+  @child_wait_ms 24 * 60 * 60 * 1_000
+
+  @spec run(Node.t(), map()) :: result()
+  def run(%Node{kind: :subrun, inputs: inputs} = node, run_opts) when is_map(run_opts) do
+    with {:ok, name} <- fetch_child_name(node, run_opts),
+         :ok <- check_depth(run_opts),
+         :ok <- check_cycle(name, run_opts),
+         {:ok, entry} <- resolve_workflow(name) do
+      start_and_await(entry, name, inputs, run_opts)
+    else
+      {:error, reason} -> {:error, reason, nil}
+    end
+  end
+
+  # The child workflow name lives on the node's `source` input. A static
+  # `subrun "child.sym"` lowers to `{:literal, "child.sym"}`; a source read
+  # from an upstream output is resolved by the runtime into `resolved_inputs`
+  # before scheduling, so a dynamic source name is read from there. The
+  # catalog keys workflows by basename without the `.sym` extension, so the
+  # name is normalized the same way the author writes the file.
+  defp fetch_child_name(%Node{inputs: inputs, id: id}, run_opts) do
+    resolved = Map.get(run_opts, :resolved_inputs, %{})
+
+    raw =
+      case Map.get(resolved, "source") do
+        value when is_binary(value) -> value
+        _ -> literal_source(inputs)
+      end
+
+    case normalize_name(raw) do
+      name when is_binary(name) and name != "" -> {:ok, name}
+      _ -> {:error, {:subrun_missing_source, id}}
+    end
+  end
+
+  defp literal_source(inputs) do
+    case Map.get(inputs, "source") do
+      {:literal, value} when is_binary(value) -> value
+      _ -> nil
+    end
+  end
+
+  defp normalize_name(value) when is_binary(value) do
+    value
+    |> String.trim()
+    |> String.replace_suffix(".sym", "")
+  end
+
+  defp normalize_name(_), do: nil
+
+  # The child sits one level below the parent. Reject before starting any
+  # child process so an over-deep chain never allocates a run id or touches
+  # the store.
+  defp check_depth(run_opts) do
+    depth = current_depth(run_opts)
+    ceiling = subrun_ceiling()
+
+    if depth + 1 > ceiling do
+      {:error, {:subrun_depth_exceeded, depth + 1, ceiling}}
+    else
+      :ok
+    end
+  end
+
+  # A child whose name is already open above us would loop. Self-subruns are
+  # the first element of this set; a longer cycle is caught the same way
+  # because every ancestor name is on the chain.
+  defp check_cycle(name, run_opts) do
+    chain = ancestors(run_opts)
+
+    if name in chain do
+      {:error, {:subrun_cycle, name, chain}}
+    else
+      :ok
+    end
+  end
+
+  defp resolve_workflow(name) do
+    case WorkflowCatalog.workflow(name) do
+      {:ok, entry} -> {:ok, entry}
+      {:error, :not_found} -> {:error, {:subrun_workflow_not_found, name}}
+    end
+  end
+
+  defp start_and_await(entry, name, inputs, run_opts) do
+    trigger = trigger_context(inputs, run_opts)
+    child_opts = child_opts(name, run_opts)
+
+    case Runtime.Ingress.start_workflow(entry, trigger, child_opts) do
+      {:ok, %{run_id: run_id, pid: pid}} -> await_child(run_id, pid, run_opts)
+      {:error, reason} -> {:error, {:subrun_start_failed, name, reason}, nil}
+    end
+  end
+
+  # The extra `subrun "child" { k: v }` bindings become the child's trigger
+  # context, the same `<input>` surface a producer-started run reads. The
+  # resolved values (from upstream outputs) take precedence over the
+  # unresolved literal refs; `source` is the workflow selector, not run
+  # input, so it is dropped from the context.
+  defp trigger_context(inputs, run_opts) do
+    resolved = Map.get(run_opts, :resolved_inputs, %{})
+
+    literals =
+      for {key, {:literal, value}} <- inputs, key != "source", into: %{}, do: {key, value}
+
+    context =
+      literals
+      |> Map.merge(Map.drop(resolved, ["source"]))
+
+    if context == %{}, do: nil, else: context
+  end
+
+  # Thread the engine and store through so the child runs against the same
+  # injected engine and store dir as the parent (tests inject a fake; one
+  # store dir keeps the child's terminal graph readable here). Push the
+  # child's depth and ancestor chain so its own subruns guard correctly.
+  defp child_opts(name, run_opts) do
+    chain = [name | ancestors(run_opts)]
+    depth = current_depth(run_opts) + 1
+
+    []
+    |> put_if_present(:engine, Map.get(run_opts, :engine))
+    |> put_if_present(:store_opts, Map.get(run_opts, :store_opts))
+    |> Keyword.put(:subrun_depth, depth)
+    |> Keyword.put(:subrun_ancestors, chain)
+  end
+
+  defp put_if_present(opts, _key, nil), do: opts
+  defp put_if_present(opts, key, value), do: Keyword.put(opts, key, value)
+
+  defp await_child(run_id, pid, run_opts) do
+    ref = Process.monitor(pid)
+
+    receive do
+      {:DOWN, ^ref, :process, ^pid, _reason} -> finalize(run_id, run_opts)
+    after
+      @child_wait_ms ->
+        Process.demonitor(ref, [:flush])
+        # A child that outlives the ceiling is itself a runaway; surface it
+        # rather than block the parent's task forever.
+        {:error, {:subrun_timeout, run_id}, nil}
+    end
+  end
+
+  # The child stopped (succeeded/cancelled) or never moved from its
+  # already-terminal start (a failed run stays alive). Either way the
+  # durable graph in the store is the source of truth for the mapped
+  # result. A failed run keeps a live process, so demonitor cannot have
+  # fired for it; the store read still resolves it.
+  defp finalize(run_id, run_opts) do
+    store_opts = Map.get(run_opts, :store_opts, [])
+
+    case Store.load(run_id, store_opts) do
+      {:ok, %RunGraph{} = graph} -> map_terminal(graph)
+      {:error, reason} -> {:error, {:subrun_result_unavailable, run_id, reason}, nil}
+    end
+  end
+
+  defp map_terminal(%RunGraph{status: :succeeded} = graph) do
+    {:ok, child_output(graph), nil}
+  end
+
+  defp map_terminal(%RunGraph{status: status, run_id: run_id}) when status in [:failed, :cancelled] do
+    {:error, {:subrun_failed, run_id, status}, nil}
+  end
+
+  defp map_terminal(%RunGraph{status: status, run_id: run_id}) do
+    # A non-terminal status here means the child stopped without resolving,
+    # which should not happen for a settled run; treat it as a failure
+    # rather than a silent success.
+    {:error, {:subrun_unresolved, run_id, status}, nil}
+  end
+
+  # The subrun node's output is the child run's terminal facts: its id,
+  # status, and the per-node outputs the child produced. The full child
+  # graph stays in its own run file; this is the compact result a parent
+  # node downstream reads through its inputs.
+  defp child_output(%RunGraph{} = graph) do
+    %{
+      kind: :subrun,
+      run_id: graph.run_id,
+      status: graph.status,
+      outputs: node_outputs(graph)
+    }
+  end
+
+  defp node_outputs(%RunGraph{nodes: nodes}) do
+    for {id, %Node{output: output}} <- nodes, not is_nil(output), into: %{}, do: {id, output}
+  end
+
+  defp current_depth(run_opts) do
+    case Map.get(run_opts, :subrun_depth) do
+      depth when is_integer(depth) and depth >= 0 -> depth
+      _ -> 0
+    end
+  end
+
+  defp ancestors(run_opts) do
+    case Map.get(run_opts, :subrun_ancestors) do
+      chain when is_list(chain) -> chain
+      _ -> []
+    end
+  end
+
+  # The configured ceiling, with a conservative fallback when Config is not
+  # running (some unit tests start the runner without the full app tree).
+  defp subrun_ceiling do
+    Config.get().subrun_max_depth
+  rescue
+    _ -> 8
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/supervisor.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/supervisor.ex
new file mode 100644
index 000000000..adbdaac0c
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/supervisor.ex
@@ -0,0 +1,88 @@
+defmodule SymphonyElixir.Runtime.Supervisor do
+  @moduledoc """
+  Dynamic supervisor for the per-run `Runtime` GenServers. Each active
+  `RunGraph` runs as one child here, so a crashing run kills only that
+  run, not the orchestrator.
+
+  The supervisor owns two operations the orchestrator needs:
+
+  - `start_run/2` schedules a fresh `RunGraph` (already materialized by
+    `IR.Materializer`) under supervision.
+  - `resume_pending/1` reloads non-terminal runs from `IR.Store` on boot
+    and restarts each with `recover: true`, so the runtime reconciles
+    orphaned `:running` nodes (the BEAM-restart half of #90) before
+    resuming. A run already live is left alone.
+
+  The engine client is injected, defaulting to `Runtime.RoomEngineClient`
+  for production. Tests pass a fake to avoid a live room-server.
+  """
+
+  use DynamicSupervisor
+  require Logger
+
+  alias SymphonyElixir.IR.{RunGraph, Store}
+  alias SymphonyElixir.Runtime
+  alias SymphonyElixir.Runtime.Placement
+
+  @default_engine SymphonyElixir.Runtime.RoomEngineClient
+
+  @spec start_link(keyword()) :: Supervisor.on_start()
+  def start_link(opts \\ []) do
+    DynamicSupervisor.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @impl true
+  def init(_opts) do
+    DynamicSupervisor.init(strategy: :one_for_one)
+  end
+
+  @doc """
+  Start a run under supervision. `opts` are forwarded to `Runtime`
+  (`:engine`, `:store_opts`, `:recover`); `:engine` defaults to the
+  production room-server client.
+  """
+  @spec start_run(RunGraph.t(), keyword()) :: DynamicSupervisor.on_start_child()
+  def start_run(%RunGraph{} = graph, opts \\ []) do
+    DynamicSupervisor.start_child(__MODULE__, {Runtime, {graph, with_default_engine(opts)}})
+  end
+
+  @doc """
+  Reload every non-terminal run from `IR.Store` and resume it with
+  `recover: true`. Idempotent: a run with a live runtime (already
+  registered) is skipped. Called once at boot.
+  """
+  @spec resume_pending(keyword()) :: :ok
+  def resume_pending(opts \\ []) do
+    store_opts = Keyword.get(opts, :store_opts, [])
+    graphs = Store.load_all(store_opts)
+
+    # Reap room-server units orphaned by a prior restart and re-attach the
+    # ones whose run we are about to resume, before resuming. The placement
+    # registry is in-memory, so without this a resumed run would collide on
+    # its deterministic unit name and every terminal run's pre-restart unit
+    # would linger. Share the loaded set so the store is read once.
+    placement(opts).reconcile(graphs, opts)
+
+    graphs
+    |> Enum.filter(&resumable?/1)
+    |> Enum.each(fn graph -> resume_one(graph, opts) end)
+  end
+
+  defp resume_one(%RunGraph{} = graph, opts) do
+    resume_opts = opts |> Keyword.put(:recover, true) |> with_default_engine()
+
+    case start_run(graph, resume_opts) do
+      {:ok, _pid} -> :ok
+      {:error, {:already_started, _pid}} -> :ok
+      {:error, reason} -> Logger.warning("Failed to resume IR run #{graph.run_id}: #{inspect(reason)}")
+    end
+  end
+
+  defp resumable?(%RunGraph{status: status}), do: status in [:pending, :running]
+
+  defp with_default_engine(opts), do: Keyword.put_new(opts, :engine, @default_engine)
+
+  # The placement module, overridable in tests with a stub so resume can be
+  # exercised without a real systemd host. Defaults to the real registry.
+  defp placement(opts), do: Keyword.get(opts, :placement, Placement)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/trigger.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/trigger.ex
new file mode 100644
index 000000000..311174422
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/trigger.ex
@@ -0,0 +1,84 @@
+defmodule SymphonyElixir.Runtime.Trigger do
+  @moduledoc """
+  The one matcher every producer shares to resolve an inbound trigger event
+  to the `.sym` workflows that declared interest in it.
+
+  A producer (cron, a webhook, the operator dashboard) builds a trigger
+  event map carrying `kind:` plus the kind's selector fields (a Slack
+  channel, a GitHub `repo`/`label`, a Linear `label`, a cron `schedule`),
+  then hands it to `Runtime.Ingress.start_by_trigger/2`. That ingress asks
+  `WorkflowCatalog.for_trigger_kind/1` for the candidates of that kind and
+  keeps the ones `matches?/2` accepts.
+
+  Keeping this predicate in one place is the point of the cutover: every
+  producer used to re-implement its own `Catalog.dags() |> Enum.filter`
+  match against the declared trigger. Now the selector vocabulary lives
+  here, the producer carries only its event-shaped extraction and dedup,
+  and a new selector field is one clause here rather than a new filter in
+  each producer.
+
+  The declared trigger is the workflow's `on` clause as the DSL parser
+  normalizes it (`parser.ex` lifts it onto the AST and the catalog copies
+  it to `entry.trigger`). The event is the runtime trigger map the producer
+  builds; it stays the value stamped onto `RunGraph.trigger`, so a node can
+  read its scope from `<input>`.
+  """
+
+  @typedoc "A workflow's declared `on` trigger, normalized by the parser."
+  @type declared :: map() | nil
+
+  @typedoc "A producer's inbound trigger event."
+  @type event :: map()
+
+  @doc """
+  Does `declared` (a workflow's `on` clause) select the inbound `event`?
+
+  The kinds already agree (the ingress filters by `kind` first), so this
+  only compares the kind's selector fields:
+
+  - `:cron` matches when the declared `schedule` equals the event's
+    `schedule`. A cron tick fires one workflow at a time, so the producer
+    echoes the schedule it resolved and this re-selects exactly it.
+  - `:linear` matches when the declared `label` is present on the event.
+    The event carries the inbound issue's labels under `:labels`; a single
+    matched label is enough.
+  - `:github_pr_label` matches when both `repo` and `label` equal the
+    event's.
+  - `:slack_huddle_completed` and `:slack_app_mention` match when the
+    declared `channel` equals the event's `channel` (a producer that
+    resolves a channel name to an id stamps both so either compares equal).
+  - `:manual` always matches its kind; an operator-started run names the
+    workflow directly and never reaches this matcher.
+
+  An event missing a selector the declared trigger requires does not match,
+  so a malformed event fires nothing rather than fanning out to every
+  workflow of that kind.
+  """
+  @spec matches?(declared(), event()) :: boolean()
+  def matches?(%{kind: :cron, schedule: schedule}, %{schedule: event_schedule}),
+    do: schedule == event_schedule
+
+  def matches?(%{kind: :linear, label: label}, %{labels: labels}) when is_list(labels),
+    do: label in labels
+
+  def matches?(%{kind: :github_pr_label, repo: repo, label: label}, event),
+    do: event[:repo] == repo and event[:label] == label
+
+  def matches?(%{kind: :slack_huddle_completed, channel: channel}, event),
+    do: channel_matches?(channel, event)
+
+  def matches?(%{kind: :slack_app_mention, channel: channel}, event),
+    do: channel_matches?(channel, event)
+
+  def matches?(%{kind: :manual}, _event), do: true
+
+  def matches?(_declared, _event), do: false
+
+  # A Slack producer resolves the declared channel name (`#general`) to an
+  # id once and stamps both `channel` and `channel_id` on the event, so the
+  # declared name compares equal to either. Comparing against both keeps
+  # this matcher independent of whether the producer worked in names or ids.
+  defp channel_matches?(channel, event) do
+    channel == event[:channel] or channel == event[:channel_id]
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/worker_client.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/worker_client.ex
new file mode 100644
index 000000000..db9748409
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/worker_client.ex
@@ -0,0 +1,196 @@
+defmodule SymphonyElixir.Runtime.WorkerClient do
+  @moduledoc """
+  Runtime-worker side of the channel: dials the control plane and serves
+  provision/teardown by running `Runtime.HostRuntime` on this host.
+
+  Booted only in the `:worker` role. On connect it joins `worker:lobby` with its
+  reachable address and labels (carried as URI query params, which the control
+  plane's `WorkerSocket.connect/3` reads). The control plane then pushes
+  `provision`/`teardown`; each runs in a supervised Task so a minutes-long clone
+  or room-server start never blocks the socket's heartbeat, and the result is
+  pushed back tagged with the request's `wire_id`.
+
+  The worker holds no secrets: the run's env arrives in the `provision` payload,
+  already resolved by the control plane, and is handed straight to HostRuntime.
+  """
+
+  use Slipstream
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.RepositoryCatalog
+  alias SymphonyElixir.Runtime.HostRuntime
+
+  require Logger
+
+  @topic "worker:lobby"
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    config = Keyword.get(opts, :config) || Config.get()
+    Slipstream.start_link(__MODULE__, config, name: __MODULE__)
+  end
+
+  @impl Slipstream
+  def init(config) do
+    socket =
+      new_socket()
+      |> assign(:config, config)
+      |> assign(:handles, %{})
+
+    {:ok, connect!(socket, connect_opts(config))}
+  end
+
+  @impl Slipstream
+  def handle_connect(socket) do
+    {:ok, join(socket, @topic)}
+  end
+
+  @impl Slipstream
+  def handle_join(@topic, _response, socket) do
+    Logger.info("WorkerClient: joined #{@topic} as #{socket.assigns.config.worker.worker_id}")
+    {:ok, socket}
+  end
+
+  @impl Slipstream
+  def handle_disconnect(_reason, socket) do
+    case reconnect(socket) do
+      {:ok, socket} -> {:ok, socket}
+      {:error, reason} -> {:stop, reason, socket}
+    end
+  end
+
+  # Control-plane pushes: run the host work in a Task so the socket stays
+  # responsive, then a handle_info delivers the result back to push it.
+  @impl Slipstream
+  def handle_message(@topic, "provision", payload, socket) do
+    %{"wire_id" => wire_id, "run_id" => run_id} = payload
+    config = with_bot_identity(socket.assigns.config, payload)
+    env = wire_env(Map.get(payload, "env", %{}))
+    token = Map.get(payload, "bot_token")
+    repositories = wire_repositories(Map.get(payload, "repositories", []))
+    client = self()
+
+    run_async(fn ->
+      result =
+        HostRuntime.provision(run_id,
+          config: config,
+          room_host: config.worker.worker_room_host,
+          env: env,
+          bot_token: token,
+          repositories: repositories
+        )
+
+      send(client, {:provision_done, wire_id, run_id, result})
+    end)
+
+    {:ok, socket}
+  end
+
+  def handle_message(@topic, "teardown", payload, socket) do
+    %{"wire_id" => wire_id, "run_id" => run_id} = payload
+    config = socket.assigns.config
+    {handle, handles} = Map.pop(socket.assigns.handles, run_id)
+    client = self()
+
+    run_async(fn ->
+      if handle, do: HostRuntime.teardown(handle, config: config)
+      send(client, {:teardown_done, wire_id})
+    end)
+
+    {:ok, assign(socket, :handles, handles)}
+  end
+
+  def handle_message(_topic, _event, _payload, socket), do: {:ok, socket}
+
+  @impl Slipstream
+  def handle_info({:provision_done, wire_id, run_id, {:ok, handle}}, socket) do
+    push(socket, @topic, "provision_result", %{
+      wire_id: wire_id,
+      ok: true,
+      base_url: handle.base_url,
+      primary_workspace: handle.primary_workspace
+    })
+
+    {:noreply, assign(socket, :handles, Map.put(socket.assigns.handles, run_id, handle))}
+  end
+
+  def handle_info({:provision_done, wire_id, _run_id, {:error, reason}}, socket) do
+    push(socket, @topic, "provision_result", %{wire_id: wire_id, ok: false, error: inspect(reason)})
+    {:noreply, socket}
+  end
+
+  def handle_info({:teardown_done, wire_id}, socket) do
+    push(socket, @topic, "teardown_result", %{wire_id: wire_id, ok: true})
+    {:noreply, socket}
+  end
+
+  defp run_async(fun) do
+    Task.Supervisor.start_child(SymphonyElixir.TaskSupervisor, fun)
+  end
+
+  # The control plane owns the bot identity (it mints the matching App
+  # token), and a worker carries no bot config of its own. Fold the
+  # dispatched user.name/user.email onto the run's config so the clone stamps
+  # the bot identity; otherwise the checkout keeps the worker host's personal
+  # git identity and the babysit skill's identity guard refuses to push. An
+  # older control plane that omits the fields leaves the worker config as-is.
+  defp with_bot_identity(config, payload) do
+    %{
+      config
+      | github_app_bot_username: present(Map.get(payload, "bot_username")) || config.github_app_bot_username,
+        github_app_bot_email: present(Map.get(payload, "bot_email")) || config.github_app_bot_email
+    }
+  end
+
+  defp present(value) when is_binary(value) and value != "", do: value
+  defp present(_), do: nil
+
+  # env crosses the wire as a JSON object; HostRuntime wants a list of
+  # {name, value} pairs.
+  defp wire_env(env) when is_map(env), do: Enum.map(env, fn {key, value} -> {to_string(key), to_string(value)} end)
+
+  # The control plane sends the run's repository catalog over the channel (the
+  # worker holds no pack of its own), so the clone targets the run's real repos
+  # rather than the worker's default pack. An empty list (an older control
+  # plane that does not send the catalog) falls back to the worker's local
+  # config inside `HostRuntime`/`Provision`.
+  defp wire_repositories(repositories) when is_list(repositories) do
+    case Enum.map(repositories, &wire_repository/1) do
+      [] -> nil
+      repos -> repos
+    end
+  end
+
+  defp wire_repository(%{"name" => name, "owner_repo" => owner_repo, "default_branch" => default_branch} = repo) do
+    %RepositoryCatalog{
+      name: name,
+      owner_repo: owner_repo,
+      default_branch: default_branch,
+      primary?: Map.get(repo, "primary", false) == true
+    }
+  end
+
+  defp connect_opts(%Config{} = config) do
+    [uri: worker_uri(config), reconnect_after_msec: [1_000, 2_000, 5_000, 10_000]]
+  end
+
+  # Derive the worker websocket URI from the control-plane base URL, carrying
+  # this worker's identity/metadata as query params the socket reads on connect.
+  defp worker_uri(%Config{worker: %{control_plane_url: base} = worker}) when is_binary(base) do
+    ws_base =
+      base
+      |> String.replace_prefix("https://", "wss://")
+      |> String.replace_prefix("http://", "ws://")
+      |> String.trim_trailing("/")
+
+    query =
+      URI.encode_query(%{
+        "worker_id" => worker.worker_id,
+        "address" => worker.worker_room_host,
+        "labels" => Enum.join(worker.worker_labels, ","),
+        "capacity" => "0"
+      })
+
+    "#{ws_base}/worker/websocket?#{query}"
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/runtime/worker_dispatch.ex b/packages/symphony/elixir/lib/symphony_elixir/runtime/worker_dispatch.ex
new file mode 100644
index 000000000..28f1a2616
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/runtime/worker_dispatch.ex
@@ -0,0 +1,75 @@
+defmodule SymphonyElixir.Runtime.WorkerDispatch do
+  @moduledoc """
+  Dispatches per-run provision/teardown from the control plane to a runtime
+  worker, over the worker's channel process.
+
+  `Runtime.Placement` resolves a worker from `RuntimeRegistry` and asks this
+  module to provision or tear down a run on it. The request is delivered to the
+  worker's channel process (`worker.pid`) as a message; that process pushes it
+  down the worker's WebSocket, awaits the worker's reply, and answers back here.
+  This module only talks to a pid, so it carries no dependency on the channel
+  implementation and stays unit-testable: `Placement` calls it through its
+  driver seam, and tests inject a fake.
+
+  The wire is request/reply correlated by a unique `ref`. A worker that never
+  answers within `timeout` yields `{:error, :worker_dispatch_timeout}` rather
+  than blocking the run forever.
+  """
+
+  @type worker :: SymphonyElixir.Runtime.RuntimeRegistry.worker()
+
+  @typedoc """
+  What the worker needs to provision a run's room-server: the runtime env to
+  inject (resolved from the control plane's secrets), the bot token for the
+  clone, the bot commit identity (`user.name`/`user.email`) that token
+  authors as, and the run's repository catalog (resolved from the control
+  plane's workflow pack, so the worker clones the run's real repos rather than
+  its own default pack). The worker binds the room-server to its own
+  configured reachable address, so the bind host is not dictated here.
+
+  `bot_username`/`bot_email` travel here because a worker holds no bot config
+  of its own: without them the worker clone keeps its host's personal git
+  identity, and the babysit skill's identity guard refuses to push.
+  """
+  @type spec :: %{
+          required(:env) => [{String.t(), String.t()}],
+          optional(:bot_token) => String.t() | nil,
+          optional(:bot_username) => String.t() | nil,
+          optional(:bot_email) => String.t() | nil,
+          optional(:repositories) => [SymphonyElixir.RepositoryCatalog.t()]
+        }
+
+  @typedoc "The worker's provision result: where to reach the room-server and run."
+  @type provisioned :: %{base_url: String.t(), primary_workspace: String.t()}
+
+  @callback provision(worker(), run_id :: String.t(), spec(), timeout()) ::
+              {:ok, provisioned()} | {:error, term()}
+  @callback teardown(worker(), run_id :: String.t(), timeout()) :: :ok | {:error, term()}
+
+  @doc "Ask `worker` to provision `run_id`'s room-server. See the module doc."
+  @spec provision(worker(), String.t(), spec(), timeout()) :: {:ok, provisioned()} | {:error, term()}
+  def provision(%{pid: pid}, run_id, spec, timeout) when is_pid(pid) and is_binary(run_id) do
+    request(pid, :provision, %{run_id: run_id, spec: spec}, timeout)
+  end
+
+  @doc "Ask `worker` to tear down `run_id`'s room-server."
+  @spec teardown(worker(), String.t(), timeout()) :: :ok | {:error, term()}
+  def teardown(%{pid: pid}, run_id, timeout) when is_pid(pid) and is_binary(run_id) do
+    case request(pid, :teardown, %{run_id: run_id}, timeout) do
+      {:ok, _} -> :ok
+      :ok -> :ok
+      {:error, reason} -> {:error, reason}
+    end
+  end
+
+  defp request(pid, op, payload, timeout) do
+    ref = make_ref()
+    send(pid, {:runtime_dispatch, op, ref, self(), payload})
+
+    receive do
+      {:runtime_dispatch_reply, ^ref, result} -> result
+    after
+      timeout -> {:error, :worker_dispatch_timeout}
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/skill.ex b/packages/symphony/elixir/lib/symphony_elixir/skill.ex
new file mode 100644
index 000000000..93a7d61bd
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/skill.ex
@@ -0,0 +1,282 @@
+defmodule SymphonyElixir.Skill do
+  @moduledoc """
+  A skill is a markdown file under `skills/` whose YAML frontmatter declares
+  the codex runtime envelope (model, reasoning effort, sandbox, approval
+  policy, tools) and whose body is the system prompt for that node type.
+
+  Example `skills/implement.md`:
+
+      ---
+      codex_model: gpt-5-codex
+      reasoning_effort: medium
+      sandbox: workspace-write
+      approval_policy: never
+      tools: [linear_graphql]
+      ---
+
+      Take the Linear ticket in $INPUT. Land the change. Open a PR per
+      the PR-submission partial. On block, drop the symphony label and
+      exit.
+
+  The body is the lever for improving the agent without code changes.
+
+  ## Partials
+
+  A skill body can include a shared partial by writing
+  `{{partial:<name>}}` on its own line (or anywhere; the token is
+  replaced inline). The loader resolves the name to
+  `skills/_partials/<name>.md` and substitutes the partial's bytes. Use
+  partials for cross-skill contracts like the Linear-issue markdown
+  template.
+
+  Partials live alongside the skill files under `_partials/`. They are
+  not skills themselves: the catalog ignores files in `_partials/`
+  because it globs `*.md` non-recursively against the skills directory.
+
+  Partial files are NOT hot-reloaded on their own. To pick up a partial
+  edit, also touch the skill files that reference it.
+
+  ### Expansion algorithm
+
+  `expand_partials` runs to a fixpoint with a seen-set:
+
+  - The first `{{partial:NAME}}` token for a given NAME loads
+    `_partials/NAME.md`, substitutes its bytes, and marks NAME as seen.
+  - Any later `{{partial:NAME}}` whose NAME is already in the seen-set is
+    dropped (replaced with empty string). This covers the self-reference
+    case: a partial that documents its own token name on a prose line will
+    have that token removed rather than cause a missing-partial error or
+    an infinite loop. It also deduplicates repeated includes of the same
+    partial in one skill body.
+  - Tokens inside an inlined partial body are themselves expanded in the
+    next iteration, so nested partials work: partial A may include partial
+    B, which expands on the subsequent pass.
+  - Iteration stops when no `{{partial:...}}` tokens remain.
+  - A genuinely-missing partial (NAME not yet seen AND
+    `_partials/NAME.md` absent on disk) is a load error
+    (`{:error, {:missing_partial, name, reason}}`); the catalog refuses
+    to publish a skill with an unresolvable include.
+
+  The seen-set is what prevented the prod outage: partial files that
+  contained a literal self-reference token in their prose header would
+  leave residual tokens in the catalog body, which `Prompt.build` then
+  re-scanned and hard-errored on. The fixpoint + seen-set makes the
+  catalog body genuinely token-free regardless of partial prose content.
+
+  ## Reasoning effort
+
+  Optional. Accepts `none`, `minimal`, `low`, `medium`, `high`, or
+  `xhigh`, mirroring the codex app-server `ReasoningEffort` enum. When
+  set, the runtime passes it as the `effort` parameter on `turn/start`
+  so the codex session uses that reasoning budget. When absent, codex
+  falls back to its built-in default for the model.
+  """
+
+  @enforce_keys [
+    :name,
+    :path,
+    :codex_model,
+    :reasoning_effort,
+    :sandbox,
+    :approval_policy,
+    :tools,
+    :body,
+    :body_hash
+  ]
+  defstruct [
+    :name,
+    :path,
+    :codex_model,
+    :reasoning_effort,
+    :sandbox,
+    :approval_policy,
+    :tools,
+    :body,
+    :body_hash
+  ]
+
+  @type reasoning_effort :: nil | String.t()
+  @type t :: %__MODULE__{
+          name: String.t(),
+          path: Path.t(),
+          codex_model: String.t(),
+          reasoning_effort: reasoning_effort(),
+          sandbox: String.t(),
+          approval_policy: String.t(),
+          tools: [String.t()],
+          body: String.t(),
+          body_hash: binary()
+        }
+
+  @reasoning_efforts ~w(none minimal low medium high xhigh)
+
+  @spec load(Path.t()) :: {:ok, t()} | {:error, term()}
+  def load(path) when is_binary(path) do
+    with {:ok, raw} <- File.read(path),
+         {:ok, frontmatter_raw, body} <- split_frontmatter(raw),
+         {:ok, frontmatter} <- decode_yaml(frontmatter_raw),
+         {:ok, body} <- expand_partials(body, partials_dir(path)),
+         {:ok, parsed} <- from_parts(frontmatter, body, path) do
+      {:ok, %{parsed | body_hash: :crypto.hash(:sha256, raw)}}
+    end
+  end
+
+  @spec from_parts(map(), String.t(), Path.t()) :: {:ok, t()} | {:error, term()}
+  defp from_parts(frontmatter, body, path)
+       when is_map(frontmatter) and is_binary(body) and is_binary(path) do
+    with {:ok, codex_model} <- fetch_string(frontmatter, "codex_model"),
+         {:ok, reasoning_effort} <- fetch_reasoning_effort(frontmatter),
+         {:ok, sandbox} <- fetch_string(frontmatter, "sandbox"),
+         {:ok, approval_policy} <- fetch_string(frontmatter, "approval_policy"),
+         {:ok, tools} <- fetch_string_list(frontmatter, "tools") do
+      name =
+        path
+        |> Path.basename(".md")
+
+      {:ok,
+       %__MODULE__{
+         name: name,
+         path: path,
+         codex_model: codex_model,
+         reasoning_effort: reasoning_effort,
+         sandbox: sandbox,
+         approval_policy: approval_policy,
+         tools: tools,
+         body: body,
+         body_hash: <<>>
+       }}
+    end
+  end
+
+  defp split_frontmatter(raw) do
+    case String.split(raw, ~r/^---\s*\n/m, parts: 3) do
+      ["", frontmatter, body] -> {:ok, frontmatter, String.trim_leading(body)}
+      _ -> {:error, :missing_frontmatter}
+    end
+  end
+
+  defp decode_yaml(raw) do
+    case YamlElixir.read_from_string(raw) do
+      {:ok, decoded} when is_map(decoded) -> {:ok, decoded}
+      {:ok, _other} -> {:error, :invalid_frontmatter}
+      {:error, reason} -> {:error, {:yaml_decode_failed, reason}}
+    end
+  end
+
+  defp fetch_string(map, key) do
+    case Map.get(map, key) do
+      value when is_binary(value) ->
+        case String.trim(value) do
+          "" -> {:error, {:missing_field, key}}
+          trimmed -> {:ok, trimmed}
+        end
+
+      _ ->
+        {:error, {:missing_field, key}}
+    end
+  end
+
+  defp fetch_string_list(map, key) do
+    case Map.get(map, key, []) do
+      list when is_list(list) ->
+        if Enum.all?(list, &is_binary/1) do
+          {:ok, list}
+        else
+          {:error, {:invalid_field, key, list}}
+        end
+
+      _ ->
+        {:error, {:invalid_field, key}}
+    end
+  end
+
+  defp fetch_reasoning_effort(map) do
+    case Map.get(map, "reasoning_effort") do
+      nil ->
+        {:ok, nil}
+
+      value when is_binary(value) ->
+        normalized = value |> String.trim() |> String.downcase()
+
+        cond do
+          normalized == "" -> {:ok, nil}
+          normalized in @reasoning_efforts -> {:ok, normalized}
+          true -> {:error, {:invalid_reasoning_effort, value}}
+        end
+
+      other ->
+        {:error, {:invalid_reasoning_effort, other}}
+    end
+  end
+
+  defp partials_dir(skill_path) do
+    skill_path
+    |> Path.dirname()
+    |> Path.join("_partials")
+  end
+
+  # Expand every `{{partial:<name>}}` occurrence with the bytes of
+  # `<partials_dir>/<name>.md`, running to a fixpoint with a seen-set so
+  # each named partial is inlined at most once.
+  #
+  # Names are limited to `[A-Za-z0-9_-]+` so the resolver cannot escape
+  # the partials directory.
+  #
+  # Resolving the leftmost token one at a time is what makes "at most
+  # once" exact. The first occurrence of a name is replaced with its
+  # partial bytes and the name is marked seen; every later occurrence of
+  # that name is dropped. A later occurrence is either a repeat include in
+  # the skill body or the self-reference token a partial carries in its
+  # own prose. Dropping that self-reference is what prevented the prod
+  # outage: under the old single-pass loader the token survived in the
+  # catalog body and `Prompt.build` then re-scanned and hard-errored on
+  # it. Tokens carried in from an inlined body are resolved on a later
+  # pass, so nested partials expand.
+  #
+  # Each step either marks one new name seen (finite) or removes one
+  # token, so the loop terminates. A genuinely-missing partial (NAME not
+  # yet seen and the file absent) is a load error so the catalog refuses
+  # to publish a half-rendered skill body.
+  @partial_token ~r/\{\{partial:([A-Za-z0-9_-]+)\}\}/
+
+  defp expand_partials(body, partials_dir) when is_binary(body) and is_binary(partials_dir) do
+    expand_partials_loop(body, partials_dir, [])
+  end
+
+  # `seen` lists the partial names already inlined. A plain list keeps the
+  # recursive boundary free of MapSet's opaque type, which dialyzer rejects
+  # here as a `call_without_opaque` mismatch even with a `MapSet.t()` spec;
+  # a skill includes only a handful of partials, so linear membership is
+  # irrelevant.
+  @spec expand_partials_loop(String.t(), String.t(), [String.t()]) ::
+          {:ok, String.t()} | {:error, term()}
+  defp expand_partials_loop(body, partials_dir, seen) do
+    case Regex.run(@partial_token, body) do
+      nil ->
+        {:ok, body}
+
+      [token, name] ->
+        if name in seen do
+          expand_partials_loop(replace_first(body, token, ""), partials_dir, seen)
+        else
+          partial_path = Path.join(partials_dir, name <> ".md")
+
+          case File.read(partial_path) do
+            {:ok, contents} ->
+              inlined = replace_first(body, token, String.trim_trailing(contents))
+              expand_partials_loop(inlined, partials_dir, [name | seen])
+
+            {:error, reason} ->
+              {:error, {:missing_partial, name, reason}}
+          end
+        end
+    end
+  end
+
+  # Replace only the matched (leftmost) token. `Regex.run` returns the
+  # leftmost match, so a literal first-occurrence replace rewrites exactly
+  # that token and leaves any later occurrence for a subsequent pass.
+  defp replace_first(body, token, replacement) do
+    String.replace(body, token, replacement, global: false)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/slack/client.ex b/packages/symphony/elixir/lib/symphony_elixir/slack/client.ex
new file mode 100644
index 000000000..0650da42f
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/slack/client.ex
@@ -0,0 +1,163 @@
+defmodule SymphonyElixir.Slack.Client do
+  @moduledoc """
+  Thin Slack Web API client used by the huddle-completion trigger.
+
+  Two responsibilities:
+
+  - Resolve a channel name to an id via `conversations.list`.
+  - Page `conversations.history` for that channel id over a recent window.
+
+  Auth comes from `Config.get().slack_bot_token`. When the bot token is
+  absent the client returns `{:error, :missing_slack_token}` and the
+  trigger stays idle.
+
+  Skills that need a Slack user token (e.g. `focus_route` for fetching
+  `huddle_transcript` files via `files.sharedPublicURL`) read
+  `SLACK_USER_OAUTH_TOKEN` directly from the inherited subprocess env;
+  Symphony does not proxy it through Config.
+
+  This module knows nothing about huddles or DAG triggering. Filtering
+  for completed huddles lives in `SymphonyElixir.Triggers.Slack`.
+  """
+
+  require Logger
+  alias SymphonyElixir.Config
+
+  @page_size 100
+
+  @spec resolve_channel_id(String.t()) :: {:ok, String.t()} | {:error, term()}
+  def resolve_channel_id(channel_name) when is_binary(channel_name) do
+    trimmed = String.trim_leading(channel_name, "#")
+
+    with {:ok, token} <- bot_token() do
+      walk_channel_list(token, trimmed, nil)
+    end
+  end
+
+  @spec conversations_history(String.t(), keyword()) :: {:ok, [map()]} | {:error, term()}
+  def conversations_history(channel_id, opts \\ []) when is_binary(channel_id) do
+    with {:ok, token} <- bot_token() do
+      params =
+        opts
+        |> Keyword.take([:oldest, :latest, :limit])
+        |> Enum.into(%{"channel" => channel_id, "limit" => @page_size})
+        |> Map.new(fn {k, v} -> {to_string(k), v} end)
+
+      case slack_get(token, "conversations.history", params) do
+        {:ok, %{"messages" => messages}} -> {:ok, messages}
+        {:error, _} = err -> err
+      end
+    end
+  end
+
+  @spec conversations_replies(String.t(), String.t(), keyword()) :: {:ok, [map()]} | {:error, term()}
+  def conversations_replies(channel_id, thread_ts, opts \\ []) when is_binary(channel_id) and is_binary(thread_ts) do
+    with {:ok, token} <- bot_token() do
+      params =
+        opts
+        |> Keyword.take([:limit])
+        |> Enum.into(%{"channel" => channel_id, "ts" => thread_ts, "limit" => @page_size})
+        |> Map.new(fn {k, v} -> {to_string(k), v} end)
+
+      case slack_get(token, "conversations.replies", params) do
+        {:ok, %{"messages" => messages}} -> {:ok, messages}
+        {:error, _} = err -> err
+      end
+    end
+  end
+
+  @spec post_message(String.t(), map()) :: {:ok, map()} | {:error, term()}
+  def post_message(channel_id, payload) when is_binary(channel_id) and is_map(payload) do
+    with {:ok, token} <- bot_token() do
+      payload = Map.put(payload, "channel", channel_id)
+      slack_post(token, "chat.postMessage", payload)
+    end
+  end
+
+  defp walk_channel_list(token, name, cursor) do
+    params =
+      %{
+        "limit" => 1000,
+        "exclude_archived" => "true",
+        "types" => "public_channel,private_channel"
+      }
+      |> maybe_put_cursor(cursor)
+
+    case slack_get(token, "conversations.list", params) do
+      {:ok, %{"channels" => channels} = body} ->
+        case Enum.find(channels, fn ch -> ch["name"] == name end) do
+          %{"id" => id} ->
+            {:ok, id}
+
+          nil ->
+            case get_in(body, ["response_metadata", "next_cursor"]) do
+              c when is_binary(c) and c != "" -> walk_channel_list(token, name, c)
+              _ -> {:error, {:channel_not_found, name}}
+            end
+        end
+
+      {:error, _} = err ->
+        err
+    end
+  end
+
+  defp maybe_put_cursor(params, nil), do: params
+  defp maybe_put_cursor(params, ""), do: params
+  defp maybe_put_cursor(params, cursor), do: Map.put(params, "cursor", cursor)
+
+  defp slack_get(token, method, params) do
+    config = Config.get()
+    url = config.slack_endpoint <> "/" <> method
+
+    case Req.get(url,
+           headers: [{"Authorization", "Bearer " <> token}],
+           params: params,
+           connect_options: [timeout: 30_000]
+         ) do
+      {:ok, %{status: 200, body: %{"ok" => true} = body}} ->
+        {:ok, body}
+
+      {:ok, %{status: 200, body: %{"ok" => false, "error" => slack_err}}} ->
+        {:error, {:slack_api_error, method, slack_err}}
+
+      {:ok, %{status: status, body: body}} ->
+        {:error, {:slack_http_status, status, body}}
+
+      {:error, reason} ->
+        {:error, {:slack_request_failed, reason}}
+    end
+  end
+
+  defp slack_post(token, method, payload) do
+    config = Config.get()
+    url = config.slack_endpoint <> "/" <> method
+
+    case Req.post(url,
+           headers: [
+             {"Authorization", "Bearer " <> token},
+             {"Content-Type", "application/json; charset=utf-8"}
+           ],
+           json: payload,
+           connect_options: [timeout: 30_000]
+         ) do
+      {:ok, %{status: 200, body: %{"ok" => true} = body}} ->
+        {:ok, body}
+
+      {:ok, %{status: 200, body: %{"ok" => false, "error" => slack_err}}} ->
+        {:error, {:slack_api_error, method, slack_err}}
+
+      {:ok, %{status: status, body: body}} ->
+        {:error, {:slack_http_status, status, body}}
+
+      {:error, reason} ->
+        {:error, {:slack_request_failed, reason}}
+    end
+  end
+
+  defp bot_token do
+    case Config.get().slack_bot_token do
+      nil -> {:error, :missing_slack_token}
+      token -> {:ok, token}
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/statistics.ex b/packages/symphony/elixir/lib/symphony_elixir/statistics.ex
new file mode 100644
index 000000000..91ab9acdf
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/statistics.ex
@@ -0,0 +1,203 @@
+defmodule SymphonyElixir.Statistics do
+  @moduledoc "Builds deterministic assignment statistics from GitHub and Linear."
+
+  alias SymphonyElixir.{Config, Linear}
+
+  @github_graphql_endpoint "https://api.github.com/graphql"
+  @github_page_size 100
+
+  @github_query """
+  query SymphonyStatisticsPullRequests($query: String!, $first: Int!, $after: String) {
+    search(type: ISSUE, query: $query, first: $first, after: $after) {
+      issueCount
+      pageInfo { hasNextPage endCursor }
+      nodes {
+        ... on PullRequest {
+          title
+          body
+          reviewRequests(first: 20) {
+            nodes {
+              requestedReviewer {
+                ... on User { login avatarUrl }
+              }
+            }
+          }
+        }
+      }
+    }
+  }
+  """
+
+  @type person_count :: %{
+          id: String.t(),
+          label: String.t(),
+          avatar_url: String.t() | nil,
+          count: non_neg_integer()
+        }
+
+  @type snapshot :: %{
+          github: %{items: [person_count()], total: non_neg_integer(), error: term() | nil},
+          linear: %{items: [person_count()], total: non_neg_integer(), error: term() | nil}
+        }
+
+  @spec snapshot() :: snapshot()
+  def snapshot do
+    case github_playbook_prs() do
+      {:ok, prs} ->
+        identifiers = prs |> Enum.flat_map(&extract_linear_identifiers/1) |> Enum.uniq()
+
+        %{
+          github: %{items: count_people(Enum.flat_map(prs, & &1.reviewers)), total: length(prs), error: nil},
+          linear: linear_snapshot(identifiers)
+        }
+
+      {:error, reason} ->
+        %{
+          github: %{items: [], total: 0, error: reason},
+          linear: %{items: [], total: 0, error: :github_prs_unavailable}
+        }
+    end
+  end
+
+  @spec linear_snapshot([String.t()]) :: %{items: [person_count()], total: non_neg_integer(), error: term() | nil}
+  def linear_snapshot(identifiers) when is_list(identifiers) do
+    case linear_assignees(identifiers) do
+      {:ok, people} -> %{items: count_people(people), total: length(identifiers), error: nil}
+      {:error, reason} -> %{items: [], total: length(identifiers), error: reason}
+    end
+  end
+
+  @spec count_people([map()]) :: [person_count()]
+  def count_people(people) when is_list(people) do
+    people
+    |> Enum.reject(&is_nil/1)
+    |> Enum.reduce(%{}, fn person, acc ->
+      id = person_id(person)
+
+      Map.update(acc, id, Map.put(person, :count, 1), fn current ->
+        %{current | count: current.count + 1}
+      end)
+    end)
+    |> Map.values()
+    |> Enum.sort_by(fn %{count: count, label: label} -> {-count, String.downcase(label)} end)
+  end
+
+  defp github_playbook_prs, do: github_playbook_prs(nil, [])
+
+  defp github_playbook_prs(after_cursor, acc) do
+    config = Config.get()
+
+    with token when is_binary(token) <- config.github_token,
+         query when is_binary(query) <- config.github_stats_query,
+         {:ok, body} <- github_graphql(token, @github_query, %{query: query, first: @github_page_size, after: after_cursor}) do
+      case body do
+        %{"data" => %{"search" => %{"nodes" => nodes, "pageInfo" => page_info}}} ->
+          prs = Enum.map(nodes, &github_pr/1)
+          next_acc = acc ++ prs
+
+          case page_info do
+            %{"hasNextPage" => true, "endCursor" => cursor} when is_binary(cursor) ->
+              github_playbook_prs(cursor, next_acc)
+
+            _ ->
+              {:ok, next_acc}
+          end
+
+        %{"errors" => errors} ->
+          {:error, {:github_graphql_errors, errors}}
+
+        other ->
+          {:error, {:github_unknown_payload, other}}
+      end
+    else
+      nil ->
+        cond do
+          is_nil(Config.get().github_token) -> {:error, :missing_github_token}
+          true -> {:error, :missing_github_stats_query}
+        end
+
+      {:error, reason} ->
+        {:error, reason}
+    end
+  end
+
+  defp github_graphql(token, query, variables) do
+    Req.post(@github_graphql_endpoint,
+      headers: [
+        {"authorization", "Bearer " <> token},
+        {"accept", "application/vnd.github+json"},
+        {"user-agent", "symphony-statistics/0.1.0"}
+      ],
+      json: %{query: query, variables: variables},
+      connect_options: [timeout: 30_000]
+    )
+    |> case do
+      {:ok, %{status: 200, body: body}} -> {:ok, body}
+      {:ok, %{status: status, body: body}} -> {:error, {:github_status, status, body}}
+      {:error, reason} -> {:error, {:github_request_failed, reason}}
+    end
+  end
+
+  defp github_pr(%{"title" => title, "body" => body, "reviewRequests" => %{"nodes" => nodes}}) do
+    %{title: title || "", body: body || "", reviewers: Enum.map(nodes, &github_review_request/1)}
+  end
+
+  defp github_pr(_), do: %{title: "", body: "", reviewers: []}
+
+  defp github_review_request(%{"requestedReviewer" => %{"login" => login} = user}) when is_binary(login) do
+    %{id: "github:" <> login, label: login, avatar_url: user["avatarUrl"]}
+  end
+
+  defp github_review_request(_), do: nil
+
+  defp extract_linear_identifiers(%{title: title, body: body}) do
+    ~r/\bENG-\d+\b/
+    |> Regex.scan(title <> "\n" <> body)
+    |> List.flatten()
+  end
+
+  defp linear_assignees([]), do: {:ok, []}
+
+  defp linear_assignees(identifiers) do
+    identifiers
+    |> Enum.chunk_every(25)
+    |> Enum.reduce_while({:ok, []}, fn chunk, {:ok, acc} ->
+      case fetch_linear_issue_chunk(chunk) do
+        {:ok, people} -> {:cont, {:ok, acc ++ people}}
+        {:error, reason} -> {:halt, {:error, reason}}
+      end
+    end)
+  end
+
+  defp fetch_linear_issue_chunk(identifiers) do
+    query = linear_issue_query(identifiers)
+
+    with {:ok, %{"data" => data}} <- Linear.Client.graphql(query, %{}) do
+      {:ok, data |> Map.values() |> Enum.map(&linear_person/1) |> Enum.reject(&is_nil/1)}
+    else
+      {:ok, %{"errors" => errors}} -> {:error, {:linear_graphql_errors, errors}}
+      {:ok, other} -> {:error, {:linear_unknown_payload, other}}
+      {:error, reason} -> {:error, reason}
+    end
+  end
+
+  defp linear_issue_query(identifiers) do
+    fields =
+      identifiers
+      |> Enum.with_index()
+      |> Enum.map_join("\n", fn {identifier, index} ->
+        "i#{index}: issue(id: #{inspect(identifier)}) { assignee { id name displayName avatarUrl } }"
+      end)
+
+    "{\n#{fields}\n}"
+  end
+
+  defp linear_person(%{"assignee" => %{"id" => id} = assignee}) when is_binary(id) do
+    label = assignee["displayName"] || assignee["name"] || id
+    %{id: "linear:" <> id, label: label, avatar_url: assignee["avatarUrl"]}
+  end
+
+  defp linear_person(_), do: nil
+
+  defp person_id(%{id: id}) when is_binary(id), do: id
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/triggers/cron.ex b/packages/symphony/elixir/lib/symphony_elixir/triggers/cron.ex
new file mode 100644
index 000000000..f7cb5413a
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/triggers/cron.ex
@@ -0,0 +1,149 @@
+defmodule SymphonyElixir.Triggers.Cron do
+  @moduledoc """
+  Time-based trigger. Ticks every `Config.cron_poll_ms` (default 60s),
+  walks every `.sym` workflow with `trigger.kind = :cron`, and starts one
+  IR run per workflow when a scheduled fire moment has passed since the
+  last recorded fire.
+
+  ## Fire semantics
+
+  Per workflow we persist `last_fired_at` via `SymphonyElixir.CronState`,
+  keyed by workflow name. On each tick:
+
+  - if the workflow has no `last_fired_at` yet, we SEED it to the current
+    moment without firing. This is the boot-time "do not catch up just
+    because we deployed" behaviour. A brand new cron workflow fires for the
+    first time at its next scheduled match after deployment.
+  - if `last_fired_at` is set, we compute `next_fire_after(last_fired_at)`
+    via `CronExpression`. If that moment is <= now, we start one run,
+    set `last_fired_at = now`, and skip any intermediate missed windows.
+    This is the `systemd Persistent=true` semantic: at most one catch-up
+    fire per workflow per restart, not N firings for N missed monthly slots.
+
+  ## Trigger context
+
+  The started run's trigger map carries:
+
+      %{
+        kind: :cron,
+        schedule: "@monthly",            # the workflow's declared schedule
+        timezone: "UTC",                 # currently always UTC; reserved
+        scheduled_for: "2026-06-01T00:00:00Z",  # ISO 8601 string, the cron-matching moment we caught up to
+        fired_at: "2026-06-01T00:00:14Z",       # ISO 8601 string, actual wall clock when we started
+        input: %{...}                    # whatever the workflow's `input` block says
+      }
+
+  Datetimes are serialized as ISO 8601 strings because the trigger
+  round-trips through JSON via `IR.Store`, and `Jason` has no built-in
+  encoder for `DateTime`. Callers that need the datetime back parse it
+  with `DateTime.from_iso8601/1`. The `schedule` field is load-bearing for
+  resolution: `start_by_trigger/2` re-selects the workflow whose declared
+  cron schedule equals it, so the tick fires exactly the workflow it
+  evaluated.
+
+  ## Dedupe
+
+  Ingress is unconditional; dedupe is by `last_fired_at`. Two ticks racing
+  for the same calendar minute is not a real risk because
+  `CronState.record_fire/2` is serialized through its GenServer, and the
+  next tick reads the updated value through ETS. If `record_fire` fails
+  we log and skip; the next tick will see the old `last_fired_at` and
+  retry.
+  """
+
+  use GenServer
+  require Logger
+
+  alias SymphonyElixir.{Config, CronExpression, CronState, WorkflowCatalog}
+  alias SymphonyElixir.Runtime.Ingress
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @doc """
+  Manually trigger one poll cycle. Test hook; production fires via the
+  internal :tick message.
+  """
+  @spec poll_now() :: :ok
+  def poll_now do
+    GenServer.call(__MODULE__, :poll_now)
+  end
+
+  @impl true
+  def init(_opts) do
+    poll_ms = Config.get().cron_poll_ms
+    schedule_tick(poll_ms)
+    {:ok, %{poll_ms: poll_ms}}
+  end
+
+  @impl true
+  def handle_info(:tick, state) do
+    tick_once()
+    schedule_tick(state.poll_ms)
+    {:noreply, state}
+  end
+
+  @impl true
+  def handle_call(:poll_now, _from, state) do
+    tick_once()
+    {:reply, :ok, state}
+  end
+
+  defp schedule_tick(ms), do: Process.send_after(self(), :tick, ms)
+
+  defp tick_once do
+    now = DateTime.utc_now()
+
+    WorkflowCatalog.for_trigger_kind(:cron)
+    |> Enum.each(fn entry -> evaluate_workflow(entry, now) end)
+  end
+
+  defp evaluate_workflow(entry, now) do
+    case CronExpression.parse(entry.trigger.schedule) do
+      {:ok, parsed} ->
+        case CronState.get_last_fired(entry.name) do
+          nil ->
+            # First time we observe this workflow; do NOT fire on boot. Seed
+            # the watermark so the first fire happens at the next match.
+            :ok = CronState.seed_if_unset(entry.name, now)
+
+          %DateTime{} = last_fired ->
+            case CronExpression.next_fire_after(parsed, last_fired) do
+              {:ok, next} ->
+                if DateTime.compare(next, now) != :gt do
+                  fire(entry, next, now)
+                end
+
+              {:error, reason} ->
+                Logger.warning("Cron next_fire_after failed for workflow=#{entry.name} schedule=#{entry.trigger.schedule}: #{inspect(reason)}")
+            end
+        end
+
+      {:error, reason} ->
+        Logger.warning("Cron schedule unparseable for workflow=#{entry.name} schedule=#{inspect(entry.trigger.schedule)}: #{inspect(reason)}")
+    end
+  end
+
+  defp fire(entry, %DateTime{} = scheduled_for, %DateTime{} = now) do
+    trigger = %{
+      kind: :cron,
+      schedule: entry.trigger.schedule,
+      timezone: entry.trigger.timezone,
+      scheduled_for: DateTime.to_iso8601(scheduled_for),
+      fired_at: DateTime.to_iso8601(now),
+      input: entry.trigger.input
+    }
+
+    case Ingress.start_by_trigger(trigger) do
+      {:ok, started} ->
+        :ok = CronState.record_fire(entry.name, now)
+
+        Logger.info("Cron started runs=#{Enum.map_join(started, ",", & &1.run_id)} workflow=#{entry.name} scheduled_for=#{DateTime.to_iso8601(scheduled_for)}")
+
+      {:error, reason} ->
+        Logger.warning("Cron failed to start workflow=#{entry.name}: #{inspect(reason)}")
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/triggers/slack.ex b/packages/symphony/elixir/lib/symphony_elixir/triggers/slack.ex
new file mode 100644
index 000000000..1a2d6d6d0
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/triggers/slack.ex
@@ -0,0 +1,178 @@
+defmodule SymphonyElixir.Triggers.Slack do
+  @moduledoc """
+  Polls Slack for completed huddles in channels referenced by any `.sym`
+  workflow whose `trigger.kind = :slack_huddle_completed`, and starts one
+  IR run per fresh huddle.
+
+  A huddle is "completed" when its `huddle_thread` message has
+  `room.has_ended = true` and the Slack-AI summary has reached
+  `room.recording.summary_status = "complete"`. We dedupe on the
+  message timestamp by checking for an existing IR run (any status) that
+  references the same `message_ts`.
+
+  Polls every `Config.slack_poll_ms`. Stays idle when
+  `SLACK_BOT_OAUTH_TOKEN` is absent. Sibling to the Linear webhook.
+  """
+
+  use GenServer
+  require Logger
+
+  alias SymphonyElixir.{Config, Slack.Client, WorkflowCatalog}
+  alias SymphonyElixir.Runtime.Ingress
+
+  @history_window_seconds 86_400 * 2
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @impl true
+  def init(_opts) do
+    config = Config.get()
+    schedule_poll(config.slack_poll_ms)
+    {:ok, %{poll_ms: config.slack_poll_ms, channel_ids: %{}}}
+  end
+
+  @impl true
+  def handle_info(:poll, state) do
+    state = poll_once(state)
+    schedule_poll(state.poll_ms)
+    {:noreply, state}
+  end
+
+  defp schedule_poll(ms), do: Process.send_after(self(), :poll, ms)
+
+  defp poll_once(state) do
+    if is_nil(Config.get().slack_bot_token) do
+      state
+    else
+      WorkflowCatalog.for_trigger_kind(:slack_huddle_completed)
+      |> Enum.reduce(state, &poll_workflow/2)
+    end
+  end
+
+  defp poll_workflow(entry, state) do
+    channel_name = entry.trigger.channel
+
+    case resolve_channel_id(channel_name, state.channel_ids) do
+      {:ok, channel_id, new_cache} ->
+        case Client.conversations_history(channel_id,
+               oldest: oldest_window(),
+               limit: 50
+             ) do
+          {:ok, messages} ->
+            Enum.each(messages, fn msg ->
+              maybe_enqueue(channel_name, channel_id, msg)
+            end)
+
+            %{state | channel_ids: new_cache}
+
+          {:error, reason} ->
+            Logger.warning("Slack huddle poll for workflow=#{entry.name} channel=#{channel_name} failed: #{inspect(reason)}")
+
+            %{state | channel_ids: new_cache}
+        end
+
+      {:error, reason} ->
+        Logger.warning("Slack channel resolution for workflow=#{entry.name} channel=#{channel_name} failed: #{inspect(reason)}")
+
+        state
+    end
+  end
+
+  defp resolve_channel_id(channel_name, cache) do
+    case Map.fetch(cache, channel_name) do
+      {:ok, id} ->
+        {:ok, id, cache}
+
+      :error ->
+        case Client.resolve_channel_id(channel_name) do
+          {:ok, id} -> {:ok, id, Map.put(cache, channel_name, id)}
+          {:error, _} = err -> err
+        end
+    end
+  end
+
+  defp oldest_window do
+    System.system_time(:second) - @history_window_seconds
+  end
+
+  defp maybe_enqueue(channel_name, channel_id, %{"subtype" => "huddle_thread"} = msg) do
+    room = Map.get(msg, "room", %{})
+    recording = Map.get(room, "recording", %{})
+
+    cond do
+      Map.get(room, "has_ended") != true ->
+        :ok
+
+      Map.get(recording, "summary_status") != "complete" ->
+        :ok
+
+      true ->
+        message_ts = Map.get(msg, "ts")
+
+        cond do
+          is_nil(message_ts) ->
+            :ok
+
+          already_seen?(message_ts) ->
+            :ok
+
+          true ->
+            trigger = build_trigger(channel_name, channel_id, msg, room, recording)
+            enqueue(trigger)
+        end
+    end
+  end
+
+  defp maybe_enqueue(_channel_name, _channel_id, _msg), do: :ok
+
+  defp build_trigger(channel_name, channel_id, msg, room, _recording) do
+    files = Map.get(msg, "files", [])
+
+    canvas_file_id =
+      Enum.find_value(files, fn f -> if f["filetype"] == "quip", do: f["id"] end)
+
+    transcript_file_id =
+      Map.get(room, "huddle_transcript_file_id") ||
+        Enum.find_value(files, fn f ->
+          if f["filetype"] == "huddle_transcript", do: f["id"]
+        end)
+
+    %{
+      kind: :slack_huddle_completed,
+      channel: channel_name,
+      channel_id: channel_id,
+      message_ts: Map.get(msg, "ts"),
+      date_start: Map.get(room, "date_start") || 0,
+      date_end: Map.get(room, "date_end") || 0,
+      canvas_file_id: canvas_file_id,
+      transcript_file_id: transcript_file_id,
+      permalink: Map.get(msg, "permalink"),
+      participants: Map.get(room, "participant_history", []) || []
+    }
+  end
+
+  defp enqueue(trigger) do
+    case Ingress.start_by_trigger(trigger) do
+      {:ok, started} ->
+        Logger.info("Started runs=#{Enum.map_join(started, ",", & &1.run_id)} for huddle channel=#{trigger.channel} ts=#{trigger.message_ts}")
+
+      {:error, reason} ->
+        Logger.warning("Failed to start huddle run channel=#{trigger.channel} ts=#{trigger.message_ts}: #{inspect(reason)}")
+    end
+  end
+
+  # Dedupe across every IR run, not per workflow: a completed huddle should
+  # fire each interested workflow once, and a second poll of the same
+  # `message_ts` must start nothing new. A run started for this huddle
+  # carries the `message_ts` on its trigger, so its presence (any status)
+  # is the watermark.
+  defp already_seen?(message_ts) do
+    Ingress.seen_trigger?(fn
+      {_status, %{kind: :slack_huddle_completed, message_ts: ts}} -> ts == message_ts
+      {_status, _trigger} -> false
+    end)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/workflow_catalog.ex b/packages/symphony/elixir/lib/symphony_elixir/workflow_catalog.ex
new file mode 100644
index 000000000..204e1bc6f
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/workflow_catalog.ex
@@ -0,0 +1,208 @@
+defmodule SymphonyElixir.WorkflowCatalog do
+  @moduledoc """
+  Watches `workflows/*.sym` under the active pack and publishes the latest
+  parsed `DSL.AST` for each, hot-reloaded the same way `Catalog` reloads
+  YAML DAGs and markdown skills.
+
+  This is the DSL-era ingress index. A producer (cron, a webhook, the
+  enqueue UI) resolves an event to a workflow by matching the event against
+  each workflow's declared `trigger`, then hands the workflow to the
+  ingress to materialize and start an IR run. The catalog owns parsing and
+  freshness; it does not start runs.
+
+  Reload semantics match `Catalog`: a new file is parsed and added, changed
+  bytes are re-parsed, a deleted file is removed, and a parse error is
+  logged while the last good version stays in place. A run snapshots its
+  workflow source hash at start, so editing the pack only affects new runs.
+
+  Entries are keyed by file basename and carry the parsed `ast`, the
+  declared `trigger` (lifted from the AST for cheap matching), the raw
+  `source`, and the `hash` the run records as `RunGraph.source_hash`.
+
+  When a file fails to parse, the last-good entry stays published and the
+  located diagnostic (`message`, `line`, `column`, `file`) is recorded
+  separately, keyed by basename. `errors/0` and `error/1` expose those so a
+  workflows view can show an author exactly where a broken `.sym` failed
+  while every other workflow keeps working. A parse error stamps the file's
+  basename so the diagnostic names the source even though the parser only
+  sees bytes; the error is cleared once the file parses again.
+  """
+
+  use GenServer
+  require Logger
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.DSL.Parser
+
+  @table :symphony_workflows
+  @errors :symphony_workflow_errors
+
+  defstruct [:workflows_dir, :poll_ms]
+
+  @typedoc "A published workflow: its parsed AST plus the freshness metadata."
+  @type entry :: %{
+          name: String.t(),
+          ast: map(),
+          trigger: map() | nil,
+          source: String.t(),
+          hash: binary()
+        }
+
+  @typedoc "A recorded parse failure for one file, keyed by basename."
+  @type parse_error :: %{
+          name: String.t(),
+          message: String.t(),
+          line: pos_integer(),
+          column: pos_integer(),
+          file: String.t()
+        }
+
+  @spec start_link(keyword()) :: GenServer.on_start()
+  def start_link(opts \\ []) do
+    GenServer.start_link(__MODULE__, opts, name: __MODULE__)
+  end
+
+  @doc "One workflow by file basename."
+  @spec workflow(String.t()) :: {:ok, entry()} | {:error, :not_found}
+  def workflow(name) when is_binary(name) do
+    case :ets.lookup(@table, name) do
+      [{_key, entry}] -> {:ok, entry}
+      [] -> {:error, :not_found}
+    end
+  end
+
+  @doc "Every published workflow."
+  @spec workflows() :: [entry()]
+  def workflows do
+    @table |> :ets.tab2list() |> Enum.map(fn {_name, entry} -> entry end)
+  end
+
+  @doc "Workflows whose declared trigger has the given `kind`. The producer's first filter."
+  @spec for_trigger_kind(atom()) :: [entry()]
+  def for_trigger_kind(kind) when is_atom(kind) do
+    Enum.filter(workflows(), fn entry -> match?(%{kind: ^kind}, entry.trigger) end)
+  end
+
+  @doc "Every currently broken file's located parse diagnostic."
+  @spec errors() :: [parse_error()]
+  def errors do
+    @errors |> :ets.tab2list() |> Enum.map(fn {_name, err} -> err end)
+  end
+
+  @doc "The last parse error for one file basename, if it is currently broken."
+  @spec error(String.t()) :: {:ok, parse_error()} | {:error, :not_found}
+  def error(name) when is_binary(name) do
+    case :ets.lookup(@errors, name) do
+      [{_key, err}] -> {:ok, err}
+      [] -> {:error, :not_found}
+    end
+  end
+
+  @impl true
+  def init(opts) do
+    :ets.new(@table, [:named_table, :public, read_concurrency: true])
+    :ets.new(@errors, [:named_table, :public, read_concurrency: true])
+
+    state = %__MODULE__{
+      workflows_dir: Keyword.get_lazy(opts, :workflows_dir, fn -> Config.get().workflows_dir end),
+      poll_ms: Keyword.get_lazy(opts, :poll_ms, fn -> Config.get().catalog_poll_ms end)
+    }
+
+    schedule_scan(0)
+    {:ok, state}
+  end
+
+  @impl true
+  def handle_info(:scan, %__MODULE__{} = state) do
+    scan(state.workflows_dir)
+    schedule_scan(state.poll_ms)
+    {:noreply, state}
+  end
+
+  @doc "Scan the workflows directory once, synchronously. Exposed for tests."
+  @spec scan(Path.t()) :: :ok
+  def scan(dir) do
+    files = Path.wildcard(Path.join(dir, "*.sym"))
+
+    seen =
+      Enum.reduce(files, MapSet.new(), fn path, acc ->
+        name = Path.basename(path, ".sym")
+        load_if_changed(name, path)
+        MapSet.put(acc, name)
+      end)
+
+    remove_missing(seen)
+  end
+
+  defp schedule_scan(after_ms), do: Process.send_after(self(), :scan, after_ms)
+
+  defp load_if_changed(name, path) do
+    case File.read(path) do
+      {:ok, raw} ->
+        hash = :crypto.hash(:sha256, raw)
+
+        unless current_hash(name) == hash do
+          parse_and_store(name, path, raw, hash)
+        end
+
+      {:error, reason} ->
+        Logger.warning("WorkflowCatalog failed to read #{path}: #{inspect(reason)}")
+    end
+  end
+
+  defp parse_and_store(name, path, raw, hash) do
+    case Parser.parse(raw, file: Path.basename(path)) do
+      {:ok, ast} ->
+        entry = %{name: ast.name || name, ast: ast, trigger: ast.trigger, source: raw, hash: hash}
+        :ets.insert(@table, {name, entry})
+        # A file that parses again clears its prior diagnostic so the
+        # workflows view stops showing a stale error.
+        :ets.delete(@errors, name)
+        Logger.info("WorkflowCatalog loaded workflow=#{name} hash=#{short_hash(hash)}")
+
+      {:error, diag} ->
+        # Keep the last-good entry in @table; record the located diagnostic
+        # so an author can see where this file broke without losing the
+        # workflows that still parse.
+        :ets.insert(@errors, {name, error_entry(name, diag)})
+        Logger.warning("WorkflowCatalog failed to parse workflow=#{name}: #{inspect(diag)}")
+    end
+  end
+
+  defp error_entry(name, diag) do
+    %{
+      name: name,
+      message: diag.message,
+      line: diag.line,
+      column: diag.column,
+      file: Map.get(diag, :file) || "#{name}.sym"
+    }
+  end
+
+  defp current_hash(name) do
+    case :ets.lookup(@table, name) do
+      [{_key, %{hash: hash}}] -> hash
+      _ -> nil
+    end
+  end
+
+  defp remove_missing(seen) do
+    # A deleted file drops both its published entry and any recorded
+    # diagnostic; the union of both tables is the set of names a scan might
+    # need to retire, since a file can be broken (only in @errors) without a
+    # last-good entry in @table.
+    (table_names(@table) ++ table_names(@errors))
+    |> Enum.uniq()
+    |> Enum.each(fn name ->
+      unless MapSet.member?(seen, name) do
+        :ets.delete(@table, name)
+        :ets.delete(@errors, name)
+        Logger.info("WorkflowCatalog removed workflow=#{name} (file deleted)")
+      end
+    end)
+  end
+
+  defp table_names(table), do: table |> :ets.tab2list() |> Enum.map(fn {name, _} -> name end)
+
+  defp short_hash(hash), do: hash |> Base.encode16(case: :lower) |> binary_part(0, 8)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/workspace.ex b/packages/symphony/elixir/lib/symphony_elixir/workspace.ex
new file mode 100644
index 000000000..48b4672ef
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/workspace.ex
@@ -0,0 +1,86 @@
+defmodule SymphonyElixir.Workspace do
+  @moduledoc """
+  Creates and destroys per-run multi-repo workspaces.
+
+  Layout:
+
+      $SYMPHONY_WORKSPACES_DIR/
+        <run_id>/
+          <primary>/ primary checkout and Codex cwd
+          docs/     sibling checkout
+          index/    sibling checkout
+          ...
+
+  Repository membership comes from `RepositoryCatalog`. Each checkout has
+  local refs and a run-scoped branch, so agents can branch, commit, and open
+  PRs in any repository included in the catalog.
+  """
+
+  alias SymphonyElixir.{Config, PathSafety, Workspace.RepoCloner}
+  require Logger
+
+  @spec create(String.t()) :: {:ok, Path.t()} | {:error, term()}
+  def create(run_id) when is_binary(run_id) do
+    config = Config.get()
+
+    if is_binary(config.primary_repo) and not File.dir?(config.primary_repo) do
+      {:error, {:primary_repo_not_directory, config.primary_repo}}
+    else
+      do_create(config, run_id)
+    end
+  end
+
+  @spec destroy(String.t()) :: :ok
+  def destroy(run_id) when is_binary(run_id) do
+    config = Config.get()
+    path = Path.join(config.workspaces_dir, run_id)
+
+    case canonicalize_under_root(path, config.workspaces_dir) do
+      {:ok, canonical} ->
+        if File.exists?(canonical), do: File.rm_rf!(canonical)
+        :ok
+
+      {:error, reason} ->
+        Logger.warning("Refusing to destroy workspace #{path}: #{inspect(reason)}")
+        :ok
+    end
+  end
+
+  defp do_create(config, run_id) do
+    workspace_path = Path.join(config.workspaces_dir, run_id)
+
+    with :ok <- ensure_workspace_absent(workspace_path),
+         {:ok, canonical} <- canonicalize_under_root(workspace_path, config.workspaces_dir),
+         {:ok, primary_checkout} <- RepoCloner.clone_all(config, canonical, run_id) do
+      {:ok, primary_checkout}
+    end
+  end
+
+  defp ensure_workspace_absent(path) do
+    case File.exists?(path) do
+      false -> :ok
+      true -> {:error, {:workspace_already_exists, path}}
+    end
+  end
+
+  defp canonicalize_under_root(path, root) do
+    expanded_root = Path.expand(root)
+    root_prefix = expanded_root <> "/"
+
+    with {:ok, canonical_path} <- PathSafety.canonicalize(path),
+         {:ok, canonical_root} <- PathSafety.canonicalize(expanded_root) do
+      canonical_root_prefix = canonical_root <> "/"
+
+      cond do
+        String.starts_with?(canonical_path <> "/", canonical_root_prefix) ->
+          {:ok, canonical_path}
+
+        String.starts_with?(Path.expand(path) <> "/", root_prefix) ->
+          {:error, :symlink_escape}
+
+        true ->
+          {:error, {:outside_workspaces_root, canonical_path, canonical_root}}
+      end
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir/workspace/repo_cloner.ex b/packages/symphony/elixir/lib/symphony_elixir/workspace/repo_cloner.ex
new file mode 100644
index 000000000..24881ee3e
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir/workspace/repo_cloner.ex
@@ -0,0 +1,94 @@
+defmodule SymphonyElixir.Workspace.RepoCloner do
+  @moduledoc """
+  Clones the repositories that make up one run workspace.
+
+  Repositories are local clones with their own refs and run-scoped branches.
+  When a matching checkout exists under the configured local repo root, clone
+  with shared objects for speed; otherwise fall back to a shallow GitHub clone.
+  """
+
+  alias SymphonyElixir.{Config, RepositoryCatalog}
+
+  @spec clone_all(Config.t(), Path.t(), String.t()) :: {:ok, Path.t()} | {:error, term()}
+  def clone_all(%Config{} = config, workspace_path, run_id) when is_binary(workspace_path) do
+    primary = RepositoryCatalog.primary(config)
+
+    with :ok <- File.mkdir_p(workspace_path),
+         :ok <- clone_repos(config, workspace_path, run_id) do
+      {:ok, Path.join(workspace_path, primary.name)}
+    end
+  end
+
+  defp clone_repos(config, workspace_path, run_id) do
+    Enum.reduce_while(RepositoryCatalog.all(config), :ok, fn repo, :ok ->
+      case clone_repo(config, workspace_path, repo, run_id) do
+        :ok -> {:cont, :ok}
+        {:error, reason} -> {:halt, {:error, reason}}
+      end
+    end)
+  end
+
+  defp clone_repo(config, workspace_path, repo, run_id) do
+    target = Path.join(workspace_path, repo.name)
+    branch = "symphony/#{run_id}"
+
+    with :ok <- ensure_absent(target),
+         :ok <- run_git_clone(config, repo, target),
+         :ok <- set_origin_url(target, repo),
+         :ok <- create_run_branch(target, branch) do
+      :ok
+    end
+  end
+
+  defp ensure_absent(path) do
+    case File.exists?(path) do
+      false -> :ok
+      true -> {:error, {:repo_workspace_already_exists, path}}
+    end
+  end
+
+  defp run_git_clone(config, repo, target) do
+    args =
+      case local_checkout(config, repo) do
+        {:ok, path} ->
+          ["clone", "--local", "--shared", "--branch", repo.default_branch, path, target]
+
+        :error ->
+          ["clone", "--depth", "1", "--branch", repo.default_branch, origin_url(repo), target]
+      end
+
+    case System.cmd("git", args, stderr_to_stdout: true) do
+      {_output, 0} -> :ok
+      {output, status} -> {:error, {:git_clone_failed, repo.name, status, String.trim(output)}}
+    end
+  end
+
+  defp local_checkout(%Config{primary_repo: primary_repo}, %{primary?: true})
+       when is_binary(primary_repo) do
+    if File.dir?(primary_repo), do: {:ok, primary_repo}, else: :error
+  end
+
+  defp local_checkout(%Config{repo_root: root}, repo) when is_binary(root) do
+    path = Path.join(root, repo.name)
+
+    if File.dir?(path), do: {:ok, path}, else: :error
+  end
+
+  defp local_checkout(_config, _repo), do: :error
+
+  defp set_origin_url(path, repo) do
+    case System.cmd("git", ["-C", path, "remote", "set-url", "origin", origin_url(repo)], stderr_to_stdout: true) do
+      {_output, 0} -> :ok
+      {output, status} -> {:error, {:git_remote_set_url_failed, repo.name, status, String.trim(output)}}
+    end
+  end
+
+  defp create_run_branch(path, branch) do
+    case System.cmd("git", ["-C", path, "checkout", "-b", branch], stderr_to_stdout: true) do
+      {_output, 0} -> :ok
+      {output, status} -> {:error, {:git_checkout_b_failed, path, status, String.trim(output)}}
+    end
+  end
+
+  defp origin_url(repo), do: "https://github.com/" <> repo.owner_repo <> ".git"
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/channels/worker_channel.ex b/packages/symphony/elixir/lib/symphony_elixir_web/channels/worker_channel.ex
new file mode 100644
index 000000000..7da1ae064
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/channels/worker_channel.ex
@@ -0,0 +1,100 @@
+defmodule SymphonyElixirWeb.WorkerChannel do
+  @moduledoc """
+  Control-plane side of the runtime-worker channel.
+
+  On join, the worker is recorded in `Runtime.RuntimeRegistry` (this channel
+  process is the monitored handle, so a disconnect drops the worker). The
+  channel then bridges `Runtime.WorkerDispatch`'s in-process request/reply to
+  the wire: a `{:runtime_dispatch, op, ref, from, payload}` message is pushed to
+  the worker tagged with a `wire_id`, and the worker's `*_result` reply is
+  correlated back by that `wire_id` and delivered to the original caller.
+  """
+
+  use Phoenix.Channel
+
+  alias SymphonyElixir.Runtime.RuntimeRegistry
+
+  require Logger
+
+  @impl true
+  def join("worker:lobby", _payload, socket) do
+    assigns = socket.assigns
+
+    if is_binary(assigns.address) and assigns.address != "" do
+      :ok =
+        RuntimeRegistry.register(%{
+          worker_id: assigns.worker_id,
+          pid: self(),
+          address: assigns.address,
+          labels: assigns.labels,
+          capacity: assigns.capacity
+        })
+
+      Logger.info("WorkerChannel: worker=#{assigns.worker_id} joined address=#{assigns.address}")
+      {:ok, assign(socket, :pending, %{})}
+    else
+      {:error, %{reason: "address required"}}
+    end
+  end
+
+  # A dispatch from the control plane (WorkerDispatch sent this to our pid).
+  # Push it to the worker tagged with a wire id and remember who to answer.
+  @impl true
+  def handle_info({:runtime_dispatch, op, ref, from, payload}, socket) do
+    wire_id = System.unique_integer([:positive])
+    push(socket, Atom.to_string(op), wire_payload(op, wire_id, payload))
+    {:noreply, assign(socket, :pending, Map.put(socket.assigns.pending, wire_id, {ref, from}))}
+  end
+
+  @impl true
+  def handle_in("provision_result", payload, socket), do: settle(socket, payload)
+  def handle_in("teardown_result", payload, socket), do: settle(socket, payload)
+
+  @impl true
+  def terminate(_reason, socket) do
+    RuntimeRegistry.unregister(socket.assigns.worker_id)
+    :ok
+  end
+
+  # env is an in-process keyword-style list of {name, value}; the wire is JSON,
+  # so it crosses as a map and the worker rebuilds the list.
+  defp wire_payload(:provision, wire_id, %{run_id: run_id, spec: spec}) do
+    %{
+      wire_id: wire_id,
+      run_id: run_id,
+      env: Map.new(Map.get(spec, :env, [])),
+      bot_token: Map.get(spec, :bot_token),
+      bot_username: Map.get(spec, :bot_username),
+      bot_email: Map.get(spec, :bot_email),
+      repositories: Enum.map(Map.get(spec, :repositories, []), &wire_repository/1)
+    }
+  end
+
+  defp wire_payload(:teardown, wire_id, %{run_id: run_id}) do
+    %{wire_id: wire_id, run_id: run_id}
+  end
+
+  # A RepositoryCatalog struct crosses the wire as a plain JSON map; the worker
+  # rebuilds the struct from these keys.
+  defp wire_repository(%{name: name, owner_repo: owner_repo, default_branch: default_branch, primary?: primary?}) do
+    %{name: name, owner_repo: owner_repo, default_branch: default_branch, primary: primary?}
+  end
+
+  defp settle(socket, %{"wire_id" => wire_id} = payload) do
+    case Map.pop(socket.assigns.pending, wire_id) do
+      {nil, _pending} ->
+        {:noreply, socket}
+
+      {{ref, from}, pending} ->
+        send(from, {:runtime_dispatch_reply, ref, decode_result(payload)})
+        {:noreply, assign(socket, :pending, pending)}
+    end
+  end
+
+  defp decode_result(%{"ok" => true} = payload) do
+    {:ok, %{base_url: payload["base_url"], primary_workspace: payload["primary_workspace"]}}
+  end
+
+  defp decode_result(%{"ok" => false} = payload), do: {:error, payload["error"] || "worker_error"}
+  defp decode_result(_payload), do: {:error, "malformed_worker_reply"}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/channels/worker_socket.ex b/packages/symphony/elixir/lib/symphony_elixir_web/channels/worker_socket.ex
new file mode 100644
index 000000000..37595bdec
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/channels/worker_socket.ex
@@ -0,0 +1,66 @@
+defmodule SymphonyElixirWeb.WorkerSocket do
+  @moduledoc """
+  The socket runtime workers connect to.
+
+  A worker dials `/worker` and joins the `worker:lobby` channel, advertising the
+  address its per-run room-servers are reachable at, its labels, and capacity.
+  Identity is the mTLS client-cert CN that the nginx boundary forwards as the
+  `x-worker-cn` header; the connection is refused without it. In dev/test, where
+  the socket is not behind mTLS, the `worker_id` connect param stands in.
+  """
+
+  use Phoenix.Socket
+
+  channel("worker:lobby", SymphonyElixirWeb.WorkerChannel)
+
+  @impl true
+  def connect(params, socket, connect_info) do
+    case worker_id(params, connect_info) do
+      nil ->
+        :error
+
+      worker_id ->
+        {:ok,
+         assign(socket, %{
+           worker_id: worker_id,
+           address: params["address"],
+           labels: parse_labels(params["labels"]),
+           capacity: parse_capacity(params["capacity"])
+         })}
+    end
+  end
+
+  @impl true
+  def id(socket), do: "worker_socket:#{socket.assigns.worker_id}"
+
+  # The mTLS-verified CN nginx forwards is authoritative; the connect param is
+  # the dev/test fallback when the socket is not behind mTLS.
+  defp worker_id(params, connect_info) do
+    header_cn(connect_info) || empty_to_nil(params["worker_id"])
+  end
+
+  defp header_cn(connect_info) do
+    connect_info
+    |> Map.get(:x_headers, [])
+    |> Enum.find_value(fn {name, value} -> if name == "x-worker-cn", do: empty_to_nil(value) end)
+  end
+
+  defp parse_labels(nil), do: []
+
+  defp parse_labels(value) when is_binary(value) do
+    value |> String.split(",", trim: true) |> Enum.map(&String.trim/1) |> Enum.reject(&(&1 == ""))
+  end
+
+  defp parse_capacity(value) when is_binary(value) do
+    case Integer.parse(value) do
+      {n, _} when n >= 0 -> n
+      _ -> 0
+    end
+  end
+
+  defp parse_capacity(_), do: 0
+
+  defp empty_to_nil(nil), do: nil
+  defp empty_to_nil(""), do: nil
+  defp empty_to_nil(value) when is_binary(value), do: value
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/components/ir_graph.ex b/packages/symphony/elixir/lib/symphony_elixir_web/components/ir_graph.ex
new file mode 100644
index 000000000..65a2745b6
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/components/ir_graph.ex
@@ -0,0 +1,488 @@
+defmodule SymphonyElixirWeb.Components.IRGraph do
+  @moduledoc """
+  Server-rendered SVG IR-graph component.
+
+  Accepts a list of node maps as produced by `IR.View.render_node/1` and
+  lays them out in a left-to-right layered DAG using a longest-path-from-roots
+  algorithm. Edges are cubic bezier curves. No JavaScript library is required;
+  the SVG is emitted directly from the server on every live update.
+
+  State classes on each `<g class="gnode ...">` element match the `.gnode.*`
+  CSS rules in the application layout so colors track live node state without
+  a client-side refresh.
+
+  When a trigger label is provided, a synthetic trigger node (class `gtrigger`)
+  is prepended as the entry that feeds all root nodes. The trigger node is not
+  part of the IR; it only appears in the visual graph.
+
+  The placement map (with `"declared"` and `"effective"` keys) is forwarded
+  to agent nodes so the graph can show a fallback label when the effective
+  location differs from what was declared.
+  """
+
+  use Phoenix.Component
+
+  # Layout spacing. Node boxes are sized to their content (see node_width/1
+  # and node_height/1) so a long cron schedule or script path never spills
+  # past the rect; @min_node_w keeps short graphs from looking cramped.
+  @min_node_w 180
+  @h_gap 80
+  @v_gap 20
+  @pad_x 30
+  @pad_y 22
+
+  # Text geometry, shared between the SVG template and the box-sizing helpers.
+  # Monospace advance is about 0.6em; the per-char widths are biased slightly
+  # wide so a glyph never crosses the border. @label_char_w sizes the bold
+  # 12px label line, @detail_char_w the 10px id and detail lines.
+  @label_char_w 7.6
+  @detail_char_w 6.4
+  @text_left 10
+  @text_right 14
+  @id_y 29
+  @detail_top 44
+  @detail_step 13
+  @bottom_pad 13
+
+  @doc """
+  Render an inline SVG graph for a list of IR nodes.
+
+  `nodes` is the `"nodes"` list from `IR.View.detail/1`: each element is a
+  string-keyed map with at least `"id"`, `"kind"`, `"state"`, `"deps"`, and
+  (for agent nodes) `"envelope"` and `"label"`.
+
+  `trigger` is the human-readable trigger string from `IR.View.detail/1`
+  (e.g. `"cron 30 * * * *"`, `"manual"`, `"linear: [sym] implement"`). When
+  provided, a distinct trigger node is drawn as the entry feeding all roots.
+
+  `placement` is the placement map from `IR.View.detail/1` (keys
+  `"declared"` and `"effective"`), forwarded to agent nodes so a fallback can
+  be shown when effective differs from declared.
+
+  `base_path` is unused in rendering but kept as an attribute to allow
+  future click-through links without a breaking interface change.
+  """
+  attr(:nodes, :list, required: true)
+  attr(:trigger, :string, default: nil)
+  attr(:placement, :map, default: nil)
+  attr(:base_path, :string, default: "/ir")
+
+  def graph(assigns) do
+    assigns = assign(assigns, :layout, layout(assigns.nodes, assigns.trigger, assigns.placement))
+
+    ~H"""
+    <svg
+      class="graph"
+      viewBox={@layout.viewbox}
+      style={"max-width: #{@layout.natural_width}px"}
+      role="img"
+      aria-label="IR graph"
+    >
+      <defs>
+        <marker id="arrow" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+          <path class="garrow" d="M0,0 L6,3 L0,6 Z" />
+        </marker>
+      </defs>
+      <%= for edge <- @layout.edges do %>
+        <path class="gedge" d={edge.d} marker-end="url(#arrow)" />
+      <% end %>
+      <%= for n <- @layout.nodes do %>
+        <g class={"gnode " <> n.state_class} transform={"translate(#{n.x},#{n.y})"}>
+          <rect width={@layout.node_w} height={@layout.node_h} />
+          <text x="10" y={if n.is_trigger, do: div(@layout.node_h, 2) + 4, else: 16} class="gnode-label">{n.label}</text>
+          <text :if={not n.is_trigger} x="10" y="29" class="gnode-id" opacity=".55">{n.id}</text>
+          <%= for {line, idx} <- Enum.with_index(n.detail_lines) do %>
+            <text x="10" y={44 + idx * 13} class="gnode-detail" opacity=".7">{line}</text>
+          <% end %>
+        </g>
+      <% end %>
+    </svg>
+    """
+  end
+
+  @doc """
+  Pure layout computation: assigns each node a layer by longest-path-from-roots
+  over `deps`, orders nodes within a layer by their first appearance in the input
+  list, and returns pixel coordinates plus bezier edge paths.
+
+  When `trigger` is a non-nil string, a synthetic trigger node is prepended
+  in layer -1 (rendered as layer 0 with all real nodes shifted right), and
+  edges are drawn from it to every root node. The trigger node carries the
+  class `gtrigger`.
+
+  Returns a map with:
+  - `viewbox` - the SVG `viewBox` attribute string
+  - `natural_width` - the numeric pixel width so the caller can cap `max-width`
+  - `node_w` / `node_h` - the content-fitted box dimensions the template draws
+  - `nodes` - list of maps with `:id`, `:x`, `:y`, `:state_class`, `:label`,
+    `:detail_lines`, `:is_trigger`
+  - `edges` - list of maps with `:d` (SVG path data string)
+
+  The function is public so it can be unit-tested independently of the
+  LiveView/component machinery.
+  """
+  @spec layout([map()], String.t() | nil, map() | nil) :: %{
+          viewbox: String.t(),
+          natural_width: integer(),
+          node_w: integer(),
+          node_h: integer(),
+          nodes: [map()],
+          edges: [map()]
+        }
+  def layout(nodes, trigger \\ nil, placement \\ nil)
+
+  def layout([], nil, _placement) do
+    %{viewbox: "0 0 200 80", natural_width: 200, node_w: @min_node_w, node_h: 80, nodes: [], edges: []}
+  end
+
+  def layout([], trigger, _placement) when is_binary(trigger) do
+    sizing = [%{id: nil, label: trigger, detail_lines: []}]
+    node_w = node_width(sizing)
+    node_h = node_height(sizing)
+    width = @pad_x + node_w + @pad_x
+    height = @pad_y + node_h + @pad_y
+
+    trigger_node = %{
+      id: "__trigger__",
+      x: @pad_x,
+      y: @pad_y,
+      state_class: "gtrigger",
+      label: trigger,
+      detail_lines: [],
+      is_trigger: true
+    }
+
+    %{
+      viewbox: "0 0 #{width} #{height}",
+      natural_width: width,
+      node_w: node_w,
+      node_h: node_h,
+      nodes: [trigger_node],
+      edges: []
+    }
+  end
+
+  def layout(nodes, trigger, placement) when is_list(nodes) do
+    # Build a node-id to deps map and compute layer assignments.
+    deps_map = Map.new(nodes, fn n -> {n["id"], n["deps"] || []} end)
+    layers = assign_layers(deps_map)
+
+    # When a trigger is provided, shift all real node layers by 1 to make
+    # room for the synthetic trigger node at layer 0.
+    layers =
+      if trigger do
+        Map.new(layers, fn {id, layer} -> {id, layer + 1} end)
+      else
+        layers
+      end
+
+    # Group node ids by layer, preserving original list order within a layer.
+    id_order = nodes |> Enum.with_index() |> Map.new(fn {n, i} -> {n["id"], i} end)
+
+    layer_groups =
+      layers
+      |> Enum.group_by(fn {_id, layer} -> layer end, fn {id, _layer} -> id end)
+      |> Map.new(fn {layer, ids} -> {layer, Enum.sort_by(ids, &Map.get(id_order, &1, 0))} end)
+
+    max_layer = layers |> Map.values() |> Enum.max(fn -> 0 end)
+
+    # When a trigger is present, layer 0 holds only the synthetic trigger node
+    # (one row). For real nodes, the tallest layer among layers >= 1 determines
+    # vertical height.
+    real_max_per_layer =
+      layer_groups
+      |> Map.drop([0])
+      |> Map.values()
+      |> Enum.map(&length/1)
+      |> Enum.max(fn -> 1 end)
+
+    max_per_layer =
+      if trigger do
+        max(real_max_per_layer, 1)
+      else
+        layer_groups |> Map.values() |> Enum.map(&length/1) |> Enum.max(fn -> 1 end)
+      end
+
+    # Compute pixel coordinates for each real node.
+    node_index = Map.new(nodes, fn n -> {n["id"], n} end)
+
+    # Pre-compute each node's render data (label, id, detail lines) so the box
+    # can be sized to its content before positioning. A fixed rect width would
+    # be overflowed by a long label such as a verbose cron schedule.
+    render_by_id =
+      Map.new(nodes, fn raw ->
+        {raw["id"],
+         %{
+           id: raw["id"],
+           state_class: state_class(raw),
+           label: primary_label(raw),
+           detail_lines: detail_lines(raw, placement)
+         }}
+      end)
+
+    sizing =
+      Map.values(render_by_id) ++
+        if(trigger, do: [%{id: nil, label: trigger, detail_lines: []}], else: [])
+
+    node_w = node_width(sizing)
+    node_h = node_height(sizing)
+
+    positioned =
+      for {id, raw} <- node_index do
+        layer = Map.get(layers, id, 0)
+        pos_in_layer = Enum.find_index(layer_groups[layer], &(&1 == id)) || 0
+        total_in_layer = length(layer_groups[layer])
+
+        x = @pad_x + layer * (node_w + @h_gap)
+        # Center nodes vertically within their layer relative to the tallest layer.
+        offset_y = div((max_per_layer - total_in_layer) * (node_h + @v_gap), 2)
+        y = @pad_y + pos_in_layer * (node_h + @v_gap) + offset_y
+
+        {id, %{x: x, y: y, raw: raw}}
+      end
+      |> Map.new()
+
+    # Build edge paths: one bezier per dep edge between real nodes.
+    edges =
+      for {id, %{x: tx, y: ty}} <- positioned,
+          dep_id <- node_index[id]["deps"] || [],
+          is_binary(dep_id),
+          Map.has_key?(positioned, dep_id) do
+        %{x: sx, y: sy} = positioned[dep_id]
+        bezier_edge(sx, sy, tx, ty, node_w, node_h)
+      end
+
+    # Find root real nodes (those with no real deps) to connect from trigger.
+    root_ids =
+      if trigger do
+        Enum.filter(nodes, fn n ->
+          known_deps = Enum.filter(n["deps"] || [], &Map.has_key?(node_index, &1))
+          known_deps == []
+        end)
+        |> Enum.map(& &1["id"])
+      else
+        []
+      end
+
+    # Synthetic trigger node sits in column 0; real nodes start at column 1.
+    trigger_x = @pad_x
+    trigger_y = @pad_y + div((max_per_layer - 1) * (node_h + @v_gap), 2)
+
+    trigger_edges =
+      for root_id <- root_ids,
+          Map.has_key?(positioned, root_id) do
+        %{x: tx, y: ty} = positioned[root_id]
+        bezier_edge(trigger_x, trigger_y, tx, ty, node_w, node_h)
+      end
+
+    all_edges = edges ++ trigger_edges
+
+    # Build the layout node list.
+    layout_nodes =
+      Enum.map(nodes, fn raw ->
+        id = raw["id"]
+        %{x: x, y: y} = positioned[id]
+        render = render_by_id[id]
+
+        %{
+          id: id,
+          x: x,
+          y: y,
+          state_class: render.state_class,
+          label: render.label,
+          detail_lines: render.detail_lines,
+          is_trigger: false
+        }
+      end)
+
+    # Prepend the trigger node when present.
+    all_nodes =
+      if trigger do
+        trigger_node = %{
+          id: "__trigger__",
+          x: trigger_x,
+          y: trigger_y,
+          state_class: "gtrigger",
+          label: trigger,
+          detail_lines: [],
+          is_trigger: true
+        }
+
+        [trigger_node | layout_nodes]
+      else
+        layout_nodes
+      end
+
+    # Size the viewBox to fit all content.
+    width = @pad_x + (max_layer + 1) * (node_w + @h_gap) - @h_gap + @pad_x
+    height = @pad_y + max_per_layer * (node_h + @v_gap) - @v_gap + @pad_y
+
+    %{
+      viewbox: "0 0 #{width} #{height}",
+      natural_width: width,
+      node_w: node_w,
+      node_h: node_h,
+      nodes: all_nodes,
+      edges: all_edges
+    }
+  end
+
+  # Emit a cubic bezier edge from the right side of the source node to the
+  # left side of the target node. Coordinates are for the node's top-left corner.
+  defp bezier_edge(sx, sy, tx, ty, node_w, node_h) do
+    x1 = sx + node_w
+    y1 = sy + div(node_h, 2)
+    x2 = tx
+    y2 = ty + div(node_h, 2)
+    mid_x = div(x1 + x2, 2)
+    %{d: "M#{x1},#{y1} C#{mid_x},#{y1} #{mid_x},#{y2} #{x2},#{y2}"}
+  end
+
+  # Box width fits the widest rendered line so a long label never crosses the
+  # border. The label uses the bold 12px font; the id and detail lines the
+  # 10px font. @min_node_w keeps short graphs from looking cramped.
+  defp node_width(renders) do
+    widest =
+      renders
+      |> Enum.flat_map(&line_pixel_widths/1)
+      |> Enum.max(fn -> 0.0 end)
+
+    max(@min_node_w, ceil(widest) + @text_left + @text_right)
+  end
+
+  defp line_pixel_widths(render) do
+    label = text_px(render.label, @label_char_w)
+    id = text_px(render[:id], @detail_char_w)
+    details = Enum.map(render.detail_lines, &text_px(&1, @detail_char_w))
+    [label, id | details]
+  end
+
+  defp text_px(nil, _char_w), do: 0.0
+  defp text_px(text, char_w) when is_binary(text), do: String.length(text) * char_w
+
+  # Box height fits the tallest node: the label and id rows plus the deepest
+  # detail block in the graph (agent nodes carry up to four envelope lines).
+  defp node_height(renders) do
+    max_detail = renders |> Enum.map(&length(&1.detail_lines)) |> Enum.max(fn -> 0 end)
+
+    bottom =
+      if max_detail > 0 do
+        @detail_top + (max_detail - 1) * @detail_step
+      else
+        @id_y
+      end
+
+    bottom + @bottom_pad
+  end
+
+  # Assigns each node a layer by the longest path from any root (a node with
+  # no incoming deps). Nodes with no deps are in layer 0; a node's layer is
+  # one more than the maximum layer of its dependencies. Returns a map of
+  # node_id => layer_number.
+  defp assign_layers(deps_map) when is_map(deps_map) do
+    # Compute layer for each node via memoized recursion. Uses a plain reduce
+    # over a stable topological ordering to avoid stack issues on deep graphs.
+    Enum.reduce(Map.keys(deps_map), %{}, fn id, acc ->
+      compute_layer(id, deps_map, acc)
+    end)
+  end
+
+  defp compute_layer(id, deps_map, memo) do
+    case Map.fetch(memo, id) do
+      {:ok, _layer} ->
+        memo
+
+      :error ->
+        deps = Map.get(deps_map, id, [])
+        # Only consider deps that exist in the graph; skip dangling edges.
+        known_deps = Enum.filter(deps, &Map.has_key?(deps_map, &1))
+
+        memo =
+          Enum.reduce(known_deps, memo, fn dep_id, acc ->
+            compute_layer(dep_id, deps_map, acc)
+          end)
+
+        layer =
+          case known_deps do
+            [] ->
+              0
+
+            _ ->
+              known_deps
+              |> Enum.map(&Map.get(memo, &1, 0))
+              |> Enum.max()
+              |> Kernel.+(1)
+          end
+
+        Map.put(memo, id, layer)
+    end
+  end
+
+  # Map a node's state (and kind for gate) to a CSS class string.
+  # Gate nodes get an additional `gate` class so the dashed border rule fires.
+  defp state_class(%{"kind" => "gate", "state" => state}), do: "gate " <> normalize_state(state)
+  defp state_class(%{"state" => state}), do: normalize_state(state)
+  defp state_class(_), do: "pending"
+
+  # The CSS rules cover succeeded/running/pending/failed/skipped. Unknown or
+  # terminal-adjacent states (upstream_failed, stranded, cancelled) fall back
+  # to "pending" visually so the SVG never references an undefined class.
+  defp normalize_state("succeeded"), do: "succeeded"
+  defp normalize_state("running"), do: "running"
+  defp normalize_state("pending"), do: "pending"
+  defp normalize_state("failed"), do: "failed"
+  defp normalize_state("skipped"), do: "skipped"
+  defp normalize_state(_), do: "pending"
+
+  # Primary label: the skill name for agent nodes, script path for exec nodes,
+  # or the kind for other nodes. Falls back to the node id when no label field
+  # is present (for nodes rendered from older view shapes).
+  defp primary_label(%{"label" => label}) when is_binary(label) and label != "", do: label
+  defp primary_label(%{"id" => id}), do: id
+
+  # Build the detail lines shown below the primary label. Agent nodes show
+  # engine/model, effort, permissions, and location (with fallback notation
+  # when the envelope location differs from the node id's effective location).
+  # Exec/subrun/gate nodes show only their kind target.
+  defp detail_lines(%{"kind" => "agent", "envelope" => env}, placement) when is_map(env) do
+    engine_model =
+      case {env["engine"], env["model"]} do
+        {e, m} when is_binary(e) and is_binary(m) -> "#{e} #{m}"
+        {e, nil} when is_binary(e) -> e
+        _ -> nil
+      end
+
+    effort = env["effort"]
+    permissions = env["permissions"]
+    location = location_line(env["location"], placement)
+
+    [engine_model, effort, permissions, location]
+    |> Enum.filter(&is_binary/1)
+    |> Enum.reject(&(&1 == ""))
+  end
+
+  defp detail_lines(%{"kind" => "gate"}, _placement), do: ["gate"]
+  defp detail_lines(%{"kind" => "map_fanout"}, _placement), do: ["map_fanout"]
+  defp detail_lines(%{"kind" => kind}, _placement) when is_binary(kind), do: [kind]
+  defp detail_lines(_, _placement), do: []
+
+  # Annotate a placement fallback on the location line. When the run's
+  # effective placement type differs from the node's declared location (e.g.
+  # declared `ixvm` but the host could not start a guest so it ran on the
+  # host), the line reads `ixvm (fallback host)`. The declared location may be
+  # a typed string like `host:hil-compute-2`, so only the type before `:` is
+  # compared. With no placement (a `/workflows` preview before any run) the
+  # declared location is shown as-is.
+  defp location_line(location, %{"effective" => effective})
+       when is_binary(location) and is_binary(effective) do
+    declared_type = location |> String.split(":") |> hd()
+
+    if declared_type == effective do
+      location
+    else
+      "#{location} (fallback #{effective})"
+    end
+  end
+
+  defp location_line(location, _placement), do: location
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/components/layouts.ex b/packages/symphony/elixir/lib/symphony_elixir_web/components/layouts.ex
new file mode 100644
index 000000000..f93e174a8
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/components/layouts.ex
@@ -0,0 +1,258 @@
+defmodule SymphonyElixirWeb.Layouts do
+  @moduledoc "Root and app layouts for the runs dashboard."
+
+  use Phoenix.Component
+
+  @spec root(map()) :: Phoenix.LiveView.Rendered.t()
+  def root(assigns) do
+    assigns = assign(assigns, :csrf_token, Plug.CSRFProtection.get_csrf_token())
+
+    ~H"""
+    <!DOCTYPE html>
+    <html lang="en">
+      <head>
+        <meta charset="utf-8" />
+        <meta name="viewport" content="width=device-width, initial-scale=1" />
+        <meta name="csrf-token" content={@csrf_token} />
+        <title>symphony</title>
+        <link
+          rel="icon"
+          type="image/svg+xml"
+          href="data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' viewBox='0 0 100 100'%3E%3Ctext x='50%25' y='50%25' dominant-baseline='central' text-anchor='middle' font-size='90'%3E%F0%9F%8E%B7%3C/text%3E%3C/svg%3E"
+        />
+        <style>
+          :root { --bg: #000000; --fg: #e7e7ea; --muted: #6a6a72; --accent: #e7e7ea; --good: #6ad28a; --bad: #ff6b6b; --warn: #d8a45a; --card: #0a0a0a; --border: #1a1a1c; }
+          * { box-sizing: border-box; }
+          body { margin: 0; background: var(--bg); color: var(--fg); font: 14px/1.5 ui-sans-serif, system-ui, -apple-system, "Inter", sans-serif; }
+          a { color: var(--fg); text-decoration: none; }
+          a:hover { text-decoration: underline; }
+          main.shell { max-width: none; margin: 0; padding: 32px 32px; }
+          header.bar { display: flex; align-items: baseline; justify-content: space-between; margin-bottom: 24px; }
+          header.bar h1 { font-size: 18px; font-weight: 600; margin: 0; letter-spacing: -0.01em; display: flex; align-items: baseline; gap: 8px; }
+          header.bar h1 .logo-mark { font-size: 18px; line-height: 1; }
+          header.bar h1 .logo-bracket { color: var(--muted); font-weight: 500; }
+          header.bar h1 .logo-name { color: var(--fg); }
+          table.runs { width: 100%; border-collapse: collapse; }
+          table.runs th, table.runs td { text-align: left; padding: 10px 12px; border-bottom: 1px solid var(--border); }
+          table.runs th { font-weight: 500; color: var(--muted); font-size: 12px; text-transform: uppercase; letter-spacing: 0.04em; }
+          table.runs tr:hover td { background: var(--card); }
+          table.runs td a.ref { font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 12px; color: var(--fg); }
+          table.runs td a.ref:hover { text-decoration: underline; }
+          table.runs td .ref-empty { color: var(--muted); font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 12px; }
+          .pager { display: flex; justify-content: space-between; align-items: center; padding: 10px 12px; color: var(--muted); font-size: 12px; }
+          .pager .pages { display: flex; gap: 6px; align-items: center; }
+          .pager a, .pager span.page-num { display: inline-block; padding: 4px 10px; border: 1px solid var(--border); color: var(--muted); font-variant-numeric: tabular-nums; }
+          .pager a:hover { color: var(--fg); border-color: var(--fg); text-decoration: none; }
+          .pager span.page-num.current { color: var(--fg); border-color: var(--fg); }
+          .pager a.disabled { opacity: 0.4; pointer-events: none; }
+          .pill { display: inline-block; padding: 2px 8px; font-size: 11px; font-weight: 500; letter-spacing: 0.02em; border: 1px solid var(--border); }
+          .pill.pending { color: var(--muted); }
+          .pill.running { color: var(--fg); border-color: var(--border); }
+          .pill.succeeded { color: var(--good); border-color: rgba(106,210,138,0.35); }
+          .pill.failed { color: var(--bad); border-color: rgba(255,107,107,0.35); }
+          .pill.skipped { color: var(--warn); border-color: rgba(216,164,90,0.35); }
+          .card { background: var(--card); border: 1px solid var(--border); padding: 16px; margin-bottom: 16px; }
+          .card-header { display: flex; align-items: baseline; justify-content: space-between; gap: 12px; margin-bottom: 10px; }
+          .card-header .title { color: var(--muted); font-size: 12px; text-transform: uppercase; letter-spacing: 0.04em; }
+          .node-grid { display: grid; gap: 10px; grid-template-columns: 1fr; }
+          .node-row { display: grid; grid-template-columns: 160px 100px minmax(0, 1fr) 140px; gap: 12px; align-items: center; padding: 8px 10px; background: var(--bg); }
+          .mono { font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 12px; }
+          .muted { color: var(--muted); }
+          .empty { color: var(--muted); padding: 24px; text-align: center; border: 1px dashed var(--border); }
+          .actions { display: flex; gap: 8px; align-items: center; }
+          .btn { display: inline-block; padding: 6px 12px; background: var(--card); color: var(--fg); border: 1px solid var(--border); cursor: pointer; font-size: 13px; text-decoration: none; }
+          .btn:hover { border-color: var(--fg); text-decoration: none; }
+          .btn.btn-primary { background: var(--fg); color: var(--bg); border-color: var(--fg); }
+          .btn.btn-primary:hover { opacity: 0.9; }
+          form.enqueue { display: flex; flex-direction: column; gap: 12px; align-items: stretch; }
+          form.enqueue select, form.enqueue input { background: var(--card); color: var(--fg); border: 1px solid var(--border); padding: 6px 10px; font: inherit; }
+          form.enqueue .row { display: flex; gap: 12px; align-items: center; width: 100%; }
+          form.enqueue label { color: var(--muted); font-size: 12px; min-width: 110px; }
+          /* min-width:0 lets the select shrink below its widest <option>; a flex
+             item defaults to min-width:auto and otherwise forces the row (and the
+             popover) wider than its width, which is the horizontal-scroll overflow. */
+          form.enqueue .field-input { flex: 1; min-width: 0; }
+          form.enqueue select.field-input { width: 100%; max-width: 100%; text-overflow: ellipsis; }
+          form.enqueue .hint { color: var(--muted); font-size: 12px; margin-left: 122px; }
+          form.enqueue .field-group { padding: 12px; border: 1px solid var(--border); background: var(--bg); }
+          form.enqueue .field-group .field-group-title { color: var(--muted); font-size: 12px; margin-bottom: 10px; text-transform: uppercase; letter-spacing: 0.04em; }
+          form.enqueue .submit-row { display: flex; justify-content: flex-end; gap: 8px; }
+          .toolbar { display: flex; justify-content: flex-end; margin-bottom: 16px; }
+          /* Native popover: a compact launcher anchored top-right so the runs table stays the page. */
+          .launcher-popover { position: fixed; inset: 64px 24px auto auto; width: 420px; max-width: calc(100vw - 48px); margin: 0; background: var(--card); color: var(--fg); border: 1px solid var(--border); padding: 20px; box-shadow: 0 12px 32px rgba(0,0,0,0.55); }
+          .launcher-popover .launcher-title { color: var(--muted); font-size: 12px; text-transform: uppercase; letter-spacing: 0.04em; margin-bottom: 12px; }
+          .launcher-popover::backdrop { background: rgba(0,0,0,0.2); }
+          nav.tabs { display: flex; gap: 16px; margin-top: 6px; }
+          nav.tabs a { color: var(--muted); padding: 4px 0; border-bottom: 1px solid transparent; font-size: 13px; }
+          nav.tabs a.active { color: var(--fg); border-bottom-color: var(--fg); }
+          nav.tabs a:hover { color: var(--fg); text-decoration: none; }
+          .dag-grid { display: grid; gap: 10px; grid-template-columns: 1fr; }
+          .dag-row { display: grid; grid-template-columns: 180px minmax(0, 280px) minmax(0, 1fr) 90px; gap: 12px; align-items: center; padding: 10px 12px; background: var(--bg); border: 1px solid var(--border); }
+          .dag-row > * { min-width: 0; overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }
+          .dag-row .name { font-weight: 500; }
+          .dag-row .right-align { text-align: right; }
+          .skill-body { white-space: pre-wrap; font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 12px; padding: 12px; background: var(--bg); border: 1px solid var(--border); max-height: 480px; overflow: auto; }
+          .kv { display: grid; grid-template-columns: 140px 1fr; gap: 6px 16px; }
+          .kv dt { color: var(--muted); font-size: 12px; }
+          .kv dd { margin: 0; }
+          .dag-diagram { overflow: auto; background: var(--bg); border: 1px solid var(--border); padding: 16px; }
+          .dag-diagram svg { display: block; margin: 0 auto; color: var(--muted); }
+          .dag-diagram .dnode { fill: var(--card); stroke: var(--border); stroke-width: 1; }
+          .dag-diagram .dnode-id { fill: var(--fg); font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 13px; font-weight: 500; }
+          .dag-diagram .dnode-skill { fill: var(--muted); font-family: ui-sans-serif, system-ui, sans-serif; font-size: 11px; }
+          .dag-diagram .dedge { stroke: var(--muted); stroke-width: 1.5; fill: none; }
+          .dag-diagram .darrow { fill: var(--muted); }
+          .back-link { display: inline-flex; align-items: center; gap: 4px; color: var(--muted); font-size: 13px; }
+          .back-link:hover { color: var(--fg); }
+          .codex-sessions { list-style: none; padding: 0; margin: 0; }
+          .codex-sessions li { border-top: 1px solid var(--border); margin: 0; }
+          .codex-sessions li:last-child { border-bottom: 1px solid var(--border); }
+          .codex-sessions li > a { display: block; padding: 10px 0; color: inherit; }
+          .codex-sessions li > a:hover { background: var(--bg); text-decoration: none; }
+          .codex-sessions .row { display: flex; justify-content: space-between; align-items: baseline; gap: 12px; }
+          .codex-sessions .row.top { margin-bottom: 2px; }
+          .codex-sessions .row.meta { font-size: 12px; color: var(--muted); gap: 8px; justify-content: flex-start; }
+          .codex-sessions .cwd { color: var(--fg); font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 13px; background: none; padding: 0; overflow-wrap: anywhere; }
+          .codex-sessions .time { color: var(--muted); font-size: 12px; font-variant-numeric: tabular-nums; white-space: nowrap; flex-shrink: 0; }
+          .codex-sessions li.live .time { color: var(--fg); font-weight: 500; }
+          .codex-sessions li.live .time::before { content: '\25cf  '; color: var(--warn); font-size: 0.6em; vertical-align: 0.2em; }
+          .codex-sessions .version { font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; }
+          .codex-sessions .preview { margin: 6px 0 0; color: var(--fg); font-size: 13px; line-height: 1.5; display: -webkit-box; -webkit-line-clamp: 2; line-clamp: 2; -webkit-box-orient: vertical; overflow: hidden; }
+          .codex-head { display: flex; justify-content: space-between; align-items: center; margin-bottom: 16px; }
+          .codex-head .state { display: inline-flex; align-items: center; gap: 6px; font-size: 12px; color: var(--muted); font-variant-numeric: tabular-nums; }
+          .codex-head .state .dot { width: 8px; height: 8px; background: var(--muted); }
+          .codex-head .state.live .dot { background: var(--warn); box-shadow: 0 0 0 3px rgba(216,164,90,0.2); }
+          .codex-head .state.live .label { color: var(--fg); font-weight: 500; }
+          .codex-log { padding: 8px 12px; max-height: calc(100vh - 280px); overflow-y: auto; }
+          .codex-event { display: inline-block; font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 11px; color: var(--muted); text-transform: lowercase; letter-spacing: 0.04em; background: var(--bg); padding: 2px 6px; margin: 6px 0; }
+          .codex-event.tokens { background: none; border: 1px dashed var(--border); }
+          .codex-msg { margin: 10px 0; background: var(--bg); border: 1px solid var(--border); padding: 8px 12px; }
+          .codex-msg header, .codex-msg summary { color: var(--muted); font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 11px; text-transform: uppercase; letter-spacing: 0.06em; margin-bottom: 4px; cursor: default; }
+          details.codex-msg > summary { cursor: pointer; list-style: none; display: flex; align-items: baseline; gap: 8px; }
+          details.codex-msg > summary::-webkit-details-marker { display: none; }
+          details.codex-msg > summary::before { content: '\25b8'; display: inline-block; font-size: 0.7em; transition: transform 0.12s ease; }
+          details.codex-msg[open] > summary::before { transform: rotate(90deg); }
+          details.codex-msg .name { color: var(--fg); text-transform: none; letter-spacing: 0; font-size: 12px; }
+          .codex-msg pre { margin: 0; border: none; padding: 0; background: none; color: var(--fg); white-space: pre-wrap; overflow-wrap: anywhere; font-size: 13px; line-height: 1.45; font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; }
+          .codex-msg[data-role='user'] { border-color: var(--fg); border-left: 2px solid var(--fg); }
+          .codex-msg[data-role='assistant'] { background: var(--card); }
+          .codex-msg[data-role='developer'] { opacity: 0.7; }
+          .codex-msg[data-role='developer'] pre { color: var(--muted); }
+          .codex-msg.reasoning { border-style: dashed; }
+          .codex-msg.reasoning pre { color: var(--muted); font-style: italic; }
+          .codex-msg.tool-output pre { max-height: 280px; overflow: auto; }
+          .codex-msg.unknown { opacity: 0.6; }
+          /* Rendered markdown (skill bodies, codex message/reasoning text).
+             Resets the pre-wrap/monospace container styling these used to
+             inherit so block elements lay out as prose. */
+          .markdown { white-space: normal; font-family: ui-sans-serif, system-ui, -apple-system, "Inter", sans-serif; font-size: 13px; line-height: 1.55; color: var(--fg); overflow-wrap: anywhere; }
+          .markdown > :first-child { margin-top: 0; }
+          .markdown > :last-child { margin-bottom: 0; }
+          .markdown p { margin: 0 0 10px; }
+          .markdown h1, .markdown h2, .markdown h3, .markdown h4, .markdown h5, .markdown h6 { margin: 16px 0 8px; line-height: 1.3; font-weight: 600; }
+          .markdown h1 { font-size: 18px; }
+          .markdown h2 { font-size: 16px; }
+          .markdown h3 { font-size: 14px; }
+          .markdown h4, .markdown h5, .markdown h6 { font-size: 13px; color: var(--muted); }
+          .markdown ul, .markdown ol { margin: 0 0 10px; padding-left: 22px; }
+          .markdown li { margin: 2px 0; }
+          .markdown li > ul, .markdown li > ol { margin: 2px 0; }
+          .markdown a { color: var(--fg); text-decoration: underline; text-underline-offset: 2px; }
+          .markdown code { font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 0.92em; background: var(--bg); border: 1px solid var(--border); border-radius: 2px; padding: 1px 4px; }
+          .markdown pre { margin: 0 0 10px; padding: 10px 12px; background: var(--bg); border: 1px solid var(--border); overflow-x: auto; }
+          .markdown pre code { background: none; border: none; padding: 0; font-size: 12px; line-height: 1.45; }
+          .markdown blockquote { margin: 0 0 10px; padding: 2px 12px; border-left: 2px solid var(--border); color: var(--muted); }
+          .markdown hr { border: none; border-top: 1px solid var(--border); margin: 16px 0; }
+          .markdown table { border-collapse: collapse; margin: 0 0 10px; }
+          .markdown th, .markdown td { border: 1px solid var(--border); padding: 6px 10px; text-align: left; }
+          .markdown th { color: var(--muted); font-weight: 500; }
+          .markdown img { max-width: 100%; }
+          .codex-msg .markdown { font-size: 13px; }
+          .codex-msg.reasoning .markdown { color: var(--muted); font-style: italic; }
+          .codex-msg[data-role='developer'] .markdown { color: var(--muted); }
+          .stats-grid { display: grid; grid-template-columns: repeat(2, minmax(0, 1fr)); gap: 16px; align-items: start; }
+          .stats-card { min-width: 0; }
+          .bar-chart { display: grid; gap: 10px; }
+          .bar-row { display: grid; grid-template-columns: minmax(150px, 220px) minmax(120px, 1fr) 48px; gap: 12px; align-items: center; min-height: 36px; }
+          .bar-person { display: flex; align-items: center; gap: 10px; min-width: 0; }
+          .bar-person img { width: 28px; height: 28px; border: 1px solid var(--border); background: var(--bg); flex: 0 0 auto; }
+          .bar-person span { overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }
+          .bar-track { height: 12px; background: var(--bg); border: 1px solid var(--border); overflow: hidden; }
+          .bar-fill { height: 100%; min-width: 3px; background: var(--fg); }
+          .bar-count { text-align: right; font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; font-size: 12px; color: var(--fg); font-variant-numeric: tabular-nums; }
+          /* Inline IR graph - server-rendered SVG, no JS library */
+          /* max-width is set inline on the SVG element to the natural content width
+             so a single-node workflow does not stretch to fill the card. */
+          .graph { display: block; width: 100%; }
+          .gnode rect { fill: #101012; stroke: var(--border); }
+          .gnode text { fill: var(--fg); font-family: ui-monospace, "SF Mono", "JetBrains Mono", monospace; }
+          .gnode .gnode-label { font-size: 12px; font-weight: 600; }
+          .gnode .gnode-id { font-size: 10px; }
+          .gnode .gnode-detail { font-size: 10px; }
+          .gnode.succeeded rect { stroke: rgba(106,210,138,0.5); }
+          .gnode.running rect { stroke: rgba(216,164,90,0.6); }
+          .gnode.pending rect { stroke: var(--border); }
+          .gnode.failed rect { stroke: rgba(255,107,107,0.5); }
+          .gnode.skipped rect { stroke: rgba(216,164,90,0.35); }
+          .gnode.gate rect { stroke-dasharray: 4 3; }
+          .gnode.gtrigger rect { fill: #0a0a12; stroke: rgba(106,138,210,0.55); stroke-dasharray: 4 3; }
+          .gnode.gtrigger .gnode-label { fill: rgba(106,138,210,0.9); }
+          .gedge { stroke: var(--border); fill: none; }
+          .garrow { fill: var(--muted); }
+          @media (max-width: 800px) {
+            main.shell { padding: 20px 16px; }
+            header.bar { align-items: flex-start; }
+            nav.tabs { flex-wrap: wrap; gap: 10px 14px; }
+            .stats-grid { grid-template-columns: 1fr; }
+            .bar-row { grid-template-columns: minmax(0, 1fr) 72px 36px; }
+          }
+        </style>
+        <script defer src="/vendor/phoenix/phoenix.js"></script>
+        <script defer src="/vendor/phoenix_html/phoenix_html.js"></script>
+        <script defer src="/vendor/phoenix_live_view/phoenix_live_view.js"></script>
+        <script>
+          window.addEventListener("DOMContentLoaded", function () {
+            var csrfToken = document.querySelector("meta[name='csrf-token']")?.getAttribute("content");
+            if (!window.Phoenix || !window.LiveView) return;
+            var liveSocket = new window.LiveView.LiveSocket("/live", window.Phoenix.Socket, { params: { _csrf_token: csrfToken } });
+            liveSocket.connect();
+            window.liveSocket = liveSocket;
+          });
+        </script>
+      </head>
+      <body>
+        {@inner_content}
+      </body>
+    </html>
+    """
+  end
+
+  @spec app(map()) :: Phoenix.LiveView.Rendered.t()
+  def app(assigns) do
+    # Every call site passes active_tab explicitly; default to :ir if
+    # someone forgets, using Map.put_new (not assign_new, which expects a
+    # socket / change-tracked assigns map and crashes on a plain one - was
+    # the cause of every LiveView route returning 500 after PR #21).
+    assigns = Map.put_new(assigns, :active_tab, :ir)
+
+    ~H"""
+    <main class="shell">
+      <header class="bar">
+        <div>
+          <h1>
+            <span class="logo-mark" aria-hidden="true">🎷</span>
+            <span><span class="logo-bracket">[</span><span class="logo-name">sym</span><span class="logo-bracket">]</span>phony</span>
+          </h1>
+          <nav class="tabs">
+            <a href="/" class={if @active_tab == :ir, do: "active", else: ""}>runs</a>
+            <a href="/workflows" class={if @active_tab == :workflows, do: "active", else: ""}>workflows</a>
+            <a href="/skills" class={if @active_tab == :skills, do: "active", else: ""}>skills</a>
+            <a href="/statistics" class={if @active_tab == :statistics, do: "active", else: ""}>statistics</a>
+          </nav>
+        </div>
+      </header>
+      {@inner_content}
+    </main>
+    """
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/controllers/api_controller.ex b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/api_controller.ex
new file mode 100644
index 000000000..e18a7ec8d
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/api_controller.ex
@@ -0,0 +1,42 @@
+defmodule SymphonyElixirWeb.ApiController do
+  @moduledoc """
+  The manual-trigger enqueue producer onto the IR runtime.
+
+      POST /api/v1/runs   start IR run(s) from a manual trigger;
+                          body: {"workflow": "...", "input": {...}}
+
+  A caller naming a `workflow` starts exactly that `.sym`; a caller without
+  one fires every `on manual` workflow through the shared trigger matcher.
+  Input rides on the trigger context so a node can read it as `<input>`.
+  """
+
+  use Phoenix.Controller, formats: [:json]
+
+  alias SymphonyElixir.Runtime.Ingress
+
+  def enqueue_run(conn, params) do
+    input = Map.get(params, "input", %{})
+
+    case Map.get(params, "workflow") || Map.get(params, "dag") do
+      name when is_binary(name) and name != "" ->
+        Ingress.start_by_name(name, %{kind: :manual, input: input}, [])
+        |> respond_started(conn)
+
+      _ ->
+        Ingress.start_by_trigger(%{kind: :manual, input: input}, [])
+        |> respond_started(conn)
+    end
+  end
+
+  defp respond_started({:ok, %{run_id: run_id}}, conn),
+    do: conn |> put_status(:created) |> json(%{run_ids: [run_id]})
+
+  defp respond_started({:ok, started}, conn) when is_list(started),
+    do: conn |> put_status(:created) |> json(%{run_ids: Enum.map(started, & &1.run_id)})
+
+  defp respond_started({:error, {:workflow_not_found, _}} = reason, conn),
+    do: conn |> put_status(:not_found) |> json(%{error: inspect(reason)})
+
+  defp respond_started({:error, reason}, conn),
+    do: conn |> put_status(:unprocessable_entity) |> json(%{error: inspect(reason)})
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/controllers/github_webhook_controller.ex b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/github_webhook_controller.ex
new file mode 100644
index 000000000..1fd6b366a
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/github_webhook_controller.ex
@@ -0,0 +1,145 @@
+defmodule SymphonyElixirWeb.GithubWebhookController do
+  @moduledoc """
+  Receives GitHub pull-request label webhooks and starts matching IR runs.
+
+  Only pull_request.labeled events are actionable. Matching is driven by
+  `.sym` workflows declaring trigger.kind = github_pr_label with a
+  trigger.repo and trigger.label that match the incoming event, resolved
+  through the shared `Runtime.Trigger` matcher.
+  """
+
+  use Phoenix.Controller, formats: [:json]
+
+  require Logger
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.Runtime.Ingress
+
+  @spec accept(Plug.Conn.t(), map()) :: Plug.Conn.t()
+  def accept(conn, params) do
+    with :ok <- verify_signature(conn),
+         :ok <- verify_event(conn) do
+      json(conn, handle_event(params))
+    else
+      {:error, status, reason} ->
+        Logger.warning("GitHub webhook rejected: #{reason}")
+
+        conn
+        |> put_status(status)
+        |> json(%{error: reason})
+    end
+  end
+
+  defp verify_signature(conn) do
+    cond do
+      is_nil(Config.get().github_webhook_secret) ->
+        {:error, :unauthorized, "github webhook secret not configured"}
+
+      is_nil(conn.assigns[:raw_body]) ->
+        {:error, :bad_request, "missing raw body"}
+
+      true ->
+        provided =
+          conn
+          |> Plug.Conn.get_req_header("x-hub-signature-256")
+          |> List.first()
+
+        expected = expected_signature(conn.assigns.raw_body)
+
+        cond do
+          is_nil(provided) ->
+            {:error, :unauthorized, "missing X-Hub-Signature-256 header"}
+
+          byte_size(provided) != byte_size(expected) ->
+            {:error, :unauthorized, "signature mismatch"}
+
+          not Plug.Crypto.secure_compare(provided, expected) ->
+            {:error, :unauthorized, "signature mismatch"}
+
+          true ->
+            :ok
+        end
+    end
+  end
+
+  defp expected_signature(raw_body) do
+    secret = Config.get().github_webhook_secret
+    digest = :crypto.mac(:hmac, :sha256, secret, raw_body) |> Base.encode16(case: :lower)
+    "sha256=" <> digest
+  end
+
+  defp verify_event(conn) do
+    case conn |> Plug.Conn.get_req_header("x-github-event") |> List.first() do
+      "pull_request" -> :ok
+      nil -> {:error, :bad_request, "missing X-GitHub-Event header"}
+      other -> {:error, :accepted, "ignored GitHub event #{other}"}
+    end
+  end
+
+  defp handle_event(%{"action" => "labeled", "pull_request" => pr, "repository" => repo, "label" => label})
+       when is_map(pr) and is_map(repo) and is_map(label) do
+    repo_name = Map.get(repo, "full_name")
+    label_name = label |> Map.get("name", "") |> normalize_label()
+    pr_number = Map.get(pr, "number")
+
+    cond do
+      Map.get(pr, "state") != "open" ->
+        %{ok: true, results: [format_result({:ignored, "PR is not open"})]}
+
+      not is_integer(pr_number) ->
+        %{ok: true, results: [format_result({:ignored, "PR number missing"})]}
+
+      active_run_exists?(repo_name, pr_number) ->
+        %{ok: true, results: [format_result({:deduped, pr_number})]}
+
+      true ->
+        start_label(build_trigger(repo_name, label_name, pr_number, pr), repo_name, pr_number)
+    end
+  end
+
+  defp handle_event(_event), do: %{ok: true, ignored: true}
+
+  defp build_trigger(repo_name, label_name, pr_number, pr) do
+    %{
+      kind: :github_pr_label,
+      repo: repo_name,
+      label: label_name,
+      pr_number: pr_number,
+      pr_url: Map.get(pr, "html_url"),
+      title: Map.get(pr, "title"),
+      head_ref: get_in(pr, ["head", "ref"]),
+      head_repo: get_in(pr, ["head", "repo", "full_name"]),
+      base_ref: get_in(pr, ["base", "ref"])
+    }
+  end
+
+  defp start_label(trigger, repo_name, pr_number) do
+    case Ingress.start_by_trigger(trigger) do
+      {:ok, started} ->
+        Logger.info("Started runs=#{Enum.map_join(started, ",", & &1.run_id)} for #{repo_name}##{pr_number} via github label")
+        %{ok: true, enqueued: length(started), results: Enum.map(started, &format_result({:enqueued, &1.run_id}))}
+
+      {:error, reason} ->
+        Logger.warning("Failed to start github label run for #{repo_name}##{pr_number}: #{inspect(reason)}")
+        %{ok: true, results: [format_result({:error, inspect(reason)})]}
+    end
+  end
+
+  defp active_run_exists?(repo, pr_number) do
+    Ingress.seen_trigger?(fn
+      {status, %{kind: :github_pr_label, repo: r, pr_number: n}} ->
+        status in [:pending, :running] and r == repo and n == pr_number
+
+      {_status, _trigger} ->
+        false
+    end)
+  end
+
+  defp normalize_label(name) when is_binary(name), do: name |> String.trim() |> String.downcase()
+  defp normalize_label(_), do: ""
+
+  defp format_result({:enqueued, run_id}), do: %{status: "enqueued", run_id: run_id}
+  defp format_result({:deduped, pr_number}), do: %{status: "deduped", pr_number: pr_number}
+  defp format_result({:ignored, reason}), do: %{status: "ignored", reason: reason}
+  defp format_result({:error, reason}), do: %{status: "error", reason: reason}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/controllers/ir_run_controller.ex b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/ir_run_controller.ex
new file mode 100644
index 000000000..6a9c23a48
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/ir_run_controller.ex
@@ -0,0 +1,126 @@
+defmodule SymphonyElixirWeb.IRRunController do
+  @moduledoc """
+  Read-only JSON API over IR runs (the `RunGraph` model), and the operator
+  control endpoints.
+
+      GET  /api/v1/ir/schema               the runtime's enum vocabulary
+      GET  /api/v1/ir/runs                 list IR runs (summaries)
+      POST /api/v1/ir/runs                 start a run from a workflow name
+      GET  /api/v1/ir/runs/:run_id         one IR run (full detail)
+      POST /api/v1/ir/runs/:run_id/cancel        operator: cancel
+      POST /api/v1/ir/runs/:run_id/rerun         operator: re-run all
+      POST /api/v1/ir/runs/:run_id/clear-failed  operator: clear failed nodes
+      POST /api/v1/ir/runs/:run_id/nodes/:node_id/retry  operator: retry one node
+
+  This is parallel to the legacy `/api/v1/runs` surface (the old `Run`
+  model) and renders the canonical IR facts through `IR.View`, keeping the
+  protocol emitter out of the runtime. Reads come from `IR.Store` so a
+  finished or restarted run is visible; operator actions go to the live
+  `Runtime` process, returning 409 when the run has no live process to act
+  on (a succeeded or cancelled run that already stopped).
+  """
+
+  use Phoenix.Controller, formats: [:json]
+
+  alias SymphonyElixir.DSL.Schema
+  alias SymphonyElixir.IR.{Store, View}
+  alias SymphonyElixir.Runtime
+
+  # The runtime's single source of truth for the form's option lists:
+  # engines, efforts, permissions, locations, node kinds/states, effect
+  # kinds, and trigger kinds. A consumer drives its selects from this so a
+  # new enum value at its owner reaches the UI without a form edit.
+  def schema(conn, _params) do
+    json(conn, Schema.to_map())
+  end
+
+  def index(conn, _params) do
+    summaries = Store.load_all() |> Enum.sort_by(& &1.run_id) |> Enum.map(&View.summary/1)
+    json(conn, %{runs: summaries})
+  end
+
+  # Start a run from a workflow name. This is the manual/operator door onto
+  # the IR runtime: resolve the workflow through the catalog, materialize
+  # it, and start it under Runtime.Supervisor. Trigger context is optional;
+  # an operator-started run carries `%{kind: :manual}` plus any input the
+  # caller passed.
+  def create(conn, %{"workflow" => name}) when is_binary(name) do
+    case Runtime.Ingress.start_by_name(name, trigger_context(conn.params), []) do
+      {:ok, %{run_id: run_id}} ->
+        conn |> put_status(:created) |> json(%{run_id: run_id})
+
+      {:error, {:workflow_not_found, _}} = reason ->
+        conn |> put_status(:not_found) |> json(%{error: inspect(reason)})
+
+      {:error, reason} ->
+        conn |> put_status(:unprocessable_entity) |> json(%{error: inspect(reason)})
+    end
+  end
+
+  def create(conn, _params) do
+    conn |> put_status(:unprocessable_entity) |> json(%{error: "missing required field: workflow"})
+  end
+
+  # Build the trigger context from request params. A manual run always
+  # carries `kind: :manual`; any caller-supplied `input` map rides along so
+  # a node can read it as `<input>`. Absent or non-map input defaults to an
+  # empty map so the graph trigger shape is stable.
+  defp trigger_context(params) do
+    input =
+      case params["input"] do
+        %{} = map -> map
+        _ -> %{}
+      end
+
+    %{kind: :manual, input: input}
+  end
+
+  def show(conn, %{"run_id" => run_id}) do
+    case Store.load(run_id) do
+      {:ok, graph} -> json(conn, View.detail(graph))
+      {:error, :not_found} -> not_found(conn)
+      {:error, reason} -> conn |> put_status(:unprocessable_entity) |> json(%{error: inspect(reason)})
+    end
+  end
+
+  def cancel(conn, %{"run_id" => run_id}), do: operate(conn, run_id, &Runtime.cancel(&1, actor(conn)))
+
+  def rerun(conn, %{"run_id" => run_id}), do: operate(conn, run_id, &Runtime.rerun(&1, actor(conn)))
+
+  def clear_failed(conn, %{"run_id" => run_id}),
+    do: operate(conn, run_id, &Runtime.clear_failed(&1, actor(conn)))
+
+  def retry_node(conn, %{"run_id" => run_id, "node_id" => node_id}),
+    do: operate(conn, run_id, &Runtime.retry_node(&1, node_id, actor(conn)))
+
+  # Apply an operator action to the live run, then return its current
+  # persisted detail. A run with no live process (already stopped) returns
+  # 409 with a clear reason rather than a 500 from the GenServer call.
+  defp operate(conn, run_id, action) do
+    action.(run_id)
+
+    case Store.load(run_id) do
+      {:ok, graph} -> json(conn, View.detail(graph))
+      {:error, :not_found} -> not_found(conn)
+      {:error, reason} -> conn |> put_status(:unprocessable_entity) |> json(%{error: inspect(reason)})
+    end
+  catch
+    :exit, {:noproc, _} -> run_not_live(conn, run_id)
+    :exit, {{:noproc, _}, _} -> run_not_live(conn, run_id)
+  end
+
+  defp actor(conn) do
+    case get_req_header(conn, "x-operator") do
+      [value | _] when value != "" -> value
+      _ -> :operator
+    end
+  end
+
+  defp not_found(conn), do: conn |> put_status(:not_found) |> json(%{error: "run not found"})
+
+  defp run_not_live(conn, run_id) do
+    conn
+    |> put_status(:conflict)
+    |> json(%{error: "run #{run_id} has no live process; it has already finished or is not running"})
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/controllers/linear_webhook_controller.ex b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/linear_webhook_controller.ex
new file mode 100644
index 000000000..c8ade8615
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/linear_webhook_controller.ex
@@ -0,0 +1,151 @@
+defmodule SymphonyElixirWeb.LinearWebhookController do
+  @moduledoc """
+  Receives Linear webhook events and starts IR runs for any `.sym`
+  workflow whose `trigger.kind = :linear` label matches a label on the
+  inbound issue.
+
+  Replaces the old `Triggers.Linear` poller. Linear's 2500-req/hr quota
+  is plenty when the poller is gone; webhooks add zero scheduled
+  traffic.
+
+  Setup, in Linear's webhook admin:
+
+  - URL: `https://<symphony-host>/api/v1/triggers/linear`
+  - Resource types: `Issue` (at minimum)
+  - Copy the signing secret into `LINEAR_WEBHOOK_SECRET` on the
+    symphony host
+
+  Security:
+
+  - Every request must carry a `Linear-Signature` header that is
+    `hex(hmac_sha256(secret, raw_body))`. Mismatched signatures get
+    `401`. The raw body is preserved by
+    `SymphonyElixirWeb.RawBodyReader` so HMAC is over the exact bytes
+    Linear signed.
+  - Absent secret -> we refuse to authenticate any request and return
+    `401`; this fail-closed default keeps an empty-secret deployment
+    from silently accepting unsigned traffic.
+
+  Dedupe: an issue with an active run (status `:pending` or
+  `:running`) is skipped, matching the previous poller's contract.
+  """
+
+  use Phoenix.Controller, formats: [:json]
+
+  require Logger
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.Runtime.Ingress
+
+  @spec accept(Plug.Conn.t(), map()) :: Plug.Conn.t()
+  def accept(conn, params) do
+    with :ok <- verify_signature(conn) do
+      handle_event(params)
+      json(conn, %{ok: true})
+    else
+      {:error, status, reason} ->
+        Logger.warning("Linear webhook rejected: #{reason}")
+
+        conn
+        |> put_status(status)
+        |> json(%{error: reason})
+    end
+  end
+
+  defp verify_signature(conn) do
+    cond do
+      is_nil(Config.get().linear_webhook_secret) ->
+        {:error, :unauthorized, "linear webhook secret not configured"}
+
+      is_nil(conn.assigns[:raw_body]) ->
+        {:error, :bad_request, "missing raw body"}
+
+      true ->
+        provided =
+          conn
+          |> Plug.Conn.get_req_header("linear-signature")
+          |> List.first()
+
+        cond do
+          is_nil(provided) ->
+            {:error, :unauthorized, "missing Linear-Signature header"}
+
+          not Plug.Crypto.secure_compare(provided, expected_signature(conn.assigns.raw_body)) ->
+            {:error, :unauthorized, "signature mismatch"}
+
+          true ->
+            :ok
+        end
+    end
+  end
+
+  defp expected_signature(raw_body) do
+    secret = Config.get().linear_webhook_secret
+
+    :hmac
+    |> :crypto.mac(:sha256, secret, raw_body)
+    |> Base.encode16(case: :lower)
+  end
+
+  defp handle_event(%{"type" => "Issue", "action" => action} = event)
+       when action in ["create", "update"] do
+    data = Map.get(event, "data", %{})
+    labels = extract_labels(data)
+
+    maybe_enqueue(data, labels)
+  end
+
+  defp handle_event(_event), do: :ok
+
+  defp extract_labels(%{"labels" => labels}) when is_list(labels) do
+    labels
+    |> Enum.map(fn
+      %{"name" => name} when is_binary(name) -> String.downcase(String.trim(name))
+      _ -> nil
+    end)
+    |> Enum.reject(&is_nil/1)
+  end
+
+  defp extract_labels(%{"labelIds" => _ids}) do
+    # Linear sends label ids only on some event shapes (e.g. older webhook
+    # versions). We do not have the names locally; skip these events. The
+    # next full update with a `labels` array will re-fire.
+    []
+  end
+
+  defp extract_labels(_), do: []
+
+  defp maybe_enqueue(%{"id" => issue_id} = data, labels) do
+    if active_run_exists?(issue_id) do
+      :ok
+    else
+      # The issue's labels ride on the event so the shared matcher can keep
+      # the workflows whose declared label is present, fanning out to each.
+      trigger = %{
+        kind: :linear,
+        labels: labels,
+        issue_id: issue_id,
+        identifier: Map.get(data, "identifier"),
+        title: Map.get(data, "title"),
+        url: Map.get(data, "url")
+      }
+
+      case Ingress.start_by_trigger(trigger) do
+        {:ok, started} ->
+          Logger.info("Started runs=#{Enum.map_join(started, ",", & &1.run_id)} for #{trigger.identifier} via webhook")
+
+        {:error, reason} ->
+          Logger.warning("Failed to start webhook run for #{trigger.identifier}: #{inspect(reason)}")
+      end
+    end
+  end
+
+  defp maybe_enqueue(_data, _labels), do: :ok
+
+  defp active_run_exists?(linear_issue_id) do
+    Ingress.seen_trigger?(fn
+      {status, %{kind: :linear, issue_id: id}} -> id == linear_issue_id and status in [:pending, :running]
+      {_status, _trigger} -> false
+    end)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/controllers/slack_events_controller.ex b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/slack_events_controller.ex
new file mode 100644
index 000000000..725e4a033
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/slack_events_controller.ex
@@ -0,0 +1,151 @@
+defmodule SymphonyElixirWeb.SlackEventsController do
+  @moduledoc "Receives Slack Events API callbacks and starts app-mention IR runs."
+
+  use Phoenix.Controller, formats: [:json]
+
+  require Logger
+
+  alias SymphonyElixir.{Config, Slack, WorkflowCatalog}
+  alias SymphonyElixir.Runtime.Ingress
+
+  @spec accept(Plug.Conn.t(), map()) :: Plug.Conn.t()
+  def accept(conn, %{"type" => "url_verification", "challenge" => challenge}) do
+    with :ok <- verify_signature(conn) do
+      json(conn, %{challenge: challenge})
+    else
+      {:error, status, reason} ->
+        conn |> put_status(status) |> json(%{error: reason})
+    end
+  end
+
+  def accept(conn, %{"event" => %{"type" => "app_mention"} = event}) do
+    with :ok <- verify_signature(conn) do
+      json(conn, handle_app_mention(event))
+    else
+      {:error, status, reason} ->
+        Logger.warning("Slack event rejected: #{reason}")
+        conn |> put_status(status) |> json(%{error: reason})
+    end
+  end
+
+  def accept(conn, _params) do
+    with :ok <- verify_signature(conn) do
+      json(conn, %{ok: true, ignored: true})
+    else
+      {:error, status, reason} ->
+        conn |> put_status(status) |> json(%{error: reason})
+    end
+  end
+
+  defp handle_app_mention(event) do
+    channel = Map.get(event, "channel")
+    ts = Map.get(event, "ts")
+    thread_ts = Map.get(event, "thread_ts") || ts
+
+    cond do
+      not is_binary(channel) or not is_binary(ts) ->
+        %{ok: true, results: [format_result({:ignored, "missing channel or ts"})]}
+
+      active_run_exists?(channel, ts) ->
+        %{ok: true, results: [format_result({:deduped, ts})]}
+
+      true ->
+        # Stamp both the raw channel id the event carries and any declared
+        # channel name resolved to it, so the shared matcher accepts a
+        # workflow that declared either spelling.
+        trigger = %{
+          kind: :slack_app_mention,
+          channel: resolved_channel_name(channel) || channel,
+          channel_id: channel,
+          message_ts: ts,
+          thread_ts: thread_ts,
+          user: Map.get(event, "user"),
+          text: Map.get(event, "text", "")
+        }
+
+        start_mention(trigger)
+    end
+  end
+
+  defp start_mention(trigger) do
+    case Ingress.start_by_trigger(trigger) do
+      {:ok, started} ->
+        %{ok: true, enqueued: length(started), results: Enum.map(started, &format_result({:enqueued, &1.run_id}))}
+
+      {:error, reason} ->
+        %{ok: true, results: [format_result({:error, inspect(reason)})]}
+    end
+  end
+
+  # Resolve the channel id back to the `#name` a workflow's `on` clause
+  # might declare, so a name-based trigger and the event's id compare
+  # equal. The candidate names come from the loaded `:slack_app_mention`
+  # workflows, so this only resolves names symphony actually watches.
+  defp resolved_channel_name(channel_id) do
+    WorkflowCatalog.for_trigger_kind(:slack_app_mention)
+    |> Enum.map(& &1.trigger.channel)
+    |> Enum.uniq()
+    |> Enum.find(fn declared -> channel_matches?(declared, channel_id) end)
+  end
+
+  defp channel_matches?("#" <> channel_name, channel_id) do
+    case Slack.Client.resolve_channel_id(channel_name) do
+      {:ok, ^channel_id} -> true
+      _ -> false
+    end
+  end
+
+  defp channel_matches?(configured, channel_id), do: configured == channel_id
+
+  defp active_run_exists?(channel, ts) do
+    Ingress.seen_trigger?(fn
+      {status, %{kind: :slack_app_mention, channel_id: cid, message_ts: mts}} ->
+        status in [:pending, :running] and cid == channel and mts == ts
+
+      {_status, _trigger} ->
+        false
+    end)
+  end
+
+  defp verify_signature(conn) do
+    secret = Config.get().slack_signing_secret
+
+    cond do
+      is_nil(secret) ->
+        {:error, :unauthorized, "slack signing secret not configured"}
+
+      is_nil(conn.assigns[:raw_body]) ->
+        {:error, :bad_request, "missing raw body"}
+
+      true ->
+        timestamp = conn |> Plug.Conn.get_req_header("x-slack-request-timestamp") |> List.first()
+        provided = conn |> Plug.Conn.get_req_header("x-slack-signature") |> List.first()
+        expected = expected_signature(secret, timestamp, conn.assigns.raw_body)
+
+        cond do
+          is_nil(timestamp) or is_nil(provided) ->
+            {:error, :unauthorized, "missing Slack signature headers"}
+
+          byte_size(provided) != byte_size(expected) ->
+            {:error, :unauthorized, "signature mismatch"}
+
+          not Plug.Crypto.secure_compare(provided, expected) ->
+            {:error, :unauthorized, "signature mismatch"}
+
+          true ->
+            :ok
+        end
+    end
+  end
+
+  defp expected_signature(secret, timestamp, body) do
+    base = "v0:" <> to_string(timestamp) <> ":" <> body
+    digest = :crypto.mac(:hmac, :sha256, secret, base) |> Base.encode16(case: :lower)
+    "v0=" <> digest
+  end
+
+  defp format_result({:enqueued, run_id}), do: %{status: "enqueued", run_id: run_id}
+  defp format_result({:deduped, ts}), do: %{status: "deduped", message_ts: ts}
+  defp format_result({:ignored, reason}), do: %{status: "ignored", reason: reason}
+  defp format_result({:error, reason}), do: %{status: "error", reason: reason}
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/controllers/static_asset_controller.ex b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/static_asset_controller.ex
new file mode 100644
index 000000000..13939c1e7
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/controllers/static_asset_controller.ex
@@ -0,0 +1,22 @@
+defmodule SymphonyElixirWeb.StaticAssetController do
+  @moduledoc """
+  Serves the JS bundles Phoenix LiveView needs, read directly from the
+  dep checkout. Avoids a build pipeline for v0.
+  """
+
+  use Phoenix.Controller, formats: []
+
+  def phoenix(conn, _params), do: send_dep_js(conn, :phoenix, "priv/static/phoenix.js")
+  def phoenix_html(conn, _params), do: send_dep_js(conn, :phoenix_html, "priv/static/phoenix_html.js")
+  def phoenix_live_view(conn, _params), do: send_dep_js(conn, :phoenix_live_view, "priv/static/phoenix_live_view.js")
+
+  defp send_dep_js(conn, app, relative_path) do
+    priv = :code.priv_dir(app) |> to_string()
+    full = Path.join(Path.dirname(priv), relative_path)
+
+    conn
+    |> put_resp_content_type("application/javascript")
+    |> put_resp_header("cache-control", "public, max-age=3600")
+    |> send_file(200, full)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/endpoint.ex b/packages/symphony/elixir/lib/symphony_elixir_web/endpoint.ex
new file mode 100644
index 000000000..23344911f
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/endpoint.ex
@@ -0,0 +1,40 @@
+defmodule SymphonyElixirWeb.Endpoint do
+  @moduledoc """
+  Phoenix endpoint for Symphony's optional observability UI and API.
+  """
+
+  use Phoenix.Endpoint, otp_app: :symphony_elixir
+
+  @session_options [
+    store: :cookie,
+    key: "_symphony_elixir_key",
+    signing_salt: "symphony-session"
+  ]
+
+  socket("/live", Phoenix.LiveView.Socket,
+    websocket: [connect_info: [session: @session_options]],
+    longpoll: false
+  )
+
+  # Runtime workers dial in here and join `worker:lobby`. `:x_headers` exposes
+  # the mTLS client-cert CN that the nginx boundary forwards as `x-worker-cn`.
+  socket("/worker", SymphonyElixirWeb.WorkerSocket,
+    websocket: [connect_info: [:x_headers]],
+    longpoll: false
+  )
+
+  plug(Plug.RequestId)
+  plug(Plug.Telemetry, event_prefix: [:phoenix, :endpoint])
+
+  plug(Plug.Parsers,
+    parsers: [:urlencoded, :multipart, :json],
+    pass: ["*/*"],
+    json_decoder: Jason,
+    body_reader: {SymphonyElixirWeb.RawBodyReader, :read_body, []}
+  )
+
+  plug(Plug.MethodOverride)
+  plug(Plug.Head)
+  plug(Plug.Session, @session_options)
+  plug(SymphonyElixirWeb.Router)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/error_html.ex b/packages/symphony/elixir/lib/symphony_elixir_web/error_html.ex
new file mode 100644
index 000000000..5b2722a26
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/error_html.ex
@@ -0,0 +1,8 @@
+defmodule SymphonyElixirWeb.ErrorHTML do
+  @moduledoc false
+
+  @spec render(String.t(), map()) :: String.t()
+  def render(template, _assigns) do
+    Phoenix.Controller.status_message_from_template(template)
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/error_json.ex b/packages/symphony/elixir/lib/symphony_elixir_web/error_json.ex
new file mode 100644
index 000000000..5babea4c2
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/error_json.ex
@@ -0,0 +1,8 @@
+defmodule SymphonyElixirWeb.ErrorJSON do
+  @moduledoc false
+
+  @spec render(String.t(), map()) :: map()
+  def render(template, _assigns) do
+    %{error: %{code: "request_failed", message: Phoenix.Controller.status_message_from_template(template)}}
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/live/ir_runs_live.ex b/packages/symphony/elixir/lib/symphony_elixir_web/live/ir_runs_live.ex
new file mode 100644
index 000000000..3b50669bc
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/live/ir_runs_live.ex
@@ -0,0 +1,513 @@
+defmodule SymphonyElixirWeb.IRRunsLive do
+  @moduledoc """
+  Dashboard LiveView over IR runs (the `RunGraph` model), the live-page
+  counterpart to the read-only `IRRunController` JSON API.
+
+  Two actions:
+
+  - `:index` - every IR run as a table, plus a "run" control that starts a
+    workflow from the `WorkflowCatalog` by name.
+  - `:show` - one run in detail with per-node state pills, mirroring the
+    `node-grid` layout the legacy `RunsLive` uses.
+
+  Live updates ride `Runtime.Events`: `Runtime` broadcasts an
+  `{:ir_run_event, run_id, summary}` on every persisted transition. This
+  LiveView subscribes to the index topic on mount and to the open run's
+  topic when navigating to `:show`, so pills move from running to succeeded
+  with no polling. The data shapes come straight from `IR.View` so the page
+  renders the same facts the JSON API serves.
+  """
+
+  use Phoenix.LiveView
+
+  alias SymphonyElixir.IR.{Store, View}
+  alias SymphonyElixir.Runtime.Events
+  alias SymphonyElixir.{Runtime, WorkflowCatalog}
+
+  # The runs table paginates at this many rows per page, navigated via the
+  # `?page=N` query param. The full sorted list still loads on every render
+  # (the store scan is cheap) so the total count and "latest first" order
+  # stay exact; only the rendered slice is bounded.
+  @per_page 50
+
+  @impl true
+  def mount(_params, _session, socket) do
+    # The index topic carries every run's transitions, so a subscriber on
+    # the connected mount can refresh the table from the event payload. The
+    # first (static) render runs disconnected; skip the subscribe there.
+    if connected?(socket), do: Events.subscribe_index()
+
+    {:ok,
+     socket
+     |> assign(runs: load_runs())
+     |> assign(workflows: load_workflows())
+     |> assign(workflow_errors: load_workflow_errors())
+     |> assign(subscribed_run: nil)
+     |> assign(page: 1)
+     |> assign(path: "/")
+     |> assign(form_error: nil)}
+  end
+
+  @impl true
+  def handle_params(%{"run_id" => run_id}, _uri, socket) do
+    socket = resubscribe_run(socket, run_id)
+
+    detail =
+      case Store.load(run_id) do
+        {:ok, graph} -> View.detail(graph)
+        {:error, _} -> nil
+      end
+
+    {:noreply, assign(socket, live_action: :show, run_id: run_id, detail: detail)}
+  end
+
+  def handle_params(params, uri, socket) do
+    socket = resubscribe_run(socket, nil)
+
+    {:noreply,
+     assign(socket,
+       live_action: :index,
+       page: parse_page(params["page"]),
+       path: URI.parse(uri).path,
+       runs: load_runs(),
+       workflows: load_workflows(),
+       workflow_errors: load_workflow_errors()
+     )}
+  end
+
+  @impl true
+  def handle_info({:ir_run_event, run_id, _summary}, %{assigns: %{live_action: :show, run_id: run_id}} = socket) do
+    # A transition on the open run: re-read the store for the full detail
+    # view (the event payload is only the summary, and the node grid needs
+    # per-node state). A read miss leaves the last-good detail in place.
+    detail =
+      case Store.load(run_id) do
+        {:ok, graph} -> View.detail(graph)
+        {:error, _} -> socket.assigns[:detail]
+      end
+
+    {:noreply, assign(socket, detail: detail)}
+  end
+
+  def handle_info({:ir_run_event, _run_id, _summary}, %{assigns: %{live_action: :index}} = socket) do
+    # Any run transitioned: refresh the index table. Re-reading the store
+    # rather than splicing the one summary keeps sort order and the
+    # appearance of a brand-new run consistent without per-row bookkeeping.
+    # Re-read the catalog's parse errors on the same beat so the broken-
+    # workflow panel reflects a hot-reload that landed between navigations.
+    {:noreply, assign(socket, runs: load_runs(), workflow_errors: load_workflow_errors())}
+  end
+
+  def handle_info({:ir_run_event, _run_id, _summary}, socket), do: {:noreply, socket}
+
+  @impl true
+  def handle_event("run", %{"workflow" => name}, socket) when is_binary(name) and name != "" do
+    case Runtime.Ingress.start_by_name(name, %{kind: :manual, input: %{}}, []) do
+      {:ok, %{run_id: run_id}} ->
+        {:noreply, push_navigate(socket, to: "/ir/" <> run_id)}
+
+      {:error, reason} ->
+        {:noreply, assign(socket, form_error: "could not start #{name}: #{inspect(reason)}")}
+    end
+  end
+
+  def handle_event("run", _params, socket) do
+    {:noreply, assign(socket, form_error: "pick a workflow to run")}
+  end
+
+  def handle_event("cancel", _params, %{assigns: %{run_id: id}} = socket) do
+    try do
+      _ = Runtime.cancel(id, "dashboard")
+    catch
+      :exit, _ -> :ok
+    end
+
+    {:noreply, assign(socket, detail: reload_detail(id))}
+  end
+
+  def handle_event("retry_failed", _params, %{assigns: %{run_id: id}} = socket) do
+    try do
+      _ = Runtime.clear_failed(id, "dashboard")
+    catch
+      :exit, _ -> :ok
+    end
+
+    {:noreply, assign(socket, detail: reload_detail(id))}
+  end
+
+  def handle_event("rerun", _params, %{assigns: %{run_id: id}} = socket) do
+    try do
+      _ = Runtime.rerun(id, "dashboard")
+    catch
+      :exit, _ -> :ok
+    end
+
+    {:noreply, assign(socket, detail: reload_detail(id))}
+  end
+
+  @impl true
+  def render(%{live_action: :show} = assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_show(assigns), active_tab: :ir})}
+    """
+  end
+
+  def render(assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_index(assigns), active_tab: :ir})}
+    """
+  end
+
+  defp render_index(assigns) do
+    # Bound the rendered slice to one page. `page` is clamped against the
+    # live total so a stale `?page=N` (or a run count that shrank under the
+    # current page) falls back to the last real page instead of an empty
+    # table.
+    total = length(assigns.runs)
+    total_pages = max(1, div(total + @per_page - 1, @per_page))
+    page = assigns.page |> max(1) |> min(total_pages)
+    page_runs = assigns.runs |> Enum.drop((page - 1) * @per_page) |> Enum.take(@per_page)
+
+    assigns =
+      assigns
+      |> assign(:page, page)
+      |> assign(:total_pages, total_pages)
+      |> assign(:total_runs, total)
+      |> assign(:page_runs, page_runs)
+      |> assign(:per_page, @per_page)
+
+    ~H"""
+    <div class="toolbar">
+      <button class="btn btn-primary" popovertarget="run-launcher">start a run</button>
+    </div>
+
+    <div popover id="run-launcher" class="launcher-popover">
+      <div class="launcher-title">start a run</div>
+      <%= if @workflows == [] do %>
+        <div class="muted">
+          no <code class="mono">.sym</code> workflows loaded. drop a file under
+          <code class="mono">workflows/</code> and the catalog will pick it up within a second.
+        </div>
+      <% else %>
+        <form class="enqueue" phx-submit="run">
+          <div class="row">
+            <label for="ir-workflow">workflow</label>
+            <select id="ir-workflow" name="workflow" class="field-input">
+              <%= for wf <- @workflows do %>
+                <option value={wf.name}>{wf.name} - {trigger_label(wf.trigger)}</option>
+              <% end %>
+            </select>
+          </div>
+          <%= if @form_error do %>
+            <div class="hint" style="color: var(--bad); margin-left: 0">{@form_error}</div>
+          <% end %>
+          <div class="submit-row">
+            <button class="btn btn-primary" type="submit">run</button>
+          </div>
+        </form>
+      <% end %>
+    </div>
+
+    <%= if @runs == [] do %>
+      <div class="empty">no IR runs yet. start one with the button above.</div>
+    <% else %>
+      <div class="card">
+        <div class="card-header">
+          <div class="title">{run_count_label(@runs)}</div>
+        </div>
+        <table class="runs">
+          <thead>
+            <tr>
+              <th>run</th>
+              <th>status</th>
+              <th>nodes</th>
+              <th>cost</th>
+              <th>updated</th>
+            </tr>
+          </thead>
+          <tbody>
+            <%= for run <- @page_runs do %>
+              <tr>
+                <td class="mono"><a href={"/ir/" <> run["run_id"]}>{run["run_id"]}</a></td>
+                <td><span class={"pill " <> run["status"]}>{run["status"]}</span></td>
+                <td>{node_counts(run)}</td>
+                <td class="muted">{cost_label(run["cost_usd"])}</td>
+                <td class="muted">{relative_time(run["updated_at"])}</td>
+              </tr>
+            <% end %>
+          </tbody>
+        </table>
+        <%= if @total_pages > 1 do %>
+          <div class="pager">
+            <div>
+              showing {(@page - 1) * @per_page + 1}-{min(@page * @per_page, @total_runs)} of {@total_runs}
+            </div>
+            <div class="pages">
+              <.link
+                class={if @page <= 1, do: "disabled", else: ""}
+                patch={page_path(@path, @page - 1)}
+              >prev</.link>
+              <span class="page-num current">{@page} / {@total_pages}</span>
+              <.link
+                class={if @page >= @total_pages, do: "disabled", else: ""}
+                patch={page_path(@path, @page + 1)}
+              >next</.link>
+            </div>
+          </div>
+        <% end %>
+      </div>
+    <% end %>
+
+    <%= if @workflow_errors != [] do %>
+      <div class="card">
+        <div class="card-header">
+          <div class="title">broken workflows</div>
+        </div>
+        <div class="hint" style="margin-left: 0">
+          these <code class="mono">.sym</code> files failed to parse. the last
+          working version of each stays loaded; fix the location below and the
+          catalog reloads it within a second.
+        </div>
+        <div class="node-grid">
+          <%= for err <- @workflow_errors do %>
+            <div class="node-row">
+              <div class="mono">{error_location(err)}</div>
+              <div><span class="pill failed">parse error</span></div>
+              <div class="muted">{err.message}</div>
+              <div></div>
+            </div>
+          <% end %>
+        </div>
+      </div>
+    <% end %>
+    """
+  end
+
+  defp render_show(assigns) do
+    case assigns.detail do
+      nil ->
+        ~H"""
+        <div class="empty">run not found. <a href="/ir">back to IR runs</a></div>
+        """
+
+      _detail ->
+        ~H"""
+        <div class="card">
+          <div class="card-header">
+            <div class="title">run</div>
+            <span class={"pill " <> @detail["status"]}>{@detail["status"]}</span>
+          </div>
+          <div class="card-body">
+            <dl class="kv">
+              <dt>run id</dt><dd class="mono">{@detail["run_id"]}</dd>
+              <dt>trigger</dt><dd>{@detail["trigger"]}</dd>
+              <dt>placement</dt><dd>{placement_label(@detail["placement"])}</dd>
+              <dt>nodes</dt><dd>{detail_node_counts(@detail)}</dd>
+              <dt>cost</dt><dd class="mono">{cost_label(@detail["cost_usd"])}</dd>
+              <dt>started</dt><dd class="muted">{@detail["created_at"] || "-"}</dd>
+            </dl>
+          </div>
+        </div>
+
+        <div class="card">
+          <div class="card-header">
+            <div class="title">graph</div>
+          </div>
+          <div class="card-body">
+            <SymphonyElixirWeb.Components.IRGraph.graph
+              nodes={@detail["nodes"]}
+              trigger={@detail["trigger"]}
+              placement={@detail["placement"]}
+            />
+          </div>
+        </div>
+
+        <div class="card">
+          <div class="card-header">
+            <div class="title">nodes</div>
+            <div class="actions">
+              <%= if @detail["status"] in ["pending", "running"] do %>
+                <button class="btn" phx-click="cancel">cancel run</button>
+              <% end %>
+              <%= if @detail["status"] in ["failed"] do %>
+                <button class="btn" phx-click="retry_failed">retry failed</button>
+                <button class="btn" phx-click="rerun">rerun</button>
+              <% end %>
+            </div>
+          </div>
+          <div class="node-grid">
+            <%= for node <- @detail["nodes"] do %>
+              <div class="node-row">
+                <div class="mono">{node["id"]}</div>
+                <div>
+                  <span class={"pill " <> node["state"]}>{node["state"]}</span>
+                </div>
+                <div class="muted mono">{node["kind"]}{engine_label(node["envelope"])}</div>
+                <div class="muted">{node_cost(node)}</div>
+              </div>
+            <% end %>
+          </div>
+        </div>
+
+        <div><a class="back-link" href="/ir">&larr; back to IR runs</a></div>
+        """
+    end
+  end
+
+  # Keep at most one per-run subscription alive as the operator navigates
+  # between detail pages. Switching from one run to another drops the old
+  # topic so the LiveView is not woken by transitions on a run it no longer
+  # shows; the index topic (subscribed once at mount) is left untouched.
+  defp resubscribe_run(socket, run_id) do
+    if connected?(socket) do
+      current = socket.assigns[:subscribed_run]
+
+      if current != run_id do
+        if is_binary(current), do: Phoenix.PubSub.unsubscribe(SymphonyElixir.PubSub, Events.run_topic(current))
+        if is_binary(run_id), do: Events.subscribe_run(run_id)
+        assign(socket, subscribed_run: run_id)
+      else
+        socket
+      end
+    else
+      socket
+    end
+  end
+
+  defp reload_detail(run_id) do
+    case Store.load(run_id) do
+      {:ok, graph} -> View.detail(graph)
+      {:error, _} -> nil
+    end
+  end
+
+  defp load_runs do
+    # Latest first: the most recently updated run leads the table, matching
+    # the "updated" column. `sort_by/3` with `:desc` puts newest at the top;
+    # the run_id is a stable tiebreaker for runs that share a timestamp.
+    Store.load_all()
+    |> Enum.map(&View.summary/1)
+    |> Enum.sort_by(&{&1["updated_at"], &1["run_id"]}, :desc)
+  end
+
+  # `?page=N` is operator-supplied, so anything that is not a positive
+  # integer (absent, empty, negative, garbage) falls back to the first page.
+  # The upper bound is clamped against the live total in render_index.
+  defp parse_page(raw) when is_binary(raw) do
+    case Integer.parse(raw) do
+      {n, _} when n > 0 -> n
+      _ -> 1
+    end
+  end
+
+  defp parse_page(_), do: 1
+
+  # Keep page 1 on the bare path so the canonical first-page URL has no query
+  # string; later pages carry `?page=N` on whichever index path is active
+  # (`/` or `/ir`).
+  defp page_path(path, page) when page <= 1, do: path
+  defp page_path(path, page), do: path <> "?page=" <> Integer.to_string(page)
+
+  defp load_workflows do
+    WorkflowCatalog.workflows() |> Enum.sort_by(& &1.name)
+  end
+
+  defp load_workflow_errors do
+    WorkflowCatalog.errors() |> Enum.sort_by(& &1.name)
+  end
+
+  # `file:line:column`, the shape an editor jumps to from a build log. The
+  # diagnostic always carries a file basename, so the location is enough to
+  # find the offending token without a byte offset.
+  defp error_location(%{file: file, line: line, column: column}) do
+    "#{file}:#{line}:#{column}"
+  end
+
+  defp run_count_label(runs) do
+    count = length(runs)
+    if count == 1, do: "1 run", else: "#{count} runs"
+  end
+
+  defp node_counts(%{"states" => states}) when is_map(states) do
+    total = states |> Map.values() |> Enum.sum()
+    done = Map.get(states, "succeeded", 0)
+    "#{done}/#{total}"
+  end
+
+  defp node_counts(_), do: "0/0"
+
+  # Richer node-count summary for the run detail header: each non-zero state
+  # is shown so the operator can see "1 succeeded - 2 running - 1 pending"
+  # at a glance without scrolling to the node grid.
+  defp detail_node_counts(%{"states" => states}) when is_map(states) do
+    order = ["running", "pending", "succeeded", "failed", "skipped", "upstream_failed", "stranded", "cancelled"]
+
+    parts =
+      for state <- order, count = Map.get(states, state, 0), count > 0 do
+        "#{count} #{state}"
+      end
+
+    case parts do
+      [] -> "0 nodes"
+      _ -> Enum.join(parts, " - ")
+    end
+  end
+
+  defp detail_node_counts(_), do: "0 nodes"
+
+  # Render a placement map as a human-readable label. When declared and
+  # effective differ (a fallback occurred), both are shown so the operator
+  # can see exactly what happened. Nil placement means placement was not
+  # recorded (e.g. a local-only run or a run predating the placement stamp).
+  defp placement_label(nil), do: "-"
+
+  defp placement_label(%{"declared" => declared, "effective" => effective})
+       when declared == effective or is_nil(effective) do
+    declared || "-"
+  end
+
+  defp placement_label(%{"declared" => declared, "effective" => effective}) do
+    "#{declared} (fallback #{effective})"
+  end
+
+  defp placement_label(_), do: "-"
+
+  defp cost_label(nil), do: "-"
+  defp cost_label(usd) when is_number(usd), do: "$" <> :erlang.float_to_binary(usd / 1, decimals: 4)
+
+  defp node_cost(%{"attempts" => attempts}) when is_list(attempts) do
+    usd =
+      for %{"cost" => %{"usd" => usd}} <- attempts, is_number(usd), reduce: nil do
+        acc -> (acc || 0) + usd
+      end
+
+    cost_label(usd)
+  end
+
+  defp node_cost(_), do: "-"
+
+  defp engine_label(%{"engine" => engine}) when is_binary(engine), do: " - " <> engine
+  defp engine_label(_), do: ""
+
+  # Delegate to the shared formatter in View so the form dropdown and the
+  # summary card always show the same label for a given trigger.
+  defp trigger_label(trigger), do: View.trigger_label(trigger)
+
+  defp relative_time(nil), do: ""
+
+  defp relative_time(iso) when is_binary(iso) do
+    case DateTime.from_iso8601(iso) do
+      {:ok, dt, _} ->
+        s = DateTime.diff(DateTime.utc_now(), dt, :second)
+
+        cond do
+          s < 60 -> "#{s}s ago"
+          s < 3600 -> "#{div(s, 60)}m ago"
+          true -> "#{div(s, 3600)}h ago"
+        end
+
+      _ ->
+        iso
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/live/skills_live.ex b/packages/symphony/elixir/lib/symphony_elixir_web/live/skills_live.ex
new file mode 100644
index 000000000..f5201c204
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/live/skills_live.ex
@@ -0,0 +1,120 @@
+defmodule SymphonyElixirWeb.SkillsLive do
+  @moduledoc """
+  Skill catalog view.
+
+  - `:index` lists every skill the catalog has loaded with its codex
+    envelope (model, sandbox, approval policy, tools).
+  - `:show` renders the full system-prompt body for one skill so the
+    operator can read what the agent is being told without leaving the
+    dashboard.
+
+  Reads through `Catalog`; hot-reloads when `skills/*.md` changes on
+  disk because Catalog re-emits the skill list on its 1s tick.
+  """
+
+  use Phoenix.LiveView
+
+  alias SymphonyElixir.Catalog
+
+  @impl true
+  def mount(_params, _session, socket) do
+    {:ok, assign(socket, skills: Catalog.skills())}
+  end
+
+  @impl true
+  def handle_params(%{"name" => name}, _uri, socket) do
+    skill = Enum.find(socket.assigns.skills, fn s -> s.name == name end)
+    {:noreply, assign(socket, live_action: :show, skill: skill, skill_name: name)}
+  end
+
+  def handle_params(_params, _uri, socket) do
+    {:noreply, assign(socket, live_action: :index)}
+  end
+
+  @impl true
+  def render(%{live_action: :show} = assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_show(assigns), active_tab: :skills})}
+    """
+  end
+
+  def render(assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_index(assigns), active_tab: :skills})}
+    """
+  end
+
+  defp render_index(assigns) do
+    ~H"""
+    <%= if @skills == [] do %>
+      <div class="empty">
+        no skills loaded. add a file under <code class="mono">skills/</code> and the catalog will pick it up within a second.
+      </div>
+    <% else %>
+      <div class="dag-grid">
+        <%= for skill <- @skills do %>
+          <div class="dag-row">
+            <div class="name"><a href={"/skills/" <> skill.name}>{skill.name}</a></div>
+            <div class="muted mono" title={model_summary(skill)}>{model_summary(skill)}</div>
+            <div class="muted" title={skill.sandbox}>{skill.sandbox}</div>
+            <div class="muted right-align" title={tool_summary(skill.tools)}>{tool_summary(skill.tools)}</div>
+          </div>
+        <% end %>
+      </div>
+    <% end %>
+    """
+  end
+
+  defp render_show(assigns) do
+    case assigns.skill do
+      nil ->
+        ~H"""
+        <div class="empty">
+          no skill named <span class="mono">{@skill_name}</span>. <a href="/skills">back to skills</a>
+        </div>
+        """
+
+      _skill ->
+        ~H"""
+        <div class="card">
+          <div style="display:flex; justify-content:space-between; align-items:baseline">
+            <div class="mono">{@skill.name}</div>
+            <div class="muted mono">{Path.relative_to_cwd(@skill.path)}</div>
+          </div>
+          <dl class="kv" style="margin-top:12px">
+            <dt>codex model</dt>
+            <dd class="mono">{@skill.codex_model}</dd>
+            <dt>reasoning effort</dt>
+            <dd class="mono">{effort_label(@skill.reasoning_effort)}</dd>
+            <dt>sandbox</dt>
+            <dd class="mono">{@skill.sandbox}</dd>
+            <dt>approval policy</dt>
+            <dd class="mono">{@skill.approval_policy}</dd>
+            <dt>tools</dt>
+            <dd class="mono">{tool_summary(@skill.tools)}</dd>
+          </dl>
+        </div>
+
+        <div class="card">
+          <div class="card-header">
+            <div class="title">prompt body</div>
+          </div>
+          <div class="skill-body markdown">{SymphonyElixirWeb.Markdown.to_html(@skill.body)}</div>
+        </div>
+
+        <div><a class="back-link" href="/skills">&larr; back to skills</a></div>
+        """
+    end
+  end
+
+  defp tool_summary([]), do: "(no tools)"
+  defp tool_summary(tools), do: Enum.join(tools, ", ")
+
+  defp model_summary(skill) do
+    "#{skill.codex_model} (#{effort_label(skill.reasoning_effort)})"
+  end
+
+  defp effort_label(nil), do: "default"
+  defp effort_label(""), do: "default"
+  defp effort_label(effort) when is_binary(effort), do: effort
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/live/statistics_live.ex b/packages/symphony/elixir/lib/symphony_elixir_web/live/statistics_live.ex
new file mode 100644
index 000000000..112a73a1f
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/live/statistics_live.ex
@@ -0,0 +1,112 @@
+defmodule SymphonyElixirWeb.StatisticsLive do
+  @moduledoc "Statistics dashboard for playbook-created assignments."
+
+  use Phoenix.LiveView
+
+  alias SymphonyElixir.Statistics
+
+  @impl true
+  def mount(_params, _session, socket) do
+    if connected?(socket) do
+      parent = self()
+
+      Task.start(fn ->
+        send(parent, {:statistics_snapshot, Statistics.snapshot()})
+      end)
+    end
+
+    {:ok, assign(socket, loading?: true, snapshot: nil)}
+  end
+
+  @impl true
+  def handle_info({:statistics_snapshot, snapshot}, socket) do
+    {:noreply, assign(socket, loading?: false, snapshot: snapshot)}
+  end
+
+  @impl true
+  def render(assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_page(assigns), active_tab: :statistics})}
+    """
+  end
+
+  defp render_page(%{loading?: true} = assigns) do
+    ~H"""
+    <div class="empty">loading statistics...</div>
+    """
+  end
+
+  defp render_page(assigns) do
+    ~H"""
+    <div class="stats-grid">
+      <.chart
+        title="GitHub review requests"
+        stat={@snapshot.github}
+        empty="no requested reviewers found"
+      />
+      <.chart
+        title="Linear assignees from PR tickets"
+        stat={@snapshot.linear}
+        empty="no ticket assignees found"
+      />
+    </div>
+    """
+  end
+
+  defp chart(assigns) do
+    assigns =
+      assigns
+      |> assign(:max_count, max_count(assigns.stat.items))
+      |> assign(:error, format_error(assigns.stat.error))
+
+    ~H"""
+    <section class="card stats-card">
+      <div class="card-header">
+        <div>
+          <div class="title">{@title}</div>
+          <div class="muted mono">{@stat.total} refs scanned</div>
+        </div>
+      </div>
+
+      <%= cond do %>
+        <% @error -> %>
+          <div class="empty">{@error}</div>
+        <% @stat.items == [] -> %>
+          <div class="empty">{@empty}</div>
+        <% true -> %>
+          <div class="bar-chart">
+            <%= for person <- @stat.items do %>
+              <div class="bar-row">
+                <div class="bar-person">
+                  <img src={person.avatar_url || fallback_avatar(person.label)} alt="" loading="lazy" />
+                  <span>{person.label}</span>
+                </div>
+                <div class="bar-track" aria-hidden="true">
+                  <div class="bar-fill" style={"width: " <> bar_width(person.count, @max_count)}></div>
+                </div>
+                <div class="bar-count">{person.count}</div>
+              </div>
+            <% end %>
+          </div>
+      <% end %>
+    </section>
+    """
+  end
+
+  defp max_count([]), do: 1
+  defp max_count(items), do: items |> Enum.map(& &1.count) |> Enum.max()
+
+  defp bar_width(count, max_count) when max_count > 0 do
+    Integer.to_string(round(count / max_count * 100)) <> "%"
+  end
+
+  defp fallback_avatar(label) do
+    "https://github.com/identicons/" <> URI.encode(label) <> ".png"
+  end
+
+  defp format_error(nil), do: nil
+  defp format_error(:missing_github_token), do: "GITHUB_TOKEN is not configured."
+  defp format_error(:github_prs_unavailable), do: "GitHub PR statistics are not available."
+  defp format_error(:missing_linear_api_token), do: "LINEAR_API_KEY is not configured."
+  defp format_error(reason), do: "unable to load statistics: " <> inspect(reason)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/live/workflows_live.ex b/packages/symphony/elixir/lib/symphony_elixir_web/live/workflows_live.ex
new file mode 100644
index 000000000..9c22946d3
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/live/workflows_live.ex
@@ -0,0 +1,173 @@
+defmodule SymphonyElixirWeb.WorkflowsLive do
+  @moduledoc """
+  Workflow catalog view.
+
+  - `:index` lists every workflow the catalog has loaded with its name and
+    trigger label, plus a panel for broken `.sym` files showing their located
+    parse diagnostics.
+  - `:show` materializes one workflow's AST into a static IR graph and renders
+    it with the `IRGraph` component, so an operator can inspect the DAG shape
+    without starting a run.
+
+  Reads through `WorkflowCatalog`; hot-reloads on catalog ticks the same way
+  `IRRunsLive` re-reads errors on index transitions.
+  """
+
+  use Phoenix.LiveView
+
+  alias SymphonyElixir.IR.{Materializer, View}
+  alias SymphonyElixir.WorkflowCatalog
+
+  @impl true
+  def mount(_params, _session, socket) do
+    {:ok,
+     socket
+     |> assign(workflows: load_workflows())
+     |> assign(workflow_errors: load_workflow_errors())}
+  end
+
+  @impl true
+  def handle_params(%{"name" => name}, _uri, socket) do
+    {:noreply, assign(socket, live_action: :show, workflow_name: name)}
+  end
+
+  def handle_params(_params, _uri, socket) do
+    {:noreply,
+     assign(socket,
+       live_action: :index,
+       workflows: load_workflows(),
+       workflow_errors: load_workflow_errors()
+     )}
+  end
+
+  @impl true
+  def render(%{live_action: :show} = assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_show(assigns), active_tab: :workflows})}
+    """
+  end
+
+  def render(assigns) do
+    ~H"""
+    {SymphonyElixirWeb.Layouts.app(%{inner_content: render_index(assigns), active_tab: :workflows})}
+    """
+  end
+
+  defp render_index(assigns) do
+    ~H"""
+    <%= if @workflows == [] and @workflow_errors == [] do %>
+      <div class="empty">
+        no workflows loaded. add a <code class="mono">.sym</code> file under
+        <code class="mono">workflows/</code> and the catalog will pick it up within a second.
+      </div>
+    <% else %>
+      <%= if @workflow_errors != [] do %>
+        <div class="card">
+          <div class="card-header">
+            <div class="title">broken workflows</div>
+          </div>
+          <div class="hint" style="margin-left: 0">
+            these <code class="mono">.sym</code> files failed to parse. the last
+            working version of each stays loaded; fix the location below and the
+            catalog reloads it within a second.
+          </div>
+          <div class="node-grid">
+            <%= for err <- @workflow_errors do %>
+              <div class="node-row">
+                <div class="mono">{error_location(err)}</div>
+                <div><span class="pill failed">parse error</span></div>
+                <div class="muted">{err.message}</div>
+                <div></div>
+              </div>
+            <% end %>
+          </div>
+        </div>
+      <% end %>
+
+      <%= if @workflows != [] do %>
+        <div class="dag-grid">
+          <%= for wf <- @workflows do %>
+            <div class="dag-row">
+              <div class="name"><a href={"/workflows/" <> wf.name}>{wf.name}</a></div>
+              <div class="muted">{trigger_label(wf.trigger)}</div>
+              <div></div>
+              <div></div>
+            </div>
+          <% end %>
+        </div>
+      <% end %>
+    <% end %>
+    """
+  end
+
+  defp render_show(assigns) do
+    case Enum.find(assigns.workflows, &(&1.name == assigns.workflow_name)) do
+      nil ->
+        ~H"""
+        <div class="empty">
+          no workflow named <span class="mono">{@workflow_name}</span>. <a href="/workflows">back to workflows</a>
+        </div>
+        """
+
+      entry ->
+        assigns =
+          assigns
+          |> assign(:graph_result, preview_graph(entry))
+          |> assign(:workflow_trigger, trigger_label(entry.trigger))
+
+        ~H"""
+        <div class="card">
+          <div style="display:flex; justify-content:space-between; align-items:baseline">
+            <div class="mono">{@workflow_name}</div>
+            <div class="muted">{@workflow_trigger}</div>
+          </div>
+        </div>
+
+        <div class="card">
+          <div class="card-header">
+            <div class="title">graph</div>
+          </div>
+          <div class="card-body">
+            <%= case @graph_result do %>
+              <% {:ok, detail} -> %>
+                <SymphonyElixirWeb.Components.IRGraph.graph
+                  nodes={detail["nodes"]}
+                  trigger={detail["trigger"]}
+                  placement={detail["placement"]}
+                  base_path="/workflows"
+                />
+              <% {:error, reason} -> %>
+                <div class="empty">cannot preview: {inspect(reason)}</div>
+            <% end %>
+          </div>
+        </div>
+
+        <div><a class="back-link" href="/workflows">&larr; back to workflows</a></div>
+        """
+    end
+  end
+
+  defp preview_graph(entry) do
+    case Materializer.materialize("preview-#{entry.name}", entry.hash, entry.ast) do
+      {:ok, graph} -> {:ok, View.detail(graph)}
+      {:error, reason} -> {:error, reason}
+    end
+  end
+
+  defp load_workflows do
+    WorkflowCatalog.workflows() |> Enum.sort_by(& &1.name)
+  end
+
+  defp load_workflow_errors do
+    WorkflowCatalog.errors() |> Enum.sort_by(& &1.name)
+  end
+
+  # `file:line:column`, the shape an editor jumps to from a build log.
+  defp error_location(%{file: file, line: line, column: column}) do
+    "#{file}:#{line}:#{column}"
+  end
+
+  # Delegate to the shared formatter in View so the form dropdown and the
+  # workflows index always show the same label for a given trigger.
+  defp trigger_label(trigger), do: View.trigger_label(trigger)
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/markdown.ex b/packages/symphony/elixir/lib/symphony_elixir_web/markdown.ex
new file mode 100644
index 000000000..68a65249e
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/markdown.ex
@@ -0,0 +1,43 @@
+defmodule SymphonyElixirWeb.Markdown do
+  @moduledoc """
+  Render markdown source to sanitized, dashboard-safe HTML.
+
+  Skill bodies and codex message/reasoning text are authored as
+  markdown; the dashboard used to print them verbatim in a `<pre>`, so
+  headings, lists, fenced code, and emphasis showed as raw syntax. This
+  lowers that source to HTML once at render time.
+
+  Earmark defaults to `escape: true`, so raw HTML in the source is
+  neutralized; the output is still run through
+  `HtmlSanitizeEx.markdown_html/1` because the dashboard is served
+  read-only on a public host and the codex transcript text is
+  agent-authored.
+  """
+
+  @doc """
+  Lower a markdown string to a `{:safe, iodata}` tuple HEEx renders
+  without re-escaping. `nil` and blank input render as empty so callers
+  can pipe straight from optional fields.
+  """
+  # The raw/1 call below is the point of this module; sobelow reports it
+  # as XSS.Raw (Low Confidence). The HTML it wraps is Earmark output
+  # (escape: true) passed through HtmlSanitizeEx.markdown_html/1 first, so
+  # the sink is sanitized. sobelow runs reporting-only per .sobelow-conf,
+  # so this stays a documented, expected finding rather than a skip
+  # annotation.
+  @spec to_html(String.t() | nil) :: Phoenix.HTML.safe()
+  def to_html(nil), do: Phoenix.HTML.raw("")
+
+  def to_html(source) when is_binary(source) do
+    case String.trim(source) do
+      "" ->
+        Phoenix.HTML.raw("")
+
+      _ ->
+        source
+        |> Earmark.as_html!(compact_output: true)
+        |> HtmlSanitizeEx.markdown_html()
+        |> Phoenix.HTML.raw()
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/raw_body_reader.ex b/packages/symphony/elixir/lib/symphony_elixir_web/raw_body_reader.ex
new file mode 100644
index 000000000..86c860b24
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/raw_body_reader.ex
@@ -0,0 +1,47 @@
+defmodule SymphonyElixirWeb.RawBodyReader do
+  @moduledoc """
+  A `Plug.Parsers` body reader that retains the raw request body in
+  `conn.assigns.raw_body`.
+
+  Plug.Parsers consumes the request body to decode JSON, which means
+  controllers can't recompute an HMAC over the bytes the caller signed.
+  Inserting this reader keeps the raw body around so the Linear
+  webhook controller can verify `Linear-Signature` before trusting any
+  parsed field.
+
+  Only enabled for paths under `/api/v1/triggers/`; other routes pay no
+  cost.
+  """
+
+  @retain_prefix "/api/v1/triggers/"
+
+  @spec read_body(Plug.Conn.t(), keyword()) :: {:ok, binary(), Plug.Conn.t()} | {:more, binary(), Plug.Conn.t()} | {:error, term()}
+  def read_body(conn, opts) do
+    case Plug.Conn.read_body(conn, opts) do
+      {:ok, body, conn} ->
+        {:ok, body, maybe_retain(conn, body)}
+
+      {:more, body, conn} ->
+        {:more, body, maybe_retain(conn, body, append: true)}
+
+      {:error, _} = err ->
+        err
+    end
+  end
+
+  defp maybe_retain(conn, body, opts \\ []) do
+    if String.starts_with?(conn.request_path, @retain_prefix) do
+      Plug.Conn.assign(conn, :raw_body, retained(conn, body, opts))
+    else
+      conn
+    end
+  end
+
+  defp retained(conn, body, opts) do
+    if Keyword.get(opts, :append, false) do
+      (conn.assigns[:raw_body] || "") <> body
+    else
+      body
+    end
+  end
+end
diff --git a/packages/symphony/elixir/lib/symphony_elixir_web/router.ex b/packages/symphony/elixir/lib/symphony_elixir_web/router.ex
new file mode 100644
index 000000000..f856cef60
--- /dev/null
+++ b/packages/symphony/elixir/lib/symphony_elixir_web/router.ex
@@ -0,0 +1,62 @@
+defmodule SymphonyElixirWeb.Router do
+  @moduledoc "Routes for the runs dashboard and the JSON API."
+
+  use Phoenix.Router
+  import Phoenix.LiveView.Router
+
+  pipeline :browser do
+    plug(:fetch_session)
+    plug(:fetch_live_flash)
+    plug(:put_root_layout, html: {SymphonyElixirWeb.Layouts, :root})
+    plug(:protect_from_forgery)
+    plug(:put_secure_browser_headers)
+  end
+
+  pipeline :api do
+    plug(:accepts, ["json"])
+  end
+
+  scope "/", SymphonyElixirWeb do
+    get("/vendor/phoenix/phoenix.js", StaticAssetController, :phoenix)
+    get("/vendor/phoenix_html/phoenix_html.js", StaticAssetController, :phoenix_html)
+    get("/vendor/phoenix_live_view/phoenix_live_view.js", StaticAssetController, :phoenix_live_view)
+  end
+
+  scope "/", SymphonyElixirWeb do
+    pipe_through(:browser)
+
+    # The IR runs view is the default dashboard. It carries the
+    # schema-driven run control, so there is no separate enqueue form.
+    live("/", IRRunsLive, :index)
+    live("/ir", IRRunsLive, :index)
+    live("/ir/:run_id", IRRunsLive, :show)
+
+    live("/workflows", WorkflowsLive, :index)
+    live("/workflows/:name", WorkflowsLive, :show)
+
+    live("/skills", SkillsLive, :index)
+    live("/skills/:name", SkillsLive, :show)
+    live("/statistics", StatisticsLive, :index)
+  end
+
+  scope "/api/v1", SymphonyElixirWeb do
+    pipe_through(:api)
+
+    # The manual-trigger producer onto the IR runtime.
+    post("/runs", ApiController, :enqueue_run)
+
+    # IR runs (the RunGraph model).
+    get("/ir/schema", IRRunController, :schema)
+    get("/ir/runs", IRRunController, :index)
+    post("/ir/runs", IRRunController, :create)
+    get("/ir/runs/:run_id", IRRunController, :show)
+    post("/ir/runs/:run_id/cancel", IRRunController, :cancel)
+    post("/ir/runs/:run_id/rerun", IRRunController, :rerun)
+    post("/ir/runs/:run_id/clear-failed", IRRunController, :clear_failed)
+    post("/ir/runs/:run_id/nodes/:node_id/retry", IRRunController, :retry_node)
+
+    post("/triggers/linear", LinearWebhookController, :accept)
+    post("/triggers/github", GithubWebhookController, :accept)
+    post("/triggers/slack/events", SlackEventsController, :accept)
+  end
+end
diff --git a/packages/symphony/elixir/mise.toml b/packages/symphony/elixir/mise.toml
new file mode 100644
index 000000000..439bbb261
--- /dev/null
+++ b/packages/symphony/elixir/mise.toml
@@ -0,0 +1,3 @@
+[tools]
+erlang = "28"
+elixir = "1.19.5-otp-28"
diff --git a/packages/symphony/elixir/mix.exs b/packages/symphony/elixir/mix.exs
new file mode 100644
index 000000000..c505267ea
--- /dev/null
+++ b/packages/symphony/elixir/mix.exs
@@ -0,0 +1,88 @@
+defmodule SymphonyElixir.MixProject do
+  use Mix.Project
+
+  def project do
+    [
+      app: :symphony_elixir,
+      version: "0.2.0",
+      elixir: "~> 1.19",
+      compilers: [:phoenix_live_view] ++ Mix.compilers(),
+      start_permanent: Mix.env() == :prod,
+      deps: deps(),
+      aliases: aliases(),
+      test_coverage: [tool: ExCoveralls],
+      dialyzer: [
+        plt_add_apps: [:mix, :ex_unit],
+        plt_core_path: "priv/plts",
+        plt_local_path: "priv/plts"
+      ]
+    ]
+  end
+
+  def cli do
+    [
+      preferred_envs: [
+        coveralls: :test,
+        "coveralls.detail": :test,
+        "coveralls.post": :test,
+        "coveralls.html": :test,
+        "coveralls.json": :test
+      ]
+    ]
+  end
+
+  def application do
+    [
+      mod: {SymphonyElixir.Application, []},
+      extra_applications: [:logger]
+    ]
+  end
+
+  defp deps do
+    [
+      {:bandit, "~> 1.8"},
+      {:phoenix, "~> 1.8.0"},
+      {:phoenix_html, "~> 4.2"},
+      {:phoenix_live_view, "~> 1.1.0"},
+      {:req, "~> 0.5"},
+      {:jason, "~> 1.4"},
+      {:yaml_elixir, "~> 2.12"},
+      # Pure-BEAM markdown render + sanitize for the dashboard. Both are
+      # NIF-free (earmark is pure Elixir, html_sanitize_ex rides on the
+      # pure-Erlang mochiweb), so the runtime mix build stays portable on
+      # NixOS where precompiled dynamically-linked NIFs break.
+      {:earmark, "~> 1.4"},
+      {:html_sanitize_ex, "~> 1.5"},
+      # Phoenix channel client: a runtime worker dials the control plane's
+      # /worker socket and serves provision/teardown over it.
+      {:slipstream, "~> 1.1"},
+      {:lazy_html, ">= 0.1.0", only: :test},
+      {:credo, "~> 1.7", only: [:dev, :test], runtime: false},
+      {:dialyxir, "~> 1.4", only: [:dev, :test], runtime: false},
+      {:sobelow, "~> 0.13", only: [:dev, :test], runtime: false},
+      {:mix_audit, "~> 2.1", only: [:dev, :test], runtime: false},
+      {:excoveralls, "~> 0.18", only: :test}
+    ]
+  end
+
+  defp aliases do
+    [
+      setup: ["deps.get", "compile --warnings-as-errors"],
+      build: ["compile --warnings-as-errors"],
+      lint: ["credo"],
+      quality: [
+        "format --check-formatted",
+        # Non-strict so credo respects the :low priority the checks carry in
+        # .credo.exs; --strict surfaces and fails on those informational
+        # refactor/readability suggestions, defeating that config.
+        "credo",
+        "sobelow --config",
+        # decimal 2.x is pinned by ecto and solid (both require ~> 2.0), so the
+        # only patched release (3.0.0) is unreachable until they move upstream.
+        # https://github.com/advisories/GHSA-rhv4-8758-jx7v
+        "deps.audit --ignore-advisory-ids GHSA-rhv4-8758-jx7v",
+        "dialyzer"
+      ]
+    ]
+  end
+end
diff --git a/packages/symphony/elixir/mix.lock b/packages/symphony/elixir/mix.lock
new file mode 100644
index 000000000..a8a6d06e6
--- /dev/null
+++ b/packages/symphony/elixir/mix.lock
@@ -0,0 +1,47 @@
+%{
+  "bandit": {:hex, :bandit, "1.11.1", "1eb33123cc3c17ae0c3447874eb83399ee530f960c39711ed240342fbd4865fa", [:mix], [{:hpax, "~> 1.0", [hex: :hpax, repo: "hexpm", optional: false]}, {:plug, "~> 1.18", [hex: :plug, repo: "hexpm", optional: false]}, {:telemetry, "~> 0.4 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}, {:thousand_island, "~> 1.0", [hex: :thousand_island, repo: "hexpm", optional: false]}, {:websock, "~> 0.5", [hex: :websock, repo: "hexpm", optional: false]}], "hexpm", "d4401016df9abbc6dcd325c0b78b2b193e7c7c96bb68f31e576112be025d84a5"},
+  "bunt": {:hex, :bunt, "1.0.0", "081c2c665f086849e6d57900292b3a161727ab40431219529f13c4ddcf3e7a44", [:mix], [], "hexpm", "dc5f86aa08a5f6fa6b8096f0735c4e76d54ae5c9fa2c143e5a1fc7c1cd9bb6b5"},
+  "cc_precompiler": {:hex, :cc_precompiler, "0.1.11", "8c844d0b9fb98a3edea067f94f616b3f6b29b959b6b3bf25fee94ffe34364768", [:mix], [{:elixir_make, "~> 0.7", [hex: :elixir_make, repo: "hexpm", optional: false]}], "hexpm", "3427232caf0835f94680e5bcf082408a70b48ad68a5f5c0b02a3bea9f3a075b9"},
+  "credo": {:hex, :credo, "1.7.16", "a9f1389d13d19c631cb123c77a813dbf16449a2aebf602f590defa08953309d4", [:mix], [{:bunt, "~> 0.2.1 or ~> 1.0", [hex: :bunt, repo: "hexpm", optional: false]}, {:file_system, "~> 0.2 or ~> 1.0", [hex: :file_system, repo: "hexpm", optional: false]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: false]}], "hexpm", "d0562af33756b21f248f066a9119e3890722031b6d199f22e3cf95550e4f1579"},
+  "date_time_parser": {:hex, :date_time_parser, "1.3.0", "6ba16850b5ab83dd126576451023ab65349e29af2336ca5084aa1e37025b476e", [:mix], [{:kday, "~> 1.0", [hex: :kday, repo: "hexpm", optional: false]}], "hexpm", "93c8203a8ddc66b1f1531fc0e046329bf0b250c75ffa09567ef03d2c09218e8c"},
+  "decimal": {:hex, :decimal, "2.3.0", "3ad6255aa77b4a3c4f818171b12d237500e63525c2fd056699967a3e7ea20f62", [:mix], [], "hexpm", "a4d66355cb29cb47c3cf30e71329e58361cfcb37c34235ef3bf1d7bf3773aeac"},
+  "dialyxir": {:hex, :dialyxir, "1.4.7", "dda948fcee52962e4b6c5b4b16b2d8fa7d50d8645bbae8b8685c3f9ecb7f5f4d", [:mix], [{:erlex, ">= 0.2.8", [hex: :erlex, repo: "hexpm", optional: false]}], "hexpm", "b34527202e6eb8cee198efec110996c25c5898f43a4094df157f8d28f27d9efe"},
+  "earmark": {:hex, :earmark, "1.4.48", "5f41e579d85ef812351211842b6e005f6e0cef111216dea7d4b9d58af4608434", [:mix], [], "hexpm", "a461a0ddfdc5432381c876af1c86c411fd78a25790c75023c7a4c035fdc858f9"},
+  "ecto": {:hex, :ecto, "3.13.5", "9d4a69700183f33bf97208294768e561f5c7f1ecf417e0fa1006e4a91713a834", [:mix], [{:decimal, "~> 2.0", [hex: :decimal, repo: "hexpm", optional: false]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: true]}, {:telemetry, "~> 0.4 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}], "hexpm", "df9efebf70cf94142739ba357499661ef5dbb559ef902b68ea1f3c1fabce36de"},
+  "elixir_make": {:hex, :elixir_make, "0.9.0", "6484b3cd8c0cee58f09f05ecaf1a140a8c97670671a6a0e7ab4dc326c3109726", [:mix], [], "hexpm", "db23d4fd8b757462ad02f8aa73431a426fe6671c80b200d9710caf3d1dd0ffdb"},
+  "erlex": {:hex, :erlex, "0.2.8", "cd8116f20f3c0afe376d1e8d1f0ae2452337729f68be016ea544a72f767d9c12", [:mix], [], "hexpm", "9d66ff9fedf69e49dc3fd12831e12a8a37b76f8651dd21cd45fcf5561a8a7590"},
+  "excoveralls": {:hex, :excoveralls, "0.18.5", "e229d0a65982613332ec30f07940038fe451a2e5b29bce2a5022165f0c9b157e", [:mix], [{:castore, "~> 1.0", [hex: :castore, repo: "hexpm", optional: true]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: false]}], "hexpm", "523fe8a15603f86d64852aab2abe8ddbd78e68579c8525ae765facc5eae01562"},
+  "file_system": {:hex, :file_system, "1.1.1", "31864f4685b0148f25bd3fbef2b1228457c0c89024ad67f7a81a3ffbc0bbad3a", [:mix], [], "hexpm", "7a15ff97dfe526aeefb090a7a9d3d03aa907e100e262a0f8f7746b78f8f87a5d"},
+  "finch": {:hex, :finch, "0.21.0", "b1c3b2d48af02d0c66d2a9ebfb5622be5c5ecd62937cf79a88a7f98d48a8290c", [:mix], [{:mime, "~> 1.0 or ~> 2.0", [hex: :mime, repo: "hexpm", optional: false]}, {:mint, "~> 1.6.2 or ~> 1.7", [hex: :mint, repo: "hexpm", optional: false]}, {:nimble_options, "~> 0.4 or ~> 1.0", [hex: :nimble_options, repo: "hexpm", optional: false]}, {:nimble_pool, "~> 1.1", [hex: :nimble_pool, repo: "hexpm", optional: false]}, {:telemetry, "~> 0.4 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}], "hexpm", "87dc6e169794cb2570f75841a19da99cfde834249568f2a5b121b809588a4377"},
+  "fine": {:hex, :fine, "0.1.4", "b19a89c1476c7c57afb5f9314aed5960b5bc95d5277de4cb5ee8e1d1616ce379", [:mix], [], "hexpm", "be3324cc454a42d80951cf6023b9954e9ff27c6daa255483b3e8d608670303f5"},
+  "floki": {:hex, :floki, "0.38.0", "62b642386fa3f2f90713f6e231da0fa3256e41ef1089f83b6ceac7a3fd3abf33", [:mix], [], "hexpm", "a5943ee91e93fb2d635b612caf5508e36d37548e84928463ef9dd986f0d1abd9"},
+  "hpax": {:hex, :hpax, "1.0.3", "ed67ef51ad4df91e75cc6a1494f851850c0bd98ebc0be6e81b026e765ee535aa", [:mix], [], "hexpm", "8eab6e1cfa8d5918c2ce4ba43588e894af35dbd8e91e6e55c817bca5847df34a"},
+  "html_sanitize_ex": {:hex, :html_sanitize_ex, "1.5.1", "70d7a817eca4850b330361e1f85ca02422a25d6564fc43dd0915dadac55a16f8", [:mix], [{:mochiweb, "~> 2.15 or ~> 3.1", [hex: :mochiweb, repo: "hexpm", optional: false]}], "hexpm", "c32e0a7f1c479ee4f387a3468b3f27a89715a96e71ee4f0d6a7a9d5658a083ef"},
+  "jason": {:hex, :jason, "1.4.5", "2e3a008590b0b8d7388c20293e9dcc9cf3e5d642fd2a114e4cbbb52e595d940a", [:mix], [{:decimal, "~> 1.0 or ~> 2.0 or ~> 3.0", [hex: :decimal, repo: "hexpm", optional: true]}], "hexpm", "b0c823996102bcd0239b3c2444eb00409b72f6a140c1950bc8b457d836b30684"},
+  "kday": {:hex, :kday, "1.1.0", "64efac85279a12283eaaf3ad6f13001ca2dff943eda8c53288179775a8c057a0", [:mix], [{:ex_doc, "~> 0.21", [hex: :ex_doc, repo: "hexpm", optional: true]}], "hexpm", "69703055d63b8d5b260479266c78b0b3e66f7aecdd2022906cd9bf09892a266d"},
+  "lazy_html": {:hex, :lazy_html, "0.1.10", "ffe42a0b4e70859cf21a33e12a251e0c76c1dff76391609bd56702a0ef5bc429", [:make, :mix], [{:cc_precompiler, "~> 0.1", [hex: :cc_precompiler, repo: "hexpm", optional: false]}, {:elixir_make, "~> 0.9.0", [hex: :elixir_make, repo: "hexpm", optional: false]}, {:fine, "~> 0.1.0", [hex: :fine, repo: "hexpm", optional: false]}], "hexpm", "50f67e5faa09d45a99c1ddf3fac004f051997877dc8974c5797bb5ccd8e27058"},
+  "mime": {:hex, :mime, "2.0.7", "b8d739037be7cd402aee1ba0306edfdef982687ee7e9859bee6198c1e7e2f128", [:mix], [], "hexpm", "6171188e399ee16023ffc5b76ce445eb6d9672e2e241d2df6050f3c771e80ccd"},
+  "mint": {:hex, :mint, "1.7.1", "113fdb2b2f3b59e47c7955971854641c61f378549d73e829e1768de90fc1abf1", [:mix], [{:castore, "~> 0.1.0 or ~> 1.0", [hex: :castore, repo: "hexpm", optional: true]}, {:hpax, "~> 0.1.1 or ~> 0.2.0 or ~> 1.0", [hex: :hpax, repo: "hexpm", optional: false]}], "hexpm", "fceba0a4d0f24301ddee3024ae116df1c3f4bb7a563a731f45fdfeb9d39a231b"},
+  "mint_web_socket": {:hex, :mint_web_socket, "1.0.5", "60354efeb49b1eccf95dfb75f55b08d692e211970fe735a5eb3188b328be2a90", [:mix], [{:mint, ">= 1.4.1 and < 2.0.0-0", [hex: :mint, repo: "hexpm", optional: false]}], "hexpm", "04b35663448fc758f3356cce4d6ac067ca418bbafe6972a3805df984b5f12e61"},
+  "mix_audit": {:hex, :mix_audit, "2.1.5", "c0f77cee6b4ef9d97e37772359a187a166c7a1e0e08b50edf5bf6959dfe5a016", [:make, :mix], [{:jason, "~> 1.4", [hex: :jason, repo: "hexpm", optional: false]}, {:yaml_elixir, "~> 2.11", [hex: :yaml_elixir, repo: "hexpm", optional: false]}], "hexpm", "87f9298e21da32f697af535475860dc1d3617a010e0b418d2ec6142bc8b42d69"},
+  "mochiweb": {:hex, :mochiweb, "3.3.0", "2898ad0bfeee234e4cbae623c7052abc3ff0d73d499ba6e6ffef445b13ffd07a", [:rebar3], [], "hexpm", "aa85b777fb23e9972ebc424e40b5d35106f19bc998873e026dedd876df8ee50c"},
+  "nimble_options": {:hex, :nimble_options, "1.1.1", "e3a492d54d85fc3fd7c5baf411d9d2852922f66e69476317787a7b2bb000a61b", [:mix], [], "hexpm", "821b2470ca9442c4b6984882fe9bb0389371b8ddec4d45a9504f00a66f650b44"},
+  "nimble_pool": {:hex, :nimble_pool, "1.1.0", "bf9c29fbdcba3564a8b800d1eeb5a3c58f36e1e11d7b7fb2e084a643f645f06b", [:mix], [], "hexpm", "af2e4e6b34197db81f7aad230c1118eac993acc0dae6bc83bac0126d4ae0813a"},
+  "phoenix": {:hex, :phoenix, "1.8.7", "d8d755b4ff4b449f610223dd706b4ae64155cb720d3dc09c706c079ecea189e4", [:mix], [{:bandit, "~> 1.0", [hex: :bandit, repo: "hexpm", optional: true]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: true]}, {:phoenix_pubsub, "~> 2.1", [hex: :phoenix_pubsub, repo: "hexpm", optional: false]}, {:phoenix_template, "~> 1.0", [hex: :phoenix_template, repo: "hexpm", optional: false]}, {:phoenix_view, "~> 2.0", [hex: :phoenix_view, repo: "hexpm", optional: true]}, {:plug, "~> 1.14", [hex: :plug, repo: "hexpm", optional: false]}, {:plug_cowboy, "~> 2.7", [hex: :plug_cowboy, repo: "hexpm", optional: true]}, {:plug_crypto, "~> 1.2 or ~> 2.0", [hex: :plug_crypto, repo: "hexpm", optional: false]}, {:telemetry, "~> 0.4 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}, {:websock_adapter, "~> 0.5.3", [hex: :websock_adapter, repo: "hexpm", optional: false]}], "hexpm", "47352f72d6ab31009ef77516b1b3a14745be97b54061fd458031b9d8294869d5"},
+  "phoenix_html": {:hex, :phoenix_html, "4.3.0", "d3577a5df4b6954cd7890c84d955c470b5310bb49647f0a114a6eeecc850f7ad", [:mix], [], "hexpm", "3eaa290a78bab0f075f791a46a981bbe769d94bc776869f4f3063a14f30497ad"},
+  "phoenix_live_view": {:hex, :phoenix_live_view, "1.1.25", "abc1bdf7f148d7f9a003f149834cc858b24290c433b10ef6d1cbb1d6e9a211ca", [:mix], [{:igniter, ">= 0.6.16 and < 1.0.0-0", [hex: :igniter, repo: "hexpm", optional: true]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: true]}, {:lazy_html, "~> 0.1.0", [hex: :lazy_html, repo: "hexpm", optional: true]}, {:phoenix, "~> 1.6.15 or ~> 1.7.0 or ~> 1.8.0-rc", [hex: :phoenix, repo: "hexpm", optional: false]}, {:phoenix_html, "~> 3.3 or ~> 4.0", [hex: :phoenix_html, repo: "hexpm", optional: false]}, {:phoenix_template, "~> 1.0", [hex: :phoenix_template, repo: "hexpm", optional: false]}, {:phoenix_view, "~> 2.0", [hex: :phoenix_view, repo: "hexpm", optional: true]}, {:plug, "~> 1.15", [hex: :plug, repo: "hexpm", optional: false]}, {:telemetry, "~> 0.4.2 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}], "hexpm", "b8946e474799da1f874eab7e9ce107502c96ca318ed46d19f811f847df270865"},
+  "phoenix_pubsub": {:hex, :phoenix_pubsub, "2.2.0", "ff3a5616e1bed6804de7773b92cbccfc0b0f473faf1f63d7daf1206c7aeaaa6f", [:mix], [], "hexpm", "adc313a5bf7136039f63cfd9668fde73bba0765e0614cba80c06ac9460ff3e96"},
+  "phoenix_template": {:hex, :phoenix_template, "1.0.4", "e2092c132f3b5e5b2d49c96695342eb36d0ed514c5b252a77048d5969330d639", [:mix], [{:phoenix_html, "~> 2.14.2 or ~> 3.0 or ~> 4.0", [hex: :phoenix_html, repo: "hexpm", optional: true]}], "hexpm", "2c0c81f0e5c6753faf5cca2f229c9709919aba34fab866d3bc05060c9c444206"},
+  "plug": {:hex, :plug, "1.19.2", "e4950525b22c6789dfb38a3f95d47171ba159da3fc5a33be9643b43d5e8adb98", [:mix], [{:mime, "~> 1.0 or ~> 2.0", [hex: :mime, repo: "hexpm", optional: false]}, {:plug_crypto, "~> 1.1.1 or ~> 1.2 or ~> 2.0", [hex: :plug_crypto, repo: "hexpm", optional: false]}, {:telemetry, "~> 0.4.3 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}], "hexpm", "b6fce20a56af5e60fa5dfecf3f907bb98ec981be43c79a3809a499bc3d133de0"},
+  "plug_crypto": {:hex, :plug_crypto, "2.1.1", "19bda8184399cb24afa10be734f84a16ea0a2bc65054e23a62bb10f06bc89491", [:mix], [], "hexpm", "6470bce6ffe41c8bd497612ffde1a7e4af67f36a15eea5f921af71cf3e11247c"},
+  "req": {:hex, :req, "0.5.17", "0096ddd5b0ed6f576a03dde4b158a0c727215b15d2795e59e0916c6971066ede", [:mix], [{:brotli, "~> 0.3.1", [hex: :brotli, repo: "hexpm", optional: true]}, {:ezstd, "~> 1.0", [hex: :ezstd, repo: "hexpm", optional: true]}, {:finch, "~> 0.17", [hex: :finch, repo: "hexpm", optional: false]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: false]}, {:mime, "~> 2.0.6 or ~> 2.1", [hex: :mime, repo: "hexpm", optional: false]}, {:nimble_csv, "~> 1.0", [hex: :nimble_csv, repo: "hexpm", optional: true]}, {:plug, "~> 1.0", [hex: :plug, repo: "hexpm", optional: true]}], "hexpm", "0b8bc6ffdfebbc07968e59d3ff96d52f2202d0536f10fef4dc11dc02a2a43e39"},
+  "slipstream": {:hex, :slipstream, "1.2.2", "6b07124ac5f62a50327aa38c84edd0284920ac8aba548e04738827838f233ed0", [:mix], [{:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: true]}, {:mint_web_socket, "~> 0.2 or ~> 1.0", [hex: :mint_web_socket, repo: "hexpm", optional: false]}, {:nimble_options, "~> 0.1 or ~> 1.0", [hex: :nimble_options, repo: "hexpm", optional: false]}, {:telemetry, "~> 0.4 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}], "hexpm", "ccb873ddb21aadb37c5c7745014febe6da0aa2cef0c4e73e7d08ce11d18aacd0"},
+  "sobelow": {:hex, :sobelow, "0.14.1", "2f81e8632f15574cba2402bcddff5497b413c01e6f094bc0ab94e83c2f74db81", [:mix], [{:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: false]}], "hexpm", "8fac9a2bd90fdc4b15d6fca6e1608efb7f7c600fa75800813b794ee9364c87f2"},
+  "solid": {:hex, :solid, "1.2.2", "615d3fb75e12b575d99976ca49f242b1e603f98489d30bf8634b5ab47d85e33f", [:mix], [{:date_time_parser, "~> 1.2", [hex: :date_time_parser, repo: "hexpm", optional: false]}, {:decimal, "~> 2.0", [hex: :decimal, repo: "hexpm", optional: false]}], "hexpm", "410d0af6c0cdfd9d58ed2d22158f4fb0733a49f7b59b8e3bdb26f05919ae38ae"},
+  "telemetry": {:hex, :telemetry, "1.4.2", "a0cb522801dffb1c49fe6e30561badffc7b6d0e180db1300df759faa22062855", [:rebar3], [], "hexpm", "928f6495066506077862c0d1646609eed891a4326bee3126ba54b60af61febb1"},
+  "thousand_island": {:hex, :thousand_island, "1.4.3", "2158209580f633be38d43ec4e3ce0a01079592b9657afff9080d5d8ca149a3af", [:mix], [{:telemetry, "~> 0.4 or ~> 1.0", [hex: :telemetry, repo: "hexpm", optional: false]}], "hexpm", "6e4ce09b0fd761a58594d02814d40f77daff460c48a7354a15ab353bb998ea0b"},
+  "websock": {:hex, :websock, "0.5.3", "2f69a6ebe810328555b6fe5c831a851f485e303a7c8ce6c5f675abeb20ebdadc", [:mix], [], "hexpm", "6105453d7fac22c712ad66fab1d45abdf049868f253cf719b625151460b8b453"},
+  "websock_adapter": {:hex, :websock_adapter, "0.5.9", "43dc3ba6d89ef5dec5b1d0a39698436a1e856d000d84bf31a3149862b01a287f", [:mix], [{:bandit, ">= 0.6.0", [hex: :bandit, repo: "hexpm", optional: true]}, {:plug, "~> 1.14", [hex: :plug, repo: "hexpm", optional: false]}, {:plug_cowboy, "~> 2.6", [hex: :plug_cowboy, repo: "hexpm", optional: true]}, {:websock, "~> 0.5", [hex: :websock, repo: "hexpm", optional: false]}], "hexpm", "5534d5c9adad3c18a0f58a9371220d75a803bf0b9a3d87e6fe072faaeed76a08"},
+  "yamerl": {:hex, :yamerl, "0.10.0", "4ff81fee2f1f6a46f1700c0d880b24d193ddb74bd14ef42cb0bcf46e81ef2f8e", [:rebar3], [], "hexpm", "346adb2963f1051dc837a2364e4acf6eb7d80097c0f53cbdc3046ec8ec4b4e6e"},
+  "yaml_elixir": {:hex, :yaml_elixir, "2.12.0", "30343ff5018637a64b1b7de1ed2a3ca03bc641410c1f311a4dbdc1ffbbf449c7", [:mix], [{:yamerl, "~> 0.10", [hex: :yamerl, repo: "hexpm", optional: false]}], "hexpm", "ca6bacae7bac917a7155dca0ab6149088aa7bc800c94d0fe18c5238f53b313c6"},
+}
diff --git a/packages/symphony/elixir/priv/static/dashboard.css b/packages/symphony/elixir/priv/static/dashboard.css
new file mode 100644
index 000000000..bc191c0ca
--- /dev/null
+++ b/packages/symphony/elixir/priv/static/dashboard.css
@@ -0,0 +1,463 @@
+:root {
+  color-scheme: light;
+  --page: #f7f7f8;
+  --page-soft: #fbfbfc;
+  --page-deep: #ececf1;
+  --card: rgba(255, 255, 255, 0.94);
+  --card-muted: #f3f4f6;
+  --ink: #202123;
+  --muted: #6e6e80;
+  --line: #ececf1;
+  --line-strong: #d9d9e3;
+  --accent: #10a37f;
+  --accent-ink: #0f513f;
+  --accent-soft: #e8faf4;
+  --danger: #b42318;
+  --danger-soft: #fef3f2;
+  --shadow-sm: 0 1px 2px rgba(16, 24, 40, 0.05);
+  --shadow-lg: 0 20px 50px rgba(15, 23, 42, 0.08);
+}
+
+* {
+  box-sizing: border-box;
+}
+
+html {
+  background: var(--page);
+}
+
+body {
+  margin: 0;
+  min-height: 100vh;
+  background:
+    radial-gradient(circle at top, rgba(16, 163, 127, 0.12) 0%, rgba(16, 163, 127, 0) 30%),
+    linear-gradient(180deg, var(--page-soft) 0%, var(--page) 24%, #f3f4f6 100%);
+  color: var(--ink);
+  font-family: "Sohne", "SF Pro Text", "Helvetica Neue", "Segoe UI", sans-serif;
+  line-height: 1.5;
+}
+
+a {
+  color: var(--ink);
+  text-decoration: none;
+  transition: color 140ms ease;
+}
+
+a:hover {
+  color: var(--accent);
+}
+
+button {
+  appearance: none;
+  border: 1px solid var(--accent);
+  background: var(--accent);
+  color: white;
+  border-radius: 999px;
+  padding: 0.72rem 1.08rem;
+  cursor: pointer;
+  font: inherit;
+  font-weight: 600;
+  letter-spacing: -0.01em;
+  box-shadow: 0 8px 20px rgba(16, 163, 127, 0.18);
+  transition:
+    transform 140ms ease,
+    box-shadow 140ms ease,
+    background 140ms ease,
+    border-color 140ms ease;
+}
+
+button:hover {
+  transform: translateY(-1px);
+  box-shadow: 0 12px 24px rgba(16, 163, 127, 0.22);
+}
+
+button.secondary {
+  background: var(--card);
+  color: var(--ink);
+  border-color: var(--line-strong);
+  box-shadow: var(--shadow-sm);
+}
+
+button.secondary:hover {
+  box-shadow: 0 6px 16px rgba(15, 23, 42, 0.08);
+}
+
+.subtle-button {
+  appearance: none;
+  border: 1px solid var(--line-strong);
+  background: rgba(255, 255, 255, 0.72);
+  color: var(--muted);
+  border-radius: 999px;
+  padding: 0.34rem 0.72rem;
+  cursor: pointer;
+  font: inherit;
+  font-size: 0.82rem;
+  font-weight: 600;
+  letter-spacing: 0.01em;
+  box-shadow: none;
+  transition:
+    background 140ms ease,
+    border-color 140ms ease,
+    color 140ms ease;
+}
+
+.subtle-button:hover {
+  transform: none;
+  box-shadow: none;
+  background: white;
+  border-color: var(--muted);
+  color: var(--ink);
+}
+
+pre {
+  margin: 0;
+  white-space: pre-wrap;
+  word-break: break-word;
+}
+
+code,
+pre,
+.mono {
+  font-family: "Sohne Mono", "SFMono-Regular", "SF Mono", Consolas, "Liberation Mono", monospace;
+}
+
+.mono,
+.numeric {
+  font-variant-numeric: tabular-nums slashed-zero;
+  font-feature-settings: "tnum" 1, "zero" 1;
+}
+
+.app-shell {
+  max-width: 1280px;
+  margin: 0 auto;
+  padding: 2rem 1rem 3.5rem;
+}
+
+.dashboard-shell {
+  display: grid;
+  gap: 1rem;
+}
+
+.hero-card,
+.section-card,
+.metric-card,
+.error-card {
+  background: var(--card);
+  border: 1px solid rgba(217, 217, 227, 0.82);
+  box-shadow: var(--shadow-sm);
+  backdrop-filter: blur(18px);
+}
+
+.hero-card {
+  border-radius: 28px;
+  padding: clamp(1.25rem, 3vw, 2rem);
+  box-shadow: var(--shadow-lg);
+}
+
+.hero-grid {
+  display: grid;
+  grid-template-columns: minmax(0, 1fr) auto;
+  gap: 1.25rem;
+  align-items: start;
+}
+
+.eyebrow {
+  margin: 0;
+  color: var(--muted);
+  text-transform: uppercase;
+  letter-spacing: 0.08em;
+  font-size: 0.76rem;
+  font-weight: 600;
+}
+
+.hero-title {
+  margin: 0.35rem 0 0;
+  font-size: clamp(2rem, 4vw, 3.3rem);
+  line-height: 0.98;
+  letter-spacing: -0.04em;
+}
+
+.hero-copy {
+  margin: 0.75rem 0 0;
+  max-width: 46rem;
+  color: var(--muted);
+  font-size: 1rem;
+}
+
+.status-stack {
+  display: grid;
+  justify-items: end;
+  align-content: start;
+  min-width: min(100%, 9rem);
+}
+
+.status-badge {
+  display: inline-flex;
+  align-items: center;
+  gap: 0.45rem;
+  min-height: 2rem;
+  padding: 0.35rem 0.78rem;
+  border-radius: 999px;
+  border: 1px solid var(--line);
+  background: var(--card-muted);
+  color: var(--muted);
+  font-size: 0.82rem;
+  font-weight: 700;
+  letter-spacing: 0.01em;
+}
+
+.status-badge-dot {
+  width: 0.52rem;
+  height: 0.52rem;
+  border-radius: 999px;
+  background: currentColor;
+  opacity: 0.9;
+}
+
+.status-badge-live {
+  display: none;
+  background: var(--accent-soft);
+  border-color: rgba(16, 163, 127, 0.18);
+  color: var(--accent-ink);
+}
+
+.status-badge-offline {
+  background: #f5f5f7;
+  border-color: var(--line-strong);
+  color: var(--muted);
+}
+
+[data-phx-main].phx-connected .status-badge-live {
+  display: inline-flex;
+}
+
+[data-phx-main].phx-connected .status-badge-offline {
+  display: none;
+}
+
+.metric-grid {
+  display: grid;
+  gap: 0.85rem;
+  grid-template-columns: repeat(auto-fit, minmax(180px, 1fr));
+}
+
+.metric-card {
+  border-radius: 22px;
+  padding: 1rem 1.05rem 1.1rem;
+}
+
+.metric-label {
+  margin: 0;
+  color: var(--muted);
+  font-size: 0.82rem;
+  font-weight: 600;
+  letter-spacing: 0.01em;
+}
+
+.metric-value {
+  margin: 0.35rem 0 0;
+  font-size: clamp(1.6rem, 2vw, 2.1rem);
+  line-height: 1.05;
+  letter-spacing: -0.03em;
+}
+
+.metric-detail {
+  margin: 0.45rem 0 0;
+  color: var(--muted);
+  font-size: 0.88rem;
+}
+
+.section-card {
+  border-radius: 24px;
+  padding: 1.15rem;
+}
+
+.section-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: flex-start;
+  gap: 1rem;
+  flex-wrap: wrap;
+}
+
+.section-title {
+  margin: 0;
+  font-size: 1.08rem;
+  line-height: 1.2;
+  letter-spacing: -0.02em;
+}
+
+.section-copy {
+  margin: 0.35rem 0 0;
+  color: var(--muted);
+  font-size: 0.94rem;
+}
+
+.table-wrap {
+  overflow-x: auto;
+  margin-top: 1rem;
+}
+
+.data-table {
+  width: 100%;
+  min-width: 720px;
+  border-collapse: collapse;
+}
+
+.data-table-running {
+  table-layout: fixed;
+  min-width: 980px;
+}
+
+.data-table th {
+  padding: 0 0.5rem 0.75rem 0;
+  text-align: left;
+  color: var(--muted);
+  font-size: 0.78rem;
+  font-weight: 600;
+  text-transform: uppercase;
+  letter-spacing: 0.04em;
+}
+
+.data-table td {
+  padding: 0.9rem 0.5rem 0.9rem 0;
+  border-top: 1px solid var(--line);
+  vertical-align: top;
+  font-size: 0.94rem;
+}
+
+.issue-stack,
+.session-stack,
+.detail-stack,
+.token-stack {
+  display: grid;
+  gap: 0.24rem;
+  min-width: 0;
+}
+
+.event-text {
+  font-weight: 500;
+  line-height: 1.45;
+  max-width: 100%;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.event-meta {
+  max-width: 100%;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.state-badge {
+  display: inline-flex;
+  align-items: center;
+  min-height: 1.85rem;
+  padding: 0.3rem 0.68rem;
+  border-radius: 999px;
+  border: 1px solid var(--line);
+  background: var(--card-muted);
+  color: var(--ink);
+  font-size: 0.8rem;
+  font-weight: 600;
+  line-height: 1;
+}
+
+.state-badge-active {
+  background: var(--accent-soft);
+  border-color: rgba(16, 163, 127, 0.18);
+  color: var(--accent-ink);
+}
+
+.state-badge-warning {
+  background: #fff7e8;
+  border-color: #f1d8a6;
+  color: #8a5a00;
+}
+
+.state-badge-danger {
+  background: var(--danger-soft);
+  border-color: #f6d3cf;
+  color: var(--danger);
+}
+
+.issue-id {
+  font-weight: 600;
+  letter-spacing: -0.01em;
+}
+
+.issue-link {
+  color: var(--muted);
+  font-size: 0.86rem;
+}
+
+.muted {
+  color: var(--muted);
+}
+
+.code-panel {
+  margin-top: 1rem;
+  padding: 1rem;
+  border-radius: 18px;
+  background: #f5f5f7;
+  border: 1px solid var(--line);
+  color: #353740;
+  font-size: 0.9rem;
+}
+
+.empty-state {
+  margin: 1rem 0 0;
+  color: var(--muted);
+}
+
+.error-card {
+  border-radius: 24px;
+  padding: 1.25rem;
+  background: linear-gradient(180deg, #fff8f7 0%, var(--danger-soft) 100%);
+  border-color: #f6d3cf;
+}
+
+.error-title {
+  margin: 0;
+  color: var(--danger);
+  font-size: 1.15rem;
+  letter-spacing: -0.02em;
+}
+
+.error-copy {
+  margin: 0.45rem 0 0;
+  color: var(--danger);
+}
+
+@media (max-width: 860px) {
+  .app-shell {
+    padding: 1rem 0.85rem 2rem;
+  }
+
+  .hero-grid {
+    grid-template-columns: 1fr;
+  }
+
+  .status-stack {
+    justify-items: start;
+  }
+
+  .metric-grid {
+    grid-template-columns: repeat(2, minmax(0, 1fr));
+  }
+}
+
+@media (max-width: 560px) {
+  .metric-grid {
+    grid-template-columns: 1fr;
+  }
+
+  .section-card,
+  .hero-card,
+  .error-card {
+    border-radius: 20px;
+    padding: 1rem;
+  }
+}
diff --git a/packages/symphony/elixir/test/catalog_assets_test.exs b/packages/symphony/elixir/test/catalog_assets_test.exs
new file mode 100644
index 000000000..905da8bf9
--- /dev/null
+++ b/packages/symphony/elixir/test/catalog_assets_test.exs
@@ -0,0 +1,48 @@
+defmodule SymphonyElixir.CatalogAssetsTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.DSL.Parser
+  alias SymphonyElixir.Skill
+
+  @root Path.expand("../..", __DIR__)
+  @example_workflows_dir Path.join([@root, "workflows", "example", "workflows"])
+  @example_skills_dir Path.join([@root, "workflows", "example", "skills"])
+
+  test "all shipped workflow files parse" do
+    results =
+      @root
+      |> Path.join("workflows/*/workflows/*.sym")
+      |> Path.wildcard()
+      |> Enum.sort()
+      |> Enum.map(fn path -> {path, Parser.parse(File.read!(path), file: path)} end)
+
+    refute results == []
+
+    for {path, result} <- results do
+      assert {:ok, %{kind: :workflow}} = result, "expected #{path} to parse, got #{inspect(result)}"
+    end
+  end
+
+  test "all shipped skill files load" do
+    assert @root
+           |> Path.join("workflows/*/skills/*.md")
+           |> Path.wildcard()
+           |> Enum.sort()
+           |> Enum.map(&Skill.load/1)
+           |> Enum.all?(&match?({:ok, %Skill{}}, &1))
+  end
+
+  test "example workflow pack is safe and manual-only" do
+    source = File.read!(Path.join(@example_workflows_dir, "inspect.sym"))
+    assert {:ok, workflow} = Parser.parse(source, file: "inspect.sym")
+    assert {:ok, skill} = Skill.load(Path.join(@example_skills_dir, "inspect.md"))
+
+    assert workflow.name == "inspect"
+    assert workflow.trigger == %{kind: :manual}
+
+    binds = for {:bind, name, _expr} <- workflow.statements, do: name
+    assert binds == ["inspect"]
+
+    assert skill.tools == []
+  end
+end
diff --git a/packages/symphony/elixir/test/claude/code_test.exs b/packages/symphony/elixir/test/claude/code_test.exs
new file mode 100644
index 000000000..1a82b8625
--- /dev/null
+++ b/packages/symphony/elixir/test/claude/code_test.exs
@@ -0,0 +1,31 @@
+defmodule SymphonyElixir.Claude.CodeTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Claude.Code
+  alias SymphonyElixir.Config
+
+  test "command pipes the prompt on stdin and reads prompt/model from env" do
+    cmd = Code.command("claude")
+
+    # Prompt arrives on stdin, never on argv, so a leading dash or argv
+    # length limit cannot corrupt the invocation.
+    assert cmd =~ ~s(printf '%s' "$SYMPHONY_CLAUDE_PROMPT" | claude)
+    assert cmd =~ "--print"
+    assert cmd =~ "--output-format json"
+    assert cmd =~ "--dangerously-skip-permissions"
+    assert cmd =~ ~s(--model "$SYMPHONY_CLAUDE_MODEL")
+    refute cmd =~ "SYMPHONY_CLAUDE_PROMPT="
+  end
+
+  test "command honors an overridden claude executable" do
+    assert Code.command("/opt/bin/claude") =~ "| /opt/bin/claude --print"
+  end
+
+  test "run errors without an Anthropic API key rather than spawning claude" do
+    assert {:error, :anthropic_api_key_not_configured} =
+             Code.run(File.cwd!(), "hello", %{},
+               config: %Config{anthropic_api_key: nil},
+               model: "claude-opus-4-8"
+             )
+  end
+end
diff --git a/packages/symphony/elixir/test/codex/provision_test.exs b/packages/symphony/elixir/test/codex/provision_test.exs
new file mode 100644
index 000000000..5e209b5d3
--- /dev/null
+++ b/packages/symphony/elixir/test/codex/provision_test.exs
@@ -0,0 +1,247 @@
+defmodule SymphonyElixir.Codex.ProvisionTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.{Codex.Provision, Config, RepositoryCatalog}
+
+  defp config_with_repos(extra \\ %{}) do
+    dir = Path.join(System.tmp_dir!(), "provision_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(dir)
+    path = Path.join(dir, "repositories.yaml")
+
+    File.write!(path, """
+    repositories:
+      - name: app
+        owner_repo: acme/app
+        default_branch: main
+        primary: true
+    """)
+
+    on_exit(fn -> File.rm_rf!(dir) end)
+
+    struct(
+      Config,
+      Map.merge(
+        %{
+          repositories_file: path,
+          github_token: nil,
+          ix_env_passthrough: [],
+          github_app_bot_username: "acme-bot[bot]",
+          github_app_bot_email: "bot@acme.dev"
+        },
+        extra
+      )
+    )
+  end
+
+  test "sh single-quotes and escapes embedded quotes" do
+    assert Provision.sh("plain") == "'plain'"
+    assert Provision.sh("a'b") == "'a'\\''b'"
+  end
+
+  test "env_export_lines renders a no-op for an empty env" do
+    assert Provision.env_export_lines([]) == ":"
+  end
+
+  test "env_export_lines quotes values" do
+    assert Provision.env_export_lines([{"K", "a b"}]) == "export K='a b'"
+  end
+
+  test "runtime_env falls back to the static github_token when no bot token is minted" do
+    config = config_with_repos(%{github_token: "ghs_main"})
+
+    env = Provision.runtime_env(config, [])
+
+    assert {"GITHUB_TOKEN", "ghs_main"} in env
+    assert {"GH_TOKEN", "ghs_main"} in env
+  end
+
+  test "runtime_env: the minted bot token owns both GITHUB_TOKEN and GH_TOKEN over the static token" do
+    config = config_with_repos(%{github_token: "ghs_human"})
+
+    env = Provision.runtime_env(config, bot_token: "ghs_app")
+
+    # gh pr create authors as GH_TOKEN, so both vars must carry the App
+    # token; neither may fall back to the static host token (ENG-2012).
+    assert {"GITHUB_TOKEN", "ghs_app"} in env
+    assert {"GH_TOKEN", "ghs_app"} in env
+    refute Enum.any?(env, fn {_key, value} -> value == "ghs_human" end)
+    keys = Enum.map(env, &elem(&1, 0))
+    assert keys == Enum.uniq(keys)
+  end
+
+  test "runtime_env: a passthrough of the same name cannot shadow the bot token" do
+    var = "GH_TOKEN"
+    System.put_env(var, "ghs_inherited")
+    on_exit(fn -> System.delete_env(var) end)
+
+    config = config_with_repos(%{github_token: nil, ix_env_passthrough: [var]})
+
+    env = Provision.runtime_env(config, bot_token: "ghs_app")
+
+    assert {"GH_TOKEN", "ghs_app"} in env
+    refute {"GH_TOKEN", "ghs_inherited"} in env
+  end
+
+  test "repo_blocks stamps the auth header and bot identity when a token is given" do
+    config = config_with_repos()
+    blocks = Provision.repo_blocks(config, "/home/u/symphony-workspaces/run1", "symphony/run1", "ghs_tok")
+
+    assert blocks =~ "clone --depth 1 --branch 'main' 'https://github.com/acme/app.git'"
+    assert blocks =~ "http.https://github.com/.extraheader"
+    assert blocks =~ "checkout -b 'symphony/run1'"
+    assert blocks =~ "user.name' 'acme-bot[bot]'"
+    assert blocks =~ "user.email' 'bot@acme.dev'"
+    assert blocks =~ Base.encode64("x-access-token:ghs_tok")
+  end
+
+  test "repo_blocks omits the auth header when no token is available" do
+    config = config_with_repos()
+    blocks = Provision.repo_blocks(config, "/home/u/symphony-workspaces/run1", "symphony/run1", nil)
+
+    refute blocks =~ "extraheader"
+  end
+
+  test "repo_blocks clones an explicit repository list, overriding the config catalog" do
+    config = config_with_repos()
+
+    repositories = [
+      %RepositoryCatalog{name: "ix", owner_repo: "indexable-inc/ix", default_branch: "main", primary?: true}
+    ]
+
+    blocks =
+      Provision.repo_blocks(config, "/home/u/symphony-workspaces/run1", "symphony/run1", "ghs_tok", repositories)
+
+    assert blocks =~ "clone --depth 1 --branch 'main' 'https://github.com/indexable-inc/ix.git'"
+    refute blocks =~ "acme/app"
+  end
+
+  test "host_primary_workspace uses the explicit list's primary, falling back to the config catalog when absent" do
+    config = config_with_repos()
+
+    repositories = [
+      %RepositoryCatalog{name: "docs", owner_repo: "indexable-inc/docs", default_branch: "main", primary?: false},
+      %RepositoryCatalog{name: "ix", owner_repo: "indexable-inc/ix", default_branch: "main", primary?: true}
+    ]
+
+    assert Provision.host_primary_workspace(config, "/home/u/symphony-workspaces/run1", "run1", repositories) ==
+             "/home/u/symphony-workspaces/run1/ix"
+
+    assert Provision.host_primary_workspace(config, "/home/u/symphony-workspaces/run1", "run1") ==
+             "/home/u/symphony-workspaces/run1/app"
+  end
+
+  test "backend id and name follow the symphony scheme" do
+    assert Provision.backend_id("run1", "impl") == "symphony:run1:impl"
+    assert Provision.backend_name(%{identifier: "ENG-1", title: "Do it"}, "run1", "impl") == "ENG-1: Do it / impl"
+    assert Provision.backend_name(%{identifier: "ENG-1"}, "run1", "impl") == "ENG-1 / impl"
+    assert Provision.backend_name(%{}, "run1", "impl") == "run1 / impl"
+  end
+
+  # Redaction and the room-start pkill behavior were asserted through the
+  # `Codex.IxVm` / `Codex.Host` delegates before those modules were deleted
+  # in the `.sym`/IR cutover. The behavior is owned here, so the coverage
+  # moved to the owner.
+  test "sanitize_ix_args redacts --env values in ix command args" do
+    assert Provision.sanitize_ix_args([
+             "new",
+             "ix/symphony-codex:2026-05-27",
+             "--env",
+             "GITHUB_TOKEN=ghs_secret",
+             "--env",
+             "OPENAI_API_KEY=sk-secret",
+             "--name",
+             "worker"
+           ]) == [
+             "new",
+             "ix/symphony-codex:2026-05-27",
+             "--env",
+             "GITHUB_TOKEN=<redacted>",
+             "--env",
+             "OPENAI_API_KEY=<redacted>",
+             "--name",
+             "worker"
+           ]
+  end
+
+  test "sanitize_ix_args redacts sensitive shell exports in ix command args" do
+    assert Provision.sanitize_ix_args([
+             "shell",
+             "worker",
+             "--",
+             "bash",
+             "-lc",
+             "export GITHUB_TOKEN='ghs_secret'\nexport OPENAI_API_KEY='sk-secret'\necho ok"
+           ]) == [
+             "shell",
+             "worker",
+             "--",
+             "bash",
+             "-lc",
+             "export GITHUB_TOKEN='<redacted>'\nexport OPENAI_API_KEY='<redacted>'\necho ok"
+           ]
+  end
+
+  test "sanitize_setenv_args redacts --setenv values but keeps other args" do
+    args = [
+      "--collect",
+      "--uid=hari",
+      "--setenv=GITHUB_TOKEN=ghs_secret",
+      "--setenv=PATH=/usr/bin",
+      "--unit=symphony-host-abc.service",
+      "--",
+      "room-server"
+    ]
+
+    assert Provision.sanitize_setenv_args(args) == [
+             "--collect",
+             "--uid=hari",
+             "--setenv=GITHUB_TOKEN=<redacted>",
+             "--setenv=PATH=<redacted>",
+             "--unit=symphony-host-abc.service",
+             "--",
+             "room-server"
+           ]
+  end
+
+  test "ix_room_start_script stops only the room-server process name" do
+    script =
+      Provision.ix_room_start_script(
+        %Config{ix_room_server_command: "room-server", ix_room_port: 8080, github_token: nil, ix_env_passthrough: []},
+        "run_test",
+        []
+      )
+
+    assert script =~ "pkill -x room-server || true"
+    refute script =~ "pkill -f room-server"
+    # The per-run engine host serves the HTTP /api surface only, so it
+    # opts out of the WebTransport listener (room-server #232).
+    assert script =~ "--no-wt"
+  end
+
+  test "host_room_server_command binds the picked port and disables WebTransport" do
+    argv =
+      Provision.host_room_server_command(
+        %Config{host_room_server_command: "room-server"},
+        "127.0.0.1",
+        54_321,
+        "/home/u/.local/state/room/run1"
+      )
+
+    assert argv == [
+             System.find_executable("room-server") || "room-server",
+             "--host",
+             "127.0.0.1",
+             "--port",
+             "54321",
+             "--state-dir",
+             "/home/u/.local/state/room/run1",
+             "--no-wt"
+           ]
+
+    # --no-wt opts out of the WebTransport listener, so per-run host
+    # servers do not collide on the fixed UDP port that the standalone
+    # server now binds by default (room-server #232).
+    assert "--no-wt" in argv
+    refute "--wt-port" in argv
+  end
+end
diff --git a/packages/symphony/elixir/test/command_test.exs b/packages/symphony/elixir/test/command_test.exs
new file mode 100644
index 000000000..efb45977c
--- /dev/null
+++ b/packages/symphony/elixir/test/command_test.exs
@@ -0,0 +1,49 @@
+defmodule SymphonyElixir.CommandTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Command
+
+  test "captures successful command output" do
+    assert {:ok, "ok\n"} = Command.run("/bin/sh", ["-c", "printf 'ok\n'"], 1_000)
+  end
+
+  test "captures stderr with failed command output" do
+    assert {:error, {:exit, 7, "bad\n"}} = Command.run("/bin/sh", ["-c", "printf 'bad\n' >&2; exit 7"], 1_000)
+  end
+
+  test "terminates commands after the timeout" do
+    assert {:error, {:timeout, 50, _output}} = Command.run("/bin/sh", ["-c", "sleep 5"], 50)
+  end
+
+  test "kills the spawned process on timeout so it does not orphan" do
+    pid_file = Path.join(System.tmp_dir!(), "command_test_#{System.unique_integer([:positive])}.pid")
+    on_exit(fn -> File.rm(pid_file) end)
+
+    # `exec sleep` replaces the shell so $$ is the surviving process the
+    # port owns; without the kill it would outlive the 50ms timeout.
+    assert {:error, {:timeout, 50, _output}} =
+             Command.run("/bin/sh", ["-c", "echo $$ > #{pid_file}; exec sleep 30"], 50)
+
+    os_pid = wait_for_pid(pid_file)
+    assert eventually_dead?(os_pid), "spawned process #{os_pid} was left running after timeout"
+  end
+
+  defp wait_for_pid(pid_file, attempts \\ 50) do
+    case File.read(pid_file) do
+      {:ok, contents} when contents != "" -> contents |> String.trim() |> String.to_integer()
+      _ when attempts > 0 -> Process.sleep(10) && wait_for_pid(pid_file, attempts - 1)
+      _ -> flunk("spawned process never recorded its pid in #{pid_file}")
+    end
+  end
+
+  defp eventually_dead?(os_pid, attempts \\ 50)
+
+  defp eventually_dead?(_os_pid, 0), do: false
+
+  defp eventually_dead?(os_pid, attempts) do
+    case System.cmd("kill", ["-0", Integer.to_string(os_pid)], stderr_to_stdout: true) do
+      {_, 0} -> Process.sleep(10) && eventually_dead?(os_pid, attempts - 1)
+      {_, _nonzero} -> true
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/config_test.exs b/packages/symphony/elixir/test/config_test.exs
new file mode 100644
index 000000000..5991f000a
--- /dev/null
+++ b/packages/symphony/elixir/test/config_test.exs
@@ -0,0 +1,132 @@
+defmodule SymphonyElixir.ConfigTest do
+  use ExUnit.Case, async: false
+
+  alias SymphonyElixir.Config
+
+  test "captures default codex runtime knobs" do
+    config = Config.get()
+
+    assert config.ix_command == "ix"
+    assert config.ix_image == "ix/symphony-codex:latest"
+    assert config.ix_room_server_command == "room-server"
+    assert config.ix_room_port == 8080
+    assert config.ix_room_connect == "direct"
+    assert config.ix_local_port_base == 18_080
+    refute config.ix_keep_vm?
+    assert config.ix_env_passthrough == ["OPENAI_API_KEY", "CODEX_API_KEY"]
+    assert config.host_user == nil
+    assert config.host_group == nil
+    assert config.host_workspaces_dir == nil
+    assert config.host_room_server_command == "room-server"
+    assert config.host_systemd_run_command == "systemd-run"
+    refute config.host_keep?
+    assert config.claude_command == "claude"
+  end
+
+  test "reads the room advertise host and registry url from the environment" do
+    original = Config.get()
+
+    on_exit(fn ->
+      System.delete_env("SYMPHONY_ROOM_ADVERTISE_HOST")
+      System.delete_env("SYMPHONY_ROOM_REGISTRY_URL")
+      restart_config!(original)
+    end)
+
+    System.put_env("SYMPHONY_ROOM_ADVERTISE_HOST", "100.0.0.7")
+    System.put_env("SYMPHONY_ROOM_REGISTRY_URL", "https://room.ix.dev")
+    restart_config!(original)
+
+    config = Config.get()
+    assert config.room.advertise_host == "100.0.0.7"
+    assert config.room.registry_url == "https://room.ix.dev"
+  end
+
+  test "creates mutable runtime dirs without mutating workflow pack assets" do
+    original = Config.get()
+    root = tmp_dir("config_pack_state")
+    pack_dir = write_pack!(Path.join(root, "pack"))
+    workspaces_dir = Path.join(root, "state/workspaces")
+    runs_dir = Path.join(root, "state/runs")
+
+    on_exit(fn -> restart_config!(original) end)
+    restart_config!(root: root, pack_dir: pack_dir, workspaces_dir: workspaces_dir, runs_dir: runs_dir)
+
+    assert File.dir?(workspaces_dir)
+    assert File.dir?(runs_dir)
+    assert File.dir?(Path.join(pack_dir, "workflows"))
+    assert File.dir?(Path.join(pack_dir, "skills"))
+  end
+
+  test "fails clearly when workflow pack assets are missing" do
+    original = Config.get()
+    root = tmp_dir("config_missing_pack_asset")
+    pack_dir = Path.join(root, "pack")
+    File.mkdir_p!(Path.join(pack_dir, "skills"))
+    File.write!(Path.join(pack_dir, "repositories.yaml"), "repositories: []\n")
+
+    on_exit(fn -> restart_config!(original) end)
+    stop_config()
+
+    previous_flag = Process.flag(:trap_exit, true)
+
+    assert {:error, {%RuntimeError{message: message}, _stack}} =
+             Config.start_link(root: root, pack_dir: pack_dir)
+
+    receive do
+      {:EXIT, _pid, {%RuntimeError{}, _stack}} -> :ok
+    after
+      0 -> :ok
+    end
+
+    Process.flag(:trap_exit, previous_flag)
+
+    assert message =~ "SYMPHONY_WORKFLOWS_DIR must point at an existing directory"
+    refute File.exists?(Path.join(pack_dir, "workflows"))
+  end
+
+  defp write_pack!(pack_dir) do
+    File.mkdir_p!(Path.join(pack_dir, "workflows"))
+    File.mkdir_p!(Path.join(pack_dir, "skills"))
+    File.write!(Path.join(pack_dir, "repositories.yaml"), "repositories: []\n")
+    pack_dir
+  end
+
+  defp restart_config!(%Config{} = snapshot) do
+    opts =
+      snapshot
+      |> Map.from_struct()
+      |> Map.to_list()
+
+    restart_config!(opts)
+  end
+
+  defp restart_config!(opts) do
+    stop_config()
+    assert {:ok, pid} = Config.start_link(opts)
+    Process.unlink(pid)
+  end
+
+  defp stop_config do
+    case Process.whereis(Config) do
+      nil ->
+        :ok
+
+      pid ->
+        ref = Process.monitor(pid)
+        GenServer.stop(pid, :normal)
+
+        receive do
+          {:DOWN, ^ref, :process, ^pid, _reason} -> :ok
+        after
+          1_000 -> flunk("timed out stopping SymphonyElixir.Config")
+        end
+    end
+  end
+
+  defp tmp_dir(name) do
+    dir = Path.join(System.tmp_dir!(), "symphony_#{name}_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(dir)
+    on_exit(fn -> File.rm_rf!(dir) end)
+    dir
+  end
+end
diff --git a/packages/symphony/elixir/test/cron_expression_test.exs b/packages/symphony/elixir/test/cron_expression_test.exs
new file mode 100644
index 000000000..bf0ef2637
--- /dev/null
+++ b/packages/symphony/elixir/test/cron_expression_test.exs
@@ -0,0 +1,111 @@
+defmodule SymphonyElixir.CronExpressionTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.CronExpression
+
+  describe "parse/1" do
+    test "accepts the nicknames" do
+      for nick <- ~w(@yearly @annually @monthly @weekly @daily @midnight @hourly) do
+        assert {:ok, parsed} = CronExpression.parse(nick)
+        assert parsed.source == nick
+      end
+    end
+
+    test "trims whitespace before resolving nicknames" do
+      assert {:ok, parsed} = CronExpression.parse("  @monthly  ")
+      assert parsed.source == "@monthly"
+    end
+
+    test "accepts standard 5-field cron strings" do
+      assert {:ok, _} = CronExpression.parse("0 0 1 * *")
+      assert {:ok, _} = CronExpression.parse("*/15 * * * *")
+      assert {:ok, _} = CronExpression.parse("0 9-17 * * 1-5")
+      assert {:ok, _} = CronExpression.parse("0,15,30,45 * * * *")
+    end
+
+    test "rejects malformed expressions" do
+      assert {:error, _} = CronExpression.parse("not a cron")
+      assert {:error, _} = CronExpression.parse("0 0 1 *")
+      assert {:error, _} = CronExpression.parse("60 0 1 * *")
+      assert {:error, _} = CronExpression.parse("0 24 1 * *")
+      assert {:error, _} = CronExpression.parse("0 0 32 * *")
+      assert {:error, _} = CronExpression.parse("0 0 1 13 *")
+      assert {:error, _} = CronExpression.parse("0 0 1 * 7")
+    end
+
+    test "rejects inverted ranges" do
+      assert {:error, _} = CronExpression.parse("10-5 0 1 * *")
+    end
+
+    test "rejects non-positive step" do
+      assert {:error, _} = CronExpression.parse("*/0 0 1 * *")
+    end
+  end
+
+  describe "next_fire_after/2 with @hourly" do
+    test "advances to the next hour boundary" do
+      {:ok, parsed} = CronExpression.parse("@hourly")
+      from = ~U[2026-05-17 14:23:00Z]
+      assert {:ok, ~U[2026-05-17 15:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+
+    test "never returns the from moment itself" do
+      {:ok, parsed} = CronExpression.parse("@hourly")
+      from = ~U[2026-05-17 14:00:00Z]
+      assert {:ok, ~U[2026-05-17 15:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+  end
+
+  describe "next_fire_after/2 with @daily" do
+    test "advances to midnight UTC the next day" do
+      {:ok, parsed} = CronExpression.parse("@daily")
+      from = ~U[2026-05-17 14:00:00Z]
+      assert {:ok, ~U[2026-05-18 00:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+  end
+
+  describe "next_fire_after/2 with @monthly" do
+    test "advances to the 1st of the next month at 00:00 UTC" do
+      {:ok, parsed} = CronExpression.parse("@monthly")
+      from = ~U[2026-05-17 14:00:00Z]
+      assert {:ok, ~U[2026-06-01 00:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+
+    test "rolls into the next year correctly" do
+      {:ok, parsed} = CronExpression.parse("@monthly")
+      from = ~U[2026-12-15 09:30:00Z]
+      assert {:ok, ~U[2027-01-01 00:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+  end
+
+  describe "next_fire_after/2 with explicit 5-field" do
+    test "*/15 * * * * fires on the next quarter-hour" do
+      {:ok, parsed} = CronExpression.parse("*/15 * * * *")
+      from = ~U[2026-05-17 14:07:00Z]
+      assert {:ok, ~U[2026-05-17 14:15:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+
+    test "weekday business hours respects day-of-week" do
+      # 9am on weekdays (Mon-Fri). 2026-05-17 is a Sunday.
+      {:ok, parsed} = CronExpression.parse("0 9 * * 1-5")
+      from = ~U[2026-05-17 12:00:00Z]
+      assert {:ok, ~U[2026-05-18 09:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+
+    test "POSIX OR semantics for DOM and DOW when both restricted" do
+      # 'every 1st of the month OR every Friday'
+      {:ok, parsed} = CronExpression.parse("0 0 1 * 5")
+      # Thursday May 14 2026 -> first match is Friday May 15
+      from = ~U[2026-05-14 12:00:00Z]
+      assert {:ok, ~U[2026-05-15 00:00:00Z]} = CronExpression.next_fire_after(parsed, from)
+    end
+  end
+
+  describe "matches?/2" do
+    test "@hourly matches every wall-clock hour" do
+      {:ok, parsed} = CronExpression.parse("@hourly")
+      assert CronExpression.matches?(parsed, ~U[2026-05-17 03:00:00Z])
+      refute CronExpression.matches?(parsed, ~U[2026-05-17 03:01:00Z])
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/github_app_test.exs b/packages/symphony/elixir/test/github_app_test.exs
new file mode 100644
index 000000000..a71b6214d
--- /dev/null
+++ b/packages/symphony/elixir/test/github_app_test.exs
@@ -0,0 +1,45 @@
+defmodule SymphonyElixir.GithubAppTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.GithubApp
+
+  describe "configured?/1" do
+    test "false when app id is missing" do
+      refute GithubApp.configured?(%{
+               github_app_id: nil,
+               github_app_private_key_pem: "irrelevant"
+             })
+    end
+
+    test "false when key is missing" do
+      refute GithubApp.configured?(%{
+               github_app_id: "123",
+               github_app_private_key_pem: nil
+             })
+    end
+
+    test "false when either is empty string" do
+      refute GithubApp.configured?(%{
+               github_app_id: "",
+               github_app_private_key_pem: "pem"
+             })
+
+      refute GithubApp.configured?(%{
+               github_app_id: "123",
+               github_app_private_key_pem: ""
+             })
+    end
+
+    test "true when both id and key are present" do
+      assert GithubApp.configured?(%{
+               github_app_id: "123",
+               github_app_private_key_pem: "-----BEGIN RSA PRIVATE KEY-----\n..."
+             })
+    end
+
+    test "false when passed a non-config-shaped term" do
+      refute GithubApp.configured?(nil)
+      refute GithubApp.configured?(%{})
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/slack_events_controller_test.exs b/packages/symphony/elixir/test/slack_events_controller_test.exs
new file mode 100644
index 000000000..9c70d2b9c
--- /dev/null
+++ b/packages/symphony/elixir/test/slack_events_controller_test.exs
@@ -0,0 +1,18 @@
+defmodule SymphonyElixirWeb.SlackEventsControllerTest do
+  use ExUnit.Case, async: true
+  import Plug.Conn
+  import Plug.Test
+
+  @opts SymphonyElixirWeb.Endpoint.init([])
+
+  test "rejects Slack events when the signing secret is not configured" do
+    conn =
+      :post
+      |> conn("/api/v1/triggers/slack/events", Jason.encode!(%{type: "event_callback"}))
+      |> put_req_header("content-type", "application/json")
+      |> SymphonyElixirWeb.Endpoint.call(@opts)
+
+    assert conn.status == 401
+    assert Jason.decode!(conn.resp_body) == %{"error" => "slack signing secret not configured"}
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/dsl/fixtures/release.sym b/packages/symphony/elixir/test/symphony_elixir/dsl/fixtures/release.sym
new file mode 100644
index 000000000..475bd783a
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/dsl/fixtures/release.sym
@@ -0,0 +1,33 @@
+# A small workflow exercising binds, an envelope, a skill prompt, an
+# inline prompt with interpolation, and a when gate. The two agent binds
+# read disjoint inputs, so the interpreter is free to run them in
+# parallel: report has no edge to inspect's output.
+
+workflow "release" {
+  inspect <- agent {
+    engine: codex
+    model: "gpt-5.3-codex"
+    effort: medium
+    permissions: workspace_write
+    location: local
+    prompt: skill "inspect" { repo: "symphony" }
+  }
+
+  report <- agent {
+    engine: claude
+    model: haiku
+    permissions: read_only
+    prompt: inline "write a status report and stop"
+  }
+
+  summary <- agent {
+    engine: codex
+    model: "gpt-5.3-codex"
+    permissions: read_only
+    prompt: inline "summarize ${inspect.area}"
+  }
+
+  when ${inspect.changed} {
+    notify <- exec "./scripts/notify.sh" timeout 30
+  }
+}
diff --git a/packages/symphony/elixir/test/symphony_elixir/dsl/interpreter_test.exs b/packages/symphony/elixir/test/symphony_elixir/dsl/interpreter_test.exs
new file mode 100644
index 000000000..0f9fb966c
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/dsl/interpreter_test.exs
@@ -0,0 +1,455 @@
+defmodule SymphonyElixir.DSL.InterpreterTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.DSL.Interpreter
+  alias SymphonyElixir.DSL.Parser
+  alias SymphonyElixir.IR.Node
+
+  defp parse!(source) do
+    {:ok, ast} = Parser.parse(source)
+    ast
+  end
+
+  # Node carries wall-clock created_at/updated_at, which differ between
+  # expand calls and are not part of the determinism contract. Compare the
+  # structural fields that the interpreter actually decides.
+  defp structural(nodes) when is_list(nodes), do: Enum.map(nodes, &structural/1)
+
+  defp structural(%Node{} = node) do
+    Map.take(node, [:id, :ast_origin, :kind, :envelope, :prompt_ref, :inputs, :deps, :expansion_key, :state, :output])
+  end
+
+  describe "expand/3 effect emission" do
+    test "only effectful constructors become IR nodes; lets do not" do
+      ast =
+        parse!("""
+        workflow "w" {
+          label = "build-1"
+          run <- agent { engine: codex, model: "m", prompt: inline "go" }
+        }
+        """)
+
+      {delta, _pending, _log} = Interpreter.expand(ast, %{}, [])
+
+      assert [%Node{kind: :agent, id: "agent-0"}] = delta
+    end
+
+    test "agent node carries the envelope spec map and prompt ref" do
+      ast =
+        parse!("""
+        workflow "w" {
+          run <- agent {
+            engine: codex
+            model: "m"
+            permissions: read_only
+            prompt: skill "inspect" { repo: "symphony" }
+          }
+        }
+        """)
+
+      {[node], _pending, _log} = Interpreter.expand(ast, %{}, [])
+
+      assert node.envelope == %{"engine" => "codex", "model" => "m", "permissions" => "read_only"}
+      assert {:skill, "inspect", %{"repo" => "symphony"}} = node.prompt_ref
+      assert node.inputs["repo"] == {:literal, "symphony"}
+    end
+  end
+
+  describe "derived deps and parallelism" do
+    test "a downstream read of a binding becomes a node edge" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          b <- agent { engine: codex, model: "m", prompt: skill "next" { ctx: ${a.area} } }
+        }
+        """)
+
+      {delta, _pending, _log} = Interpreter.expand(ast, %{}, [])
+      by_id = Map.new(delta, &{&1.id, &1})
+
+      a = by_id["agent-0"]
+      b = by_id["agent-1"]
+
+      assert a.deps == []
+      assert b.inputs["ctx"] == {:node, "agent-0", ["area"]}
+      assert b.deps == ["agent-0"]
+    end
+
+    test "two data-independent binds have no edge and run in parallel" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "one" }
+          b <- agent { engine: claude, model: "haiku", prompt: inline "two" }
+        }
+        """)
+
+      {delta, _pending, _log} = Interpreter.expand(ast, %{}, [])
+
+      assert Enum.all?(delta, &(&1.deps == []))
+      assert Enum.map(delta, & &1.id) |> Enum.sort() == ["agent-0", "agent-1"]
+    end
+  end
+
+  describe "when gate" do
+    test "emits a placeholder while the gating input is unresolved" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "do" }
+          when ${a.changed} {
+            n <- exec "./n.sh"
+          }
+        }
+        """)
+
+      {delta, pending, log} = Interpreter.expand(ast, %{}, [])
+      by_kind = Enum.group_by(delta, & &1.kind)
+
+      assert [gate] = by_kind[:gate]
+      assert gate.inputs["gate"] == {:node, "agent-0", ["changed"]}
+      assert gate.deps == ["agent-0"]
+      # the body exec is not emitted yet
+      assert by_kind[:exec] == nil
+      assert {:awaiting, "when-1", ["agent-0"]} in pending
+      assert log == []
+    end
+
+    test "expands the body only when the input resolves truthy" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "do" }
+          when ${a.changed} {
+            n <- exec "./n.sh"
+          }
+        }
+        """)
+
+      known = %{"agent-0" => %{"changed" => true}}
+      {delta, _pending, log} = Interpreter.expand(ast, known, [])
+
+      assert Enum.any?(delta, &(&1.kind == :exec))
+      assert [%{observed: %{gate: :when, opened: true}}] = log
+    end
+
+    test "skips the body when the input resolves falsy" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "do" }
+          when ${a.changed} {
+            n <- exec "./n.sh"
+          }
+        }
+        """)
+
+      known = %{"agent-0" => %{"changed" => false}}
+      {delta, _pending, log} = Interpreter.expand(ast, known, [])
+
+      refute Enum.any?(delta, &(&1.kind == :exec))
+      assert [%{observed: %{gate: :when, opened: false}}] = log
+    end
+  end
+
+  describe "every_nth gate" do
+    # `every n` is one tick per run, evaluated at materialize against an
+    # empty log. A run drives `expand_dynamic/1` several times (init, then
+    # after each node success), re-feeding the grown log, so a re-pass must
+    # reproduce the materialize decision and never advance the tick. The
+    # cross-run tick advance is a separate concern (a future run would seed
+    # its counter from the prior run's terminal log); the runtime today
+    # never carries one run's log into the next run's materialize.
+    test "evaluates one tick per run at the empty-log materialize pass" do
+      ast =
+        parse!("""
+        workflow "w" {
+          every 3 of gc {
+            run <- exec "./gc.sh"
+          }
+        }
+        """)
+
+      # tick 1 (every 3): empty log -> skip.
+      {d1, _p1, _log1} = Interpreter.expand(ast, %{}, [])
+      refute Enum.any?(d1, &(&1.kind == :exec))
+
+      one =
+        parse!("""
+        workflow "w" {
+          every 1 of gc {
+            run <- exec "./gc.sh"
+          }
+        }
+        """)
+
+      # tick 1 (every 1): fires immediately on the materialize pass.
+      {d2, _p2, _log2} = Interpreter.expand(one, %{}, [])
+      assert Enum.any?(d2, &(&1.kind == :exec))
+    end
+
+    test "re-expansion within a run reproduces the tick, never advancing it" do
+      ast =
+        parse!("""
+        workflow "w" {
+          every 2 of c {
+            run <- exec "./x.sh"
+          }
+        }
+        """)
+
+      # The first (materialize) pass against an empty log skips (tick 1 of 2)
+      # and records the decision in the log.
+      {d0, _p0, log_after_skip} = Interpreter.expand(ast, %{}, [])
+      refute Enum.any?(d0, &(&1.kind == :exec))
+
+      # Re-feeding that log (what `expand_dynamic/1` does on every later
+      # pass) reproduces the recorded skip rather than advancing to a fire,
+      # so the live graph and a cold replay stay identical. This is the
+      # replay invariant from `IR.RunGraph`.
+      {a, _, log_a} = Interpreter.expand(ast, %{}, log_after_skip)
+      {b, _, log_b} = Interpreter.expand(ast, %{}, log_after_skip)
+      assert structural(a) == structural(b)
+      refute Enum.any?(a, &(&1.kind == :exec))
+      # No duplicate tick event is appended on a reproduction pass.
+      assert length(log_a) == length(log_after_skip)
+      assert log_a == log_b
+    end
+
+    test "a fired tick re-emits its body idempotently on re-expansion" do
+      ast =
+        parse!("""
+        workflow "w" {
+          every 1 of c {
+            run <- exec "./x.sh"
+          }
+        }
+        """)
+
+      # tick 1 fires; the body exec is emitted and one fire event is logged.
+      {d0, _p0, log0} = Interpreter.expand(ast, %{}, [])
+      assert Enum.any?(d0, &(&1.kind == :exec))
+
+      # A re-pass re-emits the same body (so the materializer re-derives and
+      # merges it) without appending a second fire event.
+      {d1, _p1, log1} = Interpreter.expand(ast, %{}, log0)
+      assert Enum.any?(d1, &(&1.kind == :exec))
+      assert structural(d0) == structural(d1)
+      assert length(log1) == length(log0)
+    end
+  end
+
+  describe "map fan-out" do
+    test "emits one keyed child per element once the list resolves" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "list repos" }
+          map ${seed.repos} as repo {
+            child <- exec "./audit.sh" { target: ${repo} }
+          }
+        }
+        """)
+
+      # unresolved: a single placeholder
+      {d0, pending, _l0} = Interpreter.expand(ast, %{}, [])
+      assert Enum.any?(d0, &(&1.kind == :map_fanout))
+      assert {:awaiting, "map-1", ["agent-0"]} in pending
+
+      # resolved: one exec per element, each binding the element literally
+      known = %{"agent-0" => %{"repos" => ["alpha", "beta"]}}
+      {d1, _p1, log} = Interpreter.expand(ast, known, [])
+
+      execs = Enum.filter(d1, &(&1.kind == :exec))
+      assert length(execs) == 2
+
+      targets = execs |> Enum.map(& &1.inputs["target"]) |> Enum.sort()
+      assert targets == [{:literal, "alpha"}, {:literal, "beta"}]
+
+      assert [%{observed: %{gate: :map, count: 2}}] = log
+      # children carry distinct ids derived from the fan-out key
+      assert execs |> Enum.map(& &1.id) |> Enum.uniq() |> length() == 2
+    end
+
+    test "an empty list resolves to zero children and no placeholder" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "list repos" }
+          map ${seed.repos} as repo {
+            child <- exec "./audit.sh" { target: ${repo} }
+          }
+        }
+        """)
+
+      known = %{"agent-0" => %{"repos" => []}}
+      {delta, pending, log} = Interpreter.expand(ast, known, [])
+
+      # No body child and no leftover placeholder: an empty fan-out emits
+      # nothing for the materializer to schedule. The count event is still
+      # logged so a replay reproduces the zero-child decision.
+      refute Enum.any?(delta, &(&1.kind in [:exec, :map_fanout]))
+      assert pending == []
+      assert [%{observed: %{gate: :map, count: 0}}] = log
+    end
+
+    test "a non-list over folds to zero children rather than crashing" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "scalar" }
+          map ${seed.value} as it {
+            child <- exec "./n.sh" { v: ${it} }
+          }
+        }
+        """)
+
+      # A scalar where a list is expected is a typed mismatch surfaced as an
+      # empty fan-out, not an exception in the expand pass.
+      known = %{"agent-0" => %{"value" => "not-a-list"}}
+      {delta, _pending, log} = Interpreter.expand(ast, known, [])
+
+      refute Enum.any?(delta, &(&1.kind in [:exec, :map_fanout]))
+      assert [%{observed: %{gate: :map, over: :not_a_list}}] = log
+    end
+
+    test "re-expanding a fanned-out map re-emits identical children for an idempotent merge" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "list repos" }
+          map ${seed.repos} as repo {
+            child <- exec "./audit.sh" { target: ${repo} }
+          }
+        }
+        """)
+
+      known = %{"agent-0" => %{"repos" => ["alpha", "beta"]}}
+
+      # The fan-out is a pure function of the resolved list, so two passes
+      # against the same known outputs emit byte-identical children. This is
+      # what lets the materializer re-emit on every `expand_dynamic` pass and
+      # merge by stable id without duplicating a child.
+      {d1, p1, l1} = Interpreter.expand(ast, known, [])
+      {d2, p2, l2} = Interpreter.expand(ast, known, [])
+      assert structural(d1) == structural(d2)
+      assert p1 == p2
+      assert l1 == l2
+    end
+  end
+
+  describe "determinism invariant" do
+    test "expand is a pure function of its inputs" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "go" }
+          when ${a.ok} {
+            b <- exec "./b.sh"
+          }
+          map ${a.items} as it {
+            c <- exec "./c.sh" { v: ${it} }
+          }
+        }
+        """)
+
+      known = %{"a" => nil, "agent-0" => %{"ok" => true, "items" => [1, 2, 3]}}
+
+      {d1, p1, l1} = Interpreter.expand(ast, known, [])
+      {d2, p2, l2} = Interpreter.expand(ast, known, [])
+
+      assert structural(d1) == structural(d2)
+      assert p1 == p2
+      assert l1 == l2
+    end
+  end
+
+  describe "bound gates" do
+    test "a bound when gate binds the resolved body node so downstream reads it" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "do" }
+          changed <- when ${a.flag} {
+            n <- exec "./n.sh"
+          }
+          post <- agent { engine: codex, model: "m", prompt: skill "s" { from: ${changed.path} } }
+        }
+        """)
+
+      known = %{"agent-0" => %{"flag" => true}}
+      {delta, _pending, _log} = Interpreter.expand(ast, known, [])
+
+      exec = Enum.find(delta, &(&1.kind == :exec))
+      post = Enum.find(delta, &(&1.kind == :agent and &1.id != "agent-0"))
+
+      assert exec, "the gate body exec should be emitted on the firing pass"
+      # The gate's binding (`changed`) must point at the body node, not the
+      # vanished placeholder, so the downstream edge resolves.
+      assert post.inputs["from"] == {:node, exec.id, ["path"]}
+      assert exec.id in post.deps
+    end
+
+    test "a bound every_nth gate binds the body node on the firing tick" do
+      ast =
+        parse!("""
+        workflow "w" {
+          tick <- every 1 of c {
+            n <- exec "./n.sh"
+          }
+          post <- agent { engine: codex, model: "m", prompt: skill "s" { from: ${tick.path} } }
+        }
+        """)
+
+      {delta, _pending, _log} = Interpreter.expand(ast, %{}, [])
+
+      exec = Enum.find(delta, &(&1.kind == :exec))
+      post = Enum.find(delta, &(&1.kind == :agent))
+
+      assert exec
+      assert post.inputs["from"] == {:node, exec.id, ["path"]}
+      assert exec.id in post.deps
+    end
+
+    test "the gate placeholder is gone once the when input resolves" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "do" }
+          when ${a.changed} {
+            n <- exec "./n.sh"
+          }
+        }
+        """)
+
+      known = %{"agent-0" => %{"changed" => true}}
+      {delta, _pending, _log} = Interpreter.expand(ast, known, [])
+
+      refute Enum.any?(delta, &(&1.kind == :gate))
+      assert Enum.any?(delta, &(&1.kind == :exec))
+    end
+  end
+
+  describe "deferred inline prompts" do
+    test "an inline prompt over an unresolved output defers, then folds to text" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          b <- agent { engine: codex, model: "m", prompt: inline "use ${a.result} now" }
+        }
+        """)
+
+      {d0, pending, _l0} = Interpreter.expand(ast, %{}, [])
+      b0 = Enum.find(d0, &(&1.id == "agent-1"))
+      assert b0.prompt_ref == {:inline, nil}
+      assert {:awaiting, "agent-1", ["agent-0"]} in pending
+
+      known = %{"agent-0" => %{"result" => "X"}}
+      {d1, _p1, _l1} = Interpreter.expand(ast, known, [])
+      b1 = Enum.find(d1, &(&1.id == "agent-1"))
+      assert b1.prompt_ref == {:inline, "use X now"}
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/dsl/parser_test.exs b/packages/symphony/elixir/test/symphony_elixir/dsl/parser_test.exs
new file mode 100644
index 000000000..0c27c897e
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/dsl/parser_test.exs
@@ -0,0 +1,195 @@
+defmodule SymphonyElixir.DSL.ParserTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.DSL.Parser
+
+  @fixture Path.join(__DIR__, "fixtures/release.sym")
+
+  describe "parse/1" do
+    test "parses the release fixture into a workflow AST" do
+      source = File.read!(@fixture)
+      assert {:ok, ast} = Parser.parse(source)
+
+      assert ast.kind == :workflow
+      assert ast.name == "release"
+      # three agent binds plus one when gate
+      assert length(ast.statements) == 4
+    end
+
+    test "binds introduce names and effects carry envelope and prompt" do
+      source = """
+      workflow "one" {
+        session <- agent {
+          engine: codex
+          model: "gpt-5.3-codex"
+          permissions: workspace_write
+          prompt: skill "inspect" { repo: "symphony" }
+        }
+      }
+      """
+
+      assert {:ok, ast} = Parser.parse(source)
+      assert [{:bind, "session", agent}] = ast.statements
+      assert agent.kind == :agent
+      assert agent.envelope == %{"engine" => "codex", "model" => "gpt-5.3-codex", "permissions" => "workspace_write"}
+      assert {:skill, "inspect", %{"repo" => {:literal, "symphony"}}} = agent.prompt
+    end
+
+    test "inline prompt interpolation lowers to a field read over a binding" do
+      source = """
+      workflow "two" {
+        a <- agent { engine: codex, model: "m", prompt: inline "x" }
+        b <- agent { engine: codex, model: "m", prompt: inline "use ${a.area} now" }
+      }
+      """
+
+      assert {:ok, ast} = Parser.parse(source)
+      assert [_a, {:bind, "b", agent_b}] = ast.statements
+      assert {:inline, {:concat, parts}} = agent_b.prompt
+      assert {:literal, "use "} = Enum.at(parts, 0)
+      assert {:field, {:var, "a"}, ["area"]} = Enum.at(parts, 1)
+      assert {:literal, " now"} = Enum.at(parts, 2)
+    end
+
+    test "every and map and exec parse with their combinator shape" do
+      source = """
+      workflow "combos" {
+        every 3 of gc_counter {
+          gc <- exec "./gc.sh" timeout 60
+        }
+
+        map ${seed.repos} as repo {
+          child <- subrun "audit.sym" { target: ${repo} }
+        }
+      }
+      """
+
+      assert {:ok, ast} = Parser.parse(source)
+      assert [every, map] = ast.statements
+      assert every.kind == :every_nth
+      assert every.n == 3
+      assert every.counter == "gc_counter"
+      assert {:bind, "gc", %{kind: :exec, timeout: {:literal, 60}}} = every.body
+
+      assert map.kind == :map
+      assert map.as == "repo"
+      assert {:field, {:var, "seed"}, ["repos"]} = map.over
+      assert {:bind, "child", %{kind: :subrun}} = map.body
+    end
+
+    test "diagnostics carry a 1-based line and column" do
+      source = """
+      workflow "bad" {
+        x <- agent {
+          engine: codex
+          model: "m"
+        }
+        oops
+      }
+      """
+
+      assert {:error, diag} = Parser.parse(source)
+      assert is_binary(diag.message)
+      assert is_integer(diag.line) and diag.line >= 1
+      assert is_integer(diag.column) and diag.column >= 1
+    end
+
+    test "the diagnostic carries the file name a caller passes" do
+      source = ~s(workflow "bad" { oops })
+
+      assert {:error, diag} = Parser.parse(source, file: "bad.sym")
+      assert diag.file == "bad.sym"
+
+      # An anonymous string parse has no file.
+      assert {:error, anon} = Parser.parse(source)
+      assert anon.file == nil
+    end
+
+    test "a tokenizer error also carries the caller's file name" do
+      # The unterminated string fails in the lexer, before a parse state
+      # exists; the file still lands on the diagnostic.
+      source = ~s(workflow "u" {\n  x <- agent { engine: codex, model: "oops\n}\n)
+
+      assert {:error, diag} = Parser.parse(source, file: "u.sym")
+      assert diag.file == "u.sym"
+      assert diag.message =~ "string"
+    end
+
+    test "a missing prompt is a load error" do
+      source = """
+      workflow "np" {
+        x <- agent { engine: codex, model: "m" }
+      }
+      """
+
+      assert {:error, diag} = Parser.parse(source)
+      assert diag.message =~ "prompt"
+    end
+
+    test "an unterminated string reports the open position" do
+      source = ~s(workflow "u" {\n  x <- agent { engine: codex, model: "oops\n}\n)
+      assert {:error, diag} = Parser.parse(source)
+      assert diag.message =~ "string"
+      assert diag.line == 2
+    end
+  end
+
+  describe "trigger header" do
+    defp parse!(source) do
+      {:ok, ast} = Parser.parse(source)
+      ast
+    end
+
+    test "a workflow with no `on` clause has a nil trigger" do
+      assert parse!(~s(workflow "w" { a <- agent { engine: codex, model: "m", prompt: inline "go" } })).trigger ==
+               nil
+    end
+
+    test "manual" do
+      assert parse!(~s(workflow "w" on manual { a <- exec "./x.sh" })).trigger == %{kind: :manual}
+    end
+
+    test "linear normalizes the label" do
+      assert parse!(~s(workflow "w" on linear label "[Sym] Implement" { a <- exec "./x.sh" })).trigger ==
+               %{kind: :linear, label: "[sym] implement"}
+    end
+
+    test "cron carries schedule, timezone, and input" do
+      source = ~s|workflow "w" on cron "0 9 * * *" tz "UTC" input { lookback_hours: 5 } { a <- exec "./x.sh" }|
+
+      assert parse!(source).trigger == %{
+               kind: :cron,
+               schedule: "0 9 * * *",
+               timezone: "UTC",
+               input: %{"lookback_hours" => 5}
+             }
+    end
+
+    test "cron defaults the timezone and input when omitted" do
+      assert parse!(~s|workflow "w" on cron "* * * * *" { a <- exec "./x.sh" }|).trigger == %{
+               kind: :cron,
+               schedule: "* * * * *",
+               timezone: "UTC",
+               input: %{}
+             }
+    end
+
+    test "slack_huddle and slack_mention map to the runtime kinds" do
+      assert parse!(~s(workflow "w" on slack_huddle channel "focus" { a <- exec "./x.sh" })).trigger ==
+               %{kind: :slack_huddle_completed, channel: "focus"}
+
+      assert parse!(~s(workflow "w" on slack_mention channel "#playbook" { a <- exec "./x.sh" })).trigger ==
+               %{kind: :slack_app_mention, channel: "#playbook"}
+    end
+
+    test "github_pr_label carries repo and normalized label" do
+      assert parse!(~s(workflow "w" on github_pr_label repo "indexable-inc/ix" label "Review-Loop" { a <- exec "./x.sh" })).trigger ==
+               %{kind: :github_pr_label, repo: "indexable-inc/ix", label: "review-loop"}
+    end
+
+    test "an unknown trigger kind is a diagnostic" do
+      assert {:error, diag} = Parser.parse(~s(workflow "w" on telepathy { a <- exec "./x.sh" }))
+      assert diag.message =~ "trigger kind"
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/dsl/schema_test.exs b/packages/symphony/elixir/test/symphony_elixir/dsl/schema_test.exs
new file mode 100644
index 000000000..02f0cd511
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/dsl/schema_test.exs
@@ -0,0 +1,61 @@
+defmodule SymphonyElixir.DSL.SchemaTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.DSL.{AST, Parser, Schema}
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.Node
+
+  describe "to_map/0" do
+    test "each field is the owner's accessor verbatim" do
+      # The point of the schema is that it does not restate the enums: it
+      # reads each owner's single source of truth. Asserting equality here
+      # means adding a value at the owner flows through with no schema edit
+      # and no UI edit.
+      schema = Schema.to_map()
+
+      assert schema.engines == Envelope.engines()
+      assert schema.efforts == Envelope.efforts()
+      assert schema.permissions == Envelope.permission_levels()
+      assert schema.locations == Envelope.locations()
+      assert schema.node_kinds == Node.kinds()
+      assert schema.node_states == Node.states()
+      assert schema.effect_kinds == AST.effect_kinds()
+      assert schema.trigger_kinds == Parser.trigger_kinds()
+    end
+
+    test "every value is a list of atoms, so it encodes to JSON as strings" do
+      schema = Schema.to_map()
+
+      for {_key, values} <- schema do
+        assert is_list(values)
+        assert Enum.all?(values, &is_atom/1)
+      end
+
+      assert {:ok, _json} = Jason.encode(schema)
+    end
+  end
+
+  describe "trigger_kinds/0" do
+    test "every advertised trigger kind parses through an `on` clause" do
+      # Guard against the accessor drifting from the parser's dispatch: a
+      # kind the schema offers but the parser rejects would be a dead UI
+      # option. Each kind gets its minimal valid params.
+      params = %{
+        manual: "",
+        cron: ~s|"0 * * * *"|,
+        linear: ~s|label "ready"|,
+        slack_huddle: ~s|channel "C123"|,
+        slack_mention: ~s|channel "C123"|,
+        github_pr_label: ~s|repo "owner/name" label "ship"|
+      }
+
+      for kind <- Parser.trigger_kinds() do
+        clause = Map.fetch!(params, kind)
+        source = ~s|workflow "w" on #{kind} #{clause} { a <- exec "./x" }|
+
+        assert {:ok, ast} = Parser.parse(source), "expected #{kind} to parse"
+        assert is_map(ast.trigger)
+      end
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/engine/client_test.exs b/packages/symphony/elixir/test/symphony_elixir/engine/client_test.exs
new file mode 100644
index 000000000..4e3cee69e
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/engine/client_test.exs
@@ -0,0 +1,278 @@
+defmodule SymphonyElixir.Engine.ClientTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Engine.{Client, Envelope}
+
+  describe "request_body/2" do
+    test "lowers a codex envelope to the camelCase TurnRequest wire shape" do
+      {:ok, env} =
+        Envelope.validate(%Envelope{
+          engine: :codex,
+          model: "gpt-5.3-codex",
+          effort: :high,
+          permissions: :workspace_write,
+          location: :local
+        })
+
+      assert {:ok, body} =
+               Client.request_body(env, %{
+                 prompt: "write FOO to ./hello.txt and stop.",
+                 cwd: "/workspace",
+                 run_id: "run_1",
+                 node_id: "n0"
+               })
+
+      assert body == %{
+               "engine" => "codex",
+               "model" => "gpt-5.3-codex",
+               "effort" => "high",
+               "permissions" => "workspace_write",
+               "cwd" => "/workspace",
+               "prompt" => "write FOO to ./hello.txt and stop.",
+               "tools" => [],
+               "runId" => "run_1",
+               "nodeId" => "n0"
+             }
+    end
+
+    test "omits effort when the envelope leaves it nil" do
+      {:ok, env} =
+        Envelope.validate(%Envelope{engine: :claude, model: "haiku", permissions: :danger_full_access, location: :local})
+
+      assert {:ok, body} = Client.request_body(env, %{prompt: "hi", cwd: "/w"})
+      refute Map.has_key?(body, "effort")
+      assert body["engine"] == "claude"
+      assert body["permissions"] == "danger_full_access"
+    end
+
+    test "drops nil correlation ids rather than sending null" do
+      {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :local})
+      assert {:ok, body} = Client.request_body(env, %{prompt: "hi", cwd: "/w"})
+      refute Map.has_key?(body, "runId")
+      refute Map.has_key?(body, "nodeId")
+    end
+
+    test "rejects a turn missing the prompt or cwd" do
+      {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :local})
+      assert {:error, :missing_prompt} = Client.request_body(env, %{cwd: "/w"})
+      assert {:error, :missing_cwd} = Client.request_body(env, %{prompt: "hi"})
+    end
+  end
+
+  describe "submit_turn/3 location resolution" do
+    test "a host location resolves to the run's per-run room-server from the placement module" do
+      test_pid = self()
+
+      # The run's `Runtime.Placement` provisioned a host room-server (a
+      # systemd-run unit) and registered its loopback URL under run_id. The
+      # client reads it back the same way it resolves :ixvm; no real unit.
+      defmodule HostPlacement do
+        def base_url("run_host"), do: {:ok, "http://127.0.0.1:41234"}
+        def base_url(_), do: :error
+      end
+
+      {:ok, host} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: {:host, "box"}})
+
+      plug = fn conn ->
+        send(test_pid, {:hit, conn.host, conn.port})
+        respond(conn, %{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0})
+      end
+
+      assert {:ok, _} =
+               Client.submit_turn(host, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://ignored.default",
+                 run_id: "run_host",
+                 placement: HostPlacement,
+                 req_options: [plug: plug]
+               )
+
+      assert_received {:hit, "127.0.0.1", 41_234}
+    end
+
+    test "a host location with no acquired placement fails loudly rather than routing to the default" do
+      defmodule UnresolvedHostPlacement do
+        def base_url(_run_id), do: :error
+      end
+
+      {:ok, host} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: {:host, "box"}})
+
+      assert {:error, {:unresolved_location, {:host, "box"}}} =
+               Client.submit_turn(host, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://ignored.default",
+                 run_id: "run_unknown",
+                 placement: UnresolvedHostPlacement
+               )
+    end
+
+    test "a host location without a run_id is unresolved (no context to look up)" do
+      {:ok, host} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: {:host, "box"}})
+
+      assert {:error, {:unresolved_location, {:host, "box"}}} =
+               Client.submit_turn(host, %{prompt: "hi", cwd: "/w"}, room_server_url: "http://ignored.default")
+    end
+
+    test "an ixvm location resolves to the run's per-run room-server from the placement module" do
+      test_pid = self()
+
+      # Stub the placement lookup: the run's `Runtime.Placement` would have
+      # provisioned this URL before the first agent turn. No real VM is
+      # created; the client just reads the resolved per-run base URL.
+      defmodule StubPlacement do
+        def base_url("run_42"), do: {:ok, "http://run-42-vm.test:8080"}
+        def base_url(_), do: :error
+      end
+
+      {:ok, ixvm} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :ixvm})
+
+      plug = fn conn ->
+        send(test_pid, {:hit, conn.host, conn.port})
+        respond(conn, %{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0})
+      end
+
+      assert {:ok, _} =
+               Client.submit_turn(ixvm, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://ignored.default",
+                 run_id: "run_42",
+                 placement: StubPlacement,
+                 req_options: [plug: plug]
+               )
+
+      assert_received {:hit, "run-42-vm.test", 8080}
+    end
+
+    test "an ixvm location with no acquired placement fails loudly rather than routing to the default" do
+      defmodule UnresolvedPlacement do
+        def base_url(_run_id), do: :error
+      end
+
+      {:ok, ixvm} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :ixvm})
+
+      assert {:error, {:unresolved_location, :ixvm}} =
+               Client.submit_turn(ixvm, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://ignored.default",
+                 run_id: "run_unknown",
+                 placement: UnresolvedPlacement
+               )
+    end
+
+    test "an ixvm location without a run_id is unresolved (no context to look up)" do
+      {:ok, ixvm} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :ixvm})
+
+      assert {:error, {:unresolved_location, :ixvm}} =
+               Client.submit_turn(ixvm, %{prompt: "hi", cwd: "/w"}, room_server_url: "http://ignored.default")
+    end
+
+    test "a local location with no configured url is a clear error" do
+      {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :local})
+      assert {:error, :missing_room_server_url} = Client.submit_turn(env, %{prompt: "hi", cwd: "/w"})
+    end
+  end
+
+  describe "submit_turn/3 against a stub room-server" do
+    test "maps an ok outcome to {:ok, %{thread_id, event_count}}" do
+      plug = stub_plug(%{"threadId" => "thread_abc", "outcome" => %{"kind" => "ok"}, "eventCount" => 4})
+      {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5.3-codex", location: :local})
+
+      assert {:ok, %{thread_id: "thread_abc", event_count: 4}} =
+               Client.submit_turn(env, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://room.test",
+                 req_options: [plug: plug]
+               )
+    end
+
+    test "lowers the terminal usage totals to the IR.Attempt cost shape" do
+      plug =
+        stub_plug(%{
+          "threadId" => "thread_abc",
+          "outcome" => %{"kind" => "ok"},
+          "eventCount" => 4,
+          "usage" => %{
+            "tokensIn" => 1200,
+            "tokensOut" => 340,
+            "cacheRead" => 800,
+            "cacheCreation" => 64,
+            "costUsd" => 0.0123
+          }
+        })
+
+      {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5.3-codex", location: :local})
+
+      assert {:ok, %{cost: cost}} =
+               Client.submit_turn(env, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://room.test",
+                 req_options: [plug: plug]
+               )
+
+      assert cost == %{
+               usd: 0.0123,
+               tokens_in: 1200,
+               tokens_out: 340,
+               cache_read: 800,
+               cache_creation: 64
+             }
+    end
+
+    test "a response without usage records an unknown (nil) cost" do
+      plug = stub_plug(%{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0})
+      {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5.3-codex", location: :local})
+
+      assert {:ok, %{cost: nil}} =
+               Client.submit_turn(env, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://room.test",
+                 req_options: [plug: plug]
+               )
+    end
+
+    test "maps an error outcome to {:error, {:turn_error, message, thread_id}}" do
+      plug =
+        stub_plug(%{
+          "threadId" => "thread_err",
+          "outcome" => %{"kind" => "error", "message" => "model refused"},
+          "eventCount" => 1
+        })
+
+      {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: {:room, "http://room.test"}})
+
+      assert {:error, {:turn_error, "model refused", "thread_err"}} =
+               Client.submit_turn(env, %{prompt: "hi", cwd: "/w"}, req_options: [plug: plug])
+    end
+
+    test "an explicit {:room, url} location overrides the default url" do
+      test_pid = self()
+
+      plug = fn conn ->
+        send(test_pid, {:hit, conn.host, conn.port})
+        respond(conn, %{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0})
+      end
+
+      {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: {:room, "http://chosen.test:9999"}})
+
+      assert {:ok, _} =
+               Client.submit_turn(env, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://default.test",
+                 req_options: [plug: plug]
+               )
+
+      assert_received {:hit, "chosen.test", 9999}
+    end
+
+    test "a non-2xx status surfaces as an agent_turn_status error" do
+      plug = fn conn -> Plug.Conn.send_resp(conn, 503, "engine claude not configured") end
+      {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: :local})
+
+      assert {:error, {:agent_turn_status, 503, _}} =
+               Client.submit_turn(env, %{prompt: "hi", cwd: "/w"},
+                 room_server_url: "http://room.test",
+                 req_options: [plug: plug]
+               )
+    end
+  end
+
+  defp stub_plug(json), do: fn conn -> respond(conn, json) end
+
+  defp respond(conn, json) do
+    conn
+    |> Plug.Conn.put_resp_content_type("application/json")
+    |> Plug.Conn.send_resp(200, Jason.encode!(json))
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/engine/contract_fixtures_test.exs b/packages/symphony/elixir/test/symphony_elixir/engine/contract_fixtures_test.exs
new file mode 100644
index 000000000..2de999602
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/engine/contract_fixtures_test.exs
@@ -0,0 +1,85 @@
+defmodule SymphonyElixir.Engine.ContractFixturesTest do
+  @moduledoc """
+  The Elixir half of the cross-language contract guard (see
+  `docs/engine-contract.md`). It asserts that `Engine.Client.request_body/2`
+  reproduces the shared `contracts/fixtures/turn_request.json` shape the Rust
+  room-server parses, so a field rename on either side fails a check rather
+  than drifting silently at runtime.
+  """
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Engine.{Client, Envelope}
+
+  # contracts/ sits at the repo root, four levels up from this test file.
+  @fixtures Path.expand(Path.join([__DIR__, "..", "..", "..", "..", "contracts", "fixtures"]))
+
+  defp fixture(name) do
+    @fixtures |> Path.join(name) |> File.read!() |> Jason.decode!()
+  end
+
+  test "request_body/2 reproduces the shared turn_request fixture" do
+    expected = fixture("turn_request.json")
+
+    {:ok, envelope} =
+      Envelope.from_map(%{
+        "engine" => expected["engine"],
+        "model" => expected["model"],
+        "effort" => expected["effort"],
+        "permissions" => expected["permissions"],
+        "location" => "local"
+      })
+
+    turn = %{
+      prompt: expected["prompt"],
+      cwd: expected["cwd"],
+      tools: expected["tools"],
+      run_id: expected["runId"],
+      node_id: expected["nodeId"]
+    }
+
+    assert {:ok, body} = Client.request_body(envelope, turn)
+    # Compare on the wire shape (string keys, JSON scalars), not atom keys.
+    assert Jason.decode!(Jason.encode!(body)) == expected
+  end
+
+  test "submit_turn maps the shared agent_turn_response fixture's usage to cost" do
+    expected = fixture("agent_turn_response.json")
+    usage = expected["usage"]
+
+    plug = fn conn ->
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(200, Jason.encode!(expected))
+    end
+
+    {:ok, env} =
+      Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "location" => "local"})
+
+    assert {:ok, %{thread_id: thread_id, event_count: event_count, cost: cost}} =
+             Client.submit_turn(env, %{prompt: "hi", cwd: "/w"},
+               room_server_url: "http://room.test",
+               req_options: [plug: plug]
+             )
+
+    assert thread_id == expected["threadId"]
+    assert event_count == expected["eventCount"]
+
+    assert cost == %{
+             usd: usage["costUsd"],
+             tokens_in: usage["tokensIn"],
+             tokens_out: usage["tokensOut"],
+             cache_read: usage["cacheRead"],
+             cache_creation: usage["cacheCreation"]
+           }
+  end
+
+  test "an unset effort is omitted from the wire shape" do
+    {:ok, envelope} =
+      Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "location" => "local"})
+
+    turn = %{prompt: "go", cwd: "/w", tools: [], run_id: "r", node_id: "n"}
+
+    assert {:ok, body} = Client.request_body(envelope, turn)
+    refute Map.has_key?(body, "effort")
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/engine/envelope_test.exs b/packages/symphony/elixir/test/symphony_elixir/engine/envelope_test.exs
new file mode 100644
index 000000000..4d90e0ada
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/engine/envelope_test.exs
@@ -0,0 +1,73 @@
+defmodule SymphonyElixir.Engine.EnvelopeTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Engine.Envelope
+
+  describe "from_map/1" do
+    test "builds a valid codex envelope and defaults permissions and location" do
+      assert {:ok, env} =
+               Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "effort" => "medium"})
+
+      assert env.engine == :codex
+      assert env.model == "gpt-5.3-codex"
+      assert env.effort == :medium
+      assert env.permissions == :workspace_write
+      assert env.location == :local
+    end
+
+    test "builds a valid claude envelope" do
+      assert {:ok, env} =
+               Envelope.from_map(%{
+                 "engine" => "claude",
+                 "model" => "claude-opus-4-8",
+                 "permissions" => "danger_full_access",
+                 "location" => "local"
+               })
+
+      assert env.engine == :claude
+      assert env.permissions == :danger_full_access
+    end
+
+    test "parses host and room locations" do
+      assert {:ok, %{location: {:host, "hari"}}} =
+               Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "location" => %{"host" => "hari"}})
+
+      assert {:ok, %{location: {:room, "https://r"}}} =
+               Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "location" => %{"room" => "https://r"}})
+    end
+
+    test "rejects a claude model under engine: codex" do
+      assert {:error, {:engine_model_mismatch, :codex, "opus"}} =
+               Envelope.from_map(%{"engine" => "codex", "model" => "opus"})
+    end
+
+    test "rejects a non-claude model under engine: claude" do
+      assert {:error, {:engine_model_mismatch, :claude, "gpt-5.3-codex"}} =
+               Envelope.from_map(%{"engine" => "claude", "model" => "gpt-5.3-codex"})
+    end
+
+    test "rejects unknown keys instead of silently ignoring them" do
+      assert {:error, {:unknown_envelope_keys, ["sandbox"]}} =
+               Envelope.from_map(%{"engine" => "claude", "model" => "opus", "sandbox" => "workspace-write"})
+    end
+
+    test "rejects an out-of-range effort" do
+      assert {:error, {:invalid_effort, "ultra"}} =
+               Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "effort" => "ultra"})
+    end
+
+    test "requires engine and model" do
+      assert {:error, {:missing_envelope_field, "engine"}} = Envelope.from_map(%{"model" => "opus"})
+      assert {:error, {:missing_envelope_field, "model"}} = Envelope.from_map(%{"engine" => "claude"})
+    end
+  end
+
+  describe "claude_model?/1" do
+    test "matches claude prefixes and aliases" do
+      assert Envelope.claude_model?("claude-opus-4-8")
+      assert Envelope.claude_model?("opus")
+      assert Envelope.claude_model?("SONNET")
+      refute Envelope.claude_model?("gpt-5.3-codex")
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/ir/graph_test.exs b/packages/symphony/elixir/test/symphony_elixir/ir/graph_test.exs
new file mode 100644
index 000000000..1c93a67c2
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/ir/graph_test.exs
@@ -0,0 +1,142 @@
+defmodule SymphonyElixir.IR.GraphTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.IR.{Graph, Node, RunGraph}
+
+  defp node(id, opts) do
+    Node.new(
+      [id: id, ast_origin: {:test, id}, kind: :exec, inputs: Keyword.get(opts, :inputs, %{})] ++
+        Keyword.take(opts, [:state])
+    )
+  end
+
+  defp graph(nodes) do
+    RunGraph.new("run-1", "hash", nil) |> RunGraph.put_nodes(nodes)
+  end
+
+  describe "ready_nodes/1" do
+    test "a node with no deps is ready immediately" do
+      g = graph([node("a", state: :pending)])
+      assert [%Node{id: "a"}] = Graph.ready_nodes(g)
+    end
+
+    test "parallel-ready siblings are both returned" do
+      g = graph([node("a", state: :pending), node("b", state: :pending)])
+      ids = g |> Graph.ready_nodes() |> Enum.map(& &1.id)
+      assert ids == ["a", "b"]
+    end
+
+    test "a dependent is not ready until its dep succeeds" do
+      dep_input = %{"x" => {:node, "a", []}}
+      g = graph([node("a", state: :pending), node("b", state: :pending, inputs: dep_input)])
+
+      assert g |> Graph.ready_nodes() |> Enum.map(& &1.id) == ["a"]
+
+      g = Graph.apply_output(g, "a", {:ok, %{result: 1}})
+      assert g |> Graph.ready_nodes() |> Enum.map(& &1.id) == ["b"]
+    end
+
+    test "running and terminal nodes are excluded" do
+      g =
+        graph([
+          node("a", state: :running),
+          node("b", state: :succeeded),
+          node("c", state: :pending)
+        ])
+
+      assert g |> Graph.ready_nodes() |> Enum.map(& &1.id) == ["c"]
+    end
+
+    test "fan-out: two independent dependents of one parent are both ready together" do
+      inputs = %{"x" => {:node, "a", []}}
+
+      g =
+        graph([
+          node("a", state: :succeeded),
+          node("b", state: :pending, inputs: inputs),
+          node("c", state: :pending, inputs: inputs)
+        ])
+
+      assert g |> Graph.ready_nodes() |> Enum.map(& &1.id) == ["b", "c"]
+    end
+  end
+
+  describe "apply_output/3" do
+    test "success marks the node succeeded and records output" do
+      g = graph([node("a", state: :running)]) |> Graph.apply_output("a", {:ok, :done})
+      assert g.nodes["a"].state == :succeeded
+      assert g.nodes["a"].output == :done
+    end
+
+    test "failure propagates :upstream_failed to a waiting dependent" do
+      inputs = %{"x" => {:node, "a", []}}
+      g = graph([node("a", state: :running), node("b", state: :pending, inputs: inputs)])
+
+      g = Graph.apply_output(g, "a", {:error, :boom})
+
+      assert g.nodes["a"].state == :failed
+      assert g.nodes["b"].state == :upstream_failed
+    end
+
+    test "failure propagates transitively through a chain" do
+      g =
+        graph([
+          node("a", state: :running),
+          node("b", state: :pending, inputs: %{"x" => {:node, "a", []}}),
+          node("c", state: :pending, inputs: %{"y" => {:node, "b", []}})
+        ])
+
+      g = Graph.apply_output(g, "a", {:error, :boom})
+
+      assert g.nodes["b"].state == :upstream_failed
+      assert g.nodes["c"].state == :upstream_failed
+    end
+
+    test "a dependent that opts to run on failure is not propagated to" do
+      inputs = %{"x" => {:node, "a", []}, "__on_failure__" => {:literal, true}}
+      g = graph([node("a", state: :running), node("b", state: :pending, inputs: inputs)])
+
+      g = Graph.apply_output(g, "a", {:error, :boom})
+
+      assert g.nodes["b"].state == :pending
+    end
+  end
+
+  describe "reset_node/2" do
+    test "returns a terminal node to :pending and clears output" do
+      g = graph([node("a", state: :failed)])
+      g = %{g | nodes: %{"a" => %{g.nodes["a"] | output: {:error, :x}}}}
+
+      g = Graph.reset_node(g, "a")
+
+      assert g.nodes["a"].state == :pending
+      assert g.nodes["a"].output == nil
+    end
+  end
+
+  describe "finish detection" do
+    test "all_terminal? is true only when every node is terminal" do
+      refute Graph.all_terminal?(graph([node("a", state: :running)]))
+      assert Graph.all_terminal?(graph([node("a", state: :succeeded), node("b", state: :skipped)]))
+    end
+
+    test "finished_status reflects failure and success" do
+      assert Graph.finished_status(graph([node("a", state: :succeeded)])) == :succeeded
+      assert Graph.finished_status(graph([node("a", state: :failed)])) == :failed
+      assert Graph.finished_status(graph([node("a", state: :running)])) == :running
+    end
+
+    test "an empty node map is a no-op run that finishes succeeded" do
+      # A workflow whose only construct gated its body off (`when` falsy,
+      # `every n` that did not fire this tick) materializes to zero nodes.
+      # That is a completed no-op, not a run still in progress, so the
+      # runtime can finish it instead of tripping the deadlock guard.
+      assert Graph.finished_status(graph([])) == :succeeded
+
+      # The empty map stays non-terminal so the runtime never declares a run
+      # done before its first materialization; the two invariants are the
+      # deliberate pair the runtime relies on.
+      refute Graph.all_terminal?(graph([]))
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/ir/materializer_test.exs b/packages/symphony/elixir/test/symphony_elixir/ir/materializer_test.exs
new file mode 100644
index 000000000..9702af520
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/ir/materializer_test.exs
@@ -0,0 +1,296 @@
+defmodule SymphonyElixir.IR.MaterializerTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.DSL.Parser
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Graph, Materializer, RunGraph}
+
+  defp parse!(source) do
+    {:ok, ast} = Parser.parse(source)
+    ast
+  end
+
+  describe "materialize/3" do
+    test "builds a running RunGraph with the static nodes and a lowered envelope" do
+      ast =
+        parse!("""
+        workflow "w" {
+          run <- agent { engine: codex, model: "gpt-5.3-codex", permissions: workspace_write, prompt: inline "go" }
+        }
+        """)
+
+      assert {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      assert graph.status == :running
+      assert [node] = Map.values(graph.nodes)
+      assert node.kind == :agent
+      # The raw spec map is lowered to a typed Engine.Envelope at this boundary.
+      assert %Envelope{engine: :codex, model: "gpt-5.3-codex", permissions: :workspace_write} = node.envelope
+    end
+
+    test "an invalid envelope fails the whole materialization with the node id" do
+      # A claude-looking model under engine: codex is a load error.
+      ast =
+        parse!("""
+        workflow "w" {
+          run <- agent { engine: codex, model: "claude-opus-4", prompt: inline "go" }
+        }
+        """)
+
+      assert {:error, {:invalid_envelope, "agent-0", {:engine_model_mismatch, :codex, "claude-opus-4"}}} =
+               Materializer.materialize("run_1", "hash", ast)
+    end
+  end
+
+  describe "expand_dynamic/1" do
+    test "a when-gate emits its body once the gating output is known" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          when ${a.ok} {
+            b <- agent { engine: codex, model: "m", prompt: inline "second" }
+          }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+
+      # Before a's output is known, the gate is a placeholder and the body
+      # agent node is absent (only agent-0 plus the gate exist).
+      assert Enum.any?(Map.values(graph.nodes), &(&1.kind == :gate))
+      agents_before = for {id, %{kind: :agent}} <- graph.nodes, do: id
+      assert agents_before == ["agent-0"]
+
+      # Succeed a with a truthy `ok`, then re-expand.
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"ok" => true}})
+      assert {:ok, expanded, new_ids} = Materializer.expand_dynamic(graph)
+
+      # Exactly one new agent node (the gate body) appears.
+      assert [body_id] = new_ids
+      assert expanded.nodes[body_id].kind == :agent
+      # The resolved gate placeholder is retired so it cannot deadlock the run.
+      gate = Enum.find(Map.values(expanded.nodes), &(&1.kind == :gate))
+      assert gate.state == :skipped
+    end
+
+    test "a falsey when-gate emits no body and retires the placeholder" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          when ${a.ok} {
+            b <- agent { engine: codex, model: "m", prompt: inline "second" }
+          }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"ok" => false}})
+
+      assert {:ok, expanded, new_ids} = Materializer.expand_dynamic(graph)
+      assert new_ids == []
+      refute Map.has_key?(expanded.nodes, "agent-1")
+      assert Enum.find(Map.values(expanded.nodes), &(&1.kind == :gate)).state == :skipped
+    end
+
+    test "re-expansion is idempotent: a second pass adds nothing new" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          when ${a.ok} {
+            b <- agent { engine: codex, model: "m", prompt: inline "second" }
+          }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"ok" => true}})
+
+      {:ok, once, _} = Materializer.expand_dynamic(graph)
+      {:ok, twice, second_ids} = Materializer.expand_dynamic(once)
+
+      assert second_ids == []
+      assert Map.keys(once.nodes) |> Enum.sort() == Map.keys(twice.nodes) |> Enum.sort()
+    end
+
+    test "a map fan-out emits one child per element and retires the placeholder" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "list" }
+          map ${seed.repos} as repo {
+            child <- exec "./audit.sh" { target: ${repo} }
+          }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+
+      # Before the list is known the fan-out is a single placeholder and no
+      # body child exists.
+      assert Enum.any?(Map.values(graph.nodes), &(&1.kind == :map_fanout))
+      refute Enum.any?(Map.values(graph.nodes), &(&1.kind == :exec))
+
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"repos" => ["alpha", "beta", "gamma"]}})
+      assert {:ok, expanded, new_ids} = Materializer.expand_dynamic(graph)
+
+      # One exec child per element, each carrying its element literally, with
+      # distinct content-derived ids.
+      children = for {_id, %{kind: :exec} = n} <- expanded.nodes, do: n
+      assert length(children) == 3
+      assert length(new_ids) == 3
+      targets = children |> Enum.map(& &1.inputs["target"]) |> Enum.sort()
+      assert targets == [{:literal, "alpha"}, {:literal, "beta"}, {:literal, "gamma"}]
+
+      # The resolved fan-out placeholder is retired so it cannot deadlock the run.
+      assert Enum.find(Map.values(expanded.nodes), &(&1.kind == :map_fanout)).state == :skipped
+    end
+
+    test "re-expanding a fanned-out map merges idempotently, adding nothing new" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "list" }
+          map ${seed.repos} as repo {
+            child <- exec "./audit.sh" { target: ${repo} }
+          }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"repos" => ["alpha", "beta"]}})
+
+      {:ok, once, first_ids} = Materializer.expand_dynamic(graph)
+      assert length(first_ids) == 2
+
+      # A second pass re-emits the same children (the interpreter re-derives
+      # them deterministically), but the merge-by-id adds nothing because the
+      # ids already exist. This confirms the Phase 7 agent's belief that
+      # re-emitting children on each pass merges idempotently.
+      {:ok, twice, second_ids} = Materializer.expand_dynamic(once)
+      assert second_ids == []
+      assert Map.keys(once.nodes) |> Enum.sort() == Map.keys(twice.nodes) |> Enum.sort()
+    end
+
+    test "a map over an empty list emits no children and retires the placeholder" do
+      ast =
+        parse!("""
+        workflow "w" {
+          seed <- agent { engine: codex, model: "m", prompt: inline "list" }
+          map ${seed.repos} as repo {
+            child <- exec "./audit.sh" { target: ${repo} }
+          }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"repos" => []}})
+
+      assert {:ok, expanded, new_ids} = Materializer.expand_dynamic(graph)
+      assert new_ids == []
+      refute Enum.any?(Map.values(expanded.nodes), &(&1.kind == :exec))
+      assert Enum.find(Map.values(expanded.nodes), &(&1.kind == :map_fanout)).state == :skipped
+    end
+
+    test "a graph without a workflow AST is returned unchanged" do
+      graph = RunGraph.new("run_1", "hash", nil)
+      assert {:ok, ^graph, []} = Materializer.expand_dynamic(graph)
+    end
+
+    test "a deferred inline prompt waits on its input and folds to text once the output arrives" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          b <- agent { engine: codex, model: "m", prompt: inline "use ${a.result} now" }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+
+      # b interpolates a's output. The interpreter cannot fold the mixed
+      # literal/node concat into one input ref, so the edge arrives via the
+      # pending set; the materializer must still make b depend on a so it
+      # does not run with an unresolved prompt.
+      b = graph.nodes["agent-1"]
+      assert b.prompt_ref == {:inline, nil}
+      assert "agent-0" in b.deps
+      refute Enum.any?(Graph.ready_nodes(graph), &(&1.id == "agent-1"))
+
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"result" => "X"}})
+      assert {:ok, expanded, _ids} = Materializer.expand_dynamic(graph)
+
+      b = expanded.nodes["agent-1"]
+      assert b.prompt_ref == {:inline, "use X now"}
+      assert b.state == :pending
+      # The edge is kept for provenance even though the prompt now folds to a
+      # literal; it points at the succeeded agent-0 so b is schedulable.
+      assert "agent-0" in b.deps
+      assert Enum.any?(Graph.ready_nodes(expanded), &(&1.id == "agent-1"))
+    end
+
+    test "a deferred skill binding folds to the resolved value on re-expansion" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          b <- agent { engine: codex, model: "m", prompt: skill "next" { ctx: ${a.area} } }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+
+      # A skill binding that reads a node output already carries the edge as
+      # an input ref, so b depends on a from the first pass.
+      b = graph.nodes["agent-1"]
+      assert "agent-0" in b.deps
+      assert b.inputs["ctx"] == {:node, "agent-0", ["area"]}
+      assert {:skill, "next", %{"ctx" => unresolved}} = b.prompt_ref
+      refute unresolved == "DB"
+
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"area" => "DB"}})
+      assert {:ok, expanded, _ids} = Materializer.expand_dynamic(graph)
+
+      b = expanded.nodes["agent-1"]
+      assert b.prompt_ref == {:skill, "next", %{"ctx" => "DB"}}
+      assert b.inputs["ctx"] == {:literal, "DB"}
+    end
+
+    test "a node already running is not clobbered by re-expansion" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+          b <- agent { engine: codex, model: "m", prompt: inline "use ${a.result} now" }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      # Force agent-0 into a live state, then re-expand: a running/terminal
+      # node keeps its state and is never replaced by the fresh expansion.
+      graph = put_in(graph.nodes["agent-0"].state, :running)
+
+      assert {:ok, expanded, new_ids} = Materializer.expand_dynamic(graph)
+      assert new_ids == []
+      assert expanded.nodes["agent-0"].state == :running
+    end
+  end
+
+  describe "known_outputs/1" do
+    test "exposes only succeeded node outputs" do
+      ast =
+        parse!("""
+        workflow "w" {
+          a <- agent { engine: codex, model: "m", prompt: inline "first" }
+        }
+        """)
+
+      {:ok, graph} = Materializer.materialize("run_1", "hash", ast)
+      assert Materializer.known_outputs(graph) == %{}
+
+      graph = Graph.apply_output(graph, "agent-0", {:ok, %{"area" => 42}})
+      assert Materializer.known_outputs(graph) == %{"agent-0" => %{"area" => 42}}
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/ir/recovery_test.exs b/packages/symphony/elixir/test/symphony_elixir/ir/recovery_test.exs
new file mode 100644
index 000000000..f402ec856
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/ir/recovery_test.exs
@@ -0,0 +1,107 @@
+defmodule SymphonyElixir.IR.RecoveryTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.IR.{Attempt, Graph, Node, RunGraph}
+  alias SymphonyElixir.Runtime.Recovery
+
+  defp node(id, opts) do
+    Node.new(
+      [id: id, ast_origin: {:test, id}, kind: :agent, inputs: Keyword.get(opts, :inputs, %{})] ++
+        Keyword.take(opts, [:state, :attempts])
+    )
+  end
+
+  defp running_with_thread(id, thread_id, opts \\ []) do
+    attempt = Attempt.start(1, :codex, thread_id)
+    node(id, Keyword.merge([state: :running, attempts: [attempt]], opts))
+  end
+
+  defp graph(nodes), do: RunGraph.new("r", "h", {:ast, []}) |> RunGraph.put_nodes(nodes)
+
+  describe "replay/2" do
+    test "replaying an expansion log reproduces the same node set deterministically" do
+      base = graph([node("root", state: :succeeded)])
+
+      log =
+        base
+        |> RunGraph.append_expansion({:fanout, "f"}, [:a, :b], ["child-a", "child-b"])
+
+      expand = fn {:fanout, "f"}, elements, _nodes ->
+        Enum.map(elements, fn e -> node("child-#{e}", state: :pending) end)
+      end
+
+      one = Recovery.replay(log, expand)
+      two = Recovery.replay(log, expand)
+
+      assert Map.keys(one.nodes) |> Enum.sort() == ["child-a", "child-b", "root"]
+      assert Map.keys(one.nodes) == Map.keys(two.nodes)
+    end
+
+    test "the default expander leaves a statically-materialized graph unchanged" do
+      g = graph([node("a", state: :pending), node("b", state: :pending)])
+      assert Recovery.replay(g).nodes == g.nodes
+    end
+  end
+
+  describe "reconcile/2 reattach probe" do
+    test "a :running node the engine still owns is left running" do
+      g = graph([running_with_thread("a", "t1")])
+      out = Recovery.reconcile(g, fn "t1" -> :running end)
+      assert out.nodes["a"].state == :running
+    end
+
+    test "a :running node the engine finished is harvested" do
+      g = graph([running_with_thread("a", "t1")])
+      out = Recovery.reconcile(g, fn "t1" -> {:finished, {:ok, :harvested}} end)
+      assert out.nodes["a"].state == :succeeded
+      assert out.nodes["a"].output == :harvested
+    end
+  end
+
+  describe "reconcile/2 strand policy (#90, non-idempotent safety)" do
+    test "an unknown thread with an opened thread_id is stranded, never auto-retried" do
+      # opted in but the attempt recorded a thread_id, so a side effect may
+      # have happened: route to human review, do not blind-retry.
+      g = graph([running_with_thread("a", "t1", inputs: %{"__retry__" => {:literal, true}})])
+      out = Recovery.reconcile(g, fn "t1" -> :unknown end)
+      assert out.nodes["a"].state == :stranded
+    end
+
+    test "an opted-in node with no observed side effect is auto-retried" do
+      attempt = Attempt.start(1, :codex, nil)
+
+      g =
+        graph([
+          node("a",
+            state: :running,
+            attempts: [attempt],
+            inputs: %{"__retry__" => {:literal, true}}
+          )
+        ])
+
+      out = Recovery.reconcile(g, fn nil -> :unknown end)
+      assert out.nodes["a"].state == :retrying
+    end
+
+    test "a node that did not opt in is stranded even with no side effect" do
+      attempt = Attempt.start(1, :codex, nil)
+      g = graph([node("a", state: :running, attempts: [attempt])])
+      out = Recovery.reconcile(g, fn nil -> :unknown end)
+      assert out.nodes["a"].state == :stranded
+    end
+
+    test "the stranded attempt is recorded on the node" do
+      g = graph([running_with_thread("a", "t1")])
+      out = Recovery.reconcile(g, fn "t1" -> :unknown end)
+      [att] = out.nodes["a"].attempts
+      assert att.state == :stranded
+      assert att.outcome == :stranded
+    end
+
+    test "after reconcile no node remains :running" do
+      g = graph([running_with_thread("a", "t1"), running_with_thread("b", "t2")])
+      out = Recovery.reconcile(g, fn _ -> :unknown end)
+      refute Enum.any?(Graph.running_nodes(out))
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/ir/run_notifier_test.exs b/packages/symphony/elixir/test/symphony_elixir/ir/run_notifier_test.exs
new file mode 100644
index 000000000..7eddf8d81
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/ir/run_notifier_test.exs
@@ -0,0 +1,157 @@
+defmodule SymphonyElixir.IR.RunNotifierTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.IR.Attempt
+  alias SymphonyElixir.IR.Node
+  alias SymphonyElixir.IR.RunGraph
+  alias SymphonyElixir.IR.RunNotifier
+
+  defp graph(attrs) do
+    defaults = %{run_id: "triage-1780166452589-58", source_hash: "hash", status: :succeeded, nodes: %{}}
+    struct(RunGraph, Map.merge(defaults, Map.new(attrs)))
+  end
+
+  # A succeeded agent node carrying one attempt with the given room-server
+  # thread id, so the run-details link can resolve a deep link.
+  defp agent_node(id, thread_id) do
+    %Node{
+      id: id,
+      ast_origin: {:agent, id},
+      kind: :agent,
+      inputs: [],
+      deps: [],
+      state: :succeeded,
+      attempts: [%Attempt{n: 1, engine: :codex, thread_id: thread_id, state: :succeeded, started_at: ~U[2026-06-04 00:00:00Z]}]
+    }
+  end
+
+  # The notifier only reads the two cron-policy fields; default to the
+  # production defaults (failures on, no success allowlist) unless overridden.
+  defp config(attrs \\ %{}) do
+    defaults = %{slack_notify_cron_failures: true, slack_notify_cron_workflows: []}
+    struct(Config, Map.merge(defaults, Map.new(attrs)))
+  end
+
+  describe "notify?/2" do
+    test "skips non-terminal runs" do
+      refute RunNotifier.notify?(graph(status: :running, trigger: %{kind: :linear}), config())
+      refute RunNotifier.notify?(graph(status: :pending, trigger: %{kind: :linear}), config())
+    end
+
+    test "skips cancelled runs" do
+      refute RunNotifier.notify?(graph(status: :cancelled, trigger: %{kind: :linear}), config())
+    end
+
+    test "notifies on terminal non-cron runs" do
+      assert RunNotifier.notify?(graph(status: :succeeded, trigger: %{kind: :linear}), config())
+      assert RunNotifier.notify?(graph(status: :failed, trigger: %{kind: :manual}), config())
+      # Absent trigger is not cron, so it notifies.
+      assert RunNotifier.notify?(graph(status: :succeeded, trigger: nil), config())
+    end
+
+    test "suppresses cron successes unless the workflow is allowlisted" do
+      run = graph(run_id: "digest-100-2", status: :succeeded, trigger: %{kind: :cron})
+
+      refute RunNotifier.notify?(run, config())
+      assert RunNotifier.notify?(run, config(slack_notify_cron_workflows: ["digest"]))
+    end
+
+    test "notifies on cron failures by default and suppresses them when disabled" do
+      # A store round-trip leaves the kind string-keyed; it must still be
+      # treated as cron.
+      run = graph(run_id: "babysit-dispatch-100-2", status: :failed, trigger: %{"kind" => "cron"})
+
+      assert RunNotifier.notify?(run, config())
+      refute RunNotifier.notify?(run, config(slack_notify_cron_failures: false))
+    end
+
+    test "a tight-interval cron success stays quiet even when failures are enabled" do
+      run = graph(run_id: "babysit-dispatch-100-2", status: :succeeded, trigger: %{kind: :cron})
+
+      refute RunNotifier.notify?(run, config(slack_notify_cron_failures: true))
+    end
+
+    test "the wildcard allowlist notifies every cron success" do
+      run = graph(run_id: "babysit-dispatch-100-2", status: :succeeded, trigger: %{kind: :cron})
+
+      refute RunNotifier.notify?(run, config())
+      assert RunNotifier.notify?(run, config(slack_notify_cron_workflows: ["*"]))
+    end
+  end
+
+  describe "workflow_name/1" do
+    test "strips the numeric run-id suffix to recover the workflow slug" do
+      assert RunNotifier.workflow_name("babysit-dispatch-1780166452589-58") == "babysit-dispatch"
+      assert RunNotifier.workflow_name("triage-100-2") == "triage"
+    end
+  end
+
+  describe "build_payload/2" do
+    test "headers a succeeded run and links run details to the room root when no thread opened" do
+      payload =
+        RunNotifier.build_payload(
+          graph(run_id: "triage-100-2", status: :succeeded, trigger: %{kind: :manual}),
+          "https://room.ix.dev"
+        )
+
+      [header | _] = payload["blocks"]
+      assert header["type"] == "header"
+      assert header["text"]["text"] =~ "triage"
+      assert header["text"]["text"] =~ "finished"
+      assert payload["text"] =~ "Symphony: triage finished"
+
+      # No agent thread on the graph, so the link falls back to the room root.
+      run_button = button_with_text(payload, "Run details")
+      assert run_button["url"] == "https://room.ix.dev/"
+    end
+
+    test "deep-links run details to the run's room backend and latest thread" do
+      payload =
+        RunNotifier.build_payload(
+          graph(
+            run_id: "triage-100-2",
+            status: :succeeded,
+            trigger: %{kind: :manual},
+            nodes: %{"n0" => agent_node("n0", "thread_abc")}
+          ),
+          "https://room.ix.dev/"
+        )
+
+      run_button = button_with_text(payload, "Run details")
+
+      # server_id is the registered backend id (Provision.backend_id), encoded
+      # like the room client's encodeURIComponent links; the trailing slash on
+      # the base is trimmed.
+      assert run_button["url"] ==
+               "https://room.ix.dev/#/s/symphony%3Atriage-100-2%3Aroom/t/thread_abc"
+    end
+
+    test "adds a Linear button from the trigger and marks the run failed" do
+      payload =
+        RunNotifier.build_payload(
+          graph(
+            run_id: "triage-100-2",
+            status: :failed,
+            trigger: %{kind: :linear, identifier: "ENG-9", url: "https://linear.app/indexable/issue/ENG-9"}
+          ),
+          nil
+        )
+
+      [header | _] = payload["blocks"]
+      assert header["text"]["text"] =~ "failed"
+
+      linear_button = button_with_text(payload, "ENG-9")
+      assert linear_button["url"] == "https://linear.app/indexable/issue/ENG-9"
+      # No room url was given, so there is no run-details button.
+      assert is_nil(button_with_text(payload, "Run details"))
+    end
+  end
+
+  defp button_with_text(payload, text) do
+    payload["blocks"]
+    |> Enum.find(%{}, &(&1["type"] == "actions"))
+    |> Map.get("elements", [])
+    |> Enum.find(fn el -> el["text"]["text"] == text end)
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/ir/store_test.exs b/packages/symphony/elixir/test/symphony_elixir/ir/store_test.exs
new file mode 100644
index 000000000..ba1b5c518
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/ir/store_test.exs
@@ -0,0 +1,151 @@
+defmodule SymphonyElixir.IR.StoreTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Attempt, Node, RunGraph, Store}
+
+  setup do
+    dir = Path.join(System.tmp_dir!(), "ir_store_test_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(dir)
+    on_exit(fn -> File.rm_rf(dir) end)
+    {:ok, dir: dir}
+  end
+
+  defp sample_graph do
+    {:ok, env} =
+      Envelope.from_map(%{"engine" => "codex", "model" => "gpt-5.3-codex", "effort" => "medium"})
+
+    agent =
+      Node.new(
+        id: "agent-1",
+        ast_origin: {:agent, "write"},
+        kind: :agent,
+        envelope: env,
+        prompt_ref: {:skill, "writer", %{"topic" => "hello"}},
+        inputs: %{"seed" => {:literal, 42}},
+        state: :running
+      )
+
+    attempt = Attempt.start(1, :codex, "thread-abc") |> Attempt.finish(:succeeded, :ok, %{usd: 0.12, tokens_in: 100})
+    agent = %{agent | attempts: [attempt]}
+
+    exec =
+      Node.new(
+        id: "exec-1",
+        ast_origin: {:exec, "build"},
+        kind: :exec,
+        inputs: %{"from" => {:node, "agent-1", [:output]}},
+        state: :pending
+      )
+
+    RunGraph.new("run-store-1", "deadbeef", {:ast, [:root]})
+    |> RunGraph.put_nodes([agent, exec])
+    |> RunGraph.append_expansion({:gate, "g1"}, {:observed, true}, ["exec-1"])
+  end
+
+  test "round-trips a RunGraph with attempts and an expansion log", %{dir: dir} do
+    graph = sample_graph()
+
+    assert :ok = Store.persist(graph, dir: dir)
+    assert {:ok, loaded} = Store.load(graph.run_id, dir: dir)
+
+    assert loaded.run_id == graph.run_id
+    assert loaded.source_hash == graph.source_hash
+    assert loaded.ast == {:ast, [:root]}
+    assert loaded.status == graph.status
+
+    agent = loaded.nodes["agent-1"]
+    assert agent.kind == :agent
+    assert agent.state == :running
+    assert agent.envelope.engine == :codex
+    assert agent.envelope.model == "gpt-5.3-codex"
+    assert agent.prompt_ref == {:skill, "writer", %{"topic" => "hello"}}
+    assert agent.inputs == %{"seed" => {:literal, 42}}
+
+    [att] = agent.attempts
+    assert att.thread_id == "thread-abc"
+    assert att.state == :succeeded
+    assert att.outcome == :ok
+    assert att.cost == %{usd: 0.12, tokens_in: 100}
+
+    exec = loaded.nodes["exec-1"]
+    assert exec.inputs == %{"from" => {:node, "agent-1", [:output]}}
+    assert exec.deps == ["agent-1"]
+
+    [event] = loaded.expansion_log
+    assert event.origin == {:gate, "g1"}
+    assert event.observed == {:observed, true}
+    assert event.emitted == ["exec-1"]
+  end
+
+  test "load_all returns every decodable graph and quarantines a corrupt file", %{dir: dir} do
+    graph = sample_graph()
+    assert :ok = Store.persist(graph, dir: dir)
+
+    bad_path = Path.join(dir, "broken.json")
+    File.write!(bad_path, "{ not json")
+
+    loaded = Store.load_all(dir: dir)
+    assert Enum.map(loaded, & &1.run_id) == ["run-store-1"]
+
+    refute File.exists?(bad_path)
+    assert File.exists?(bad_path <> ".bad")
+  end
+
+  test "append_expansion persists the new event", %{dir: dir} do
+    graph = sample_graph()
+    assert :ok = Store.persist(graph, dir: dir)
+
+    assert {:ok, next} = Store.append_expansion(graph, {{:gate, "g2"}, {:observed, 7}, ["exec-1"]}, dir: dir)
+    assert length(next.expansion_log) == 2
+
+    assert {:ok, reloaded} = Store.load(graph.run_id, dir: dir)
+    assert length(reloaded.expansion_log) == 2
+  end
+
+  test "load returns :not_found for an unknown run", %{dir: dir} do
+    assert {:error, :not_found} = Store.load("nope", dir: dir)
+  end
+
+  test "round-trips a graph with a placement map (ixvm declared, host effective)", %{dir: dir} do
+    graph =
+      RunGraph.new("run-placement", "deadbeef", nil)
+      |> Map.put(:placement, %{declared: :ixvm, effective: :host})
+
+    assert :ok = Store.persist(graph, dir: dir)
+    assert {:ok, loaded} = Store.load("run-placement", dir: dir)
+
+    assert loaded.placement == %{declared: :ixvm, effective: :host}
+  end
+
+  test "round-trips a graph with a remote effective placement (ixvm -> remote fallback)", %{dir: dir} do
+    graph =
+      RunGraph.new("run-placement-remote", "deadbeef", nil)
+      |> Map.put(:placement, %{declared: :ixvm, effective: :remote})
+
+    assert :ok = Store.persist(graph, dir: dir)
+    assert {:ok, loaded} = Store.load("run-placement-remote", dir: dir)
+
+    assert loaded.placement == %{declared: :ixvm, effective: :remote}
+  end
+
+  test "round-trips a graph with a host-named declared placement", %{dir: dir} do
+    graph =
+      RunGraph.new("run-placement-host-named", "deadbeef", nil)
+      |> Map.put(:placement, %{declared: {:host, "box1"}, effective: :host})
+
+    assert :ok = Store.persist(graph, dir: dir)
+    assert {:ok, loaded} = Store.load("run-placement-host-named", dir: dir)
+
+    assert loaded.placement == %{declared: {:host, "box1"}, effective: :host}
+  end
+
+  test "round-trips a graph with nil placement (no placement acquired)", %{dir: dir} do
+    graph = RunGraph.new("run-no-placement", "deadbeef", nil)
+
+    assert :ok = Store.persist(graph, dir: dir)
+    assert {:ok, loaded} = Store.load("run-no-placement", dir: dir)
+
+    assert loaded.placement == nil
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/ir/view_test.exs b/packages/symphony/elixir/test/symphony_elixir/ir/view_test.exs
new file mode 100644
index 000000000..4874c086f
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/ir/view_test.exs
@@ -0,0 +1,204 @@
+defmodule SymphonyElixir.IR.ViewTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Attempt, Node, RunGraph, View}
+
+  defp agent_node do
+    {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5.3-codex", effort: :high, location: :local})
+
+    attempt =
+      Attempt.start(1, :codex, "thread-1")
+      |> Attempt.finish(:succeeded, :ok)
+      |> Map.put(:cost, %{usd: 0.42, tokens_in: 100, tokens_out: 20})
+
+    %{
+      Node.new(id: "a", ast_origin: {:agent, "skill"}, kind: :agent, envelope: env, inputs: %{})
+      | state: :succeeded,
+        output: %{"area" => 7},
+        attempts: [attempt]
+    }
+  end
+
+  defp graph do
+    RunGraph.new("run_v", "hash", nil)
+    |> RunGraph.put_nodes([agent_node()])
+    |> Map.put(:status, :succeeded)
+    |> RunGraph.append_audit(:retry_node, "a", "alice", %{})
+  end
+
+  test "summary/1 reports status, counts, and total cost" do
+    s = View.summary(graph())
+    assert s["run_id"] == "run_v"
+    assert s["status"] == "succeeded"
+    assert s["node_count"] == 1
+    assert s["states"] == %{"succeeded" => 1}
+    assert s["cost_usd"] == 0.42
+  end
+
+  test "summary cost is nil when no attempt reported a cost" do
+    g = RunGraph.new("r", "h", nil) |> RunGraph.put_nodes([Node.new(id: "x", ast_origin: {:exec, "x"}, kind: :exec, inputs: %{})])
+    assert View.summary(g)["cost_usd"] == nil
+  end
+
+  test "detail/1 renders nodes, attempts, envelope, and audit log as JSON-able facts" do
+    d = View.detail(graph())
+
+    assert [node] = d["nodes"]
+    assert node["id"] == "a"
+    assert node["kind"] == "agent"
+    assert node["state"] == "succeeded"
+    assert node["envelope"]["engine"] == "codex"
+    assert node["envelope"]["effort"] == "high"
+    assert node["envelope"]["location"] == "local"
+    assert node["output"] == %{"area" => 7}
+
+    assert [attempt] = node["attempts"]
+    assert attempt["n"] == 1
+    assert attempt["outcome"] == "ok"
+    assert attempt["cost"]["usd"] == 0.42
+
+    assert [audit] = d["audit_log"]
+    assert audit["action"] == "retry_node"
+    assert audit["target"] == "a"
+    assert audit["actor"] == "alice"
+  end
+
+  describe "render_node/1 label field" do
+    test "agent node with skill prompt_ref uses skill name as label" do
+      {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5", effort: :high, location: :local})
+
+      node =
+        Node.new(
+          id: "skill-node",
+          ast_origin: {:agent, "my_skill"},
+          kind: :agent,
+          envelope: env,
+          prompt_ref: {:skill, "my_skill", %{}},
+          inputs: %{}
+        )
+
+      assert View.render_node(node)["label"] == "my_skill"
+    end
+
+    test "agent node with inline prompt_ref uses 'inline' as label" do
+      {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5", effort: :high, location: :local})
+
+      node =
+        Node.new(
+          id: "inline-node",
+          ast_origin: {:agent, "inline"},
+          kind: :agent,
+          envelope: env,
+          prompt_ref: {:inline, "do something"},
+          inputs: %{}
+        )
+
+      assert View.render_node(node)["label"] == "inline"
+    end
+
+    test "exec node with literal script input uses script path as label" do
+      node =
+        Node.new(
+          id: "exec-node",
+          ast_origin: {:exec, "run"},
+          kind: :exec,
+          inputs: %{"script" => {:literal, "./scripts/deploy.sh"}}
+        )
+
+      assert View.render_node(node)["label"] == "./scripts/deploy.sh"
+    end
+
+    test "exec node without resolved script input uses 'exec' as label" do
+      node =
+        Node.new(
+          id: "exec-node",
+          ast_origin: {:exec, "run"},
+          kind: :exec,
+          inputs: %{}
+        )
+
+      assert View.render_node(node)["label"] == "exec"
+    end
+
+    test "gate node uses 'gate' as label" do
+      node =
+        Node.new(
+          id: "gate-node",
+          ast_origin: {:gate, "check"},
+          kind: :gate,
+          inputs: %{}
+        )
+
+      assert View.render_node(node)["label"] == "gate"
+    end
+
+    test "subrun node uses 'subrun' as label" do
+      node =
+        Node.new(
+          id: "sub-node",
+          ast_origin: {:subrun, "child"},
+          kind: :subrun,
+          inputs: %{}
+        )
+
+      assert View.render_node(node)["label"] == "subrun"
+    end
+  end
+
+  test "the rendered detail encodes to JSON without a custom encoder" do
+    assert {:ok, _json} = graph() |> View.detail() |> Jason.encode()
+  end
+
+  test "render_node stringifies a non-default location" do
+    {:ok, env} = Envelope.validate(%Envelope{engine: :claude, model: "haiku", location: {:room, "http://h:1"}})
+    node = Node.new(id: "n", ast_origin: {:agent, "s"}, kind: :agent, envelope: env, inputs: %{})
+    assert View.render_node(node)["envelope"]["location"] == "room:http://h:1"
+  end
+
+  describe "summary/1 trigger and placement fields" do
+    test "summary includes trigger as a string label for a manual trigger" do
+      g = graph() |> Map.put(:trigger, %{kind: :manual})
+      s = View.summary(g)
+      assert s["trigger"] == "manual"
+    end
+
+    test "summary includes trigger label for a cron trigger" do
+      g = graph() |> Map.put(:trigger, %{kind: :cron, schedule: "0 * * * *"})
+      s = View.summary(g)
+      assert s["trigger"] == "cron 0 * * * *"
+    end
+
+    test "summary defaults trigger to 'manual' when trigger is nil" do
+      g = RunGraph.new("r-nil-trigger", "h", nil)
+      assert View.summary(g)["trigger"] == "manual"
+    end
+
+    test "summary includes placement with declared and effective as strings" do
+      g = graph() |> Map.put(:placement, %{declared: :ixvm, effective: :host})
+      s = View.summary(g)
+      assert s["placement"] == %{"declared" => "ixvm", "effective" => "host"}
+    end
+
+    test "summary includes placement for an ixvm -> host fallback" do
+      g = graph() |> Map.put(:placement, %{declared: :ixvm, effective: :host})
+      s = View.summary(g)
+      # A consumer can detect a fallback by comparing declared != effective.
+      assert s["placement"]["declared"] == "ixvm"
+      assert s["placement"]["effective"] == "host"
+    end
+
+    test "summary placement is nil when no placement was acquired" do
+      g = RunGraph.new("r-no-placement", "h", nil)
+      assert View.summary(g)["placement"] == nil
+    end
+
+    test "trigger_label/1 is a public shared formatter" do
+      assert View.trigger_label(%{kind: :manual}) == "manual"
+      assert View.trigger_label(%{kind: :cron, schedule: "*/5 * * * *"}) == "cron */5 * * * *"
+      assert View.trigger_label(%{kind: :linear, label: "bug"}) == "linear: bug"
+      assert View.trigger_label(%{kind: :github_pr_label, label: "review"}) == "github: review"
+      assert View.trigger_label(nil) == "manual"
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/prompt_test.exs b/packages/symphony/elixir/test/symphony_elixir/prompt_test.exs
new file mode 100644
index 000000000..e53b18146
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/prompt_test.exs
@@ -0,0 +1,94 @@
+defmodule SymphonyElixir.PromptTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Prompt
+
+  describe "build/2 inline" do
+    test "returns inline text verbatim" do
+      assert {:ok, "do the thing"} = Prompt.build({:inline, "do the thing"})
+    end
+
+    test "an unresolved inline prompt (nil text) is an error" do
+      assert {:error, :unresolved_inline_prompt} = Prompt.build({:inline, nil})
+    end
+  end
+
+  describe "build/2 skill" do
+    test "loads the body through the resolver and interpolates bindings" do
+      resolver = fn "inspect" -> {:ok, "Inspect ${repo} on branch ${branch}."} end
+
+      assert {:ok, "Inspect symphony on branch main."} =
+               Prompt.build({:skill, "inspect", %{"repo" => "symphony", "branch" => "main"}}, resolver: resolver)
+    end
+
+    test "reads a dotted binding path" do
+      resolver = fn _ -> {:ok, "Ticket ${ticket.id}: ${ticket.title}"} end
+      bindings = %{"ticket" => %{"id" => "ABC-1", "title" => "Fix it"}}
+
+      assert {:ok, "Ticket ABC-1: Fix it"} = Prompt.build({:skill, "impl", bindings}, resolver: resolver)
+    end
+
+    test "a placeholder with no binding fails loudly" do
+      resolver = fn _ -> {:ok, "needs ${missing}"} end
+      assert {:error, {:unbound_placeholder, "missing"}} = Prompt.build({:skill, "x", %{}}, resolver: resolver)
+    end
+
+    test "a skill ref with no resolver is an error" do
+      assert {:error, :missing_skill_resolver} = Prompt.build({:skill, "x", %{}})
+    end
+
+    test "propagates a resolver failure" do
+      resolver = fn _ -> {:error, :enoent} end
+      assert {:error, :enoent} = Prompt.build({:skill, "missing", %{}}, resolver: resolver)
+    end
+
+    test "expands {{partial:name}} includes through the partial resolver" do
+      resolver = fn _ -> {:ok, "Start.\n{{partial:pr}}\nEnd ${who}."} end
+      partial_resolver = fn "pr" -> {:ok, "Open a PR."} end
+
+      assert {:ok, rendered} =
+               Prompt.build({:skill, "impl", %{"who" => "you"}},
+                 resolver: resolver,
+                 partial_resolver: partial_resolver
+               )
+
+      assert rendered == "Start.\nOpen a PR.\nEnd you."
+    end
+
+    test "a body that references a partial with no partial resolver fails" do
+      resolver = fn _ -> {:ok, "{{partial:pr}}"} end
+      assert {:error, {:missing_partial_resolver, ["pr"]}} = Prompt.build({:skill, "x", %{}}, resolver: resolver)
+    end
+  end
+
+  describe "render/2" do
+    test "leaves a bare dollar sign untouched" do
+      assert {:ok, "cost is $5 and ${x}"} = Prompt.render("cost is $5 and ${x}", %{"x" => "${x}"})
+    end
+
+    test "stringifies non-string bindings" do
+      assert {:ok, "count 3"} = Prompt.render("count ${n}", %{"n" => 3})
+    end
+
+    test "an escaped $${path} renders a literal ${path} with no binding" do
+      assert {:ok, "?pub_secret=${pub_secret}"} = Prompt.render("?pub_secret=$${pub_secret}", %{})
+    end
+
+    test "an escape and a real placeholder coexist in one body" do
+      assert {:ok, "url=${pub_secret} repo=symphony"} =
+               Prompt.render("url=$${pub_secret} repo=${repo}", %{"repo" => "symphony"})
+    end
+
+    test "an unescaped placeholder still fails loudly when an escape is present" do
+      assert {:error, {:unbound_placeholder, "missing"}} =
+               Prompt.render("keep $${literal} but ${missing}", %{})
+    end
+  end
+
+  describe "build/2 escape" do
+    test "a skill body with a shell $${var} reaches the engine as a literal" do
+      resolver = fn _ -> {:ok, "curl ...?pub_secret=$${pub_secret}"} end
+      assert {:ok, "curl ...?pub_secret=${pub_secret}"} = Prompt.build({:skill, "focus_route", %{}}, resolver: resolver)
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/dsl_wiring_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/dsl_wiring_test.exs
new file mode 100644
index 000000000..8390b0ddb
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/dsl_wiring_test.exs
@@ -0,0 +1,141 @@
+defmodule SymphonyElixir.Runtime.DSLWiringTest do
+  @moduledoc """
+  End-to-end proof that a parsed `.sym` workflow drives the IR runtime:
+  Parser -> Materializer -> Runtime -> a fake engine -> terminal nodes,
+  including the dynamic expansion of a `when` gate after its dependency
+  succeeds. This is the WS-5 seam (interpreter <-> runtime) under test
+  against a fake `EngineClient`, so no room-server is required.
+  """
+  use ExUnit.Case, async: false
+
+  @moduletag capture_log: true
+
+  alias SymphonyElixir.DSL.Parser
+  alias SymphonyElixir.IR.{Materializer, Node, Store}
+  alias SymphonyElixir.Runtime
+
+  # A fake engine that returns a per-node-id scripted output. The gate's
+  # dependency returns `%{"ok" => true}` so the gate opens; every other
+  # node returns a trivial success.
+  defmodule FakeEngine do
+    @behaviour SymphonyElixir.Runtime.EngineClient
+
+    @table :dsl_wiring_fake
+
+    def setup do
+      if :ets.whereis(@table) == :undefined, do: :ets.new(@table, [:named_table, :public, :set])
+      :ets.delete_all_objects(@table)
+      :ok
+    end
+
+    def program(node_id, output), do: :ets.insert(@table, {node_id, output})
+
+    @impl true
+    def run_node(%Node{id: id}, _opts) do
+      case :ets.lookup(@table, id) do
+        [{^id, output}] -> {:ok, output, "thread-#{id}"}
+        [] -> {:ok, %{default: id}, "thread-#{id}"}
+      end
+    end
+
+    @impl true
+    def status(_thread_id), do: :unknown
+  end
+
+  setup do
+    FakeEngine.setup()
+    start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+    tmp = Path.join(System.tmp_dir!(), "dsl_wiring_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(tmp)
+    on_exit(fn -> File.rm_rf(tmp) end)
+    {:ok, store_opts: [dir: tmp]}
+  end
+
+  defp materialize!(source, run_id) do
+    {:ok, ast} = Parser.parse(source)
+    {:ok, graph} = Materializer.materialize(run_id, "hash-#{run_id}", ast)
+    graph
+  end
+
+  test "a two-node linear workflow runs both nodes to succeeded", %{store_opts: store_opts} do
+    source = """
+    workflow "w" {
+      a <- agent { engine: codex, model: "m", prompt: inline "first" }
+      b <- agent { engine: codex, model: "m", prompt: skill "next" { ctx: ${a.area} } }
+    }
+    """
+
+    graph = materialize!(source, "run_lin")
+    FakeEngine.program("agent-0", %{"area" => 7})
+
+    {:ok, pid} = Runtime.start_link(graph, engine: FakeEngine, store_opts: store_opts)
+    ref = Process.monitor(pid)
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    # Read the persisted final graph from the store.
+    {:ok, final} = Store.load("run_lin", store_opts)
+    assert final.status == :succeeded
+    assert final.nodes["agent-0"].state == :succeeded
+    assert final.nodes["agent-1"].state == :succeeded
+    # The edge held: agent-1 only ran after agent-0 succeeded.
+    assert "agent-0" in final.nodes["agent-1"].deps
+  end
+
+  test "a when-gate expands and runs its body after the dependency succeeds", %{store_opts: store_opts} do
+    source = """
+    workflow "w" {
+      a <- agent { engine: codex, model: "m", prompt: inline "first" }
+      when ${a.ok} {
+        b <- agent { engine: codex, model: "m", prompt: inline "gated" }
+      }
+    }
+    """
+
+    graph = materialize!(source, "run_gate")
+    FakeEngine.program("agent-0", %{"ok" => true})
+
+    {:ok, pid} = Runtime.start_link(graph, engine: FakeEngine, store_opts: store_opts)
+    ref = Process.monitor(pid)
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    {:ok, final} = Store.load("run_gate", store_opts)
+    assert final.status == :succeeded
+    assert final.nodes["agent-0"].state == :succeeded
+
+    # The gated body node was emitted dynamically and ran to success.
+    body = Enum.find(Map.values(final.nodes), fn n -> n.kind == :agent and n.id != "agent-0" end)
+    assert body, "gate body node was never materialized"
+    assert body.state == :succeeded
+
+    # The gate placeholder was retired, not left pending.
+    gate = Enum.find(Map.values(final.nodes), &(&1.kind == :gate))
+    assert gate.state == :skipped
+  end
+
+  test "a falsey when-gate skips the body and the run still succeeds", %{store_opts: store_opts} do
+    source = """
+    workflow "w" {
+      a <- agent { engine: codex, model: "m", prompt: inline "first" }
+      when ${a.ok} {
+        b <- agent { engine: codex, model: "m", prompt: inline "gated" }
+      }
+    }
+    """
+
+    graph = materialize!(source, "run_skip")
+    FakeEngine.program("agent-0", %{"ok" => false})
+
+    {:ok, pid} = Runtime.start_link(graph, engine: FakeEngine, store_opts: store_opts)
+    ref = Process.monitor(pid)
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    {:ok, final} = Store.load("run_skip", store_opts)
+    assert final.status == :succeeded
+    assert final.nodes["agent-0"].state == :succeeded
+    # No body agent node was emitted.
+    refute Enum.any?(Map.values(final.nodes), fn n -> n.kind == :agent and n.id != "agent-0" end)
+    # The gate placeholder was retired to :skipped.
+    assert Enum.find(Map.values(final.nodes), &(&1.kind == :gate)).state == :skipped
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/exec_runner_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/exec_runner_test.exs
new file mode 100644
index 000000000..ed0a4b278
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/exec_runner_test.exs
@@ -0,0 +1,85 @@
+defmodule SymphonyElixir.Runtime.ExecRunnerTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.IR.Node
+  alias SymphonyElixir.Runtime.ExecRunner
+
+  setup do
+    pack = Path.join(System.tmp_dir!(), "exec_runner_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(Path.join(pack, "scripts"))
+    on_exit(fn -> File.rm_rf(pack) end)
+    {:ok, pack: pack}
+  end
+
+  defp write_script!(pack, rel, body, mode \\ 0o755) do
+    path = Path.join(pack, rel)
+    File.mkdir_p!(Path.dirname(path))
+    File.write!(path, body)
+    File.chmod!(path, mode)
+    rel
+  end
+
+  defp exec_node(rel, opts \\ []) do
+    inputs = %{"script" => {:literal, rel}}
+
+    inputs =
+      case Keyword.get(opts, :timeout) do
+        nil -> inputs
+        seconds -> Map.put(inputs, "timeout", {:literal, seconds})
+      end
+
+    Node.new(id: "exec-0", ast_origin: "exec-0", kind: :exec, inputs: inputs, state: :pending)
+  end
+
+  test "a zero-exit script succeeds and captures output", %{pack: pack} do
+    rel = write_script!(pack, "scripts/ok.sh", "#!/bin/sh\necho hello world\n")
+
+    assert {:ok, %{kind: :exec, exit_code: 0, output: output}, nil} =
+             ExecRunner.run(exec_node(rel), %{run_id: "r", attempt: 1, pack_dir: pack})
+
+    assert output =~ "hello world"
+  end
+
+  test "a non-zero exit fails with the status and output tail", %{pack: pack} do
+    rel = write_script!(pack, "scripts/boom.sh", "#!/bin/sh\necho dying\nexit 3\n")
+
+    assert {:error, {:exec_failed, 3, output}, nil} =
+             ExecRunner.run(exec_node(rel), %{run_id: "r", attempt: 1, pack_dir: pack})
+
+    assert output =~ "dying"
+  end
+
+  test "the script path is resolved against the pack dir, not an absolute deploy path", %{pack: pack} do
+    rel = write_script!(pack, "scripts/cwd.sh", "#!/bin/sh\npwd\n")
+
+    assert {:ok, %{output: output}, nil} =
+             ExecRunner.run(exec_node(rel), %{run_id: "r", attempt: 1, pack_dir: pack})
+
+    # The script runs with cwd = pack dir.
+    assert String.trim(output) == pack
+  end
+
+  test "a missing script file fails loudly", %{pack: pack} do
+    assert {:error, {:exec_not_found, "scripts/ghost.sh"}, nil} =
+             ExecRunner.run(exec_node("scripts/ghost.sh"), %{run_id: "r", attempt: 1, pack_dir: pack})
+  end
+
+  test "a non-executable file fails loudly", %{pack: pack} do
+    rel = write_script!(pack, "scripts/plain.sh", "#!/bin/sh\ntrue\n", 0o644)
+
+    assert {:error, {:exec_not_executable, ^rel}, nil} =
+             ExecRunner.run(exec_node(rel), %{run_id: "r", attempt: 1, pack_dir: pack})
+  end
+
+  test "a node missing its script input fails rather than running an empty command", %{pack: pack} do
+    node = Node.new(id: "exec-0", ast_origin: "exec-0", kind: :exec, inputs: %{}, state: :pending)
+    assert {:error, :missing_exec_script, nil} = ExecRunner.run(node, %{run_id: "r", attempt: 1, pack_dir: pack})
+  end
+
+  test "a script that overruns its timeout is killed and reported", %{pack: pack} do
+    rel = write_script!(pack, "scripts/slow.sh", "#!/bin/sh\nsleep 30\n")
+
+    assert {:error, {:exec_timeout, 1, _output}, nil} =
+             ExecRunner.run(exec_node(rel, timeout: 1), %{run_id: "r", attempt: 1, pack_dir: pack})
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/ingress_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/ingress_test.exs
new file mode 100644
index 000000000..9c4e48909
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/ingress_test.exs
@@ -0,0 +1,160 @@
+defmodule SymphonyElixir.Runtime.IngressTest do
+  use ExUnit.Case, async: false
+
+  @moduletag capture_log: true
+
+  alias SymphonyElixir.DSL.Parser
+  alias SymphonyElixir.IR.{Node, Store}
+  alias SymphonyElixir.Runtime.Ingress
+  alias SymphonyElixir.WorkflowCatalog
+
+  defmodule FakeEngine do
+    @behaviour SymphonyElixir.Runtime.EngineClient
+
+    @impl true
+    def run_node(%Node{id: id}, _opts), do: {:ok, %{ran: id}, "thread-#{id}"}
+
+    @impl true
+    def status(_thread_id), do: :unknown
+  end
+
+  setup do
+    start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+    start_supervised!(SymphonyElixir.Runtime.Supervisor)
+
+    tmp = Path.join(System.tmp_dir!(), "ingress_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(tmp)
+    on_exit(fn -> File.rm_rf(tmp) end)
+
+    # A catalog over an isolated workflows dir so `start_by_trigger/2`
+    # resolves against the .sym files this test wrote, not the bundled pack.
+    workflows_dir = Path.join(System.tmp_dir!(), "ingress_wf_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(workflows_dir)
+    on_exit(fn -> File.rm_rf(workflows_dir) end)
+    start_supervised!({WorkflowCatalog, workflows_dir: workflows_dir, poll_ms: 60_000})
+
+    {:ok, store_opts: [dir: tmp], workflows_dir: workflows_dir}
+  end
+
+  defp write_sym!(dir, name, body) do
+    File.write!(Path.join(dir, "#{name}.sym"), body)
+  end
+
+  defp entry(source) do
+    {:ok, ast} = Parser.parse(source)
+    %{name: ast.name, ast: ast, trigger: ast.trigger, source: source, hash: :crypto.hash(:sha256, source)}
+  end
+
+  # Tolerate the not-yet-persisted window: start_link returns before the
+  # :advance continuation writes the first snapshot, so the run file may be
+  # absent on the first poll.
+  defp wait_terminal(run_id, store_opts, attempts \\ 60) do
+    case Store.load(run_id, store_opts) do
+      {:ok, %{status: status} = graph} when status in [:succeeded, :failed, :cancelled] ->
+        graph
+
+      _ when attempts == 0 ->
+        flunk("run #{run_id} never terminal")
+
+      _ ->
+        Process.sleep(20)
+        wait_terminal(run_id, store_opts, attempts - 1)
+    end
+  end
+
+  test "materializes a workflow and runs it under supervision", %{store_opts: store_opts} do
+    e = entry(~s|workflow "demo" on manual { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+
+    assert {:ok, %{run_id: run_id, pid: pid}} =
+             Ingress.start_workflow(e, %{kind: :manual, input: %{}}, engine: FakeEngine, store_opts: store_opts)
+
+    assert is_pid(pid)
+    final = wait_terminal(run_id, store_opts)
+
+    assert final.status == :succeeded
+    assert final.source_hash == e.hash
+    # The trigger event is stamped on the run and survives the store round-trip.
+    assert final.trigger == %{kind: :manual, input: %{}}
+  end
+
+  test "the generated run id is slugged from the workflow name", %{store_opts: store_opts} do
+    e = entry(~s|workflow "Nightly GC" on manual { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+
+    assert {:ok, %{run_id: run_id}} =
+             Ingress.start_workflow(e, nil, engine: FakeEngine, store_opts: store_opts)
+
+    assert String.starts_with?(run_id, "nightly-gc-")
+  end
+
+  test "an explicit run_id is honored", %{store_opts: store_opts} do
+    e = entry(~s|workflow "w" on manual { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+
+    assert {:ok, %{run_id: "fixed-id"}} =
+             Ingress.start_workflow(e, nil, run_id: "fixed-id", engine: FakeEngine, store_opts: store_opts)
+
+    assert wait_terminal("fixed-id", store_opts).status == :succeeded
+  end
+
+  test "start_by_trigger fans out to every workflow matching the event", %{store_opts: store_opts, workflows_dir: dir} do
+    write_sym!(dir, "label-a", ~s|workflow "label-a" on github_pr_label repo "acme/app" label "ship" { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+    write_sym!(dir, "label-b", ~s|workflow "label-b" on github_pr_label repo "acme/app" label "ship" { b <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+    write_sym!(dir, "other-repo", ~s|workflow "other-repo" on github_pr_label repo "acme/other" label "ship" { c <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+    WorkflowCatalog.scan(dir)
+
+    event = %{kind: :github_pr_label, repo: "acme/app", label: "ship", pr_number: 7}
+
+    assert {:ok, started} = Ingress.start_by_trigger(event, engine: FakeEngine, store_opts: store_opts)
+    assert length(started) == 2
+
+    for %{run_id: run_id} <- started do
+      final = wait_terminal(run_id, store_opts)
+      assert final.status == :succeeded
+      # The inbound event is the run's trigger context.
+      assert final.trigger == event
+    end
+  end
+
+  test "start_by_trigger is a no-op when no workflow matches", %{store_opts: store_opts, workflows_dir: dir} do
+    write_sym!(dir, "label-a", ~s|workflow "label-a" on github_pr_label repo "acme/app" label "ship" { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+    WorkflowCatalog.scan(dir)
+
+    assert {:ok, []} =
+             Ingress.start_by_trigger(
+               %{kind: :github_pr_label, repo: "acme/app", label: "nope"},
+               engine: FakeEngine,
+               store_opts: store_opts
+             )
+  end
+
+  test "start_by_trigger matches a linear label against the event's labels", %{store_opts: store_opts, workflows_dir: dir} do
+    write_sym!(dir, "triage", ~s|workflow "triage" on linear label "[sym] triage" { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+    WorkflowCatalog.scan(dir)
+
+    event = %{kind: :linear, labels: ["other", "[sym] triage"], issue_id: "ISS-1"}
+
+    assert {:ok, [%{run_id: run_id}]} =
+             Ingress.start_by_trigger(event, engine: FakeEngine, store_opts: store_opts)
+
+    assert wait_terminal(run_id, store_opts).status == :succeeded
+  end
+
+  test "seen_trigger? is the producer dedup read over IR runs", %{store_opts: store_opts, workflows_dir: dir} do
+    write_sym!(dir, "triage", ~s|workflow "triage" on linear label "[sym] triage" { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+    WorkflowCatalog.scan(dir)
+
+    issue_match = fn
+      {_status, %{kind: :linear, issue_id: "ISS-7"}} -> true
+      {_status, _trigger} -> false
+    end
+
+    refute Ingress.seen_trigger?(issue_match, store_opts: store_opts)
+
+    event = %{kind: :linear, labels: ["[sym] triage"], issue_id: "ISS-7"}
+    assert {:ok, [%{run_id: run_id}]} = Ingress.start_by_trigger(event, engine: FakeEngine, store_opts: store_opts)
+    wait_terminal(run_id, store_opts)
+
+    # The run persisted its trigger, so the dedup read now sees the issue.
+    assert Ingress.seen_trigger?(issue_match, store_opts: store_opts)
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/operator_controls_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/operator_controls_test.exs
new file mode 100644
index 000000000..a1657d12b
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/operator_controls_test.exs
@@ -0,0 +1,180 @@
+defmodule SymphonyElixir.Runtime.OperatorControlsTest do
+  @moduledoc """
+  The #97 operator surface: cancel, retry, rerun, and clear-failed, each
+  recording a durable audit event. Driven against a fake engine so a node
+  can be made to fail on demand.
+  """
+  use ExUnit.Case, async: false
+
+  @moduletag capture_log: true
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Graph, Node, RunGraph, Store}
+  alias SymphonyElixir.Runtime
+
+  defmodule FakeEngine do
+    @behaviour SymphonyElixir.Runtime.EngineClient
+
+    @table :operator_controls_fake
+
+    def setup do
+      if :ets.whereis(@table) == :undefined, do: :ets.new(@table, [:named_table, :public, :set])
+      :ets.delete_all_objects(@table)
+      :ok
+    end
+
+    def program(node_id, instruction), do: :ets.insert(@table, {node_id, instruction})
+
+    @impl true
+    def run_node(%Node{id: id}, _opts) do
+      case :ets.lookup(@table, id) do
+        [{^id, {:error, reason}}] -> {:error, reason, nil}
+        [{^id, {:ok, output}}] -> {:ok, output, "thread-#{id}"}
+        [] -> {:ok, %{ran: id}, "thread-#{id}"}
+      end
+    end
+
+    @impl true
+    def status(_thread_id), do: :unknown
+  end
+
+  setup do
+    FakeEngine.setup()
+    start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+
+    tmp = Path.join(System.tmp_dir!(), "op_ctrl_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(tmp)
+    on_exit(fn -> File.rm_rf(tmp) end)
+    {:ok, store_opts: [dir: tmp]}
+  end
+
+  # Agent nodes so each attempt routes through the injected engine. The
+  # operator surface is engine-agnostic; an agent node is the kind that
+  # actually consults the EngineClient (exec nodes run locally).
+  defp agent_node(id, inputs \\ %{}) do
+    Node.new(
+      id: id,
+      ast_origin: {:agent, id},
+      kind: :agent,
+      envelope: %Envelope{engine: :codex, model: "m"},
+      prompt_ref: {:inline, "go"},
+      inputs: inputs,
+      state: :pending
+    )
+  end
+
+  # Two-node chain a -> b, where b reads a's output so b only runs after a.
+  defp chain_graph(run_id) do
+    a = agent_node("a")
+    b = agent_node("b", %{"x" => {:node, "a", []}})
+    RunGraph.new(run_id, "hash", nil) |> RunGraph.put_nodes([a, b]) |> Map.put(:status, :running)
+  end
+
+  defp wait_terminal(run_id, store_opts, attempts \\ 40) do
+    {:ok, graph} = Store.load(run_id, store_opts)
+
+    cond do
+      graph.status in [:succeeded, :failed, :cancelled] -> graph
+      attempts == 0 -> flunk("run #{run_id} never terminal: #{graph.status}")
+      true -> Process.sleep(25) && wait_terminal(run_id, store_opts, attempts - 1)
+    end
+  end
+
+  test "clear_failed resets failed nodes and the rerun succeeds", %{store_opts: store_opts} do
+    FakeEngine.program("a", {:error, :boom})
+    graph = chain_graph("run_clear")
+
+    {:ok, pid} = Runtime.start_link(graph, engine: FakeEngine, store_opts: store_opts)
+
+    # Wait for the run to fail (a fails, b becomes upstream_failed).
+    failed = wait_for(pid, fn g -> Graph.all_terminal?(g) end)
+    assert failed.nodes["a"].state == :failed
+    assert failed.nodes["b"].state == :upstream_failed
+
+    # Fix the cause, then clear the failed nodes. They re-run and succeed,
+    # at which point the run reaches a terminal :succeeded and the GenServer
+    # stops, so read the recovered state from the store.
+    FakeEngine.program("a", {:ok, %{fixed: true}})
+    ref = Process.monitor(pid)
+    :ok = Runtime.clear_failed(pid, "alice")
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    recovered = wait_terminal("run_clear", store_opts)
+    assert recovered.status == :succeeded
+    assert recovered.nodes["a"].state == :succeeded
+    assert recovered.nodes["b"].state == :succeeded
+
+    # The clear_failed action is recorded with the actor and the cleared ids.
+    event = Enum.find(recovered.audit_log, &(&1.action == :clear_failed))
+    assert event.actor == "alice"
+    assert Enum.sort(event.detail.cleared) == ["a", "b"]
+  end
+
+  test "cancel records an audit event and stops the run", %{store_opts: store_opts} do
+    # Keep a node busy so the run is still in flight when we cancel.
+    FakeEngine.program("a", {:ok, %{}})
+    graph = chain_graph("run_cancel")
+    {:ok, pid} = Runtime.start_link(graph, engine: FakeEngine, store_opts: store_opts)
+    ref = Process.monitor(pid)
+
+    :ok = Runtime.cancel(pid, "bob")
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    {:ok, final} = Store.load("run_cancel", store_opts)
+    assert final.status == :cancelled
+    event = Enum.find(final.audit_log, &(&1.action == :cancel))
+    assert event.actor == "bob"
+  end
+
+  test "retry_node re-runs only the target node and records the audit event", %{store_opts: store_opts} do
+    # A single independent node so the surgical retry can drive the run to a
+    # clean terminal without an upstream_failed dependent lingering.
+    node = agent_node("a")
+    graph = RunGraph.new("run_retry", "hash", nil) |> RunGraph.put_nodes([node]) |> Map.put(:status, :running)
+
+    FakeEngine.program("a", {:error, :nope})
+    {:ok, pid} = Runtime.start_link(graph, engine: FakeEngine, store_opts: store_opts)
+
+    wait_for(pid, fn g -> g.nodes["a"].state == :failed end)
+    FakeEngine.program("a", {:ok, %{}})
+    ref = Process.monitor(pid)
+    :ok = Runtime.retry_node(pid, "a", "carol")
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    final = wait_terminal("run_retry", store_opts)
+    assert final.nodes["a"].state == :succeeded
+    event = Enum.find(final.audit_log, &(&1.action == :retry_node))
+    assert event.target == "a"
+    assert event.actor == "carol"
+  end
+
+  test "audit log survives a store round-trip", %{store_opts: store_opts} do
+    graph =
+      chain_graph("run_audit_rt")
+      |> RunGraph.append_audit(:clear_failed, nil, "dave", %{cleared: ["a"]})
+      |> RunGraph.append_audit(:cancel, "b", :system, %{})
+
+    :ok = Store.persist(graph, store_opts)
+    {:ok, loaded} = Store.load("run_audit_rt", store_opts)
+
+    assert [first, second] = loaded.audit_log
+    assert first.action == :clear_failed
+    assert first.actor == "dave"
+    assert first.detail == %{cleared: ["a"]}
+    assert second.action == :cancel
+    assert second.target == "b"
+    assert second.actor == :system
+  end
+
+  # Poll the live runtime's graph snapshot until `pred` holds.
+  defp wait_for(pid, pred, attempts \\ 80) do
+    graph = Runtime.graph(pid)
+
+    cond do
+      pred.(graph) -> graph
+      attempts == 0 -> flunk("condition never held; last status=#{graph.status}")
+      true -> Process.sleep(20) && wait_for(pid, pred, attempts - 1)
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/placement_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/placement_test.exs
new file mode 100644
index 000000000..f4e3447f7
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/placement_test.exs
@@ -0,0 +1,590 @@
+defmodule SymphonyElixir.Runtime.PlacementTest do
+  use ExUnit.Case, async: false
+
+  alias SymphonyElixir.Config
+  alias SymphonyElixir.Runtime.Placement
+
+  # A direct-connect config so the lifecycle resolves a VM address rather
+  # than opening a real port-forward Port. `room: %{registry_url: nil}` keeps
+  # the room-registry calls inert (no HTTP). No real `ix` runs: every
+  # command goes through the injected stub driver below.
+  # The example pack's single-repo manifest, so the clone script the
+  # lifecycle builds has a real catalog to render without booting Config.
+  @repositories_file Path.expand("../../../../workflows/example/repositories.yaml", __DIR__)
+
+  defp config(overrides \\ %{}) do
+    base = %Config{
+      ix_command: "ix",
+      ix_image: "ix/symphony-codex:test",
+      ix_room_server_command: "room-server",
+      ix_region: nil,
+      ix_room_port: 8080,
+      ix_room_connect: "direct",
+      ix_local_port_base: 18_080,
+      ix_keep_vm?: false,
+      ix_create_timeout_ms: 120_000,
+      ix_env_passthrough: [],
+      github_token: nil,
+      github_app_bot_username: nil,
+      github_app_bot_email: nil,
+      repositories_file: @repositories_file,
+      room: %{server_url: nil, registry_url: nil, registry_token: nil, advertise_host: nil},
+      placement_fallback: :host,
+      host_user: "agentuser",
+      host_group: nil,
+      host_workspaces_dir: nil,
+      host_room_server_command: "room-server",
+      host_systemd_run_command: "systemd-run",
+      host_keep?: false
+    }
+
+    struct(base, overrides)
+  end
+
+  # A driver that records each `ix` argv it is handed and answers from a
+  # fixed VM record, so the acquire/release path is exercised with no VM
+  # and no shell-out. `wait_for_room` always succeeds.
+  defp recording_driver(test_pid) do
+    %{
+      ix_cmd: fn _config, args, _timeout ->
+        send(test_pid, {:ix_cmd, args})
+        :ok
+      end,
+      ix_vm_by_name: fn _config, vm_name ->
+        {:ok, %{"name" => vm_name, "ipv4" => "10.0.0.5"}}
+      end,
+      wait_for_room: fn _url, _timeout -> :ok end,
+      port_forward: fn _config, _vm, _mapping -> {:error, :should_not_port_forward_in_direct_mode} end,
+      stop_port_forward: fn _port -> :ok end
+    }
+  end
+
+  # A driver that records each `systemd-run`/`systemctl` argv and answers
+  # the host lifecycle from fixed values: a `getent passwd` line with a
+  # home, a fixed port, and a healthy room. No real unit is ever started.
+  defp host_driver(test_pid) do
+    %{
+      ix_cmd: fn _config, args, _timeout ->
+        send(test_pid, {:ix_cmd, args})
+        :ok
+      end,
+      ix_vm_by_name: fn _config, vm_name -> {:ok, %{"name" => vm_name, "ipv4" => "10.0.0.5"}} end,
+      wait_for_room: fn _url, _timeout -> :ok end,
+      port_forward: fn _config, _vm, _mapping -> {:error, :unused} end,
+      stop_port_forward: fn _port -> :ok end,
+      host_passwd: fn _config, user -> {:ok, "#{user}:x:1000:1000::/home/#{user}:/bin/bash"} end,
+      systemd_run: fn _config, args, _timeout ->
+        send(test_pid, {:systemd_run, args})
+        :ok
+      end,
+      systemctl_stop: fn unit ->
+        send(test_pid, {:systemctl_stop, unit})
+        :ok
+      end,
+      pick_port: fn -> 41_234 end
+    }
+  end
+
+  setup do
+    # Fresh registry table per test; the supervised Placement process is
+    # not started here, so the module creates the table lazily on write.
+    if :ets.whereis(:symphony_placement) != :undefined do
+      :ets.delete(:symphony_placement)
+    end
+
+    :ok
+  end
+
+  test "acquire provisions a per-run room-server and resolves its base url" do
+    opts = [config: config(), driver: recording_driver(self())]
+
+    assert {:ok, "http://10.0.0.5:8080"} = Placement.acquire("run_alpha", :ixvm, opts)
+    assert {:ok, "http://10.0.0.5:8080"} = Placement.base_url("run_alpha")
+
+    # The first ix command is the create; it names the run's VM and image.
+    assert_received {:ix_cmd, ["new", "ix/symphony-codex:test", "--name", vm_name, "--l7-proxy-port", "8080", "--no-shell"]}
+    assert String.starts_with?(vm_name, "sym-run-alpha-")
+  end
+
+  test "create_vm is invoked with config.ix_create_timeout_ms, not a hardcoded constant" do
+    test_pid = self()
+    configured_timeout = 30_000
+
+    # The driver records every ix_cmd call with its timeout argument so we
+    # can assert the timeout threaded to the driver matches the config value.
+    timeout_recording_driver = %{
+      ix_cmd: fn _config, args, timeout ->
+        send(test_pid, {:ix_cmd, args, timeout})
+        :ok
+      end,
+      ix_vm_by_name: fn _config, vm_name -> {:ok, %{"name" => vm_name, "ipv4" => "10.0.0.5"}} end,
+      wait_for_room: fn _url, _timeout -> :ok end,
+      port_forward: fn _config, _vm, _mapping -> {:error, :unused} end,
+      stop_port_forward: fn _port -> :ok end
+    }
+
+    opts = [config: config(%{ix_create_timeout_ms: configured_timeout}), driver: timeout_recording_driver]
+
+    assert {:ok, _url} = Placement.acquire("run_timeout_check", :ixvm, opts)
+
+    # The first ix_cmd call is the `ix new` (create). Assert its timeout
+    # matches the config value, not the old 15-minute module constant.
+    assert_received {:ix_cmd, ["new" | _], ^configured_timeout}
+  end
+
+  test "acquire is idempotent: a second call returns the same url without re-provisioning" do
+    opts = [config: config(), driver: recording_driver(self())]
+
+    assert {:ok, url} = Placement.acquire("run_beta", :ixvm, opts)
+
+    # Drain the create/shell commands from the first acquire.
+    drain_ix_cmds()
+
+    assert {:ok, ^url} = Placement.acquire("run_beta", :ixvm, opts)
+
+    # No further ix commands on the second acquire.
+    refute_received {:ix_cmd, _args}
+  end
+
+  test "release tears the vm down and drops the per-run url" do
+    test_pid = self()
+    opts = [config: config(), driver: recording_driver(test_pid)]
+
+    assert {:ok, _url} = Placement.acquire("run_gamma", :ixvm, opts)
+    drain_ix_cmds()
+
+    assert :ok = Placement.release("run_gamma", opts)
+    assert :error = Placement.base_url("run_gamma")
+
+    # Release removes the VM by name.
+    assert_received {:ix_cmd, ["rm", "--force", vm_name]}
+    assert String.starts_with?(vm_name, "sym-run-gamma-")
+  end
+
+  test "release is a no-op for a run that never acquired a placement" do
+    assert :ok = Placement.release("run_never", config: config(), driver: recording_driver(self()))
+    refute_received {:ix_cmd, _args}
+  end
+
+  test "base_url is :error for an unknown run" do
+    assert :error = Placement.base_url("run_unknown")
+  end
+
+  test "a setup failure surfaces as ixvm_setup_failed and removes the partial vm" do
+    failing_driver = %{
+      ix_cmd: fn _config, args, _timeout ->
+        send(self(), {:ix_cmd, args})
+
+        case args do
+          ["new" | _] -> {:error, {:ix_cli_failed, args, 1, "boom"}}
+          _ -> :ok
+        end
+      end,
+      ix_vm_by_name: fn _config, vm_name -> {:ok, %{"name" => vm_name, "ipv4" => "10.0.0.5"}} end,
+      wait_for_room: fn _url, _timeout -> :ok end,
+      port_forward: fn _config, _vm, _mapping -> {:error, :unused} end,
+      stop_port_forward: fn _port -> :ok end
+    }
+
+    # placement_fallback: :none isolates the raw ixvm failure path; the
+    # ixvm -> host fallback is covered by its own describe block.
+    assert {:error, {:ixvm_setup_failed, _reason}} =
+             Placement.acquire("run_delta", :ixvm, config: config(placement_fallback: :none), driver: failing_driver)
+
+    assert :error = Placement.base_url("run_delta")
+  end
+
+  describe "host placement" do
+    test "acquire provisions a per-run systemd-run room-server and resolves its loopback url" do
+      opts = [config: config(), driver: host_driver(self())]
+
+      assert {:ok, "http://127.0.0.1:41234"} = Placement.acquire("run_host", {:host, "box"}, opts)
+      assert {:ok, "http://127.0.0.1:41234"} = Placement.base_url("run_host")
+
+      # The first systemd-run is the workspace clone, in a named "-setup" unit
+      # under the polkit-scoped prefix, dropping privileges to the host user.
+      assert_received {:systemd_run, setup_args}
+      assert "--uid=agentuser" in setup_args
+      assert Enum.any?(setup_args, &String.starts_with?(&1, "--unit=symphony-host-"))
+      assert Enum.any?(setup_args, &String.ends_with?(&1, "-setup.service"))
+
+      # The second is the long-lived room-server unit (no --wait).
+      assert_received {:systemd_run, room_args}
+      refute "--wait" in room_args
+      assert Enum.any?(room_args, &String.starts_with?(&1, "--unit=symphony-host-"))
+      assert "room-server" in room_args or Enum.any?(room_args, &String.ends_with?(&1, "room-server"))
+    end
+
+    test "an advertised host binds and resolves a reachable url instead of loopback" do
+      base = config()
+      cfg = %{base | room: %{base.room | advertise_host: "100.0.0.7"}}
+      opts = [config: cfg, driver: host_driver(self())]
+
+      # The registered/resolved url uses the advertised host so the central
+      # room.ix.dev can reach the per-run server (not 127.0.0.1).
+      assert {:ok, "http://100.0.0.7:41234"} = Placement.acquire("run_adv", {:host, "box"}, opts)
+      assert {:ok, "http://100.0.0.7:41234"} = Placement.base_url("run_adv")
+
+      # The room-server unit actually binds that host (--host 100.0.0.7), not
+      # only advertises it.
+      assert_received {:systemd_run, _setup_args}
+      assert_received {:systemd_run, room_args}
+      assert "100.0.0.7" in room_args
+    end
+
+    test "the minted bot token authors the clone auth and room-server env over the static host token" do
+      opts = [config: config(github_token: "human-token"), driver: host_driver(self()), bot_token: "app-token"]
+
+      assert {:ok, _url} = Placement.acquire("run_bot_token", :host, opts)
+
+      # The clone runs in the "-setup" unit; its script stamps the App token
+      # as the git auth header, never the static host token.
+      assert_received {:systemd_run, setup_args}
+      setup_script = List.last(setup_args)
+      assert setup_script =~ Base.encode64("x-access-token:app-token")
+      refute setup_script =~ Base.encode64("x-access-token:human-token")
+
+      # gh pr create authors as GH_TOKEN, so the long-lived room-server unit
+      # must carry the App token in both GitHub vars (ENG-2012).
+      assert_received {:systemd_run, room_args}
+      assert "--setenv=GITHUB_TOKEN=app-token" in room_args
+      assert "--setenv=GH_TOKEN=app-token" in room_args
+      refute Enum.any?(room_args, &(&1 =~ "human-token"))
+    end
+
+    test "release stops the unit and removes the checkout" do
+      opts = [config: config(), driver: host_driver(self())]
+
+      assert {:ok, _url} = Placement.acquire("run_host2", :host, opts)
+      drain_systemd_runs()
+
+      assert :ok = Placement.release("run_host2", opts)
+      assert :error = Placement.base_url("run_host2")
+
+      assert_received {:systemctl_stop, unit}
+      assert String.starts_with?(unit, "symphony-host-")
+      assert String.ends_with?(unit, ".service")
+
+      # Cleanup runs as a "-clean" sync unit under the same prefix.
+      assert_received {:systemd_run, clean_args}
+      assert Enum.any?(clean_args, &String.ends_with?(&1, "-clean.service"))
+    end
+
+    test "host_keep? leaves the unit and checkout in place on release" do
+      opts = [config: config(host_keep?: true), driver: host_driver(self())]
+
+      assert {:ok, _url} = Placement.acquire("run_keep", :host, opts)
+      drain_systemd_runs()
+
+      assert :ok = Placement.release("run_keep", opts)
+      refute_received {:systemctl_stop, _unit}
+      refute_received {:systemd_run, _args}
+    end
+
+    test "host setup fails fast when the host user is not configured" do
+      opts = [config: config(host_user: nil), driver: host_driver(self())]
+
+      assert {:error, {:host_setup_failed, :host_user_not_configured}} =
+               Placement.acquire("run_nouser", :host, opts)
+
+      assert :error = Placement.base_url("run_nouser")
+    end
+  end
+
+  describe "ixvm -> host fallback" do
+    test "an ixvm setup failure falls back to a host room-server under the same run id" do
+      failing_ixvm =
+        Map.merge(host_driver(self()), %{
+          ix_cmd: fn _config, args, _timeout ->
+            send(self(), {:ix_cmd, args})
+
+            case args do
+              ["new" | _] -> {:error, {:ix_cli_failed, args, 1, "no capacity"}}
+              _ -> :ok
+            end
+          end
+        })
+
+      opts = [config: config(placement_fallback: :host), driver: failing_ixvm]
+
+      # The node declared :ixvm; provisioning fails and the run completes on
+      # a host room-server resolved under the same run id, so the engine
+      # turn (which looks up by run id) never knows it fell back.
+      assert {:ok, "http://127.0.0.1:41234"} = Placement.acquire("run_fb", :ixvm, opts)
+      assert {:ok, "http://127.0.0.1:41234"} = Placement.base_url("run_fb")
+    end
+
+    test "fallback :local resolves to no per-run placement (the client uses the default url)" do
+      failing_ixvm =
+        Map.merge(host_driver(self()), %{
+          ix_cmd: fn _config, args, _timeout ->
+            case args do
+              ["new" | _] -> {:error, {:ix_cli_failed, args, 1, "boom"}}
+              _ -> :ok
+            end
+          end
+        })
+
+      opts = [config: config(placement_fallback: :local), driver: failing_ixvm]
+
+      assert {:error, {:no_placement_needed, :local}} = Placement.acquire("run_fb_local", :ixvm, opts)
+      assert :error = Placement.base_url("run_fb_local")
+    end
+
+    test "fallback :none leaves the original ixvm setup failure standing" do
+      failing_ixvm =
+        Map.merge(host_driver(self()), %{
+          ix_cmd: fn _config, args, _timeout ->
+            case args do
+              ["new" | _] -> {:error, {:ix_cli_failed, args, 1, "boom"}}
+              _ -> :ok
+            end
+          end
+        })
+
+      opts = [config: config(placement_fallback: :none), driver: failing_ixvm]
+
+      assert {:error, {:ixvm_setup_failed, _reason}} = Placement.acquire("run_fb_none", :ixvm, opts)
+      assert :error = Placement.base_url("run_fb_none")
+    end
+  end
+
+  describe "ixvm -> remote fallback" do
+    # A driver whose ixvm provisioning fails, with the remote seam wired to a
+    # fake worker so the fallback runs without a real registry or channel.
+    defp remote_driver(test_pid, overrides \\ %{}) do
+      worker = %{worker_id: "w1", pid: test_pid, address: "100.0.0.9", labels: [], capacity: 0, registered_at: 0}
+
+      Map.merge(
+        %{
+          ix_cmd: fn _config, args, _timeout ->
+            case args do
+              ["new" | _] -> {:error, {:ix_cli_failed, args, 1, "boom"}}
+              _ -> :ok
+            end
+          end,
+          ix_vm_by_name: fn _config, vm_name -> {:ok, %{"name" => vm_name}} end,
+          wait_for_room: fn _url, _timeout -> :ok end,
+          worker_select: fn label ->
+            send(test_pid, {:worker_select, label})
+            {:ok, worker}
+          end,
+          worker_get: fn _id -> {:ok, worker} end,
+          worker_provision: fn ^worker, run_id, spec, _timeout ->
+            send(test_pid, {:worker_provision, run_id, spec})
+            {:ok, %{base_url: "http://100.0.0.9:9100", primary_workspace: "/home/hari/symphony-workspaces/#{run_id}/example"}}
+          end,
+          worker_teardown: fn ^worker, run_id, _timeout ->
+            send(test_pid, {:worker_teardown, run_id})
+            :ok
+          end
+        },
+        overrides
+      )
+    end
+
+    test "an ixvm failure falls back to a remote worker's room-server" do
+      opts = [config: config(placement_fallback: :remote), driver: remote_driver(self())]
+
+      assert {:ok, "http://100.0.0.9:9100"} = Placement.acquire("run_rem", :ixvm, opts)
+      assert {:ok, %{location: :remote, base_url: "http://100.0.0.9:9100"}} = Placement.resolved("run_rem")
+      assert_received {:worker_select, nil}
+      assert_received {:worker_provision, "run_rem", %{env: _, bot_token: _}}
+    end
+
+    test "the dispatched spec carries the run's repository catalog so the worker clones the real repos" do
+      config = config(placement_fallback: :remote)
+      opts = [config: config, driver: remote_driver(self())]
+
+      assert {:ok, _url} = Placement.acquire("run_rem_repos", :ixvm, opts)
+      assert_received {:worker_provision, "run_rem_repos", %{repositories: repositories}}
+      assert repositories == SymphonyElixir.RepositoryCatalog.all(config)
+      assert repositories != []
+    end
+
+    test "the dispatched spec carries the bot commit identity so the worker clone authors as the App" do
+      opts = [
+        config:
+          config(
+            placement_fallback: :remote,
+            github_app_bot_username: "ix-playbook-agent[bot]",
+            github_app_bot_email: "ix-playbook-agent[bot]@users.noreply.github.com"
+          ),
+        driver: remote_driver(self())
+      ]
+
+      assert {:ok, _url} = Placement.acquire("run_rem_bot", :ixvm, opts)
+
+      assert_received {:worker_provision, "run_rem_bot",
+                       %{
+                         bot_username: "ix-playbook-agent[bot]",
+                         bot_email: "ix-playbook-agent[bot]@users.noreply.github.com"
+                       }}
+    end
+
+    test "select uses the configured worker label" do
+      opts = [config: config(placement_fallback: :remote, worker_select_label: "hari"), driver: remote_driver(self())]
+
+      assert {:ok, _url} = Placement.acquire("run_rem_lbl", :ixvm, opts)
+      assert_received {:worker_select, "hari"}
+    end
+
+    test "a remote placement resolves the worker-side primary checkout as its cwd" do
+      opts = [config: config(placement_fallback: :remote), driver: remote_driver(self())]
+      assert {:ok, _url} = Placement.acquire("run_rem_cwd", :ixvm, opts)
+
+      assert {:ok, "/home/hari/symphony-workspaces/run_rem_cwd/example"} =
+               Placement.workspace_cwd("run_rem_cwd", opts)
+    end
+
+    test "release dispatches teardown to the worker" do
+      opts = [config: config(placement_fallback: :remote), driver: remote_driver(self())]
+      assert {:ok, _url} = Placement.acquire("run_rem_rel", :ixvm, opts)
+
+      assert :ok = Placement.release("run_rem_rel", opts)
+      assert_received {:worker_teardown, "run_rem_rel"}
+      assert :error = Placement.base_url("run_rem_rel")
+    end
+
+    test "no connected worker surfaces the original ixvm failure" do
+      driver = remote_driver(self(), %{worker_select: fn _label -> {:error, :no_worker} end})
+      opts = [config: config(placement_fallback: :remote), driver: driver]
+
+      assert {:error, {:ixvm_setup_failed, _reason}} = Placement.acquire("run_rem_none", :ixvm, opts)
+      assert :error = Placement.base_url("run_rem_none")
+    end
+  end
+
+  describe "workspace_cwd/2" do
+    test "a host placement resolves the primary-repo checkout under the host run root" do
+      opts = [config: config(), driver: host_driver(self())]
+      assert {:ok, _url} = Placement.acquire("run_cwd_host", :host, opts)
+
+      assert {:ok, "/home/agentuser/symphony-workspaces/run_cwd_host/example"} =
+               Placement.workspace_cwd("run_cwd_host", opts)
+    end
+
+    test "an ixvm placement resolves the VM-internal primary-repo checkout" do
+      opts = [config: config(), driver: recording_driver(self())]
+      assert {:ok, _url} = Placement.acquire("run_cwd_ix", :ixvm, opts)
+
+      assert {:ok, "/workspace/symphony/run_cwd_ix/example"} =
+               Placement.workspace_cwd("run_cwd_ix", opts)
+    end
+
+    test "an ixvm node that fell back to host resolves the host checkout" do
+      failing_ixvm =
+        Map.merge(host_driver(self()), %{
+          ix_cmd: fn _config, args, _timeout ->
+            case args do
+              ["new" | _] -> {:error, {:ix_cli_failed, args, 1, "no capacity"}}
+              _ -> :ok
+            end
+          end
+        })
+
+      opts = [config: config(placement_fallback: :host), driver: failing_ixvm]
+      assert {:ok, _url} = Placement.acquire("run_cwd_fb", :ixvm, opts)
+
+      # The declared location was :ixvm, but the cwd follows the effective
+      # host placement so the turn runs where the clone actually landed.
+      assert {:ok, "/home/agentuser/symphony-workspaces/run_cwd_fb/example"} =
+               Placement.workspace_cwd("run_cwd_fb", opts)
+    end
+
+    test "a run with no acquired placement has no cwd" do
+      assert :error = Placement.workspace_cwd("run_cwd_none")
+    end
+  end
+
+  defp drain_ix_cmds do
+    receive do
+      {:ix_cmd, _args} -> drain_ix_cmds()
+    after
+      0 -> :ok
+    end
+  end
+
+  defp drain_systemd_runs do
+    receive do
+      {:systemd_run, _args} -> drain_systemd_runs()
+      {:ix_cmd, _args} -> drain_systemd_runs()
+    after
+      0 -> :ok
+    end
+  end
+
+  describe "reconcile/2" do
+    test "reaps an orphaned host unit and re-attaches a live one" do
+      units = %{
+        "symphony-host-live.service" => {"run_live", 1111},
+        "symphony-host-dead.service" => {"run_dead", 2222}
+      }
+
+      graphs = [graph("run_live", :running), graph("run_dead", :succeeded)]
+      opts = [config: config(), driver: reconcile_driver(self(), units)]
+
+      assert :ok = Placement.reconcile(graphs, opts)
+
+      # The terminal run's server is stopped and its checkout cleaned; the
+      # live run's server is left running.
+      assert_received {:systemctl_stop, "symphony-host-dead.service"}
+      refute_received {:systemctl_stop, "symphony-host-live.service"}
+      assert_received {:systemd_run, clean_args}
+      assert Enum.member?(clean_args, "--unit=symphony-host-dead-clean.service")
+
+      # The live run is re-attached so a resumed acquire resolves to the
+      # existing server instead of provisioning a duplicate.
+      assert {:ok, "http://127.0.0.1:1111"} = Placement.base_url("run_live")
+      # The reaped run holds no placement.
+      assert :error = Placement.base_url("run_dead")
+    end
+
+    test "reaps a unit whose run is absent from the store" do
+      units = %{"symphony-host-ghost.service" => {"run_ghost", 3333}}
+      opts = [config: config(), driver: reconcile_driver(self(), units)]
+
+      assert :ok = Placement.reconcile([], opts)
+      assert_received {:systemctl_stop, "symphony-host-ghost.service"}
+    end
+
+    test "is a no-op when the host user is unconfigured" do
+      units = %{"symphony-host-x.service" => {"run_x", 4444}}
+      opts = [config: config(%{host_user: nil}), driver: reconcile_driver(self(), units)]
+
+      assert :ok = Placement.reconcile([graph("run_x", :running)], opts)
+      refute_received {:systemctl_stop, _unit}
+    end
+  end
+
+  defp graph(run_id, status) do
+    %SymphonyElixir.IR.RunGraph{run_id: run_id, source_hash: "hash", status: status, nodes: %{}}
+  end
+
+  # A driver answering the reconcile path from a fixed unit table. Each
+  # entry maps a unit name to its `{run_id, port}`; `systemctl_show_exec_start`
+  # renders the same `ExecStart` shape systemd reports (the run id is the
+  # `--state-dir` basename), and `systemctl_stop`/`systemd_run` record so a
+  # test can assert exactly which units were reaped.
+  defp reconcile_driver(test_pid, units) do
+    %{
+      host_passwd: fn _config, user -> {:ok, "#{user}:x:1000:1000::/home/#{user}:/bin/bash"} end,
+      systemctl_list_host_units: fn -> Map.keys(units) end,
+      systemctl_show_exec_start: fn unit ->
+        {run_id, port} = Map.fetch!(units, unit)
+
+        {:ok,
+         "{ path=/n/room-server ; argv[]=/n/room-server --host 127.0.0.1 --port #{port} " <>
+           "--state-dir /home/agentuser/.local/state/symphony-room/#{run_id} ; ignore_errors=no }"}
+      end,
+      systemctl_stop: fn unit ->
+        send(test_pid, {:systemctl_stop, unit})
+        :ok
+      end,
+      systemd_run: fn _config, args, _timeout ->
+        send(test_pid, {:systemd_run, args})
+        :ok
+      end
+    }
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/room_engine_client_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/room_engine_client_test.exs
new file mode 100644
index 000000000..a291360b8
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/room_engine_client_test.exs
@@ -0,0 +1,212 @@
+defmodule SymphonyElixir.Runtime.RoomEngineClientTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.Node
+  alias SymphonyElixir.Runtime.RoomEngineClient
+
+  defp agent_node(prompt_ref, location \\ :local) do
+    {:ok, env} = Envelope.validate(%Envelope{engine: :codex, model: "gpt-5.3-codex", location: location})
+
+    Node.new(
+      id: "n0",
+      ast_origin: {:agent, "skill"},
+      kind: :agent,
+      envelope: env,
+      prompt_ref: prompt_ref,
+      inputs: %{}
+    )
+  end
+
+  defp ok_plug(thread_id) do
+    fn conn ->
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(
+        200,
+        Jason.encode!(%{"threadId" => thread_id, "outcome" => %{"kind" => "ok"}, "eventCount" => 3})
+      )
+    end
+  end
+
+  test "runs an inline-prompt agent node and returns {:ok, output, thread_id}" do
+    node = agent_node({:inline, "write FOO and stop"})
+
+    run_opts = %{
+      run_id: "run_1",
+      attempt: 1,
+      cwd: "/workspace/run_1",
+      room_server_url: "http://room.test",
+      req_options: [plug: ok_plug("thread_xyz")]
+    }
+
+    assert {:ok, %{thread_id: "thread_xyz", event_count: 3}, "thread_xyz"} =
+             RoomEngineClient.run_node(node, run_opts)
+  end
+
+  test "forwards the node id and run id to the room-server payload" do
+    test_pid = self()
+
+    plug = fn conn ->
+      {:ok, raw, conn} = Plug.Conn.read_body(conn)
+      send(test_pid, {:payload, Jason.decode!(raw)})
+
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(200, Jason.encode!(%{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0}))
+    end
+
+    node = agent_node({:inline, "do work"})
+    run_opts = %{run_id: "run_42", attempt: 1, cwd: "/w", room_server_url: "http://room.test", req_options: [plug: plug]}
+
+    assert {:ok, _, _} = RoomEngineClient.run_node(node, run_opts)
+    assert_received {:payload, payload}
+    assert payload["runId"] == "run_42"
+    assert payload["nodeId"] == "n0"
+    assert payload["prompt"] == "do work"
+    assert payload["cwd"] == "/w"
+    assert payload["engine"] == "codex"
+  end
+
+  test "an error outcome carries the thread id through for a later reattach probe" do
+    plug = fn conn ->
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(
+        200,
+        Jason.encode!(%{"threadId" => "thread_e", "outcome" => %{"kind" => "error", "message" => "boom"}, "eventCount" => 1})
+      )
+    end
+
+    node = agent_node({:inline, "do work"})
+    run_opts = %{run_id: "r", attempt: 1, cwd: "/w", room_server_url: "http://room.test", req_options: [plug: plug]}
+
+    assert {:error, {:turn_error, "boom", "thread_e"}, "thread_e"} = RoomEngineClient.run_node(node, run_opts)
+  end
+
+  test "a skill prompt is rendered from the resolved body and bindings" do
+    test_pid = self()
+
+    plug = fn conn ->
+      {:ok, raw, conn} = Plug.Conn.read_body(conn)
+      send(test_pid, {:payload, Jason.decode!(raw)})
+
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(200, Jason.encode!(%{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 1}))
+    end
+
+    node = agent_node({:skill, "inspect", %{"repo" => "symphony"}})
+
+    run_opts = %{
+      run_id: "r",
+      attempt: 1,
+      cwd: "/w",
+      room_server_url: "http://room.test",
+      req_options: [plug: plug],
+      # Inject the skill body so the test does not need a running Catalog.
+      skill_resolver: fn "inspect" -> {:ok, "inspect the ${repo} repo"} end
+    }
+
+    assert {:ok, _output, "t"} = RoomEngineClient.run_node(node, run_opts)
+    assert_receive {:payload, payload}
+    assert payload["prompt"] == "inspect the symphony repo"
+  end
+
+  test "appends the run's trigger context as an <input> block on the agent prompt" do
+    test_pid = self()
+
+    plug = fn conn ->
+      {:ok, raw, conn} = Plug.Conn.read_body(conn)
+      send(test_pid, {:payload, Jason.decode!(raw)})
+
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(200, Jason.encode!(%{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0}))
+    end
+
+    node = agent_node({:inline, "digest the window"})
+
+    trigger = %{
+      kind: :cron,
+      scheduled_for: "2026-06-03T07:00:00Z",
+      fired_at: "2026-06-03T07:00:07Z",
+      input: %{lookback_hours: 5}
+    }
+
+    run_opts = %{
+      run_id: "r",
+      attempt: 1,
+      cwd: "/w",
+      trigger: trigger,
+      room_server_url: "http://room.test",
+      req_options: [plug: plug]
+    }
+
+    assert {:ok, _, _} = RoomEngineClient.run_node(node, run_opts)
+    assert_receive {:payload, payload}
+
+    prompt = payload["prompt"]
+    assert String.starts_with?(prompt, "digest the window")
+    assert prompt =~ "<input>"
+    assert prompt =~ "</input>"
+    # The block carries the verbatim trigger envelope the skill reads.
+    assert prompt =~ "\"scheduled_for\": \"2026-06-03T07:00:00Z\""
+    assert prompt =~ "\"lookback_hours\": 5"
+  end
+
+  test "omits the <input> block for an operator-started run with no trigger" do
+    test_pid = self()
+
+    plug = fn conn ->
+      {:ok, raw, conn} = Plug.Conn.read_body(conn)
+      send(test_pid, {:payload, Jason.decode!(raw)})
+
+      conn
+      |> Plug.Conn.put_resp_content_type("application/json")
+      |> Plug.Conn.send_resp(200, Jason.encode!(%{"threadId" => "t", "outcome" => %{"kind" => "ok"}, "eventCount" => 0}))
+    end
+
+    node = agent_node({:inline, "do work"})
+    run_opts = %{run_id: "r", attempt: 1, cwd: "/w", trigger: nil, room_server_url: "http://room.test", req_options: [plug: plug]}
+
+    assert {:ok, _, _} = RoomEngineClient.run_node(node, run_opts)
+    assert_receive {:payload, payload}
+    assert payload["prompt"] == "do work"
+    refute payload["prompt"] =~ "<input>"
+  end
+
+  test "a skill that names an unbound input fails loudly rather than half-rendering" do
+    node = agent_node({:skill, "inspect", %{}})
+
+    run_opts = %{
+      run_id: "r",
+      attempt: 1,
+      cwd: "/w",
+      room_server_url: "http://room.test",
+      skill_resolver: fn "inspect" -> {:ok, "needs ${missing}"} end
+    }
+
+    assert {:error, {:unbound_placeholder, "missing"}, nil} = RoomEngineClient.run_node(node, run_opts)
+  end
+
+  test "a missing cwd fails loudly before any request" do
+    node = agent_node({:inline, "do work"})
+    assert {:error, :missing_cwd, nil} = RoomEngineClient.run_node(node, %{run_id: "r", attempt: 1})
+  end
+
+  test "an agent node with no envelope is a wiring error" do
+    node = %{agent_node({:inline, "x"}) | envelope: nil}
+    assert {:error, {:missing_envelope, "n0"}, nil} = RoomEngineClient.run_node(node, %{run_id: "r", attempt: 1, cwd: "/w"})
+  end
+
+  test "a non-agent node never reaches the engine host" do
+    exec = Node.new(id: "e0", ast_origin: {:exec, "build"}, kind: :exec, inputs: %{})
+    assert {:error, {:not_an_agent_node, :exec, "e0"}, nil} = RoomEngineClient.run_node(exec, %{run_id: "r", cwd: "/w"})
+  end
+
+  test "status/1 is conservatively unknown on the synchronous path" do
+    assert RoomEngineClient.status("any-thread") == :unknown
+    assert RoomEngineClient.status(nil) == :unknown
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/runtime_registry_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/runtime_registry_test.exs
new file mode 100644
index 000000000..273f95d3c
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/runtime_registry_test.exs
@@ -0,0 +1,79 @@
+defmodule SymphonyElixir.Runtime.RuntimeRegistryTest do
+  use ExUnit.Case, async: false
+
+  alias SymphonyElixir.Runtime.RuntimeRegistry
+
+  setup do
+    start_supervised!(RuntimeRegistry)
+    :ok
+  end
+
+  defp worker(id, overrides \\ %{}) do
+    Map.merge(
+      %{worker_id: id, pid: self(), address: "100.0.0.1", labels: ["default"], capacity: 4},
+      overrides
+    )
+  end
+
+  test "register makes a worker discoverable by get/list/select" do
+    :ok = RuntimeRegistry.register(worker("w1"))
+
+    assert {:ok, %{worker_id: "w1", address: "100.0.0.1", labels: ["default"]}} = RuntimeRegistry.get("w1")
+    assert [%{worker_id: "w1"}] = RuntimeRegistry.list()
+    assert {:ok, %{worker_id: "w1"}} = RuntimeRegistry.select()
+  end
+
+  test "get is :error for an unknown worker" do
+    assert :error = RuntimeRegistry.get("nope")
+  end
+
+  test "select filters by label and returns :no_worker when none match" do
+    :ok = RuntimeRegistry.register(worker("w1", %{labels: ["us-west"]}))
+    :ok = RuntimeRegistry.register(worker("w2", %{labels: ["hari"]}))
+
+    assert {:ok, %{worker_id: "w2"}} = RuntimeRegistry.select("hari")
+    assert {:error, :no_worker} = RuntimeRegistry.select("nonexistent")
+  end
+
+  test "select returns :no_worker when the registry is empty" do
+    assert {:error, :no_worker} = RuntimeRegistry.select()
+  end
+
+  test "re-registering the same id replaces the prior entry" do
+    :ok = RuntimeRegistry.register(worker("w1", %{address: "100.0.0.1"}))
+    :ok = RuntimeRegistry.register(worker("w1", %{address: "100.0.0.9"}))
+
+    assert {:ok, %{address: "100.0.0.9"}} = RuntimeRegistry.get("w1")
+    assert [_one] = RuntimeRegistry.list()
+  end
+
+  test "unregister drops a worker" do
+    :ok = RuntimeRegistry.register(worker("w1"))
+    :ok = RuntimeRegistry.unregister("w1")
+    assert :error = RuntimeRegistry.get("w1")
+  end
+
+  test "a worker whose channel process dies is dropped automatically" do
+    parent = self()
+    pid = spawn(fn -> receive do: (:stop -> send(parent, :stopped)) end)
+    :ok = RuntimeRegistry.register(worker("w1", %{pid: pid}))
+    assert {:ok, _} = RuntimeRegistry.get("w1")
+
+    Process.exit(pid, :kill)
+    assert eventually(fn -> RuntimeRegistry.get("w1") == :error end)
+  end
+
+  defp eventually(fun, retries \\ 50) do
+    cond do
+      fun.() ->
+        true
+
+      retries == 0 ->
+        false
+
+      true ->
+        Process.sleep(10)
+        eventually(fun, retries - 1)
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/supervisor_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/supervisor_test.exs
new file mode 100644
index 000000000..673b5ca57
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/supervisor_test.exs
@@ -0,0 +1,100 @@
+defmodule SymphonyElixir.Runtime.SupervisorTest do
+  use ExUnit.Case, async: false
+
+  @moduletag capture_log: true
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Node, RunGraph, Store}
+  alias SymphonyElixir.Runtime
+
+  defmodule FakeEngine do
+    @behaviour SymphonyElixir.Runtime.EngineClient
+
+    @impl true
+    def run_node(%Node{id: id}, _opts), do: {:ok, %{ran: id}, "thread-#{id}"}
+
+    @impl true
+    def status(_thread_id), do: :unknown
+  end
+
+  setup do
+    start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+    start_supervised!(SymphonyElixir.Runtime.Supervisor)
+
+    tmp = Path.join(System.tmp_dir!(), "rt_sup_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(tmp)
+    on_exit(fn -> File.rm_rf(tmp) end)
+    {:ok, store_opts: [dir: tmp]}
+  end
+
+  # Agent nodes route through the injected FakeEngine; exec nodes run
+  # locally and would bypass it.
+  defp agent_node(id, overrides \\ []) do
+    Node.new(
+      [
+        id: id,
+        ast_origin: {:agent, id},
+        kind: :agent,
+        envelope: %Envelope{engine: :codex, model: "m"},
+        prompt_ref: {:inline, "go"},
+        inputs: %{}
+      ] ++ overrides
+    )
+  end
+
+  defp one_node_graph(run_id) do
+    node = agent_node("n0")
+    RunGraph.new(run_id, "hash", nil) |> RunGraph.put_nodes([node]) |> Map.put(:status, :running)
+  end
+
+  test "start_run schedules a graph under supervision and it runs to terminal", %{store_opts: store_opts} do
+    graph = one_node_graph("run_sup_1")
+
+    assert {:ok, pid} = Runtime.Supervisor.start_run(graph, engine: FakeEngine, store_opts: store_opts)
+    ref = Process.monitor(pid)
+    assert_receive {:DOWN, ^ref, :process, _, _}, 2_000
+
+    {:ok, final} = Store.load("run_sup_1", store_opts)
+    assert final.status == :succeeded
+    assert final.nodes["n0"].state == :succeeded
+  end
+
+  test "resume_pending restarts a persisted non-terminal run with recovery", %{store_opts: store_opts} do
+    # Persist a run left :running with a node :running (an orphaned run, as
+    # if the BEAM died mid-flight). resume_pending should reattach/recover.
+    node = agent_node("n0", state: :running)
+    graph = RunGraph.new("run_resume", "hash", nil) |> RunGraph.put_nodes([node]) |> Map.put(:status, :running)
+    :ok = Store.persist(graph, store_opts)
+
+    Runtime.Supervisor.resume_pending(engine: FakeEngine, store_opts: store_opts)
+
+    # The recovered run reconciles the orphaned :running node. With a
+    # FakeEngine status of :unknown the node is stranded (no opt-in retry),
+    # so the run resolves rather than hanging. Poll the store until terminal.
+    final = wait_for_terminal("run_resume", store_opts)
+    assert final.status in [:failed, :succeeded]
+    refute final.nodes["n0"].state == :running
+  end
+
+  test "resume_pending skips terminal runs", %{store_opts: store_opts} do
+    node = agent_node("n0", state: :succeeded)
+    graph = RunGraph.new("run_done", "hash", nil) |> RunGraph.put_nodes([node]) |> Map.put(:status, :succeeded)
+    :ok = Store.persist(graph, store_opts)
+
+    Runtime.Supervisor.resume_pending(engine: FakeEngine, store_opts: store_opts)
+
+    # No child was started for the already-terminal run.
+    assert DynamicSupervisor.count_children(SymphonyElixir.Runtime.Supervisor).active == 0
+  end
+
+  defp wait_for_terminal(run_id, store_opts, attempts \\ 40) do
+    {:ok, graph} = Store.load(run_id, store_opts)
+
+    cond do
+      graph.status in [:succeeded, :failed, :cancelled] -> graph
+      attempts == 0 -> flunk("run #{run_id} never reached terminal: #{graph.status}")
+      true -> Process.sleep(25) && wait_for_terminal(run_id, store_opts, attempts - 1)
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime/trigger_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime/trigger_test.exs
new file mode 100644
index 000000000..ce944409a
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime/trigger_test.exs
@@ -0,0 +1,47 @@
+defmodule SymphonyElixir.Runtime.TriggerTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Runtime.Trigger
+
+  describe "matches?/2" do
+    test "cron matches on the declared schedule" do
+      declared = %{kind: :cron, schedule: "0 9 * * *", timezone: "UTC", input: %{}}
+      assert Trigger.matches?(declared, %{kind: :cron, schedule: "0 9 * * *"})
+      refute Trigger.matches?(declared, %{kind: :cron, schedule: "@daily"})
+    end
+
+    test "linear matches when the declared label is on the event" do
+      declared = %{kind: :linear, label: "[sym] triage"}
+      assert Trigger.matches?(declared, %{kind: :linear, labels: ["a", "[sym] triage"]})
+      refute Trigger.matches?(declared, %{kind: :linear, labels: ["a", "b"]})
+      refute Trigger.matches?(declared, %{kind: :linear, labels: []})
+    end
+
+    test "github matches on repo and label together" do
+      declared = %{kind: :github_pr_label, repo: "acme/app", label: "ship"}
+      assert Trigger.matches?(declared, %{kind: :github_pr_label, repo: "acme/app", label: "ship"})
+      refute Trigger.matches?(declared, %{kind: :github_pr_label, repo: "acme/other", label: "ship"})
+      refute Trigger.matches?(declared, %{kind: :github_pr_label, repo: "acme/app", label: "hold"})
+    end
+
+    test "slack matches the declared channel against name or resolved id" do
+      huddle = %{kind: :slack_huddle_completed, channel: "#general"}
+      assert Trigger.matches?(huddle, %{kind: :slack_huddle_completed, channel: "#general"})
+      assert Trigger.matches?(huddle, %{kind: :slack_huddle_completed, channel: "x", channel_id: "#general"})
+      refute Trigger.matches?(huddle, %{kind: :slack_huddle_completed, channel: "#random"})
+
+      mention = %{kind: :slack_app_mention, channel: "C123"}
+      assert Trigger.matches?(mention, %{kind: :slack_app_mention, channel_id: "C123"})
+      refute Trigger.matches?(mention, %{kind: :slack_app_mention, channel_id: "C999"})
+    end
+
+    test "manual always matches its kind" do
+      assert Trigger.matches?(%{kind: :manual}, %{kind: :manual, input: %{}})
+    end
+
+    test "a nil or mismatched declared trigger never matches" do
+      refute Trigger.matches?(nil, %{kind: :manual})
+      refute Trigger.matches?(%{kind: :cron, schedule: "x"}, %{kind: :cron})
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/runtime_test.exs b/packages/symphony/elixir/test/symphony_elixir/runtime_test.exs
new file mode 100644
index 000000000..bc8e51a3e
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/runtime_test.exs
@@ -0,0 +1,808 @@
+defmodule SymphonyElixir.RuntimeTest do
+  use ExUnit.Case, async: false
+
+  # The #90 crash tests deliberately kill executor tasks, which logs the
+  # crash and the deadlock-guard error. Capture it so a passing run stays
+  # quiet; a real regression still surfaces through the assertions.
+  @moduletag capture_log: true
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Materializer, Node, RunGraph, Store}
+  alias SymphonyElixir.Runtime
+
+  # A fake EngineClient driven by a per-test ETS table mapping a node id
+  # to an instruction. The table name is fixed but rows are cleared in
+  # setup, so `async: false` keeps tests from racing each other.
+  defmodule FakeEngine do
+    @behaviour SymphonyElixir.Runtime.EngineClient
+
+    @table :runtime_test_fake
+
+    def setup do
+      if :ets.whereis(@table) == :undefined do
+        :ets.new(@table, [:named_table, :public, :set])
+      end
+
+      :ets.delete_all_objects(@table)
+      :ok
+    end
+
+    # `instruction` is one of:
+    #   {:ok, output}        -> succeed with output
+    #   {:error, reason}     -> fail
+    #   {:ok, output, tid}   -> succeed and report thread id
+    #   :crash               -> raise, so the task dies without :node_done
+    #   {:sleep_then, instr} -> sleep so the test can observe :running first
+    def program(node_id, instruction), do: :ets.insert(@table, {node_id, instruction})
+
+    def set_status(thread_id, status), do: :ets.insert(@table, {{:status, thread_id}, status})
+
+    # The run_opts a node's turn was invoked with, so a test can assert the
+    # runtime threaded the resolved working directory in.
+    def opts_for(node_id) do
+      case :ets.lookup(@table, {:opts, node_id}) do
+        [{_, opts}] -> opts
+        [] -> nil
+      end
+    end
+
+    @impl true
+    def run_node(%Node{id: id}, opts) do
+      :ets.insert(@table, {{:opts, id}, opts})
+
+      case lookup(id) do
+        {:ok, output} -> {:ok, output, nil}
+        {:ok, output, tid} -> {:ok, output, tid}
+        {:error, reason} -> {:error, reason, nil}
+        :crash -> raise "fake engine crash for #{id}"
+        {:sleep_then, instr} -> sleep_then(id, instr)
+        nil -> {:ok, %{default: id}, nil}
+      end
+    end
+
+    @impl true
+    def status(thread_id) do
+      case :ets.lookup(@table, {:status, thread_id}) do
+        [{_, status}] -> status
+        [] -> :unknown
+      end
+    end
+
+    defp sleep_then(id, instr) do
+      Process.sleep(50)
+      :ets.insert(@table, {id, instr})
+      run_node(%Node{id: id, ast_origin: nil, kind: :exec, inputs: %{}, deps: [], state: :running}, %{})
+    end
+
+    defp lookup(id) do
+      case :ets.lookup(@table, id) do
+        [{^id, instruction}] -> instruction
+        [] -> nil
+      end
+    end
+  end
+
+  # A placement double that resolves a fixed working directory, so a test
+  # can assert the runtime threads the checkout path into an agent turn
+  # without provisioning a real room-server.
+  defmodule CwdPlacement do
+    def acquire(_run_id, _location, _opts), do: {:ok, "http://stub.test"}
+    def resolved(_run_id), do: {:ok, %{location: :host, base_url: "http://stub.test"}}
+    def workspace_cwd(_run_id, _opts), do: {:ok, "/checkout/run/example"}
+    def release(_run_id), do: :ok
+  end
+
+  # A placement double that forwards the opts `acquire/3` received to the
+  # test process (the `:test_pid` is threaded through `placement_opts`), so a
+  # test can assert the runtime minted and passed a GitHub App `:bot_token`.
+  defmodule RecordingPlacement do
+    def acquire(_run_id, _location, opts) do
+      if pid = Keyword.get(opts, :test_pid), do: send(pid, {:acquire_opts, opts})
+      {:ok, "http://stub.test"}
+    end
+
+    def resolved(_run_id), do: {:ok, %{location: :host, base_url: "http://stub.test"}}
+    def workspace_cwd(_run_id, _opts), do: {:ok, "/checkout/run/example"}
+    def release(_run_id), do: :ok
+  end
+
+  setup do
+    FakeEngine.setup()
+    start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+
+    dir = Path.join(System.tmp_dir!(), "runtime_test_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(dir)
+    on_exit(fn -> File.rm_rf(dir) end)
+    {:ok, dir: dir}
+  end
+
+  # The subrun tests launch a nested run through Runtime.Ingress, which
+  # resolves the child workflow through WorkflowCatalog's ETS table and
+  # starts it under Runtime.Supervisor. Create the table and the supervisor
+  # only when a test needs them so the rest of the suite stays untouched.
+  defp ensure_subrun_substrate do
+    table = :symphony_workflows
+
+    if :ets.whereis(table) == :undefined do
+      :ets.new(table, [:named_table, :public, read_concurrency: true])
+    else
+      :ets.delete_all_objects(table)
+    end
+
+    unless Process.whereis(SymphonyElixir.Runtime.Supervisor) do
+      start_supervised!(SymphonyElixir.Runtime.Supervisor)
+    end
+
+    :ok
+  end
+
+  defp put_workflow(name, source) do
+    {:ok, ast} = SymphonyElixir.DSL.Parser.parse(source)
+    entry = %{name: ast.name || name, ast: ast, trigger: ast.trigger, source: source, hash: :crypto.hash(:sha256, source)}
+    :ets.insert(:symphony_workflows, {name, entry})
+  end
+
+  # Agent nodes by default so each attempt routes through the injected
+  # FakeEngine; exec nodes run locally and would bypass it. A test can still
+  # pass `kind:`/`envelope:` to override.
+  defp node(id, opts) do
+    base = [
+      id: id,
+      ast_origin: {:t, id},
+      kind: Keyword.get(opts, :kind, :agent),
+      envelope: Keyword.get(opts, :envelope, %Envelope{engine: :codex, model: "m"}),
+      inputs: Keyword.get(opts, :inputs, %{})
+    ]
+
+    Node.new(base ++ Keyword.take(opts, [:state, :attempts]))
+  end
+
+  defp graph(run_id, nodes), do: RunGraph.new(run_id, "h", {:ast, []}) |> RunGraph.put_nodes(nodes)
+
+  # Materialize a `.sym` source into a real RunGraph so the runtime drives
+  # the AST through `Materializer.expand_dynamic/1` on each success. The
+  # gate tests need the AST present (the hand-built `graph/2` carries a
+  # placeholder `{:ast, []}` that re-expands to nothing); this gives the
+  # supervised run an actual `when`/`every` construct to resolve.
+  defp materialized(run_id, source) do
+    {:ok, ast} = SymphonyElixir.DSL.Parser.parse(source)
+    {:ok, graph} = Materializer.materialize(run_id, "h", ast)
+    graph
+  end
+
+  defp opts(dir), do: [engine: FakeEngine, store_opts: [dir: dir]]
+
+  # A run settles when the GenServer stops (succeeded/cancelled) or stays
+  # alive and idle on a terminal :failed status (WS-6 keeps a failed run
+  # alive so the operator surface can reach it). Treat both as settled.
+  defp wait_for_exit(pid) do
+    ref = Process.monitor(pid)
+
+    receive do
+      {:DOWN, ^ref, :process, ^pid, _} -> :ok
+    after
+      0 -> wait_for_settled(pid, ref)
+    end
+  end
+
+  defp wait_for_settled(pid, ref, attempts \\ 100) do
+    receive do
+      {:DOWN, ^ref, :process, ^pid, _} -> :ok
+    after
+      20 ->
+        cond do
+          settled_failed?(pid) ->
+            Process.demonitor(ref, [:flush])
+            :ok
+
+          attempts == 0 ->
+            flunk("runtime did not settle in time")
+
+          true ->
+            wait_for_settled(pid, ref, attempts - 1)
+        end
+    end
+  end
+
+  defp settled_failed?(pid) do
+    Process.alive?(pid) and SymphonyElixir.Runtime.graph(pid).status == :failed
+  catch
+    :exit, _ -> true
+  end
+
+  test "runs a linear two-node graph to success", %{dir: dir} do
+    g =
+      graph("run-linear", [
+        node("a", state: :pending),
+        node("b", state: :pending, inputs: %{"x" => {:node, "a", []}})
+      ])
+
+    FakeEngine.program("a", {:ok, %{v: 1}})
+    FakeEngine.program("b", {:ok, %{v: 2}})
+
+    {:ok, pid} = Runtime.start_link(g, opts(dir))
+    wait_for_exit(pid)
+
+    {:ok, final} = Store.load("run-linear", dir: dir)
+    assert final.status == :succeeded
+    assert final.nodes["a"].state == :succeeded
+    assert final.nodes["b"].state == :succeeded
+  end
+
+  test "threads the resolved placement cwd into an agent turn", %{dir: dir} do
+    # A `{:host, _}` location makes the runtime acquire a placement, so the
+    # agent run_opts must carry the checkout cwd the engine turn needs.
+    envelope = %Envelope{engine: :codex, model: "m", location: {:host, "box"}}
+    g = graph("run-cwd", [node("a", state: :pending, envelope: envelope)])
+
+    FakeEngine.program("a", {:ok, %{v: 1}})
+
+    {:ok, pid} = Runtime.start_link(g, engine: FakeEngine, placement: CwdPlacement, store_opts: [dir: dir])
+    wait_for_exit(pid)
+
+    assert FakeEngine.opts_for("a")[:cwd] == "/checkout/run/example"
+  end
+
+  test "mints a GitHub App token and threads it into placement acquire", %{dir: dir} do
+    # With a GitHub App configured, the runtime must pass a freshly minted
+    # installation token as `:bot_token` so the workspace clone auth and the
+    # room-server GITHUB_TOKEN/GH_TOKEN author agent PRs under the App's bot
+    # identity rather than the static host token (ENG-2012,
+    # indexable-inc/symphony#242).
+    snapshot = SymphonyElixir.Config.get()
+
+    :ets.insert(
+      :symphony_config,
+      {:snapshot, %{snapshot | github_app_id: "123", github_app_private_key_pem: "PEM"}}
+    )
+
+    on_exit(fn -> :ets.insert(:symphony_config, {:snapshot, snapshot}) end)
+
+    # Seed the installation-token cache so `GithubApp.installation_token/0`
+    # answers without the GenServer (unstarted in this test) or a real mint.
+    if :ets.whereis(:symphony_github_app_token) == :undefined do
+      :ets.new(:symphony_github_app_token, [:named_table, :public, read_concurrency: true])
+    end
+
+    :ets.insert(
+      :symphony_github_app_token,
+      {:current, %{token: "app-token", expires_at: DateTime.add(DateTime.utc_now(), 3600, :second), installation_id: 1}}
+    )
+
+    # The seeded table is owned by this test process when GithubApp is not
+    # supervised (it vanishes on exit); only drop the entry if a real,
+    # longer-lived table is present so the seed cannot leak into other tests.
+    on_exit(fn ->
+      if :ets.whereis(:symphony_github_app_token) != :undefined do
+        :ets.delete(:symphony_github_app_token, :current)
+      end
+    end)
+
+    envelope = %Envelope{engine: :codex, model: "m", location: {:host, "box"}}
+    g = graph("run-bot-token", [node("a", state: :pending, envelope: envelope)])
+
+    FakeEngine.program("a", {:ok, %{v: 1}})
+
+    {:ok, pid} =
+      Runtime.start_link(g,
+        engine: FakeEngine,
+        placement: RecordingPlacement,
+        store_opts: [dir: dir, placement_opts: [test_pid: self()]]
+      )
+
+    wait_for_exit(pid)
+
+    assert_received {:acquire_opts, opts}
+    assert Keyword.get(opts, :bot_token) == "app-token"
+  end
+
+  test "threads a successful turn's cost onto the recorded attempt", %{dir: dir} do
+    g = graph("run-cost", [node("a", state: :pending)])
+
+    cost = %{usd: 0.0123, tokens_in: 1200, tokens_out: 340, cache_read: 800, cache_creation: 64}
+    FakeEngine.program("a", {:ok, %{thread_id: "thread_abc", event_count: 4, cost: cost}, "thread_abc"})
+
+    {:ok, pid} = Runtime.start_link(g, opts(dir))
+    wait_for_exit(pid)
+
+    {:ok, final} = Store.load("run-cost", dir: dir)
+    assert final.status == :succeeded
+    [attempt] = final.nodes["a"].attempts
+    assert attempt.state == :succeeded
+    assert attempt.cost == cost
+  end
+
+  test "runs parallel-ready siblings concurrently", %{dir: dir} do
+    g =
+      graph("run-parallel", [
+        node("a", state: :pending),
+        node("b", state: :pending)
+      ])
+
+    FakeEngine.program("a", {:ok, :ok})
+    FakeEngine.program("b", {:ok, :ok})
+
+    {:ok, pid} = Runtime.start_link(g, opts(dir))
+    wait_for_exit(pid)
+
+    {:ok, final} = Store.load("run-parallel", dir: dir)
+    assert final.status == :succeeded
+  end
+
+  test "a node failure propagates upstream_failed and the run fails", %{dir: dir} do
+    g =
+      graph("run-fail", [
+        node("a", state: :pending),
+        node("b", state: :pending, inputs: %{"x" => {:node, "a", []}})
+      ])
+
+    FakeEngine.program("a", {:error, :boom})
+
+    {:ok, pid} = Runtime.start_link(g, opts(dir))
+    wait_for_exit(pid)
+
+    {:ok, final} = Store.load("run-fail", dir: dir)
+    assert final.status == :failed
+    assert final.nodes["a"].state == :failed
+    assert final.nodes["b"].state == :upstream_failed
+  end
+
+  describe "#90: executor task dies without :node_done" do
+    test "a crashing task strands the node and the run resolves (no opt-in retry)", %{dir: dir} do
+      g = graph("run-crash", [node("a", state: :pending)])
+      FakeEngine.program("a", :crash)
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-crash", dir: dir)
+      # The node cannot run again without operator action; the run does not
+      # hang. With no remaining ready work the deadlock guard resolves it.
+      assert final.nodes["a"].state == :stranded
+      assert final.status == :failed
+      [att] = final.nodes["a"].attempts
+      assert att.state == :stranded
+    end
+
+    test "an opted-in node with no side effect auto-retries after a crash", %{dir: dir} do
+      g = graph("run-retry", [node("a", state: :pending, inputs: %{"__retry__" => {:literal, true}})])
+
+      # First attempt crashes; the retry succeeds. The fake flips the
+      # instruction the first time it is asked to crash.
+      FakeEngine.program("a", :crash)
+
+      test_pid = self()
+
+      # Replace the crash with a success once the strand has been recorded.
+      spawn(fn ->
+        Process.sleep(80)
+        FakeEngine.program("a", {:ok, :recovered})
+        send(test_pid, :reprogrammed)
+      end)
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-retry", dir: dir)
+      assert final.nodes["a"].state in [:succeeded, :stranded]
+    end
+  end
+
+  describe "#90: deadlock guard" do
+    test "a graph with no ready nodes and no tasks fails instead of hanging", %{dir: dir} do
+      # `a` depends on a node that never succeeds (it is itself blocked by a
+      # missing dep id), so no node is ever ready.
+      g =
+        graph("run-deadlock", [
+          node("a", state: :pending, inputs: %{"x" => {:node, "ghost", []}})
+        ])
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-deadlock", dir: dir)
+      assert final.status == :failed
+    end
+  end
+
+  describe "#90: BEAM restart reconciliation" do
+    test "a persisted :running node makes progress after a simulated restart", %{dir: dir} do
+      # Persist a graph as if the BEAM died mid-turn: node `a` is :running
+      # with an attempt that opened no thread, and `b` waits on it.
+      attempt = SymphonyElixir.IR.Attempt.start(1, :codex, nil)
+
+      g =
+        graph("run-restart", [
+          node("a", state: :running, attempts: [attempt], inputs: %{"__retry__" => {:literal, true}}),
+          node("b", state: :pending, inputs: %{"x" => {:node, "a", []}})
+        ])
+
+      :ok = Store.persist(g, dir: dir)
+
+      # On restart the engine cannot account for the thread (no thread id),
+      # so reconcile auto-retries `a` (opted in, no side effect). The rerun
+      # then succeeds and unblocks `b`.
+      FakeEngine.program("a", {:ok, :ok})
+      FakeEngine.program("b", {:ok, :ok})
+
+      {:ok, reloaded} = Store.load("run-restart", dir: dir)
+      {:ok, pid} = Runtime.start_link(reloaded, [recover: true] ++ opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-restart", dir: dir)
+      assert final.nodes["a"].state == :succeeded
+      assert final.nodes["b"].state == :succeeded
+      assert final.status == :succeeded
+    end
+
+    test "a persisted :running node with an opened thread strands on restart", %{dir: dir} do
+      attempt = SymphonyElixir.IR.Attempt.start(1, :codex, "thread-x")
+      g = graph("run-restart-strand", [node("a", state: :running, attempts: [attempt])])
+      :ok = Store.persist(g, dir: dir)
+
+      # status :unknown -> the thread cannot be accounted for; a recorded
+      # thread id means a side effect may have happened, so strand.
+      {:ok, reloaded} = Store.load("run-restart-strand", dir: dir)
+      {:ok, pid} = Runtime.start_link(reloaded, [recover: true] ++ opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-restart-strand", dir: dir)
+      assert final.nodes["a"].state == :stranded
+      assert final.status == :failed
+    end
+  end
+
+  describe "PubSub: live transitions broadcast" do
+    alias SymphonyElixir.Runtime.Events
+
+    # The app PubSub (`SymphonyElixir.PubSub`) is started once in
+    # `test_helper.exs`, so a subscriber here receives the runtime's
+    # broadcasts without booting any extra process.
+
+    test "a subscriber receives an event for each persisted transition", %{dir: dir} do
+      g =
+        graph("run-pubsub", [
+          node("a", state: :pending),
+          node("b", state: :pending, inputs: %{"x" => {:node, "a", []}})
+        ])
+
+      FakeEngine.program("a", {:ok, %{v: 1}})
+      FakeEngine.program("b", {:ok, %{v: 2}})
+
+      :ok = Events.subscribe_run("run-pubsub")
+      :ok = Events.subscribe_index()
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      summaries = drain_events("run-pubsub")
+
+      # Each persisted transition announces, so a two-node run that marks
+      # each node running then succeeded fans out several events, not one.
+      assert length(summaries) > 1
+
+      # The run resolves succeeded, so the last announced summary carries
+      # the terminal status and both nodes counted as succeeded.
+      last = List.last(summaries)
+      assert last["status"] == "succeeded"
+      assert last["states"] == %{"succeeded" => 2}
+
+      # An intermediate transition is observable: at least one summary shows
+      # a node already succeeded while the run had not yet finished, proving
+      # the page would update before the run completes.
+      assert Enum.any?(summaries, fn s -> s["states"]["succeeded"] == 1 end)
+
+      # The per-run and index topics carry the same message, so the
+      # subscriber sees each transition twice (once per topic). Both shapes
+      # are the `IR.View.summary/1` map keyed on this run.
+      assert Enum.all?(summaries, &match?(%{"run_id" => "run-pubsub"}, &1))
+    end
+
+    # Collect every `{:ir_run_event, run_id, summary}` currently in the
+    # mailbox for one run. The subscriber is registered on both topics, so
+    # this drains the duplicate index + per-run deliveries too.
+    defp drain_events(run_id, acc \\ []) do
+      receive do
+        {:ir_run_event, ^run_id, summary} -> drain_events(run_id, [summary | acc])
+      after
+        50 -> Enum.reverse(acc)
+      end
+    end
+  end
+
+  describe "subrun: nested child runs" do
+    # A child workflow with a single agent node. Its node id is
+    # content-derived, so the test does not program the FakeEngine for it;
+    # the fake's default branch succeeds any unprogrammed node, which is
+    # enough to drive the child to a :succeeded terminal status.
+    @child_sym ~s|workflow "child" on manual { c <- agent { engine: codex, model: "m", prompt: inline "do" } }|
+
+    test "a subrun starts a child run and its terminal output flows to the parent", %{dir: dir} do
+      ensure_subrun_substrate()
+      put_workflow("child", @child_sym)
+
+      g =
+        graph("run-subrun-ok", [
+          Node.new(
+            id: "s",
+            ast_origin: {:t, "s"},
+            kind: :subrun,
+            inputs: %{"source" => {:literal, "child.sym"}},
+            state: :pending
+          )
+        ])
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-subrun-ok", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes["s"].state == :succeeded
+
+      # The subrun node's output names the child run and carries its status,
+      # so a downstream node could read the child result through its inputs.
+      output = final.nodes["s"].output
+      assert output.kind == :subrun
+      assert output.status == :succeeded
+      assert is_binary(output.run_id)
+
+      # The attempt records the subrun executor, not a sham engine.
+      [attempt] = final.nodes["s"].attempts
+      assert attempt.engine == :subrun
+      assert attempt.state == :succeeded
+
+      # The child run was persisted under its own id in the shared store.
+      assert {:ok, child} = Store.load(output.run_id, dir: dir)
+      assert child.status == :succeeded
+    end
+
+    test "a self-referential subrun is rejected as a cycle without spawning a child", %{dir: dir} do
+      ensure_subrun_substrate()
+      put_workflow("child", @child_sym)
+
+      g =
+        graph("run-subrun-cycle", [
+          Node.new(
+            id: "s",
+            ast_origin: {:t, "s"},
+            kind: :subrun,
+            inputs: %{"source" => {:literal, "child.sym"}},
+            state: :pending
+          )
+        ])
+
+      # The parent is itself a "child" run already (its name is on the
+      # ancestor chain), so a subrun back to "child" closes a cycle.
+      sub_opts = opts(dir) ++ [subrun_ancestors: ["child"]]
+      {:ok, pid} = Runtime.start_link(g, sub_opts)
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-subrun-cycle", dir: dir)
+      assert final.status == :failed
+      assert final.nodes["s"].state == :failed
+      assert {:error, {:subrun_cycle, "child", ["child"]}} = final.nodes["s"].output
+    end
+
+    test "a subrun over the depth ceiling is rejected", %{dir: dir} do
+      ensure_subrun_substrate()
+      put_workflow("child", @child_sym)
+
+      g =
+        graph("run-subrun-depth", [
+          Node.new(
+            id: "s",
+            ast_origin: {:t, "s"},
+            kind: :subrun,
+            inputs: %{"source" => {:literal, "child.sym"}},
+            state: :pending
+          )
+        ])
+
+      # Start already at the ceiling so the child (depth + 1) trips the cap.
+      ceiling = SymphonyElixir.Config.get().subrun_max_depth
+      sub_opts = opts(dir) ++ [subrun_depth: ceiling]
+      {:ok, pid} = Runtime.start_link(g, sub_opts)
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-subrun-depth", dir: dir)
+      assert final.status == :failed
+      assert final.nodes["s"].state == :failed
+      assert {:error, {:subrun_depth_exceeded, _depth, ^ceiling}} = final.nodes["s"].output
+    end
+  end
+
+  describe "when/every gate execution (Phase 7)" do
+    # A gating agent followed by a `when ${a.changed}` body agent. The
+    # interpreter ids are content-derived: the gating agent is `agent-0`,
+    # the gate placeholder is `when-1`, and the body agent that the firing
+    # pass emits is `agent-2`. The supervised run must drive `agent-0` to
+    # success, re-expand on its output, then schedule (or skip) `agent-2`.
+    @when_sym ~s|workflow "gate" on manual { a <- agent { engine: codex, model: "m", prompt: inline "decide" } when ${a.changed} { b <- agent { engine: codex, model: "m", prompt: inline "act" } } }|
+
+    test "a when gate that resolves true runs the gated body under a supervised run", %{dir: dir} do
+      g = materialized("run-when-true", @when_sym)
+
+      # The gate reads `${a.changed}`; the body agent is unprogrammed and
+      # falls through the fake's default success. Atom-keyed output is fine:
+      # the interpreter's field read digs string or atom keys.
+      FakeEngine.program("agent-0", {:ok, %{changed: true}})
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-when-true", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes["agent-0"].state == :succeeded
+      # The gated body materialized after agent-0 succeeded and ran to success.
+      assert final.nodes["agent-2"].state == :succeeded
+      # The resolved gate placeholder was retired so it did not deadlock the run.
+      assert final.nodes["when-1"].state == :skipped
+    end
+
+    test "a when gate that resolves false skips the body and the run still succeeds", %{dir: dir} do
+      g = materialized("run-when-false", @when_sym)
+
+      FakeEngine.program("agent-0", {:ok, %{changed: false}})
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-when-false", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes["agent-0"].state == :succeeded
+      # The body was never emitted: a falsy gate produces no child node.
+      refute Map.has_key?(final.nodes, "agent-2")
+      # The placeholder is retired to :skipped, the load-bearing pair with
+      # the deadlock guard so a never-fired gate does not stall the run.
+      assert final.nodes["when-1"].state == :skipped
+    end
+
+    # `every n of c { ... }` is an interpreter gate keyed on the persisted
+    # expansion log, not a wall-clock schedule. In a single run the gate is
+    # evaluated once at materialize time (tick 1): `every 1` fires its body,
+    # `every 2+` skips it. The skip case materializes to zero nodes, which
+    # must resolve as a no-op success, not trip the deadlock guard.
+    @every_one_sym ~s|workflow "tick" on manual { every 1 of gc { b <- agent { engine: codex, model: "m", prompt: inline "act" } } }|
+    @every_two_sym ~s|workflow "tick" on manual { every 2 of gc { b <- agent { engine: codex, model: "m", prompt: inline "act" } } }|
+
+    test "every 1 fires its body on the first tick of a supervised run", %{dir: dir} do
+      g = materialized("run-every-fire", @every_one_sym)
+
+      # The body fires immediately at materialize (tick 1), so the body
+      # agent is present from the start with no placeholder to resolve.
+      assert Map.has_key?(g.nodes, "agent-1")
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-every-fire", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes["agent-1"].state == :succeeded
+    end
+
+    test "every 2 skips on the first tick and the no-op run succeeds without deadlock", %{dir: dir} do
+      g = materialized("run-every-skip", @every_two_sym)
+
+      # The gate does not fire on tick 1, so nothing materializes. A run with
+      # no schedulable work is a no-op success, not a deadlock.
+      assert g.nodes == %{}
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-every-skip", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes == %{}
+    end
+  end
+
+  describe "map fan-out execution (Phase 8)" do
+    # A seed agent whose output is a list, then a `map ${seed.repos} as repo`
+    # body that fans out one child agent per element. The interpreter ids are
+    # content-derived: the seed is `agent-0`, the unresolved fan-out is the
+    # `map-1` placeholder, and each child is `agent-2-<digest>` keyed on the
+    # element index. The supervised run drives `agent-0` to success, re-expands
+    # on its list output, then schedules every child.
+    @map_sym ~s|workflow "fan" on manual { seed <- agent { engine: codex, model: "m", prompt: inline "list" } map ${seed.repos} as repo { child <- agent { engine: codex, model: "m", prompt: inline "audit ${repo}" } } }|
+
+    test "a map over a dependency's list fans out one child per element and collects every output", %{dir: dir} do
+      g = materialized("run-map-fanout", @map_sym)
+
+      # Before the seed succeeds the body is a single placeholder, not work.
+      assert g.nodes["map-1"].kind == :map_fanout
+      refute Enum.any?(Map.values(g.nodes), &(&1.kind == :agent and &1.id != "agent-0"))
+
+      # The seed yields three repos; each child is unprogrammed and falls
+      # through the fake's default success, so the run drives all three to
+      # :succeeded without per-child programming.
+      FakeEngine.program("agent-0", {:ok, %{repos: ["alpha", "beta", "gamma"]}})
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-map-fanout", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes["agent-0"].state == :succeeded
+
+      # One child node per element, each terminal succeeded. The ids are the
+      # content-derived fan-out keys; assert by count and kind rather than
+      # spelling each digest, so a stable-id change does not break the test.
+      children = for {_id, %Node{ast_origin: "agent-2"} = n} <- final.nodes, do: n
+      assert length(children) == 3
+      assert Enum.all?(children, &(&1.state == :succeeded))
+
+      # Every child's output collects back into the graph (here the fake's
+      # default `%{default: id}`), so a downstream node could read any one.
+      assert Enum.all?(children, fn n -> n.output == %{default: n.id} end)
+
+      # The resolved fan-out placeholder is retired to :skipped, the
+      # load-bearing pair with the deadlock guard: a fanned-out placeholder
+      # must not sit :pending and stall the run.
+      assert final.nodes["map-1"].state == :skipped
+    end
+
+    # A map over an empty list emits zero children. The placeholder retires to
+    # :skipped, leaving only the succeeded seed, so the run completes as a
+    # no-op success rather than tripping the deadlock guard.
+    test "a map over an empty list emits no children and the run still succeeds", %{dir: dir} do
+      g = materialized("run-map-empty", @map_sym)
+
+      FakeEngine.program("agent-0", {:ok, %{repos: []}})
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-map-empty", dir: dir)
+      assert final.status == :succeeded
+      assert final.nodes["agent-0"].state == :succeeded
+      # No child node was emitted for an empty fan-out.
+      refute Enum.any?(Map.values(final.nodes), &(&1.ast_origin == "agent-2"))
+      # The placeholder is retired so the empty fan-out does not stall the run.
+      assert final.nodes["map-1"].state == :skipped
+    end
+  end
+
+  describe "run visibility at creation" do
+    test "a freshly started run is present in the store before any node finishes", %{dir: dir} do
+      run_id = "run-visible-at-creation"
+
+      # Use a slow node so the run is in-flight when we check the store.
+      g = materialized(run_id, ~s|workflow "vis" on manual { a <- agent { engine: codex, model: "m", prompt: inline "x" } }|)
+      # The first scheduling pass will call run_attempt; sleep so we can load
+      # from the store before the fake engine returns.
+      FakeEngine.program("agent-0", {:sleep_then, {:ok, :done}})
+
+      {:ok, _pid} = Runtime.start_link(g, opts(dir))
+
+      # Load the store immediately after start_link returns. The run must be
+      # present on disk because init/1 persists before the first scheduling
+      # pass, even while a slow placement acquire (or in this test, a sleeping
+      # fake engine) is still in flight.
+      assert {:ok, visible} = Store.load(run_id, dir: dir)
+      assert visible.status == :running
+      assert map_size(visible.nodes) == 1
+    end
+  end
+
+  describe "operator hooks" do
+    test "cancel stops the run and marks non-terminal nodes cancelled", %{dir: dir} do
+      g =
+        graph("run-cancel", [
+          node("a", state: :pending, inputs: %{"x" => {:node, "slow", []}}),
+          node("slow", state: :pending)
+        ])
+
+      # `slow` sleeps so the run is still in flight when we cancel.
+      FakeEngine.program("slow", {:sleep_then, {:ok, :late}})
+
+      {:ok, pid} = Runtime.start_link(g, opts(dir))
+      :ok = Runtime.cancel(pid)
+      wait_for_exit(pid)
+
+      {:ok, final} = Store.load("run-cancel", dir: dir)
+      assert final.status == :cancelled
+      assert final.nodes["a"].state == :cancelled
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/skill_test.exs b/packages/symphony/elixir/test/symphony_elixir/skill_test.exs
new file mode 100644
index 000000000..c5537ca40
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/skill_test.exs
@@ -0,0 +1,117 @@
+defmodule SymphonyElixir.SkillTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixir.Skill
+
+  # Minimal valid YAML frontmatter shared by all fixture skills.
+  @frontmatter """
+  ---
+  codex_model: gpt-5-codex
+  reasoning_effort: medium
+  sandbox: workspace-write
+  approval_policy: never
+  tools: []
+  ---
+  """
+
+  defp setup_skill_dir do
+    dir = Path.join(System.tmp_dir!(), "skill_test_#{System.unique_integer([:positive])}")
+    partials_dir = Path.join(dir, "_partials")
+    File.mkdir_p!(dir)
+    File.mkdir_p!(partials_dir)
+
+    on_exit(fn -> File.rm_rf!(dir) end)
+
+    {dir, partials_dir}
+  end
+
+  defp write_skill!(dir, name, body) do
+    path = Path.join(dir, "#{name}.md")
+    File.write!(path, @frontmatter <> body)
+    path
+  end
+
+  defp write_partial!(partials_dir, name, body) do
+    File.write!(Path.join(partials_dir, "#{name}.md"), body)
+  end
+
+  describe "expand_partials: self-referential partial" do
+    # Regression guard for the prod outage described in the plan. Partial files
+    # that document their own token name in a prose header (e.g. "any skill that
+    # references `{{partial:graphite_sop}}` gets this content inlined") would
+    # leave a residual token in the catalog body under the old single-pass
+    # implementation. The fixpoint + seen-set must drop the self-reference so
+    # the stored body is token-free.
+    test "a partial whose body contains its own token loads cleanly" do
+      {dir, partials_dir} = setup_skill_dir()
+
+      write_partial!(partials_dir, "policy", """
+      This file is referenced via `{{partial:policy}}`.
+      Actual policy content here.
+      """)
+
+      path = write_skill!(dir, "my_skill", "Use this:\n{{partial:policy}}\nDone.\n")
+
+      assert {:ok, skill} = Skill.load(path)
+      refute String.contains?(skill.body, "{{partial:")
+      assert String.contains?(skill.body, "Actual policy content here.")
+    end
+  end
+
+  describe "expand_partials: nested partials" do
+    # Partial A references partial B. The fixpoint loop expands A on the first
+    # pass, which introduces {{partial:b}} into the body; the second pass
+    # expands B. The final body must contain B's text and no residual tokens.
+    test "partial A inlining partial B both expand into the final body" do
+      {dir, partials_dir} = setup_skill_dir()
+
+      write_partial!(partials_dir, "a", "Content from A.\n{{partial:b}}\n")
+      write_partial!(partials_dir, "b", "Content from B.")
+
+      path = write_skill!(dir, "nested_skill", "Start.\n{{partial:a}}\nEnd.\n")
+
+      assert {:ok, skill} = Skill.load(path)
+      refute String.contains?(skill.body, "{{partial:")
+      assert String.contains?(skill.body, "Content from A.")
+      assert String.contains?(skill.body, "Content from B.")
+    end
+  end
+
+  describe "expand_partials: missing partial" do
+    # A token whose partial file is genuinely absent must still be a hard load
+    # error. The seen-set logic must not shadow this: only already-seen names
+    # are dropped; an unseen name with no file on disk is an error.
+    test "a reference to a nonexistent partial returns a missing_partial error" do
+      {dir, _partials_dir} = setup_skill_dir()
+
+      path = write_skill!(dir, "broken_skill", "{{partial:does_not_exist}}\n")
+
+      assert {:error, {:missing_partial, "does_not_exist", _reason}} = Skill.load(path)
+    end
+  end
+
+  describe "expand_partials: repeated include" do
+    # A partial is a named shared contract; a skill body that references the
+    # same partial twice inlines its content once. This keeps the catalog body
+    # deterministic and is the "inline each named partial at most once" half of
+    # the fixpoint behavior (the other half drops self-reference tokens).
+    test "the same partial referenced twice is inlined once" do
+      {dir, partials_dir} = setup_skill_dir()
+
+      write_partial!(partials_dir, "contract", "SHARED-CONTRACT-TEXT")
+
+      path =
+        write_skill!(
+          dir,
+          "repeat_skill",
+          "First:\n{{partial:contract}}\nSecond:\n{{partial:contract}}\n"
+        )
+
+      assert {:ok, skill} = Skill.load(path)
+      refute String.contains?(skill.body, "{{partial:")
+
+      occurrences = skill.body |> String.split("SHARED-CONTRACT-TEXT") |> length() |> Kernel.-(1)
+      assert occurrences == 1
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir/workflow_catalog_test.exs b/packages/symphony/elixir/test/symphony_elixir/workflow_catalog_test.exs
new file mode 100644
index 000000000..9cb05c536
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir/workflow_catalog_test.exs
@@ -0,0 +1,109 @@
+defmodule SymphonyElixir.WorkflowCatalogTest do
+  use ExUnit.Case, async: false
+
+  @moduletag capture_log: true
+
+  alias SymphonyElixir.WorkflowCatalog
+
+  setup do
+    dir = Path.join(System.tmp_dir!(), "wf_catalog_#{System.unique_integer([:positive])}")
+    File.mkdir_p!(dir)
+    on_exit(fn -> File.rm_rf(dir) end)
+    # A long poll so the only scans are the boot scan and the explicit ones
+    # the test drives; keeps assertions deterministic.
+    start_supervised!({WorkflowCatalog, workflows_dir: dir, poll_ms: 60_000})
+    {:ok, dir: dir}
+  end
+
+  defp write_sym!(dir, name, body) do
+    File.write!(Path.join(dir, "#{name}.sym"), body)
+  end
+
+  test "parses .sym files and indexes them by name and trigger", %{dir: dir} do
+    write_sym!(dir, "implement", ~s|workflow "implement" on linear label "[sym] implement" { a <- agent { engine: codex, model: "m", prompt: skill "implement" {} } }|)
+    write_sym!(dir, "nightly", ~s|workflow "nightly" on cron "0 9 * * *" tz "UTC" { gc <- exec "./gc.sh" }|)
+
+    WorkflowCatalog.scan(dir)
+
+    assert {:ok, impl} = WorkflowCatalog.workflow("implement")
+    assert impl.name == "implement"
+    assert impl.trigger == %{kind: :linear, label: "[sym] implement"}
+    assert is_binary(impl.hash)
+
+    assert Enum.map(WorkflowCatalog.workflows(), & &1.name) |> Enum.sort() == ["implement", "nightly"]
+    assert [%{name: "implement"}] = WorkflowCatalog.for_trigger_kind(:linear)
+    assert [%{name: "nightly"}] = WorkflowCatalog.for_trigger_kind(:cron)
+  end
+
+  test "hot-reloads changed bytes and drops deleted files", %{dir: dir} do
+    write_sym!(dir, "w", ~s|workflow "w" on manual { a <- exec "./x.sh" }|)
+    WorkflowCatalog.scan(dir)
+    assert {:ok, %{hash: first}} = WorkflowCatalog.workflow("w")
+
+    write_sym!(dir, "w", ~s|workflow "w" on cron "* * * * *" { a <- exec "./x.sh" }|)
+    WorkflowCatalog.scan(dir)
+    assert {:ok, reloaded} = WorkflowCatalog.workflow("w")
+    assert reloaded.hash != first
+    assert reloaded.trigger.kind == :cron
+
+    File.rm!(Path.join(dir, "w.sym"))
+    WorkflowCatalog.scan(dir)
+    assert WorkflowCatalog.workflow("w") == {:error, :not_found}
+  end
+
+  test "a parse error keeps the last good version in place", %{dir: dir} do
+    write_sym!(dir, "w", ~s|workflow "w" on manual { a <- exec "./x.sh" }|)
+    WorkflowCatalog.scan(dir)
+    assert {:ok, good} = WorkflowCatalog.workflow("w")
+
+    write_sym!(dir, "w", ~s|workflow "w" on manual { this is not valid |)
+    WorkflowCatalog.scan(dir)
+    # The broken bytes are rejected; the prior parse stays published.
+    assert {:ok, ^good} = WorkflowCatalog.workflow("w")
+  end
+
+  test "a parse error is recorded with a located, file-stamped diagnostic", %{dir: dir} do
+    write_sym!(dir, "w", ~s|workflow "w" on manual { a <- exec "./x.sh" }|)
+    write_sym!(dir, "broken", "workflow \"broken\" {\n  oops\n}\n")
+    WorkflowCatalog.scan(dir)
+
+    # The good file parses; the broken one is absent from the published set
+    # but present in the error set.
+    assert {:ok, _} = WorkflowCatalog.workflow("w")
+    assert WorkflowCatalog.workflow("broken") == {:error, :not_found}
+
+    assert {:ok, err} = WorkflowCatalog.error("broken")
+    assert err.name == "broken"
+    assert err.file == "broken.sym"
+    assert is_integer(err.line) and err.line >= 1
+    assert is_integer(err.column) and err.column >= 1
+    assert is_binary(err.message)
+
+    # The healthy file has no recorded error, and `errors/0` lists only the
+    # broken one.
+    assert WorkflowCatalog.error("w") == {:error, :not_found}
+    assert Enum.map(WorkflowCatalog.errors(), & &1.name) == ["broken"]
+  end
+
+  test "a recorded error clears when the file parses again", %{dir: dir} do
+    write_sym!(dir, "w", "workflow \"w\" {\n  oops\n}\n")
+    WorkflowCatalog.scan(dir)
+    assert {:ok, _} = WorkflowCatalog.error("w")
+
+    write_sym!(dir, "w", ~s|workflow "w" on manual { a <- exec "./x.sh" }|)
+    WorkflowCatalog.scan(dir)
+    assert WorkflowCatalog.error("w") == {:error, :not_found}
+    assert {:ok, _} = WorkflowCatalog.workflow("w")
+  end
+
+  test "deleting a broken file retires its recorded error", %{dir: dir} do
+    write_sym!(dir, "broken", "workflow \"broken\" {\n  oops\n}\n")
+    WorkflowCatalog.scan(dir)
+    assert {:ok, _} = WorkflowCatalog.error("broken")
+
+    File.rm!(Path.join(dir, "broken.sym"))
+    WorkflowCatalog.scan(dir)
+    assert WorkflowCatalog.error("broken") == {:error, :not_found}
+    assert WorkflowCatalog.errors() == []
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir_web/components/ir_graph_test.exs b/packages/symphony/elixir/test/symphony_elixir_web/components/ir_graph_test.exs
new file mode 100644
index 000000000..c0dd27424
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir_web/components/ir_graph_test.exs
@@ -0,0 +1,393 @@
+defmodule SymphonyElixirWeb.Components.IRGraphTest do
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixirWeb.Components.IRGraph
+
+  # Build a minimal node map matching the shape IR.View.render_node/1 produces.
+  # Named mk_node to avoid conflicting with Kernel.node/1.
+  defp mk_node(id, opts \\ []) do
+    kind = Keyword.get(opts, :kind, "exec")
+    state = Keyword.get(opts, :state, "pending")
+    deps = Keyword.get(opts, :deps, [])
+    label = Keyword.get(opts, :label, id)
+
+    %{
+      "id" => id,
+      "kind" => kind,
+      "state" => state,
+      "deps" => deps,
+      "label" => label,
+      "envelope" => nil,
+      "attempts" => [],
+      "output" => nil,
+      "updated_at" => nil
+    }
+  end
+
+  defp mk_agent(id, engine, opts \\ []) do
+    model = Keyword.get(opts, :model, nil)
+    effort = Keyword.get(opts, :effort, nil)
+    permissions = Keyword.get(opts, :permissions, nil)
+    location = Keyword.get(opts, :location, nil)
+    skill = Keyword.get(opts, :skill, id)
+
+    base = mk_node(id, Keyword.merge([kind: "agent", label: skill], opts))
+
+    envelope =
+      %{"engine" => engine}
+      |> maybe_put("model", model)
+      |> maybe_put("effort", effort)
+      |> maybe_put("permissions", permissions)
+      |> maybe_put("location", location)
+
+    Map.put(base, "envelope", envelope)
+  end
+
+  defp maybe_put(map, _key, nil), do: map
+  defp maybe_put(map, key, value), do: Map.put(map, key, value)
+
+  describe "layout/1 layer assignment" do
+    test "a root node with no deps is in layer 0" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("a")])
+      [n] = Enum.reject(nodes, &(&1.state_class == "gtrigger"))
+      assert n.id == "a"
+      # Layer 0 nodes are positioned at pad_x (30).
+      assert n.x == 30
+    end
+
+    test "a -> b places a in layer 0 and b in layer 1" do
+      layout = IRGraph.layout([mk_node("a"), mk_node("b", deps: ["a"])])
+      by_id = Map.new(layout.nodes, &{&1.id, &1})
+
+      assert by_id["a"].x < by_id["b"].x
+    end
+
+    test "a -> b, a -> c, b -> d places roots in layer 0 and d in the last layer" do
+      nodes = [
+        mk_node("a"),
+        mk_node("b", deps: ["a"]),
+        mk_node("c", deps: ["a"]),
+        mk_node("d", deps: ["b"])
+      ]
+
+      layout = IRGraph.layout(nodes)
+      by_id = Map.new(layout.nodes, &{&1.id, &1})
+
+      # a is a root (layer 0)
+      a_x = by_id["a"].x
+      # b and c depend on a (layer 1)
+      b_x = by_id["b"].x
+      c_x = by_id["c"].x
+      # d depends on b (layer 2)
+      d_x = by_id["d"].x
+
+      assert a_x < b_x
+      assert b_x == c_x
+      assert d_x > b_x
+    end
+
+    test "emits one edge per dep" do
+      nodes = [
+        mk_node("a"),
+        mk_node("b", deps: ["a"]),
+        mk_node("c", deps: ["a"]),
+        mk_node("d", deps: ["b"])
+      ]
+
+      layout = IRGraph.layout(nodes)
+      # a->b, a->c, b->d = 3 edges
+      assert length(layout.edges) == 3
+    end
+
+    test "parallel independent roots all land in layer 0" do
+      nodes = [mk_node("x"), mk_node("y"), mk_node("z")]
+      layout = IRGraph.layout(nodes)
+      by_id = Map.new(layout.nodes, &{&1.id, &1})
+
+      # All roots at the same x
+      assert by_id["x"].x == by_id["y"].x
+      assert by_id["y"].x == by_id["z"].x
+    end
+
+    test "an empty list with no trigger returns a minimal viewbox and no nodes or edges" do
+      %{viewbox: vb, nodes: ns, edges: es} = IRGraph.layout([])
+      assert vb =~ "0 0"
+      assert ns == []
+      assert es == []
+    end
+
+    test "an empty list with a trigger returns a single trigger node" do
+      %{nodes: ns, edges: es} = IRGraph.layout([], "manual")
+      assert length(ns) == 1
+      assert hd(ns).state_class == "gtrigger"
+      assert hd(ns).label == "manual"
+      assert es == []
+    end
+
+    test "dangling dep edges (dep not in graph) are silently skipped" do
+      nodes = [mk_node("b", deps: ["ghost"])]
+      layout = IRGraph.layout(nodes)
+      # b has no known deps so it is a root
+      assert length(layout.nodes) == 1
+      assert layout.edges == []
+    end
+  end
+
+  describe "layout/1 state classes" do
+    test "succeeded state produces succeeded class" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("a", state: "succeeded")])
+      [n] = nodes
+      assert n.state_class == "succeeded"
+    end
+
+    test "running state produces running class" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("a", state: "running")])
+      [n] = nodes
+      assert n.state_class == "running"
+    end
+
+    test "gate kind gets gate prefix in state class" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("g", kind: "gate", state: "pending")])
+      [n] = nodes
+      assert n.state_class == "gate pending"
+    end
+
+    test "unknown state falls back to pending class" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("a", state: "upstream_failed")])
+      [n] = nodes
+      assert n.state_class == "pending"
+    end
+  end
+
+  describe "layout/1 labels" do
+    test "node label comes from the label field" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("agent-0", label: "my_skill")])
+      [n] = nodes
+      assert n.label == "my_skill"
+    end
+
+    test "node id is exposed separately from label" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("agent-0", label: "my_skill")])
+      [n] = nodes
+      assert n.id == "agent-0"
+    end
+
+    test "node without label field falls back to the id" do
+      node = mk_node("fallback-id") |> Map.delete("label")
+      %{nodes: nodes} = IRGraph.layout([node])
+      [n] = nodes
+      assert n.label == "fallback-id"
+    end
+  end
+
+  describe "layout/1 detail lines for agent nodes" do
+    test "agent node with full envelope produces engine/model, effort, permissions, location lines" do
+      node =
+        mk_agent("agent-0", "codex",
+          model: "gpt-5.5",
+          effort: "high",
+          permissions: "danger_full_access",
+          location: "ixvm",
+          skill: "my_skill"
+        )
+
+      %{nodes: nodes} = IRGraph.layout([node])
+      [n] = nodes
+      assert "codex gpt-5.5" in n.detail_lines
+      assert "high" in n.detail_lines
+      assert "danger_full_access" in n.detail_lines
+      assert "ixvm" in n.detail_lines
+    end
+
+    test "agent node without model shows engine only in first detail line" do
+      node = mk_agent("agent-0", "codex", skill: "s")
+      %{nodes: nodes} = IRGraph.layout([node])
+      [n] = nodes
+      assert "codex" in n.detail_lines
+    end
+
+    test "exec node detail shows exec kind" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("e", kind: "exec", label: "./run.sh")])
+      [n] = nodes
+      assert n.detail_lines == ["exec"]
+    end
+
+    test "gate node detail shows gate" do
+      %{nodes: nodes} = IRGraph.layout([mk_node("g", kind: "gate")])
+      [n] = nodes
+      assert n.detail_lines == ["gate"]
+    end
+
+    test "agent location annotates the fallback when effective placement differs" do
+      node = mk_agent("agent-0", "codex", location: "ixvm", skill: "s")
+      placement = %{"declared" => "ixvm", "effective" => "host"}
+      %{nodes: nodes} = IRGraph.layout([node], "manual", placement)
+      n = Enum.find(nodes, &(&1.id == "agent-0"))
+      assert "ixvm (fallback host)" in n.detail_lines
+      refute "ixvm" in n.detail_lines
+    end
+
+    test "agent location shows no fallback when effective matches the declared type" do
+      node = mk_agent("agent-0", "codex", location: "host:hil-compute-2", skill: "s")
+      placement = %{"declared" => "host:hil-compute-2", "effective" => "host"}
+      %{nodes: nodes} = IRGraph.layout([node], "manual", placement)
+      n = Enum.find(nodes, &(&1.id == "agent-0"))
+      assert "host:hil-compute-2" in n.detail_lines
+    end
+  end
+
+  describe "layout/1 trigger node" do
+    test "trigger produces a gtrigger node in the output" do
+      nodes = [mk_node("a")]
+      layout = IRGraph.layout(nodes, "cron 30 * * * *")
+      trigger_nodes = Enum.filter(layout.nodes, &(&1.state_class == "gtrigger"))
+      assert length(trigger_nodes) == 1
+      assert hd(trigger_nodes).label == "cron 30 * * * *"
+    end
+
+    test "trigger node is positioned to the left of root real nodes" do
+      nodes = [mk_node("a")]
+      layout = IRGraph.layout(nodes, "manual")
+      by_id = Map.new(layout.nodes, &{&1.id, &1})
+      assert by_id["__trigger__"].x < by_id["a"].x
+    end
+
+    test "trigger produces edges to each root node" do
+      nodes = [mk_node("a"), mk_node("b")]
+      layout = IRGraph.layout(nodes, "manual")
+      # 2 roots => 2 trigger edges (a->b has no dep so both are roots)
+      assert length(layout.edges) == 2
+    end
+
+    test "trigger does not add extra edges to non-root nodes" do
+      # b depends on a, so only a is a root; trigger has one edge to a, and
+      # one dep edge a->b gives 2 total
+      nodes = [mk_node("a"), mk_node("b", deps: ["a"])]
+      layout = IRGraph.layout(nodes, "cron 0 * * * *")
+      assert length(layout.edges) == 2
+    end
+
+    test "layout without trigger has no gtrigger nodes" do
+      nodes = [mk_node("a"), mk_node("b", deps: ["a"])]
+      layout = IRGraph.layout(nodes)
+      trigger_nodes = Enum.filter(layout.nodes, &(&1.state_class == "gtrigger"))
+      assert trigger_nodes == []
+    end
+  end
+
+  describe "layout box sizing" do
+    test "node width grows to fit a long label so it does not spill" do
+      long = "cron 0 0,5,10,15,20 * * *"
+      layout = IRGraph.layout([mk_node("a")], long)
+      # The box must be wide enough for the long trigger label plus padding so
+      # the text stays inside the rect (regression for the graph-spillage bug).
+      assert layout.node_w >= String.length(long) * 7 + 20
+    end
+
+    test "node height grows to fit the full envelope block" do
+      node =
+        mk_agent("agent-0", "codex",
+          model: "gpt-5.5",
+          effort: "high",
+          permissions: "danger_full_access",
+          location: "ixvm",
+          skill: "idiomatic"
+        )
+
+      layout = IRGraph.layout([node])
+      # label + id + four envelope detail lines must fit inside the box.
+      assert layout.node_h >= 44 + 3 * 13 + 6
+    end
+  end
+
+  describe "layout/1 single-node no-stretch" do
+    test "single node layout natural_width is bounded (not stretched to fill)" do
+      layout = IRGraph.layout([mk_node("a")])
+      # The natural width of a single-node layout should be much less than a
+      # typical screen width. Two pad_x margins plus one node width is the
+      # expected value. It must be less than 400 (no card-fill stretch).
+      assert layout.natural_width < 400
+    end
+
+    test "single node with trigger natural_width is bounded" do
+      layout = IRGraph.layout([mk_node("a")], "manual")
+      assert layout.natural_width < 600
+    end
+
+    test "viewBox width equals natural_width for single-node layout" do
+      layout = IRGraph.layout([mk_node("a")])
+      "0 0 " <> rest = layout.viewbox
+      [w_str | _] = String.split(rest, " ")
+      {vb_width, _} = Integer.parse(w_str)
+      assert vb_width == layout.natural_width
+    end
+  end
+
+  describe "layout/1 multi-node trigger -> route -> skill" do
+    test "three-layer trigger-route-skill graph lays out left-to-right" do
+      # route depends on nothing (root), skill depends on route
+      nodes = [
+        mk_agent("route-0", "codex", skill: "route", deps: []),
+        mk_agent("skill-0", "codex", skill: "idiomatic", deps: ["route-0"])
+      ]
+
+      layout = IRGraph.layout(nodes, "cron 30 * * * *")
+      by_id = Map.new(layout.nodes, &{&1.id, &1})
+
+      # trigger -> route-0 -> skill-0 must be strictly left-to-right
+      assert by_id["__trigger__"].x < by_id["route-0"].x
+      assert by_id["route-0"].x < by_id["skill-0"].x
+    end
+
+    test "three-layer graph has trigger edge plus dep edge (2 total)" do
+      nodes = [
+        mk_agent("route-0", "codex", skill: "route"),
+        mk_agent("skill-0", "codex", skill: "idiomatic", deps: ["route-0"])
+      ]
+
+      layout = IRGraph.layout(nodes, "cron 30 * * * *")
+      # trigger->route-0 and route-0->skill-0
+      assert length(layout.edges) == 2
+    end
+  end
+
+  describe "layout/1 edge path format" do
+    test "each edge has a non-empty d attribute starting with M" do
+      layout = IRGraph.layout([mk_node("a"), mk_node("b", deps: ["a"])])
+      assert [%{d: d}] = layout.edges
+      assert String.starts_with?(d, "M")
+    end
+  end
+
+  describe "single cron-triggered agent with full envelope" do
+    test "layout contains trigger label, skill name, engine+model, effort, permissions, location" do
+      node =
+        mk_agent("agent-0", "codex",
+          model: "gpt-5.5",
+          effort: "high",
+          permissions: "danger_full_access",
+          location: "ixvm",
+          skill: "idiomatic"
+        )
+
+      layout = IRGraph.layout([node], "cron 30 * * * *")
+      by_id = Map.new(layout.nodes, &{&1.id, &1})
+
+      # Trigger node has the cron label
+      assert by_id["__trigger__"].label == "cron 30 * * * *"
+
+      # Agent node primary label is the skill name
+      agent = by_id["agent-0"]
+      assert agent.label == "idiomatic"
+
+      # Agent node secondary id is distinct from label
+      assert agent.id == "agent-0"
+
+      # Envelope detail lines contain engine+model, effort, permissions, location
+      assert "codex gpt-5.5" in agent.detail_lines
+      assert "high" in agent.detail_lines
+      assert "danger_full_access" in agent.detail_lines
+      assert "ixvm" in agent.detail_lines
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir_web/ir_run_controller_test.exs b/packages/symphony/elixir/test/symphony_elixir_web/ir_run_controller_test.exs
new file mode 100644
index 000000000..8eac8b670
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir_web/ir_run_controller_test.exs
@@ -0,0 +1,234 @@
+defmodule SymphonyElixirWeb.IRRunControllerTest do
+  use ExUnit.Case, async: false
+  import Plug.Test
+  import Plug.Conn
+
+  alias SymphonyElixir.DSL.{Parser, Schema}
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Node, RunGraph, Store}
+
+  @opts SymphonyElixirWeb.Endpoint.init([])
+
+  # The controller reads the IR store at its default dir
+  # (Config.get().runs_dir/ir). Clean it between tests so listings are
+  # deterministic.
+  setup do
+    # The Runtime.Registry must exist for operator routes to resolve a run
+    # name; a run that is not registered then yields the :noproc the
+    # controller translates to 409. Start it if the Application is not up.
+    unless Process.whereis(SymphonyElixir.Runtime.Registry) do
+      start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    end
+
+    # The create route resolves a workflow through WorkflowCatalog's ETS
+    # table and starts it under Runtime.Supervisor. Bring up both when the
+    # Application is not running (auto_start: false in test).
+    ensure_workflow_catalog_table()
+
+    unless Process.whereis(SymphonyElixir.TaskSupervisor) do
+      start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+    end
+
+    unless Process.whereis(SymphonyElixir.Runtime.Supervisor) do
+      start_supervised!(SymphonyElixir.Runtime.Supervisor)
+    end
+
+    dir = Path.join(SymphonyElixir.Config.get().runs_dir, "ir")
+    File.rm_rf(dir)
+    File.mkdir_p!(dir)
+    :ok
+  end
+
+  # The catalog table is created by the WorkflowCatalog GenServer at boot,
+  # which test_helper does not start. Create it here so put_workflow/1 and
+  # the create route can read it, and reset its rows each test.
+  defp ensure_workflow_catalog_table do
+    table = :symphony_workflows
+
+    if :ets.whereis(table) == :undefined do
+      :ets.new(table, [:named_table, :public, read_concurrency: true])
+    else
+      :ets.delete_all_objects(table)
+    end
+  end
+
+  defp put_workflow(name, source) do
+    {:ok, ast} = Parser.parse(source)
+    entry = %{name: ast.name || name, ast: ast, trigger: ast.trigger, source: source, hash: :crypto.hash(:sha256, source)}
+    :ets.insert(:symphony_workflows, {name, entry})
+  end
+
+  defp persist_run(run_id, status) do
+    node = %{Node.new(id: "a", ast_origin: {:exec, "a"}, kind: :exec, inputs: %{}) | state: :succeeded, output: %{"v" => 1}}
+    graph = RunGraph.new(run_id, "hash", nil) |> RunGraph.put_nodes([node]) |> Map.put(:status, status)
+    :ok = Store.persist(graph)
+  end
+
+  defp get(path) do
+    :get |> conn(path) |> SymphonyElixirWeb.Endpoint.call(@opts)
+  end
+
+  defp post(path) do
+    :post |> conn(path) |> put_req_header("content-type", "application/json") |> SymphonyElixirWeb.Endpoint.call(@opts)
+  end
+
+  defp post(path, body) do
+    :post
+    |> conn(path, Jason.encode!(body))
+    |> put_req_header("content-type", "application/json")
+    |> SymphonyElixirWeb.Endpoint.call(@opts)
+  end
+
+  test "GET /api/v1/ir/schema returns the runtime enum vocabulary" do
+    conn = get("/api/v1/ir/schema")
+    assert conn.status == 200
+    body = Jason.decode!(conn.resp_body)
+
+    # The endpoint serves the runtime's accessors verbatim (atoms render as
+    # strings), so the form's option lists match what a turn accepts. Assert
+    # against the accessor, not a second hardcoded list, so the test is not
+    # itself a place the vocabulary can drift.
+    assert body["engines"] == strings(Envelope.engines())
+    assert body["permissions"] == strings(Envelope.permission_levels())
+    assert "agent" in body["node_kinds"]
+    assert "manual" in body["trigger_kinds"]
+  end
+
+  test "schema enums, struct-accepted values, and the API payload do not drift" do
+    # ENG-1825's "the UI cannot drift from the runtime" pillar. Three sources
+    # must name the same vocabulary or the form offers options a turn rejects:
+    #   1. the accessors the schema map reads (what the form renders),
+    #   2. the values Envelope.from_map/1 actually accepts (what a turn takes),
+    #   3. the JSON the /schema endpoint serves (what ships over the wire).
+    # A value added to one but not another turns this red. The generated
+    # @type unions keep Dialyzer in agreement with leg 2 at compile time;
+    # this test covers the runtime legs Dialyzer cannot see.
+    schema = Schema.to_map()
+    api = "/api/v1/ir/schema" |> get() |> Map.fetch!(:resp_body) |> Jason.decode!()
+
+    # engines: each accepted with an engine-agreeing model; an off-list value rejected.
+    assert schema.engines == Envelope.engines()
+    assert api["engines"] == strings(Envelope.engines())
+
+    for engine <- Envelope.engines() do
+      assert {:ok, %{engine: ^engine}} =
+               Envelope.from_map(%{"engine" => engine, "model" => model_for(engine)})
+    end
+
+    assert {:error, {:invalid_engine, _}} =
+             Envelope.from_map(%{"engine" => :nonsense, "model" => "m"})
+
+    # efforts
+    assert schema.efforts == Envelope.efforts()
+    assert api["efforts"] == strings(Envelope.efforts())
+
+    for effort <- Envelope.efforts() do
+      assert {:ok, %{effort: ^effort}} =
+               Envelope.from_map(%{"engine" => :codex, "model" => "m", "effort" => effort})
+    end
+
+    assert {:error, {:invalid_effort, _}} =
+             Envelope.from_map(%{"engine" => :codex, "model" => "m", "effort" => :nope})
+
+    # permissions
+    assert schema.permissions == Envelope.permission_levels()
+    assert api["permissions"] == strings(Envelope.permission_levels())
+
+    for perm <- Envelope.permission_levels() do
+      assert {:ok, %{permissions: ^perm}} =
+               Envelope.from_map(%{"engine" => :codex, "model" => "m", "permissions" => perm})
+    end
+
+    assert {:error, {:invalid_permissions, _}} =
+             Envelope.from_map(%{"engine" => :codex, "model" => "m", "permissions" => :nope})
+
+    # locations: the bare placement tags the form offers (payload-carriers
+    # supply their payload separately, so only the tag list is the shared axis).
+    assert schema.locations == Envelope.locations()
+    assert api["locations"] == strings(Envelope.locations())
+  end
+
+  defp strings(atoms), do: Enum.map(atoms, &Atom.to_string/1)
+
+  # check_engine_model_agree rejects a Claude model under :codex and a
+  # non-Claude model under :claude, so each engine needs an agreeing model.
+  defp model_for(:codex), do: "gpt-5.3-codex"
+  defp model_for(:claude), do: "claude-opus-4-8"
+
+  test "GET /api/v1/ir/runs lists persisted run summaries" do
+    persist_run("run_a", :succeeded)
+    persist_run("run_b", :failed)
+
+    conn = get("/api/v1/ir/runs")
+    assert conn.status == 200
+    body = Jason.decode!(conn.resp_body)
+    ids = Enum.map(body["runs"], & &1["run_id"])
+    assert ids == ["run_a", "run_b"]
+    assert Enum.find(body["runs"], &(&1["run_id"] == "run_b"))["status"] == "failed"
+  end
+
+  test "GET /api/v1/ir/runs/:id returns the full detail" do
+    persist_run("run_detail", :succeeded)
+
+    conn = get("/api/v1/ir/runs/run_detail")
+    assert conn.status == 200
+    body = Jason.decode!(conn.resp_body)
+    assert body["run_id"] == "run_detail"
+    assert [node] = body["nodes"]
+    assert node["id"] == "a"
+    assert node["output"] == %{"v" => 1}
+  end
+
+  test "GET an unknown run returns 404" do
+    conn = get("/api/v1/ir/runs/nope")
+    assert conn.status == 404
+    assert Jason.decode!(conn.resp_body) == %{"error" => "run not found"}
+  end
+
+  test "POST /api/v1/ir/runs starts a run from a workflow name" do
+    put_workflow("demo", ~s|workflow "demo" on manual { a <- agent { engine: codex, model: "m", prompt: inline "go" } }|)
+
+    conn = post("/api/v1/ir/runs", %{"workflow" => "demo"})
+    assert conn.status == 201
+    body = Jason.decode!(conn.resp_body)
+    assert is_binary(body["run_id"])
+    assert String.starts_with?(body["run_id"], "demo-")
+
+    # The run is materialized and persisted, so it is visible on the index.
+    run_id = body["run_id"]
+
+    assert eventually(fn ->
+             match?({:ok, _}, Store.load(run_id))
+           end)
+  end
+
+  test "POST /api/v1/ir/runs for an unknown workflow returns 404" do
+    conn = post("/api/v1/ir/runs", %{"workflow" => "nope"})
+    assert conn.status == 404
+    assert Jason.decode!(conn.resp_body)["error"] =~ "workflow_not_found"
+  end
+
+  test "POST /api/v1/ir/runs without a workflow field returns 422" do
+    conn = post("/api/v1/ir/runs", %{})
+    assert conn.status == 422
+    assert Jason.decode!(conn.resp_body)["error"] =~ "workflow"
+  end
+
+  defp eventually(fun, attempts \\ 50) do
+    cond do
+      fun.() -> true
+      attempts == 0 -> false
+      true -> Process.sleep(20) && eventually(fun, attempts - 1)
+    end
+  end
+
+  test "operator action on a run with no live process returns 409" do
+    # A persisted run with no live Runtime GenServer: cancel cannot reach a
+    # process, so the controller returns 409 rather than a 500.
+    persist_run("run_dead", :failed)
+
+    conn = post("/api/v1/ir/runs/run_dead/cancel")
+    assert conn.status == 409
+    assert Jason.decode!(conn.resp_body)["error"] =~ "no live process"
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir_web/ir_runs_live_test.exs b/packages/symphony/elixir/test/symphony_elixir_web/ir_runs_live_test.exs
new file mode 100644
index 000000000..41e0768da
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir_web/ir_runs_live_test.exs
@@ -0,0 +1,294 @@
+defmodule SymphonyElixirWeb.IRRunsLiveTest do
+  @moduledoc """
+  Phase 5 tests: the :show LiveView renders the graph SVG, the summary dl,
+  and action buttons that drive Runtime operator calls.
+  """
+
+  use ExUnit.Case, async: false
+
+  import Phoenix.ConnTest
+  import Phoenix.LiveViewTest
+
+  @endpoint SymphonyElixirWeb.Endpoint
+
+  alias SymphonyElixir.Engine.Envelope
+  alias SymphonyElixir.IR.{Node, RunGraph, Store}
+  alias SymphonyElixir.Runtime
+
+  # A fake EngineClient that blocks indefinitely (sleep_forever) so the run
+  # stays :running while the test exercises operator actions. Using async:
+  # false and a named table so concurrent suites do not interfere.
+  defmodule FakeEngine do
+    @behaviour SymphonyElixir.Runtime.EngineClient
+
+    @table :ir_runs_live_fake
+
+    def setup do
+      if :ets.whereis(@table) == :undefined do
+        :ets.new(@table, [:named_table, :public, :set])
+      end
+
+      :ets.delete_all_objects(@table)
+      :ok
+    end
+
+    def program(node_id, instruction), do: :ets.insert(@table, {node_id, instruction})
+
+    @impl true
+    def run_node(%Node{id: id}, _opts) do
+      case :ets.lookup(@table, id) do
+        [{^id, :block}] ->
+          # Block until the test is done by sleeping a long time. The task
+          # will be killed when the runtime stops.
+          Process.sleep(30_000)
+          {:ok, %{}, nil}
+
+        [{^id, {:ok, out}}] ->
+          {:ok, out, nil}
+
+        [{^id, {:error, reason}}] ->
+          {:error, reason, nil}
+
+        [] ->
+          {:ok, %{default: id}, nil}
+      end
+    end
+
+    @impl true
+    def status(_thread_id), do: :unknown
+  end
+
+  setup do
+    FakeEngine.setup()
+
+    unless Process.whereis(SymphonyElixir.Runtime.Registry) do
+      start_supervised!({Registry, keys: :unique, name: SymphonyElixir.Runtime.Registry})
+    end
+
+    unless Process.whereis(SymphonyElixir.TaskSupervisor) do
+      start_supervised!({Task.Supervisor, name: SymphonyElixir.TaskSupervisor})
+    end
+
+    # The LiveView mount calls WorkflowCatalog.workflows/0 and errors/0,
+    # which read two ETS tables. Create both if not present, mirroring the
+    # pattern used in IRRunControllerTest.
+    for table <- [:symphony_workflows, :symphony_workflow_errors] do
+      if :ets.whereis(table) == :undefined do
+        :ets.new(table, [:named_table, :public, read_concurrency: true])
+      else
+        :ets.delete_all_objects(table)
+      end
+    end
+
+    :ok
+  end
+
+  defp agent_node(id, opts \\ []) do
+    Node.new(
+      id: id,
+      ast_origin: {:agent, id},
+      kind: :agent,
+      envelope: %Envelope{engine: :codex, model: "gpt-5.3-codex"},
+      inputs: Keyword.get(opts, :inputs, %{}),
+      state: :pending
+    )
+  end
+
+  defp persist_graph(graph, store_opts \\ []) do
+    :ok = Store.persist(graph, store_opts)
+  end
+
+  defp build_graph(run_id, nodes) do
+    RunGraph.new(run_id, "hash", nil)
+    |> RunGraph.put_nodes(nodes)
+    |> Map.put(:status, :running)
+  end
+
+  test "show page renders the summary dl with trigger and placement" do
+    run_id = "live-show-#{System.unique_integer([:positive])}"
+
+    graph =
+      build_graph(run_id, [agent_node("a"), agent_node("b", inputs: %{"x" => {:node, "a", []}})])
+      |> Map.put(:trigger, %{kind: :manual})
+
+    persist_graph(graph)
+
+    {:ok, view, html} = live(build_conn(), "/ir/" <> run_id)
+
+    # The summary dl should be present.
+    assert html =~ "<dl"
+    assert html =~ "kv"
+    # Trigger is shown.
+    assert html =~ "trigger"
+    assert html =~ "manual"
+    # Placement label is shown (nil placement renders as "-").
+    assert html =~ "placement"
+    # Node counts are shown.
+    assert html =~ "nodes"
+
+    # Verify the LiveView is alive.
+    assert render(view) =~ run_id
+  end
+
+  test "show page renders the graph svg element" do
+    run_id = "live-graph-#{System.unique_integer([:positive])}"
+    graph = build_graph(run_id, [agent_node("inspect"), agent_node("draft", inputs: %{"x" => {:node, "inspect", []}})])
+    persist_graph(graph)
+
+    {:ok, _view, html} = live(build_conn(), "/ir/" <> run_id)
+
+    # The SVG graph component must be present.
+    assert html =~ "<svg"
+    assert html =~ "IR graph"
+    # Node ids appear in the SVG.
+    assert html =~ "inspect"
+    assert html =~ "draft"
+  end
+
+  test "show page renders cancel button for a running run" do
+    run_id = "live-cancel-btn-#{System.unique_integer([:positive])}"
+    graph = build_graph(run_id, [agent_node("a")])
+    persist_graph(graph)
+
+    {:ok, _view, html} = live(build_conn(), "/ir/" <> run_id)
+    assert html =~ "cancel run"
+  end
+
+  test "show page does not render cancel button for a succeeded run" do
+    run_id = "live-no-cancel-#{System.unique_integer([:positive])}"
+
+    graph =
+      build_graph(run_id, [agent_node("a")])
+      |> Map.put(:status, :succeeded)
+
+    persist_graph(graph)
+
+    {:ok, _view, html} = live(build_conn(), "/ir/" <> run_id)
+    refute html =~ "cancel run"
+  end
+
+  test "show page renders retry_failed and rerun buttons for a failed run" do
+    run_id = "live-failed-btns-#{System.unique_integer([:positive])}"
+
+    node = %{agent_node("a") | state: :failed}
+
+    graph =
+      build_graph(run_id, [node])
+      |> Map.put(:status, :failed)
+
+    persist_graph(graph)
+
+    {:ok, _view, html} = live(build_conn(), "/ir/" <> run_id)
+    assert html =~ "retry failed"
+    assert html =~ "rerun"
+  end
+
+  test "cancel button calls Runtime.cancel and run transitions to cancelled" do
+    run_id = "live-cancel-action-#{System.unique_integer([:positive])}"
+
+    # Use the default store dir so the Runtime, the LiveView, and the
+    # assertion all read/write the same location. Clean up this run's file
+    # after the test.
+    default_ir_dir = SymphonyElixir.IR.Store.dir()
+    File.mkdir_p!(default_ir_dir)
+    on_exit(fn -> File.rm!(Path.join(default_ir_dir, run_id <> ".json")) end)
+
+    # Build a graph with a blocking node so the run stays :running while we cancel.
+    graph = build_graph(run_id, [agent_node("slow")])
+    FakeEngine.program("slow", :block)
+
+    # Start a real runtime using the default store so cancel has a live
+    # process to reach and the store transition is visible.
+    {:ok, _pid} = Runtime.start_link(graph, engine: FakeEngine)
+
+    # Wait briefly for the runtime to persist the initial graph, then load
+    # the LiveView and click cancel.
+    assert eventually(fn ->
+             match?({:ok, _}, Store.load(run_id))
+           end),
+           "run was not persisted by the runtime in time"
+
+    {:ok, view, _html} = live(build_conn(), "/ir/" <> run_id)
+
+    # Click cancel.
+    render_click(view, "cancel")
+
+    # The Runtime should now be cancelled. Poll the store until it reflects it.
+    assert eventually(fn ->
+             case Store.load(run_id) do
+               {:ok, g} -> g.status == :cancelled
+               _ -> false
+             end
+           end),
+           "run #{run_id} did not become cancelled"
+  end
+
+  test "show page renders not-found message for an unknown run" do
+    {:ok, _view, html} = live(build_conn(), "/ir/nonexistent-run-xyz")
+    assert html =~ "run not found"
+  end
+
+  test "index paginates the runs table at 50 rows per page" do
+    # Persist 51 runs into the default store the LiveView reads. They are
+    # created now, so the latest-first sort floats all of them above any
+    # leftover runs: page 1 is exactly the per-page cap and a 51st run spills
+    # onto page 2.
+    default_ir_dir = Store.dir()
+    File.mkdir_p!(default_ir_dir)
+    prefix = "live-page-#{System.unique_integer([:positive])}-"
+
+    run_ids =
+      for i <- 1..51 do
+        run_id = prefix <> String.pad_leading(Integer.to_string(i), 3, "0")
+        persist_graph(build_graph(run_id, [agent_node("a")]))
+        run_id
+      end
+
+    on_exit(fn ->
+      for run_id <- run_ids, do: File.rm(Path.join(default_ir_dir, run_id <> ".json"))
+    end)
+
+    {:ok, _view, html} = live(build_conn(), "/")
+    # The pager renders and offers a second page once the cap is exceeded.
+    assert html =~ ~s(class="pager")
+    assert html =~ "page=2"
+    # Page 1 shows exactly the per-page cap, never the full 51.
+    assert count_run_rows(html) == 50
+
+    {:ok, _view2, html2} = live(build_conn(), "/ir?page=2")
+    # Page 2 carries the spillover and stays under the cap.
+    rows2 = count_run_rows(html2)
+    assert rows2 >= 1
+    assert rows2 <= 50
+  end
+
+  # Each runs-table row links to its run at `/ir/<id>`; the pager links use
+  # `?page=N` on the bare path, so counting the row-link prefix counts only
+  # rendered run rows.
+  defp count_run_rows(html) do
+    (html |> String.split(~s(href="/ir/)) |> length()) - 1
+  end
+
+  test "placement_label renders fallback notation when declared != effective" do
+    run_id = "live-placement-#{System.unique_integer([:positive])}"
+
+    graph =
+      build_graph(run_id, [agent_node("a")])
+      |> Map.put(:placement, %{declared: :ixvm, effective: :host})
+
+    persist_graph(graph)
+
+    {:ok, _view, html} = live(build_conn(), "/ir/" <> run_id)
+    assert html =~ "ixvm"
+    assert html =~ "fallback"
+    assert html =~ "host"
+  end
+
+  defp eventually(fun, attempts \\ 50) do
+    cond do
+      fun.() -> true
+      attempts == 0 -> false
+      true -> Process.sleep(20) && eventually(fun, attempts - 1)
+    end
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir_web/markdown_test.exs b/packages/symphony/elixir/test/symphony_elixir_web/markdown_test.exs
new file mode 100644
index 000000000..9c46d0aa4
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir_web/markdown_test.exs
@@ -0,0 +1,64 @@
+defmodule SymphonyElixirWeb.MarkdownTest do
+  @moduledoc """
+  The dashboard lowers skill bodies and codex transcript text from
+  markdown to sanitized HTML. These guard the render-and-sanitize
+  contract: structural markdown becomes HTML, blank input stays empty,
+  and script injection is scrubbed before it reaches a `{:safe, _}`.
+  """
+
+  use ExUnit.Case, async: true
+
+  alias SymphonyElixirWeb.Markdown
+
+  defp render(source) do
+    {:safe, iodata} = Markdown.to_html(source)
+    IO.iodata_to_binary(iodata)
+  end
+
+  test "renders headings, emphasis, lists, and inline code" do
+    html =
+      render("""
+      # Sub tickets
+
+      Split **the work** into `tasks`:
+
+      - first
+      - second
+      """)
+
+    assert html =~ "<h1>"
+    assert html =~ "Sub tickets"
+    assert html =~ "<strong>the work</strong>"
+    assert html =~ ~r{<code[^>]*>tasks</code>}
+    assert html =~ "<li>first</li>"
+  end
+
+  test "renders fenced code blocks" do
+    html =
+      render("""
+      ```
+      mix deps.get
+      ```
+      """)
+
+    assert html =~ "<pre>"
+    assert html =~ "mix deps.get"
+  end
+
+  test "blank and nil input render as empty safe html" do
+    assert Markdown.to_html(nil) == {:safe, ""}
+    assert Markdown.to_html("") == {:safe, ""}
+    assert Markdown.to_html("   \n  ") == {:safe, ""}
+  end
+
+  test "neutralizes raw html so transcript text cannot inject" do
+    html = render("hello <script>alert('x')</script> world")
+
+    # Earmark escapes raw html by default and the sanitizer is a second
+    # line of defense, so no executable script element survives.
+    refute html =~ "<script"
+    assert html =~ "&lt;script&gt;"
+    assert html =~ "hello"
+    assert html =~ "world"
+  end
+end
diff --git a/packages/symphony/elixir/test/symphony_elixir_web/workflows_live_test.exs b/packages/symphony/elixir/test/symphony_elixir_web/workflows_live_test.exs
new file mode 100644
index 000000000..8b808573b
--- /dev/null
+++ b/packages/symphony/elixir/test/symphony_elixir_web/workflows_live_test.exs
@@ -0,0 +1,122 @@
+defmodule SymphonyElixirWeb.WorkflowsLiveTest do
+  @moduledoc """
+  Phase 6 tests: the :index page lists loaded fixture workflows and surfaces
+  broken-.sym diagnostics; the :show page renders the graph SVG for a named
+  workflow.
+  """
+
+  use ExUnit.Case, async: false
+
+  import Phoenix.ConnTest
+  import Phoenix.LiveViewTest
+
+  @endpoint SymphonyElixirWeb.Endpoint
+
+  # Each test seeds the ETS tables WorkflowCatalog exposes so we can test the
+  # LiveView in isolation without starting the GenServer or touching the disk.
+  setup do
+    for table <- [:symphony_workflows, :symphony_workflow_errors] do
+      if :ets.whereis(table) == :undefined do
+        :ets.new(table, [:named_table, :public, read_concurrency: true])
+      else
+        :ets.delete_all_objects(table)
+      end
+    end
+
+    :ok
+  end
+
+  # Minimal valid .sym source for a manual workflow with one exec node.
+  @simple_sym ~s|workflow "inspect" on manual { a <- exec "./run.sh" }|
+
+  defp insert_workflow(name, sym_source) do
+    raw = sym_source
+    hash = :crypto.hash(:sha256, raw)
+    {:ok, ast} = SymphonyElixir.DSL.Parser.parse(raw, file: "#{name}.sym")
+    entry = %{name: name, ast: ast, trigger: ast.trigger, source: raw, hash: hash}
+    :ets.insert(:symphony_workflows, {name, entry})
+    entry
+  end
+
+  defp insert_error(name) do
+    err = %{name: name, message: "unexpected token", line: 2, column: 5, file: "#{name}.sym"}
+    :ets.insert(:symphony_workflow_errors, {name, err})
+    err
+  end
+
+  test "index page lists a loaded workflow by name and trigger" do
+    insert_workflow("inspect", @simple_sym)
+
+    {:ok, _view, html} = live(build_conn(), "/workflows")
+
+    assert html =~ "inspect"
+    assert html =~ "manual"
+  end
+
+  test "index page links each workflow to its show page" do
+    insert_workflow("inspect", @simple_sym)
+
+    {:ok, _view, html} = live(build_conn(), "/workflows")
+
+    assert html =~ ~s|href="/workflows/inspect"|
+  end
+
+  test "index page shows the empty state when no workflows are loaded" do
+    {:ok, _view, html} = live(build_conn(), "/workflows")
+
+    assert html =~ "no workflows loaded"
+  end
+
+  test "index page shows broken workflows panel when parse errors are present" do
+    insert_workflow("inspect", @simple_sym)
+    insert_error("broken")
+
+    {:ok, _view, html} = live(build_conn(), "/workflows")
+
+    assert html =~ "broken workflows"
+    assert html =~ "broken.sym"
+    assert html =~ "parse error"
+    assert html =~ "unexpected token"
+    # The healthy workflow must still appear.
+    assert html =~ "inspect"
+  end
+
+  test "index page does not show broken panel when there are no errors" do
+    insert_workflow("inspect", @simple_sym)
+
+    {:ok, _view, html} = live(build_conn(), "/workflows")
+
+    refute html =~ "broken workflows"
+  end
+
+  test "show page renders the graph svg for a loaded workflow" do
+    insert_workflow("inspect", @simple_sym)
+
+    {:ok, _view, html} = live(build_conn(), "/workflows/inspect")
+
+    assert html =~ "<svg"
+    assert html =~ "IR graph"
+    # The exec node id from the workflow appears in the SVG.
+    assert html =~ "inspect"
+  end
+
+  test "show page renders not-found message for an unknown workflow" do
+    {:ok, _view, html} = live(build_conn(), "/workflows/no-such-workflow")
+
+    assert html =~ "no workflow named"
+    assert html =~ "no-such-workflow"
+    assert html =~ "back to workflows"
+  end
+
+  test "workflows tab is active on index and show pages" do
+    insert_workflow("inspect", @simple_sym)
+
+    {:ok, _view, index_html} = live(build_conn(), "/workflows")
+    assert index_html =~ ~s|class="active"|
+    assert index_html =~ ~s|href="/workflows"|
+
+    {:ok, _view, show_html} = live(build_conn(), "/workflows/inspect")
+    assert show_html =~ ~s|class="active"|
+    assert show_html =~ ~s|href="/workflows"|
+  end
+end
diff --git a/packages/symphony/elixir/test/test_helper.exs b/packages/symphony/elixir/test/test_helper.exs
new file mode 100644
index 000000000..d130199e8
--- /dev/null
+++ b/packages/symphony/elixir/test/test_helper.exs
@@ -0,0 +1,26 @@
+ExUnit.start()
+
+# Boot a Config snapshot with sensible test defaults so any unit test
+# touching Config.get() works without needing the full Application
+# supervisor running. Individual tests that need different values can
+# inspect/override the ETS table directly.
+test_root = Path.join(System.tmp_dir!(), "symphony_test_root_#{System.unique_integer([:positive])}")
+File.mkdir_p!(test_root)
+File.mkdir_p!(Path.join([test_root, "workflows", "example", "workflows"]))
+File.mkdir_p!(Path.join([test_root, "workflows", "example", "skills"]))
+
+File.write!(Path.join([test_root, "workflows", "example", "repositories.yaml"]), """
+repositories:
+  - name: example
+    owner_repo: example/example
+    default_branch: main
+    primary: true
+""")
+
+System.put_env("SYMPHONY_ROOT", test_root)
+System.put_env("SYMPHONY_WORKFLOW_PACK", "example")
+System.put_env("LINEAR_WORKSPACE_SLUG", "example-org")
+
+{:ok, _config} = SymphonyElixir.Config.start_link([])
+{:ok, _phx_pubsub} = Phoenix.PubSub.Supervisor.start_link(name: SymphonyElixir.PubSub)
+{:ok, _endpoint} = SymphonyElixirWeb.Endpoint.start_link()
diff --git a/packages/symphony/elixir/test/workspace_test.exs b/packages/symphony/elixir/test/workspace_test.exs
new file mode 100644
index 000000000..bddd385fc
--- /dev/null
+++ b/packages/symphony/elixir/test/workspace_test.exs
@@ -0,0 +1,89 @@
+defmodule SymphonyElixir.WorkspaceTest do
+  use ExUnit.Case, async: false
+
+  alias SymphonyElixir.{Config, RepositoryCatalog, Workspace.RepoCloner}
+
+  setup do
+    tmp_root = Path.join(System.tmp_dir!(), "symphony_workspace_test_#{System.unique_integer([:positive])}")
+    source_root = Path.join(tmp_root, "sources")
+    workspaces_dir = Path.join(tmp_root, "workspaces")
+    repositories_file = Path.join(tmp_root, "repositories.yaml")
+
+    File.mkdir_p!(source_root)
+    File.mkdir_p!(workspaces_dir)
+
+    File.write!(repositories_file, """
+    repositories:
+      - name: primary-app
+        owner_repo: example/primary-app
+        default_branch: main
+        primary: true
+      - name: docs
+        owner_repo: example/docs
+        default_branch: main
+        primary: false
+    """)
+
+    local_repos =
+      %Config{repositories_file: repositories_file}
+      |> RepositoryCatalog.all()
+      |> Map.new(fn repo ->
+        {repo.name, init_repo!(Path.join(source_root, repo.name), repo.default_branch)}
+      end)
+
+    config = %Config{
+      primary_repo: Map.fetch!(local_repos, "primary-app"),
+      repo_root: source_root,
+      repositories_file: repositories_file
+    }
+
+    on_exit(fn -> File.rm_rf!(tmp_root) end)
+
+    %{config: config, local_repos: local_repos, workspaces_dir: workspaces_dir}
+  end
+
+  test "creates primary workspace with writable sibling repos", %{
+    config: config,
+    local_repos: local_repos,
+    workspaces_dir: workspaces_dir
+  } do
+    run_root = Path.join(workspaces_dir, "run-1")
+    assert {:ok, workspace} = RepoCloner.clone_all(config, run_root, "run-1")
+
+    assert workspace == Path.join([workspaces_dir, "run-1", "primary-app"])
+    assert File.exists?(Path.join(workspace, "README.md"))
+
+    docs_repo = Path.join([workspaces_dir, "run-1", "docs"])
+    assert File.exists?(Path.join(docs_repo, "README.md"))
+    assert {"symphony/run-1\n", 0} = System.cmd("git", ["-C", docs_repo, "branch", "--show-current"])
+
+    assert {alternate, 0} = System.cmd("git", ["-C", docs_repo, "rev-parse", "--git-path", "objects/info/alternates"])
+    alternate_path = Path.expand(String.trim(alternate), docs_repo)
+    assert File.read!(alternate_path) =~ Path.join(Map.fetch!(local_repos, "docs"), ".git/objects")
+  end
+
+  test "primary repo declares main as default", %{config: config} do
+    assert %{default_branch: "main", primary?: true} =
+             Enum.find(RepositoryCatalog.all(config), & &1.primary?)
+  end
+
+  defp init_repo!(path, branch) do
+    File.mkdir_p!(path)
+    File.write!(Path.join(path, "README.md"), "# #{Path.basename(path)}\n")
+
+    git!(path, ["init", "--initial-branch=#{branch}"])
+    git!(path, ["config", "user.name", "Symphony Test"])
+    git!(path, ["config", "user.email", "symphony-test@example.com"])
+    git!(path, ["add", "README.md"])
+    git!(path, ["commit", "-m", "init"])
+
+    path
+  end
+
+  defp git!(path, args) do
+    case System.cmd("git", ["-C", path] ++ args, stderr_to_stdout: true) do
+      {_output, 0} -> :ok
+      {output, status} -> flunk("git #{Enum.join(args, " ")} failed with #{status}: #{output}")
+    end
+  end
+end
diff --git a/packages/symphony/package.nix b/packages/symphony/package.nix
new file mode 100644
index 000000000..708ac9750
--- /dev/null
+++ b/packages/symphony/package.nix
@@ -0,0 +1,11 @@
+# Registry metadata. The launcher is a flake output (`nix run .#symphony`,
+# `index.packages.<sys>.symphony`, the attr ix's symphony host modules
+# consume) and deliberately not an overlay: nothing inside an image
+# evaluation needs `pkgs.symphony`, and the room-server the symphony-codex
+# image embeds is a separate package (`pkgs.symphony-room-server`, still
+# provided by the pinned `symphony` flake input).
+{
+  id = "symphony";
+  packageSet = true;
+  flake = true;
+}
diff --git a/packages/symphony/workflows/example/repositories.yaml b/packages/symphony/workflows/example/repositories.yaml
new file mode 100644
index 000000000..b060cd22f
--- /dev/null
+++ b/packages/symphony/workflows/example/repositories.yaml
@@ -0,0 +1,5 @@
+repositories:
+  - name: example
+    owner_repo: example/example
+    default_branch: main
+    primary: true
diff --git a/packages/symphony/workflows/example/skills/inspect.md b/packages/symphony/workflows/example/skills/inspect.md
new file mode 100644
index 000000000..4fb274741
--- /dev/null
+++ b/packages/symphony/workflows/example/skills/inspect.md
@@ -0,0 +1,14 @@
+---
+codex_model: gpt-5.3-codex
+reasoning_effort: medium
+sandbox: workspace-write
+approval_policy: never
+tools: []
+---
+
+You are running inside a sample Symphony workflow.
+
+Read the input and inspect the checked-out workspace. Do not push branches,
+open pull requests, mutate external services, or assume any Indexable-specific
+infrastructure exists. Return a concise summary of what you found and what a
+human could do next.
diff --git a/packages/symphony/workflows/example/workflows/inspect.sym b/packages/symphony/workflows/example/workflows/inspect.sym
new file mode 100644
index 000000000..7262fdef3
--- /dev/null
+++ b/packages/symphony/workflows/example/workflows/inspect.sym
@@ -0,0 +1,10 @@
+# A minimal manual-trigger workflow: inspect the workspace and report.
+workflow "inspect" on manual {
+  inspect <- agent {
+    engine: codex
+    model: "gpt-5.3-codex"
+    effort: medium
+    permissions: workspace_write
+    prompt: skill "inspect"
+  }
+}
diff --git a/tests/default.nix b/tests/default.nix
index 38a91810b..0ff72c47b 100644
--- a/tests/default.nix
+++ b/tests/default.nix
@@ -542,6 +542,31 @@ let
       packageNames = map lib.getName config.environment.systemPackages;
     };
 
+  # The symphony control-plane module (modules/services/symphony) evaluated
+  # standalone, the way ix's host modules consume it. `package` only needs a
+  # /bin path shape at eval, so hello stands in for the launcher.
+  symphonyService =
+    let
+      config = evalConfig [
+        {
+          ix.image = {
+            name = "test/symphony-module";
+            tag = "test";
+          };
+          services.symphony = {
+            enable = true;
+            package = pkgs.hello;
+            primaryRepo = "/srv/checkouts/index";
+            environmentFile = "/run/secrets/symphony.env";
+          };
+        }
+      ];
+    in
+    {
+      inherit config;
+      unit = config.systemd.services.symphony;
+    };
+
   pythonAppClosureProbe = ix.writePythonApplication pkgs {
     name = "python-app-closure-probe";
     src = pkgs.writeText "python-app-closure-probe.py" ''
@@ -2987,6 +3012,34 @@ let
       }
     ];
 
+    # The control-plane runtime module that moved in-tree with
+    # packages/symphony. These pin the env contract ix's hil deployment and
+    # the worker module read off the unit, so a refactor that renames an
+    # option or drops the EnvironmentFile pass-through fails here instead of
+    # on a host switch.
+    symphony = [
+      {
+        assertion = symphonyService.unit.environment.SYMPHONY_WORKFLOW_PACK == "example";
+        message = "symphony module should default to the bundled example workflow pack";
+      }
+      {
+        assertion = symphonyService.unit.environment.SYMPHONY_PRIMARY_REPO == "/srv/checkouts/index";
+        message = "symphony module should export the primary repo checkout to the runtime";
+      }
+      {
+        assertion = lib.hasSuffix "/bin/symphony" symphonyService.unit.serviceConfig.ExecStart;
+        message = "symphony module should exec /bin/symphony from the configured package";
+      }
+      {
+        assertion = symphonyService.unit.serviceConfig.EnvironmentFile == "/run/secrets/symphony.env";
+        message = "symphony module should pass the secrets EnvironmentFile through to systemd";
+      }
+      {
+        assertion = !(symphonyService.unit.environment ? SYMPHONY_HOST_USER);
+        message = "symphony module should keep host-placement env unset until hostRuntime.enable";
+      }
+    ];
+
     minecraft = [
       {
         assertion = minecraft.config.ix.image.tag == defaultMinecraftVersion;