coleam00
diff --git a/‎.archon/maintainer-standup/direction.md‎
Lines changed: 18 additions & 0 deletions b/‎.archon/maintainer-standup/direction.md‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎.archon/workflows/defaults/archon-refactor-safely.yaml‎
Lines changed: 2 additions & 2 deletions b/‎.archon/workflows/defaults/archon-refactor-safely.yaml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎.archon/workflows/maintainer/marketplace-pr-review-and-merge.yaml‎
Lines changed: 28 additions & 2 deletions b/‎.archon/workflows/maintainer/marketplace-pr-review-and-merge.yaml‎
Lines changed: 28 additions & 2 deletions
diff --git a/‎.archon/workflows/test-workflows/e2e-copilot-abort.yaml‎
Lines changed: 14 additions & 0 deletions b/‎.archon/workflows/test-workflows/e2e-copilot-abort.yaml‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎.archon/workflows/test-workflows/e2e-copilot-all-nodes-smoke.yaml‎
Lines changed: 147 additions & 0 deletions b/‎.archon/workflows/test-workflows/e2e-copilot-all-nodes-smoke.yaml‎
Lines changed: 147 additions & 0 deletions
diff --git a/‎.env.example‎
Lines changed: 14 additions & 1 deletion b/‎.env.example‎
Lines changed: 14 additions & 1 deletion
diff --git a/‎CHANGELOG.md‎
Lines changed: 4 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎CLAUDE.md‎
Lines changed: 14 additions & 1 deletion b/‎CLAUDE.md‎
Lines changed: 14 additions & 1 deletion
@@ -26,6 +26,24 @@ This file is **committed and shared by all maintainers**. Edit deliberately —
 - **Not opinionated about the dev environment.** No mandatory editor integrations, framework lock-in, or Docker requirement beyond what users opt into.
 - **Not a workflow marketplace.** Bundled workflows are reference patterns; Archon is not aiming to be a hub for third-party workflow distribution.
 
+## Community providers
+
+Archon ships built-in providers for Claude (`@anthropic-ai/claude-agent-sdk`) and Codex (`@openai/codex-sdk`). Pi (`@mariozechner/pi-coding-agent`) is the reference community provider and sets the pattern others should follow.
+
+**Acceptance criteria** for new community providers:
+
+- **Coding-agent SDK only.** The provider must wrap an existing coding-agent SDK — one that handles file edits, tool use, multi-turn sessions, and planning. Raw LLM API integrations (`chat.completions`-style) are out of scope. Pi already covers ~20 LLM backends via one harness, so single-model wrappers duplicate work that is already done.
+- **Match the Pi pattern.** Structure mirrors `packages/providers/src/community/pi/` — provider class implementing `IAgentProvider`, options translator, event bridge, capability matrix, registered with `builtIn: false`. Tests at parity with the Pi suite (config, options-translator, event-bridge, provider, session-resolver as the baseline).
+- **Docs page.** Add the provider to `packages/docs-web/src/content/docs/getting-started/ai-assistants.md` with setup, capability matrix, and supported config keys.
+
+**Maintenance policy:**
+
+- We accept any provider that meets the criteria above. There is no cap.
+- The contributor and the community maintain the provider. Archon maintainers do not own upstream-SDK breaks for community providers.
+- A community provider that goes non-functional — CI broken, upstream SDK gone, no maintainer response — is marked deprecated and removed in the next minor release unless someone from the community submits a fix.
+
+When citing this policy in a PR comment: `direction.md §community-providers`.
+
 ## Open questions (no stance yet)
 
 These are direction calls we haven't made. PRs that touch these areas should surface the question for explicit decision rather than be silently accepted or rejected. The workflow may add to this list as new questions appear.
 
@@ -117,7 +117,7 @@ nodes:
       - Rationale for each grouping (cohesion, shared dependencies)
     depends_on: [scan-scope]
     context: fresh
-    denied_tools: [Write, Edit, Bash]
+    denied_tools: [Edit, Bash]
 
   # ═══════════════════════════════════════════════════════════════
   # PHASE 3: PLAN REFACTOR — Ordered task list with rollback strategy
@@ -199,7 +199,7 @@ nodes:
       - Format: `bun run format:check`
     depends_on: [analyze-impact]
     context: fresh
-    denied_tools: [Write, Edit, Bash]
+    denied_tools: [Edit, Bash]
 
   # ═══════════════════════════════════════════════════════════════
   # PHASE 4: EXECUTE REFACTOR — Implements the plan with guardrails
 
@@ -276,10 +276,19 @@ nodes:
   # NODE 8: DECIDE — deterministic decision logic (inline Bun script)
   # ═══════════════════════════════════════════════════════════════
 
+  - id: persist-ai-review
+    # bash bridge: in a bash node $ai-review.output is shell-quoted, so a failed
+    # or non-JSON AI verdict (e.g. provider/API error) is written verbatim to a
+    # file instead of being injected raw into the decide script — where it would
+    # otherwise be invalid JS and crash the run at parse time.
+    depends_on: [ai-review]
+    bash: |
+      printf '%s' $ai-review.output > "$ARTIFACTS_DIR/ai-review.json"
+
   - id: decide
     runtime: bun
     timeout: 10000
-    depends_on: [ai-review, fetch-pr-metadata]
+    depends_on: [persist-ai-review, fetch-pr-metadata]
     script: |
       import { readFileSync, writeFileSync } from 'node:fs';
       import { resolve } from 'node:path';
@@ -292,9 +301,26 @@ nodes:
       const scopeResult = readFileSync(resolve(artifactsDir, '.scope-result'), 'utf8').trim();
 
       const scanResult = $security-scan.output;
-      const aiReview = $ai-review.output;
       const schemaResult = $validate-schema.output;
 
+      // ai-review verdict is read from a file (written by the persist-ai-review
+      // bash bridge) so a failed or non-JSON AI output can't crash this script.
+      let aiReview: { recommendation?: string; reasoning?: string };
+      try {
+        const aiReviewRaw = readFileSync(resolve(artifactsDir, 'ai-review.json'), 'utf8').trim();
+        aiReview = JSON.parse(aiReviewRaw) as { recommendation?: string; reasoning?: string };
+        if (typeof aiReview.recommendation !== 'string') {
+          throw new Error('missing "recommendation" field');
+        }
+      } catch (err) {
+        console.error(
+          `decide: ai-review did not produce a valid structured verdict (${(err as Error).message}). ` +
+            `The AI review step likely failed or was unavailable (e.g. provider/API quota). ` +
+            `Failing safe — not auto-merging. Re-run the marketplace auto-review once the provider is available.`,
+        );
+        process.exit(1);
+      }
+
       const author = prMeta.author.login;
       const isDraft = prMeta.isDraft;
 
 
@@ -0,0 +1,14 @@
+# E2E manual abort test — GitHub Copilot community provider
+# Verifies: Ctrl-C propagates through the bridge to session.abort() and
+#   sendAndWait unwinds cleanly without dangling listeners.
+# Manual: start, wait for streaming to begin, press Ctrl-C. Not for CI.
+name: e2e-copilot-abort
+description: 'Manual test: start, then Ctrl-C. Verifies abort wiring.'
+provider: copilot
+model: gpt-5-mini
+
+nodes:
+  - id: long
+    prompt: 'Count slowly from 1 to 200, one number per line, with a brief phrase after each number explaining its mathematical significance. Do not skip any numbers.'
+    effort: low
+    idle_timeout: 120000
@@ -0,0 +1,147 @@
+# E2E smoke test — Copilot provider, every CI-compatible node type
+# Covers: prompt, command, loop (AI node types) + bash, script bun/uv
+#   (deterministic node types) + depends_on / when / trigger_rule / $nodeId.output
+#   (DAG features) + Copilot-specific options: effort, allowed_tools,
+#   output_format (best-effort JSON via prompt augment + 2-tier parser).
+# Skipped: `approval:` — pauses for human input, incompatible with CI.
+# Auth: `gh auth login` OR `COPILOT_GITHUB_TOKEN`.
+#   To use `GH_TOKEN` / `GITHUB_TOKEN`, also set `assistantConfig.useLoggedInUser: false`.
+#   Requires an active GitHub Copilot subscription.
+name: e2e-copilot-all-nodes-smoke
+description: 'Copilot provider smoke across every CI-compatible node type plus Copilot-specific options.'
+provider: copilot
+model: gpt-5-mini
+
+nodes:
+  # ─── AI node types ──────────────────────────────────────────────────────
+
+  # 1. prompt: inline prompt + effort + allowed_tools (no tool calls).
+  #    Verifies reasoningEffort and availableTools=[] reach the SDK.
+  - id: prompt-node
+    prompt: "Reply with exactly the single word 'ok' and nothing else."
+    allowed_tools: []
+    effort: low
+    idle_timeout: 30000
+
+  # 2. command: named command file (.archon/commands/e2e-echo-command.md).
+  #    The command echoes back $ARGUMENTS (the workflow invocation message).
+  - id: command-node
+    command: e2e-echo-command
+    allowed_tools: []
+    idle_timeout: 30000
+
+  # 3. loop: iterative AI prompt until completion signal.
+  #    Bounded by max_iterations: 2 so a misbehaving model can't hang CI.
+  - id: loop-node
+    loop:
+      prompt: "Reply with exactly 'DONE' and nothing else."
+      until: 'DONE'
+      max_iterations: 2
+    allowed_tools: []
+    effort: low
+    idle_timeout: 60000
+
+  # 4. output_format: Copilot's best-effort structured output path
+  #    (prompt augmented with schema + 2-tier JSON parser on result text).
+  #    Unique to Copilot/Pi vs. Claude/Codex native JSON mode — only an
+  #    E2E test catches "real model drifted around the schema".
+  - id: structured-node
+    prompt: |
+      Return a JSON object with two fields, no fences and no prose:
+        - "status": always "ok" (string)
+        - "value":  always 42 (number)
+    allowed_tools: []
+    effort: low
+    idle_timeout: 30000
+    output_format:
+      type: object
+      properties:
+        status:
+          type: string
+        value:
+          type: number
+      required: [status, value]
+
+  # ─── Deterministic node types (no AI) ───────────────────────────────────
+
+  # 5. bash: shell script with JSON output (enables $nodeId.output.status
+  #    dot-access downstream).
+  - id: bash-json-node
+    bash: 'echo ''{"status":"ok"}'''
+
+  # 6. script: bun (TypeScript/JavaScript runtime)
+  - id: script-bun-node
+    script: echo-args
+    runtime: bun
+    timeout: 30000
+
+  # 7. script: uv (Python runtime)
+  - id: script-python-node
+    script: echo-py
+    runtime: uv
+    timeout: 30000
+
+  # ─── DAG features ───────────────────────────────────────────────────────
+
+  # 8. depends_on + $nodeId.output substitution
+  - id: downstream
+    bash: "echo 'downstream got: $prompt-node.output'"
+    depends_on: [prompt-node]
+
+  # 9. when: conditional (JSON dot-access on bash JSON output)
+  - id: gated
+    bash: "echo 'gated-ok'"
+    depends_on: [bash-json-node]
+    when: "$bash-json-node.output.status == 'ok'"
+
+  # 10. when: conditional on AI structured output (proves output_format
+  #     parsed and dot-access works on the resulting object).
+  - id: structured-check
+    bash: "echo \"structured.status=$structured-node.output.status\""
+    depends_on: [structured-node]
+    when: "$structured-node.output.status == 'ok'"
+
+  # 11. trigger_rule: merge multiple deps (all_success semantics)
+  - id: merge
+    bash: "echo 'merge-ok'"
+    depends_on:
+      [downstream, gated, structured-check, script-bun-node, script-python-node]
+    trigger_rule: all_success
+
+  # ─── Final assertion ────────────────────────────────────────────────────
+
+  # 12. Verify every upstream node produced non-empty output, including
+  #     dot-access on the structured-output node (proves output_format
+  #     parsed and downstream consumers can index into it).
+  #     Note: value-equality on string fields is avoided on purpose —
+  #     shellQuote() wraps strings in literal single quotes, so a literal
+  #     `[ "$x" != "ok" ]` would always fail. Non-emptiness is the right
+  #     bar for a smoke; the `when:` gate on structured-check already
+  #     proved the value matched 'ok' to reach this node.
+  - id: assert
+    bash: |
+      fail=0
+      check() {
+        local name="$1"
+        local value="$2"
+        if [ -z "$value" ]; then
+          echo "FAIL: $name produced empty output"
+          fail=1
+        fi
+      }
+      check prompt-node       "$prompt-node.output"
+      check command-node      "$command-node.output"
+      check loop-node         "$loop-node.output"
+      check bash-json-node    "$bash-json-node.output"
+      check script-bun-node   "$script-bun-node.output"
+      check script-python-node "$script-python-node.output"
+      check downstream        "$downstream.output"
+      check gated             "$gated.output"
+      check merge             "$merge.output"
+      check structured.status "$structured-node.output.status"
+      check structured.value  "$structured-node.output.value"
+
+      if [ "$fail" -eq 1 ]; then exit 1; fi
+      echo "PASS: all node types + structured output verified"
+    depends_on: [merge, loop-node, command-node]
+    trigger_rule: all_success
@@ -26,6 +26,7 @@ CLAUDE_USE_GLOBAL_AUTH=true
 # Then:
 #   CLAUDE_BIN_PATH=$HOME/.local/bin/claude       (native installer)
 #   CLAUDE_BIN_PATH=$(npm root -g)/@anthropic-ai/claude-code/cli.js  (npm alternative)
+#   CLAUDE_BIN_PATH=$(npm root -g)/@anthropic-ai/claude-code-win32-x64  (Windows npm platform dir — auto-expanded to claude.exe)
 # CLAUDE_BIN_PATH=
 
 # Codex Authentication (get from ~/.codex/auth.json after running 'codex login')
@@ -38,6 +39,18 @@ CODEX_REFRESH_TOKEN=
 CODEX_ACCOUNT_ID=
 # CODEX_BIN_PATH=  # Optional: path to Codex native binary (binary builds only)
 
+# GitHub Copilot (community provider — @github/copilot-sdk)
+# Requires an active GitHub Copilot subscription. By default, Archon uses
+# the credentials you configured via the Copilot CLI (`copilot login`).
+# Generic GH_TOKEN / GITHUB_TOKEN (declared below) are intentionally NOT
+# picked up — classic PATs lack Copilot entitlement and would fail. To
+# opt back into env-token auth, set `useLoggedInUser: false` in
+# `.archon/config.yaml`. Setting COPILOT_GITHUB_TOKEN is treated as
+# explicit Copilot intent and always wins.
+#
+# COPILOT_GITHUB_TOKEN=        # Copilot-scoped PAT (always wins when set)
+# COPILOT_BIN_PATH=            # Optional: path to Copilot CLI binary (binary builds only)
+
 # Pi (community provider — @mariozechner/pi-coding-agent)
 # One adapter, ~20 LLM backends. Archon's Pi adapter picks up credentials
 # you've already configured via the Pi CLI (`pi /login` writes to
@@ -63,7 +76,7 @@ CODEX_ACCOUNT_ID=
 # before the container starts (Pi reads it on each file path lookup).
 # PI_CODING_AGENT_DIR=/.archon/pi
 
-# Default AI Assistant (must match a registered provider, e.g. claude, codex, pi)
+# Default AI Assistant (must match a registered provider, e.g. claude, codex, copilot, pi)
 # Used for new conversations when no codebase specified — errors on unknown values
 DEFAULT_AI_ASSISTANT=claude
 
 
@@ -12,6 +12,10 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - **`assistants.opencode` provider**: community provider that runs OpenCode as an embedded runtime, with per-node agent materialization, multi-agent sessions, structured output, token usage, and multi-agent MCP tool execution (#1703).
 - MCP server support for Codex workflow nodes via the shared `loadMcpConfig` module — pass `mcp: <path>` on a Codex node and the config is translated to Codex's `mcp_servers` overrides at runtime. MCP client errors are surfaced to the workflow author as `system` chunks when MCP is explicitly configured for the node (#1459).
 
+### Fixed
+
+- **`workflow approve/resume/reject` no longer fail with "Workflow not found" when the run's working path is a worktree or workspace clone.** Resume, approve, and reject now use `codebase.default_cwd` for workflow YAML discovery, falling back to `working_path` when no codebase record is found. Fixes #1663 (#1743).
+
 ## [0.3.12] - 2026-05-14
 
 Orchestrator prompt-cache fix, SDK termination edge cases, marketplace expansion, and broad workflow fixes.
 
@@ -488,7 +488,10 @@ assistants:
       - user         # User-level ~/.claude/ (included in default; omit both to restrict to project-only)
     claudeBinaryPath: /absolute/path/to/claude  # Optional: Claude Code executable.
                                                 # Native binary (curl installer at
-                                                # ~/.local/bin/claude) or npm cli.js.
+                                                # ~/.local/bin/claude), npm cli.js, or
+                                                # the npm platform-package directory
+                                                # (e.g. @anthropic-ai/claude-code-win32-x64)
+                                                # which is auto-expanded to claude/claude.exe.
                                                 # Required in compiled binaries if
                                                 # CLAUDE_BIN_PATH env var is not set.
   codex:
@@ -585,13 +588,23 @@ curl http://localhost:3637/api/conversations/<conversationId>/messages
 
 ## Development Guidelines
 
+### UI and Visual Design
+
+All UI changes — production web (`packages/web/`), experiments (`packages/web/src/experiments/`), the docs site, marketing surfaces, and any future visual surface — must align with the Archon brand foundation.
+
+- **Canonical brand guide:** https://archon.diy/brand/ (source: `packages/docs-web/src/content/docs/brand/index.md` + `packages/docs-web/public/brand/foundation.html`).
+- **Use brand tokens, not ad-hoc values.** Colors, gradients, surfaces, and typography must come from the established design tokens (`packages/web/src/index.css`) or the brand guide. Don't hard-code hex values that aren't in the system.
+- **Introducing a new visual token** (color, font, radius, spacing) means updating both the token source and the brand guide. Don't fork the palette per package.
+- **When in doubt, consult the brand guide first** before inventing new visual treatments. Open a discussion if the guide doesn't cover your case.
+
 ### When Creating New Features
 
 **Quick reference:**
 - **Platform Adapters**: Implement `IPlatformAdapter`, handle auth, polling/webhooks
 - **AI Providers**: Implement `IAgentProvider`, session management, streaming
 - **Slash Commands**: Add to command-handler.ts, update database, no AI
 - **Database Operations**: Use `IDatabase` interface (supports PostgreSQL and SQLite via adapters)
+- **Plan insertion points**: Use stable text anchors (e.g., "after the `it('throws on ...')` test block"), never raw line numbers — line numbers drift on every preceding edit.
 
 ### SDK Type Patterns