pydantic · DouweM · Apr 2, 2026 · Apr 2, 2026 · Apr 2, 2026
diff --git a/PLAN.md b/PLAN.md
@@ -0,0 +1,36 @@
+# SubAgent Capability
+
+## Problem
+
+When building multi-agent systems with Pydantic AI, there's no reusable capability for delegating tasks from a parent (orchestrator) agent to specialized sub-agents. Users currently have to manually wire up tool functions that call `agent.run()`, duplicate boilerplate for description injection, and handle error cases like unknown agent names.
+
+## Solution
+
+A `SubAgent` capability (implementing `AbstractCapability`) that:
+
+1. Accepts a dict of named `Agent` instances
+2. Provides a `delegate_task(agent_name, task)` tool to the parent agent
+3. Injects sub-agent descriptions into the system prompt so the parent knows what's available
+4. Forwards the parent's `deps` to sub-agents (configurable via `pass_deps`)
+5. Returns sub-agent output as a string tool result
+6. Raises `ModelRetry` for unknown agent names (self-correcting)
+
+## Design decisions
+
+- **Synchronous delegation only** (for now): the `delegate_task` tool blocks until the sub-agent finishes. This is the simplest correct behavior and matches the "Agent-as-Tool" pattern from OpenAI Agents SDK. Async background tasks (#32 scope expansion) and full handoffs (#44) are left for follow-up.
+- **Descriptions from agent metadata**: falls back through `agent.description`, `agent.name`, then a default. Users can also pass explicit `descriptions` dict.
+- **Not spec-serializable**: since it takes `Agent` instances, YAML/JSON serialization is not supported (`get_serialization_name()` returns `None`).
+- **`str()` conversion of output**: all sub-agent outputs are converted to string for the tool result, regardless of the sub-agent's `output_type`.
+
+## Files
+
+- `src/pydantic_harness/subagent.py` — the `SubAgent` capability
+- `src/pydantic_harness/__init__.py` — re-exports `SubAgent`
+- `tests/test_subagent.py` — 19 tests covering construction, instructions, toolset, end-to-end delegation (deps forwarding, unknown agent retry, multiple agents), and imports
+- `pyproject.toml` — added `pytest-asyncio` dev dependency
+
+## References
+
+- Issue #32: SubAgent / Agent-as-Tool capability
+- Issue #44: Handoff / Agent Transfer (follow-up, blocked by this)
+- Prior art: [vstorm-co/subagents-pydantic-ai](https://github.com/vstorm-co/subagents-pydantic-ai), OpenAI Agents SDK handoffs, Google ADK sub_agents, Pydantic AI's `ImageGeneration` capability subagent pattern
diff --git a/pyproject.toml b/pyproject.toml
@@ -100,3 +100,4 @@ exclude_lines = [
     'assert_never',
     'if TYPE_CHECKING:',
 ]
+
diff --git a/src/pydantic_harness/__init__.py b/src/pydantic_harness/__init__.py
@@ -7,4 +7,8 @@
 # Each capability module is imported and re-exported here.
 # Capabilities are listed alphabetically.
 
-__all__: list[str] = []
+from .subagent import SubAgent
+
+__all__: list[str] = [
+    'SubAgent',
+]
diff --git a/src/pydantic_harness/subagent.py b/src/pydantic_harness/subagent.py
@@ -0,0 +1,219 @@
+"""SubAgent capability: delegate tasks from a parent agent to specialized sub-agents."""
+
+from __future__ import annotations
+
+import asyncio
+import json
+from dataclasses import dataclass, field
+from typing import Any
+
+from pydantic import BaseModel
+from pydantic_ai import Agent
+from pydantic_ai.capabilities import AbstractCapability
+from pydantic_ai.exceptions import ModelRetry
+from pydantic_ai.messages import ModelMessage, ModelResponse, ToolCallPart
+from pydantic_ai.tools import AgentDepsT, RunContext, Tool
+from pydantic_ai.toolsets import AgentToolset
+from pydantic_ai.toolsets.function import FunctionToolset
+
+__all__ = ('SubAgent',)
+
+
+def _resolve_description(name: str, agent: Agent[Any, Any]) -> str:
+    """Derive a description for a sub-agent from its metadata."""
+    if agent.description:
+        return agent.description
+    if agent.name:
+        return agent.name
+    return f'Sub-agent: {name}'
+
+
+def _shareable_history(messages: list[ModelMessage]) -> list[ModelMessage]:
+    """Return a copy of the message history safe to pass to a sub-agent.
+
+    The parent's ``ctx.messages`` may end with a ``ModelResponse`` containing
+    the ``ToolCallPart`` currently being executed, which the sub-agent cannot
+    process (it would conflict with its own user prompt).  This helper strips
+    such trailing responses to yield a clean conversation history.
+    """
+    history = list(messages)
+    while history and isinstance(history[-1], ModelResponse):
+        if any(isinstance(p, ToolCallPart) for p in history[-1].parts):
+            history.pop()
+        else:
+            break
+    return history
+
+
+def _format_output(output: Any) -> str:
+    """Format a sub-agent's output as a string for the parent agent.
+
+    Preserves structured data by JSON-serializing Pydantic models, dicts, and
+    lists, and using `repr()` for other non-string types.
+    """
+    if isinstance(output, str):
+        return output
+    if isinstance(output, BaseModel):
+        return output.model_dump_json()
+    if isinstance(output, (dict, list)):
+        return json.dumps(output)
+    return repr(output)
+
+
+@dataclass
+class SubAgent(AbstractCapability[AgentDepsT]):
+    """Capability that lets a parent agent delegate tasks to named sub-agents.
+
+    Each sub-agent is an independent `Agent` instance. The parent agent receives
+    a `delegate_task` tool that runs a named sub-agent with a given prompt and
+    returns its text output as the tool result.
+
+    Example:
+    ```python
+    from pydantic_ai import Agent
+    from pydantic_harness.subagent import SubAgent
+
+    researcher = Agent('openai:gpt-4o', description='Researches topics thoroughly.')
+    coder = Agent('openai:gpt-4o', description='Writes and reviews code.')
+
+    orchestrator = Agent(
+        'openai:gpt-4o',
+        capabilities=[
+            SubAgent(agents={'researcher': researcher, 'coder': coder}),
+        ],
+    )
+    ```
+    """
+
+    agents: dict[str, Agent[Any, Any]]
+    """Mapping of agent name to `Agent` instance.
+
+    Sub-agents may have any output type; structured outputs are automatically
+    serialized to strings for the parent agent.
+
+    Names are used by the parent agent in the `delegate_task` tool to select
+    which sub-agent to run.
+    """
+
+    descriptions: dict[str, str] = field(default_factory=dict[str, str])
+    """Optional explicit descriptions for each sub-agent.
+
+    These are included in the system prompt and in the `delegate_task` tool
+    description so the parent agent knows what each sub-agent does.
+
+    When a name is not present in this dict, the description is derived from
+    `agent.description`, `agent.name`, or a default.
+    """
+
+    pass_deps: bool = True
+    """Whether to forward the parent agent's `deps` to sub-agents.
+
+    When True (the default), sub-agents receive the same dependency object
+    as the parent. Set to False if sub-agents use incompatible dependency types.
+    """
+
+    share_history: bool = False
+    """Whether to pass the parent agent's message history to sub-agents.
+
+    When True, the parent's conversation history is forwarded as
+    ``message_history`` to each sub-agent run, giving it access to the
+    full conversation context. When False (the default), sub-agents start
+    with a fresh conversation.
+    """
+
+    _resolved_descriptions: dict[str, str] = field(default_factory=dict[str, str], init=False, repr=False)
+
+    def __post_init__(self) -> None:
+        """Resolve descriptions for all registered sub-agents."""
+        for name, agent in self.agents.items():
+            if name in self.descriptions:
+                self._resolved_descriptions[name] = self.descriptions[name]
+            else:
+                self._resolved_descriptions[name] = _resolve_description(name, agent)
+
+    @classmethod
+    def get_serialization_name(cls) -> str | None:
+        """Not spec-serializable (takes Agent instances)."""
+        return None
+
+    def get_instructions(self) -> str | None:
+        """Inject descriptions of available sub-agents into the system prompt."""
+        if not self.agents:
+            return None
+
+        lines = [
+            'You can delegate tasks to the following sub-agents using the '
+            '`delegate_task` tool (one at a time) or the `delegate_tasks` tool (multiple in parallel):'
+        ]
+        for name in self.agents:
+            desc = self._resolved_descriptions[name]
+            lines.append(f'- **{name}**: {desc}')
+        return '\n'.join(lines)
+
+    def get_toolset(self) -> AgentToolset[AgentDepsT] | None:
+        """Provide the `delegate_task` and `delegate_tasks` tools."""
+        if not self.agents:
+            return None
+
+        agents = self.agents
+        pass_deps = self.pass_deps
+        share_history = self.share_history
+
+        async def _run_sub_agent(ctx: RunContext[AgentDepsT], agent_name: str, task: str) -> str:
+            """Run a single sub-agent, returning its formatted output."""
+            agent = agents.get(agent_name)
+            if agent is None:
+                available = ', '.join(sorted(agents))
+                raise ModelRetry(f'Unknown agent {agent_name!r}. Available agents: {available}')
+
+            deps = ctx.deps if pass_deps else None
+            message_history = _shareable_history(ctx.messages) if share_history else None
+            result = await agent.run(task, deps=deps, message_history=message_history)
+            return _format_output(result.output)
+
+        async def delegate_task(ctx: RunContext[AgentDepsT], agent_name: str, task: str) -> str:
+            """Delegate a task to a named sub-agent and return its output.
+
+            Args:
+                ctx: The run context from the parent agent.
+                agent_name: The name of the sub-agent to run. Must be one of the registered agent names.
+                task: The prompt describing the task to delegate.
+            """
+            return await _run_sub_agent(ctx, agent_name, task)
+
+        async def delegate_tasks(
+            ctx: RunContext[AgentDepsT],
+            tasks: list[dict[str, str]],
+        ) -> list[str]:
+            """Delegate multiple tasks to sub-agents in parallel and return their outputs.
+
+            Args:
+                ctx: The run context from the parent agent.
+                tasks: A list of task objects, each with ``agent`` (sub-agent name) and ``task`` (prompt).
+            """
+            coros = [_run_sub_agent(ctx, t['agent'], t['task']) for t in tasks]
+            return list(await asyncio.gather(*coros))
+
+        agent_desc = self._delegate_task_description()
+        tools: list[Tool[AgentDepsT]] = [
+            Tool[AgentDepsT](
+                delegate_task,
+                name='delegate_task',
+                description=agent_desc,
+            ),
+            Tool[AgentDepsT](
+                delegate_tasks,
+                name='delegate_tasks',
+                description=f'Delegate multiple tasks in parallel. Each item needs "agent" and "task" keys. {agent_desc}',
+            ),
+        ]
+        return FunctionToolset[AgentDepsT](tools)
+
+    def _delegate_task_description(self) -> str:
+        """Build a description for the delegate_task tool including available agent names."""
+        parts: list[str] = []
+        for name in self.agents:
+            desc = self._resolved_descriptions[name]
+            parts.append(f'{name} ({desc})')
+        agent_list = ', '.join(parts)
+        return f'Delegate a task to a sub-agent. Available agents: {agent_list}'
diff --git a/tests/conftest.py b/tests/conftest.py
@@ -35,3 +35,13 @@ def allow_model_requests() -> Iterator[None]:
     """Temporarily allow real model requests within a test."""
     with pydantic_ai.models.override_allow_model_requests(True):
         yield
+
+
+@pytest.fixture(scope='module', params=['asyncio'])
+def anyio_backend(request: pytest.FixtureRequest) -> str:
+    """Override anyio backend to asyncio-only.
+
+    Pydantic AI uses ``asyncio.gather`` internally (e.g. in capabilities/combined.py)
+    which is incompatible with the Trio event loop.
+    """
+    return request.param  # type: ignore[return-value]
Original file line number	Diff line number	Diff line change
Expand Up		@@ -100,3 +100,4 @@ exclude_lines = [
		'assert_never',
		'if TYPE_CHECKING:',
		]