pydantic
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎pydantic_ai_harness/__init__.py‎
Lines changed: 7 additions & 2 deletions b/‎pydantic_ai_harness/__init__.py‎
Lines changed: 7 additions & 2 deletions
diff --git a/‎pydantic_ai_harness/experimental/_warn.py‎
Lines changed: 1 addition & 1 deletion b/‎pydantic_ai_harness/experimental/_warn.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pydantic_ai_harness/experimental/compaction/README.md‎
Lines changed: 9 additions & 9 deletions b/‎pydantic_ai_harness/experimental/compaction/README.md‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎pydantic_ai_harness/experimental/compaction/_clear_tool_results.py‎
Lines changed: 2 additions & 2 deletions b/‎pydantic_ai_harness/experimental/compaction/_clear_tool_results.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎pydantic_ai_harness/experimental/compaction/_deduplicate_file_reads.py‎
Lines changed: 2 additions & 2 deletions b/‎pydantic_ai_harness/experimental/compaction/_deduplicate_file_reads.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎pydantic_ai_harness/experimental/compaction/_limit_warner.py‎
Lines changed: 1 addition & 1 deletion b/‎pydantic_ai_harness/experimental/compaction/_limit_warner.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pydantic_ai_harness/experimental/compaction/_shared.py‎
Lines changed: 2 additions & 2 deletions b/‎pydantic_ai_harness/experimental/compaction/_shared.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎pydantic_ai_harness/experimental/compaction/_sliding_window.py‎
Lines changed: 1 addition & 1 deletion b/‎pydantic_ai_harness/experimental/compaction/_sliding_window.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pydantic_ai_harness/experimental/compaction/_summarizing_compaction.py‎
Lines changed: 5 additions & 5 deletions b/‎pydantic_ai_harness/experimental/compaction/_summarizing_compaction.py‎
Lines changed: 5 additions & 5 deletions
@@ -2,6 +2,8 @@
 .mcp.json
 .DS_Store
 .agents/settings.local.json
+.agents/skills/branch-context/
+AGENTS.local.md
 CLAUDE.local.md
 LOCAL_WORKTREES.md
 
 
@@ -1,4 +1,4 @@
-"""Pydantic AI capability library."""
+"""The batteries for your Pydantic AI agent -- the official capability library."""
 
 from typing import TYPE_CHECKING
 
@@ -8,7 +8,12 @@
     from .logfire import ManagedPrompt
     from .shell import Shell
 
-__all__ = ['CodeMode', 'FileSystem', 'ManagedPrompt', 'Shell']
+__all__ = [
+    'CodeMode',
+    'FileSystem',
+    'ManagedPrompt',
+    'Shell',
+]
 
 
 def __getattr__(name: str) -> object:
 
@@ -28,7 +28,7 @@ class HarnessExperimentalWarning(UserWarning):
 def warn_experimental(feature: str) -> None:
     """Emit a `HarnessExperimentalWarning` for *feature*, including how to silence all of them.
 
-    One filter silences the whole category — every experimental capability — so users never
+    One filter silences the whole category (every experimental capability), so users never
     need a suppression line per capability.
     """
     warnings.warn(
 
@@ -3,7 +3,7 @@
 > [!WARNING]
 > **Experimental.** These capabilities live under `pydantic_ai_harness.experimental` and may
 > change or be removed in any release, without a deprecation period. Import them from the
-> experimental path — there is no top-level export:
+> experimental path -- there is no top-level export:
 >
 > ```python
 > from pydantic_ai_harness.experimental.compaction import TieredCompaction
@@ -24,7 +24,7 @@ window. Each is a Pydantic AI `Capability` that runs in the `before_model_reques
 **persist** into the run's message history, so a trim/clear/summary carries forward to later
 steps (it is not recomputed from the full history every turn).
 
-All strategies preserve tool-call / tool-return **pairing** — core does not validate this, and a
+All strategies preserve tool-call / tool-return **pairing** -- core does not validate this, and a
 provider rejects an orphaned pair. The zero-LLM strategies never call a model.
 
 ## The menu
@@ -48,9 +48,9 @@ near-lossless). `TieredCompaction` triggers and stops on a single `target_tokens
 ## Cost: why summarization is the last resort
 
 Summarization turns input tokens into output tokens, which are billed at a premium and generated
-serially — so it is genuinely expensive. The zero-LLM strategies touch only the cheaper input side.
+serially -- so it is genuinely expensive. The zero-LLM strategies touch only the cheaper input side.
 The field consensus (Anthropic, OpenCode, Letta) is to clear/dedupe first and summarize only when
-that is not enough — which is exactly what `TieredCompaction` encodes:
+that is not enough -- which is exactly what `TieredCompaction` encodes:
 
 ```python
 from pydantic_ai import Agent
@@ -77,14 +77,14 @@ agent = Agent(
 ```
 
 A tier inside `TieredCompaction` is driven directly by the orchestrator, which re-measures after each
-and stops once under `target_tokens` — so a tier's own `max_*` trigger is irrelevant there (set it to
+and stops once under `target_tokens` -- so a tier's own `max_*` trigger is irrelevant there (set it to
 anything valid). Any object with `async def compact(messages, ctx) -> list[ModelMessage]`
 (`CompactionStrategy`) can be a tier, so you can plug in your own.
 
 ## Cache tradeoff (read before using `ClearToolResults`)
 
 Clearing or deduplicating rewrites message content, which invalidates the provider's prompt cache
-from the edit point onward — the next request pays a cache-write. Use `ClearToolResults`'
+from the edit point onward -- the next request pays a cache-write. Use `ClearToolResults`'
 `min_clear_tokens` to skip clearing that reclaims too little to be worth busting the cache.
 
 ## Model inheritance
@@ -94,8 +94,8 @@ running agent's model. No token caps are imposed on the summary call.
 
 ## Usage accounting
 
-The summary call is a real request to the model, so its full usage — tokens **and** the request
-itself — is folded into the run's `ctx.usage`. This is deliberate: it keeps cost honest, keeps the
+The summary call is a real request to the model, so its full usage -- tokens **and** the request
+itself -- is folded into the run's `ctx.usage`. This is deliberate: it keeps cost honest, keeps the
 request count consistent (a model request that didn't count as one would be the surprise), and lets a
 `UsageLimits` request limit catch a runaway compaction. A run-request / iteration limiter will
 therefore see compaction calls among its requests.
@@ -120,5 +120,5 @@ def my_file_key(call: ToolCallPart) -> str | None:
 ## Out of scope
 
 These strategies compress or drop context *inside* the window. Moving large tool outputs *out* of the
-window — overflowing them to a file the agent (or a subagent) can query on demand — is a separate
+window -- overflowing them to a file the agent (or a subagent) can query on demand -- is a separate
 capability, not lossy truncation. Prefer it over capping individual tool outputs.
@@ -1,4 +1,4 @@
-"""`ClearToolResults` — zero-cost in-place clearing of old tool results."""
+"""`ClearToolResults` -- zero-cost in-place clearing of old tool results."""
 
 from __future__ import annotations
 
@@ -31,7 +31,7 @@ class ClearToolResults(AbstractCapability[AgentDepsT]):
     calls remain paired with their (now-blanked) results, so the history stays valid.
     No LLM calls are made.
 
-    This is the cheap first tier of compaction — tool results typically dominate
+    This is the cheap first tier of compaction -- tool results typically dominate
     context, and the agent can re-run a tool if it needs the data again.
 
     Cache tradeoff: clearing rewrites message content, which invalidates the provider's
 
@@ -1,4 +1,4 @@
-"""`DeduplicateFileReads` — zero-cost in-place clearing of superseded file reads."""
+"""`DeduplicateFileReads` -- zero-cost in-place clearing of superseded file reads."""
 
 from __future__ import annotations
 
@@ -25,7 +25,7 @@ class DeduplicateFileReads(AbstractCapability[AgentDepsT]):
     earlier reads are blanked with a placeholder.  Tool-call pairing is preserved.  No LLM
     calls are made.
 
-    File identity is supplied by the ``file_key`` seam — given a ``ToolCallPart`` it returns
+    File identity is supplied by the ``file_key`` seam -- given a ``ToolCallPart`` it returns
     a stable key for the file being read, or ``None`` if the call is not a file read.  There
     is no default: file-read identification is agent-specific, and a wrong guess would drop
     live data.
 
@@ -1,4 +1,4 @@
-"""`LimitWarner` — injects warnings as the run approaches configured limits."""
+"""`LimitWarner` -- injects warnings as the run approaches configured limits."""
 
 from __future__ import annotations
 
 
@@ -1,7 +1,7 @@
 """Shared utilities for the compaction capabilities.
 
 Token estimation, the `CompactionStrategy` protocol, tool-pair-safe cutoff logic, first-user
-preservation, and in-place tool-result clearing — anything used by more than one capability.
+preservation, and in-place tool-result clearing -- anything used by more than one capability.
 """
 
 from __future__ import annotations
@@ -121,7 +121,7 @@ async def compact(
 
 
 # ---------------------------------------------------------------------------
-# Safe cutoff logic — preserves tool-call / tool-return pairs
+# Safe cutoff logic -- preserves tool-call / tool-return pairs
 # ---------------------------------------------------------------------------
 
 _TOOL_PAIR_SEARCH_RANGE = 5
 
@@ -1,4 +1,4 @@
-"""`SlidingWindow` — zero-cost trimming of the oldest messages."""
+"""`SlidingWindow` -- zero-cost trimming of the oldest messages."""
 
 from __future__ import annotations
 
 
@@ -1,4 +1,4 @@
-"""`SummarizingCompaction` — LLM-powered summarization of older messages."""
+"""`SummarizingCompaction` -- LLM-powered summarization of older messages."""
 
 from __future__ import annotations
 
@@ -44,7 +44,7 @@
 Choices made and the reasoning, so they are not relitigated.
 
 ## Artifacts
-Files, paths, identifiers, commands, and APIs touched — quote exact names.
+Files, paths, identifiers, commands, and APIs touched -- quote exact names.
 
 ## Current state
 What is done and what is in progress right now.
@@ -55,7 +55,7 @@
 ## Open questions
 Unresolved questions or blockers.
 
-Focus on results, not a replay of completed actions.  Respond ONLY with the summary — no \
+Focus on results, not a replay of completed actions.  Respond ONLY with the summary -- no \
 preamble, no markdown fences.
 
 <messages>
@@ -140,8 +140,8 @@ class SummarizingCompaction(AbstractCapability[AgentDepsT]):
     summarized using a dedicated model call and replaced with a compact, structured
     summary message, preserving recent context and tool-call integrity.
 
-    This is the expensive tier — summarization turns input tokens into (pricier) output
-    tokens — so it is best used behind cheaper passes (see `TieredCompaction`).
+    This is the expensive tier -- summarization turns input tokens into (pricier) output
+    tokens -- so it is best used behind cheaper passes (see `TieredCompaction`).
 
     The summary call's usage is folded into the parent run's usage (it counts as a real
     request), so cost accounting stays honest; note this also increments the run's request
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		-"""`LimitWarner` — injects warnings as the run approaches configured limits."""
	`1`	+"""`LimitWarner` -- injects warnings as the run approaches configured limits."""
`2`	`2`
`3`	`3`	`from __future__ import annotations`
`4`	`4`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		-"""`SlidingWindow` — zero-cost trimming of the oldest messages."""
	`1`	+"""`SlidingWindow` -- zero-cost trimming of the oldest messages."""
`2`	`2`
`3`	`3`	`from __future__ import annotations`
`4`	`4`