strands-agents
diff --git a/‎strands-py/src/strands/injection/__init__.py‎
Lines changed: 15 additions & 0 deletions b/‎strands-py/src/strands/injection/__init__.py‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎strands-py/src/strands/injection/message_injection.py‎
Lines changed: 190 additions & 0 deletions b/‎strands-py/src/strands/injection/message_injection.py‎
Lines changed: 190 additions & 0 deletions
diff --git a/‎strands-py/src/strands/injection/types.py‎
Lines changed: 80 additions & 0 deletions b/‎strands-py/src/strands/injection/types.py‎
Lines changed: 80 additions & 0 deletions
diff --git a/‎strands-py/src/strands/injection/xml.py‎
Lines changed: 37 additions & 0 deletions b/‎strands-py/src/strands/injection/xml.py‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎strands-py/src/strands/memory/__init__.py‎
Lines changed: 10 additions & 0 deletions b/‎strands-py/src/strands/memory/__init__.py‎
Lines changed: 10 additions & 0 deletions
@@ -0,0 +1,15 @@
+"""Context injection for Strands Agents.
+
+This package provides the configuration types for context injection — folding just-in-time text
+into the model input before a call without touching durable history. The delivery primitives
+(in ``message_injection``) are internal; reach injection through the ``ContextInjector`` plugin
+or the ``MemoryManager`` rather than using them directly.
+"""
+
+from .types import InjectionConfig, InjectionContext, InjectionTrigger
+
+__all__ = [
+    "InjectionConfig",
+    "InjectionContext",
+    "InjectionTrigger",
+]
@@ -0,0 +1,190 @@
+"""Delivery primitives for context injection.
+
+These fold just-in-time text into the latest user message *ephemerally* — the model sees the
+augmented input for one call while the agent's durable history is never touched. Reach injection
+through the ``ContextInjector`` plugin or the ``MemoryManager`` rather than these primitives
+directly.
+"""
+
+from __future__ import annotations
+
+import inspect
+import logging
+from collections.abc import Awaitable, Callable
+from dataclasses import replace
+from typing import TYPE_CHECKING, Any, Protocol
+
+from .types import InjectionContext, InjectionTriggerPredicate
+
+if TYPE_CHECKING:
+    from .._middleware.stages import InvokeModelContext
+    from ..types.content import ContentBlock, Message, Messages
+
+logger = logging.getLogger(__name__)
+
+
+class RenderContentCallback(Protocol):
+    """Renders the text to fold into the latest user message for a model call.
+
+    Implemented by a plain function as well — the ``**kwargs`` tail lets the calling convention
+    grow new keyword arguments without breaking existing callbacks.
+    """
+
+    def __call__(self, context: InjectionContext, **kwargs: Any) -> str | None | Awaitable[str | None]:
+        """Return the text to inject, ``None``/``""`` to skip, or an awaitable of either."""
+        ...
+
+
+# The text-rendering callback. The bare ``Callable`` arm keeps the happy path
+# (``lambda context: ...``) ergonomic; the ``RenderContentCallback`` arm is the forward-compatible
+# Protocol for callers that opt into future keyword arguments. A callback that raises fails open
+# (injection is skipped, the model call proceeds).
+RenderContent = Callable[[InjectionContext], "str | None | Awaitable[str | None]"] | RenderContentCallback
+
+
+def create_injection_middleware(
+    render_content: RenderContent,
+    *,
+    trigger: InjectionTriggerPredicate | None = None,
+) -> Callable[[InvokeModelContext], Awaitable[InvokeModelContext]]:
+    """Build an ``InvokeModelStage.Input`` handler that folds injected text into the conversation.
+
+    The handler folds ``render_content``'s text into the latest user message, ephemerally: the
+    model sees the augmented input for this one call while the agent's durable history is
+    never touched. The handler gates on the resolved trigger, asks ``render_content`` for the
+    text, and returns a context with the folded messages. Anything that skips — the trigger
+    not firing, ``render_content`` returning empty, or any callback raising — returns the
+    context unchanged so the model call proceeds (fail open). The injected text never enters
+    durable history because the input phase only rewrites the per-call context, not the
+    agent's stored messages.
+
+    Args:
+        render_content: Renders the text to inject for this call. Sync or async.
+        trigger: When to inject. An ``InjectionTrigger`` name selects a built-in policy
+            (``"userTurn"`` — default — or ``"everyTurn"``); a predicate over the
+            ``InjectionContext`` is the escape hatch. Defaults to ``"userTurn"``.
+
+    Returns:
+        An ``InvokeModelStage.Input`` handler that returns a (possibly) folded context.
+    """
+    resolved_trigger = resolve_trigger(trigger)
+
+    async def handler(context: InvokeModelContext) -> InvokeModelContext:
+        agent = context.agent
+        # Hand the callback its own list, so a callback that reorders/appends cannot perturb the
+        # per-call context. The message dicts are shared, but the upstream InvokeModelContext is
+        # already a defensive copy of agent state, so durable history is safe regardless.
+        injection_context = InjectionContext(messages=list(context.messages), state=agent.state, agent=agent)
+
+        if not resolved_trigger(injection_context):
+            return context
+
+        try:
+            text = render_content(injection_context)
+            if inspect.isawaitable(text):
+                text = await text
+        except Exception as error:  # noqa: BLE001 - fail open: a bad callback must not abort the model call.
+            logger.warning("reason=<%s> | injection render_content raised | skipping injection", error)
+            return context
+
+        if text is None or not text.strip():
+            return context
+
+        return replace(context, messages=fold_into_last_user_message(context.messages, text))
+
+    return handler
+
+
+def resolve_trigger(trigger: InjectionTriggerPredicate | None) -> Callable[[InjectionContext], bool]:
+    """Resolve an ``InjectionTrigger`` name or predicate into a single gate predicate.
+
+    ``"userTurn"`` maps to ``is_user_turn`` (over ``context.messages``); ``"everyTurn"`` to an
+    always-true gate; a user-supplied predicate is wrapped so that a raise fails open (logs and
+    skips injection rather than aborting the model call).
+
+    Args:
+        trigger: An ``InjectionTrigger`` name, a predicate, or ``None`` (defaults to ``"userTurn"``).
+
+    Returns:
+        A predicate that, given the ``InjectionContext``, returns whether to inject this call.
+    """
+    if trigger is None or trigger == "userTurn":
+        return lambda context: is_user_turn(context.messages)
+    if trigger == "everyTurn":
+        return lambda context: True
+
+    predicate = trigger
+
+    def guarded(context: InjectionContext) -> bool:
+        try:
+            return predicate(context)
+        except Exception as error:  # noqa: BLE001 - fail open: a bad predicate must not abort the model call.
+            logger.warning("reason=<%s> | injection trigger raised | skipping injection", error)
+            return False
+
+    return guarded
+
+
+def is_user_turn(messages: Messages) -> bool:
+    """Whether the latest message is a fresh user ask: a ``user`` message carrying no tool result.
+
+    This is the ``"userTurn"`` policy — it distinguishes a new chat ask from an autonomous
+    tool-result turn.
+
+    Args:
+        messages: The current conversation, as data.
+
+    Returns:
+        ``True`` when the latest message is a plain user ask, otherwise ``False``.
+    """
+    if not messages:
+        return False
+    last = messages[-1]
+    return last["role"] == "user" and not any("toolResult" in block for block in last["content"])
+
+
+def fold_into_last_user_message(messages: Messages, text: str) -> Messages:
+    """Fold ``text`` into the most recent ``user`` message as a text block, returning a NEW list.
+
+    Folding into the existing user message (rather than inserting a standalone message) keeps
+    role alternation valid in both chat and the autonomous tool loop. The block is placed to
+    keep the message valid for the model:
+
+    - A plain user ask: the text is **prepended**, leaving the user's own ask in the recency
+      slot — the last thing the model reads.
+    - A tool-result turn (the message carries a tool result block): the text is **appended**,
+      because providers require the tool result to be the first content block in the turn that
+      answers a tool use.
+
+    The input list and its messages are never mutated. When there is no ``user`` message, the
+    input list is returned unchanged.
+
+    Args:
+        messages: The conversation to fold into.
+        text: The text to fold into the most recent user message.
+
+    Returns:
+        A new list with the folded message, or the input list when there is no user message.
+    """
+    target_index = -1
+    for index in range(len(messages) - 1, -1, -1):
+        if messages[index]["role"] == "user":
+            target_index = index
+            break
+    if target_index < 0:
+        return messages
+
+    target = messages[target_index]
+    injected: ContentBlock = {"text": text}
+    # A tool result must stay the first block in the turn that answers a tool use, so append
+    # rather than prepend when the target carries one.
+    has_tool_result = any("toolResult" in block for block in target["content"])
+    content = [*target["content"], injected] if has_tool_result else [injected, *target["content"]]
+
+    folded: Message = {"role": target["role"], "content": content}
+    if "metadata" in target:
+        folded["metadata"] = target["metadata"]
+
+    result = list(messages)
+    result[target_index] = folded
+    return result
@@ -0,0 +1,80 @@
+"""Configuration types shared by injection consumers.
+
+Consumed by the ``ContextInjector`` plugin and the ``MemoryManager``.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Callable
+from dataclasses import dataclass
+from typing import TYPE_CHECKING, Any, Literal, Protocol
+
+if TYPE_CHECKING:
+    from ..agent.agent import Agent
+    from ..agent.state import AgentState
+    from ..types.content import Messages
+
+InjectionTrigger = Literal["userTurn", "everyTurn"]
+"""Determines when injection runs before a model call.
+
+- ``"userTurn"``: only when the latest message is a fresh user ask (a ``user`` message with
+  no tool result) — the common case for chat agents, where it keeps the user's ask the final
+  message the model sees.
+- ``"everyTurn"``: before every model call, including mid-task tool-result turns — for
+  autonomous agents that should consult injected context at each step.
+
+For finer control, pass a predicate instead of a trigger name.
+"""
+
+
+@dataclass
+class InjectionContext:
+    """The context an injection consumer receives on each model call.
+
+    Passed to the ``render_content`` callback and to a predicate trigger.
+
+    Attributes:
+        messages: The current conversation, as data.
+        state: Durable agent state shared across calls, hooks, and tools — read what a tool
+            stashed last turn.
+        agent: The agent the injection is attached to (escape hatch for advanced consumers).
+    """
+
+    messages: Messages
+    state: AgentState
+    agent: Agent
+
+
+class TriggerCallback(Protocol):
+    """A predicate that decides whether to inject on a given model call.
+
+    Implemented by a plain function as well — the ``**kwargs`` tail lets the calling
+    convention grow new keyword arguments without breaking existing predicates.
+    """
+
+    def __call__(self, context: InjectionContext, **kwargs: Any) -> bool:
+        """Return whether to inject this call, given the injection context."""
+        ...
+
+
+# A trigger name, or a predicate over the injection context. The bare ``Callable`` arm keeps the
+# happy path (``lambda context: ...``) ergonomic; the ``TriggerCallback`` arm is the forward-
+# compatible Protocol for callers that opt into future keyword arguments.
+InjectionTriggerPredicate = InjectionTrigger | Callable[[InjectionContext], bool] | TriggerCallback
+
+
+@dataclass
+class InjectionConfig:
+    """Configuration common to every injection consumer: when to inject.
+
+    What text to inject is a consumer concern, added by the configs that extend this one
+    (e.g. ``MemoryInjectionConfig``).
+
+    Attributes:
+        trigger: When injection runs. An ``InjectionTrigger`` name selects a built-in policy;
+            a predicate is the escape hatch — it receives the ``InjectionContext`` and returns
+            whether to inject this call. A predicate that raises fails open (injection is
+            skipped, the model call proceeds). Defaults to ``"userTurn"``.
+    """
+
+    trigger: InjectionTriggerPredicate | None = None
@@ -0,0 +1,37 @@
+"""Minimal XML escaping for folding untrusted text into an XML-shaped block.
+
+Memory entries and other injected content are frequently user-derived, so interpolating them
+raw into ``<entry>…</entry>`` both breaks the block structurally (a stray ``</entry>`` or
+``"``) and opens a stored-prompt-injection surface. These helpers are deliberately tiny —
+enough to keep a ``<memory>`` block well-formed, not a general-purpose serializer.
+"""
+
+from __future__ import annotations
+
+
+def escape_xml_text(value: str) -> str:
+    """Escape text content for placement between XML tags.
+
+    Escapes ``&`` first (so later replacements are not double-escaped), then ``<`` and ``>``.
+
+    Args:
+        value: The raw text to escape.
+
+    Returns:
+        The escaped text, safe to place in element content.
+    """
+    return value.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")
+
+
+def escape_xml_attr(value: str) -> str:
+    """Escape a value for placement inside a double-quoted XML attribute.
+
+    Applies the :func:`escape_xml_text` rules plus ``"`` and ``'``.
+
+    Args:
+        value: The raw attribute value to escape.
+
+    Returns:
+        The escaped value, safe to place inside a quoted attribute.
+    """
+    return escape_xml_text(value).replace('"', "&quot;").replace("'", "&#39;")
@@ -5,6 +5,7 @@
 tools, and runs automatic background extraction.
 """
 
+from ..injection import InjectionConfig, InjectionContext, InjectionTrigger
 from ..types.exceptions import AggregateMemoryError
 from .extraction.model_extractor import ModelExtractor
 from .extraction.triggers import IntervalTrigger, InvocationTrigger
@@ -21,9 +22,12 @@
 from .memory_manager import MemoryManager
 from .types import (
     AddMessagesContext,
+    InjectionFormatContext,
+    InjectionQueryContext,
     MemoryAddOptions,
     MemoryAddToolConfig,
     MemoryEntry,
+    MemoryInjectionConfig,
     MemoryManagerConfig,
     MemorySearchOptions,
     MemoryStore,
@@ -41,12 +45,18 @@
     "ExtractionTriggerContext",
     "Extractor",
     "ExtractorContext",
+    "InjectionConfig",
+    "InjectionContext",
+    "InjectionFormatContext",
+    "InjectionQueryContext",
+    "InjectionTrigger",
     "IntervalTrigger",
     "InvocationTrigger",
     "MemoryAddOptions",
     "MemoryAddToolConfig",
     "MemoryContentBlockType",
     "MemoryEntry",
+    "MemoryInjectionConfig",
     "MemoryManager",
     "MemoryManagerConfig",
     "MemoryMessageFilter",