srtab
diff --git a/‎daiv/activity/static/activity/js/activity-stream.js‎
Lines changed: 15 additions & 4 deletions b/‎daiv/activity/static/activity/js/activity-stream.js‎
Lines changed: 15 additions & 4 deletions
diff --git a/‎daiv/automation/agent/middlewares/git.py‎
Lines changed: 28 additions & 2 deletions b/‎daiv/automation/agent/middlewares/git.py‎
Lines changed: 28 additions & 2 deletions
diff --git a/‎daiv/automation/agent/middlewares/git_platform.py‎
Lines changed: 27 additions & 4 deletions b/‎daiv/automation/agent/middlewares/git_platform.py‎
Lines changed: 27 additions & 4 deletions
diff --git a/‎daiv/automation/agent/middlewares/web_fetch.py‎
Lines changed: 3 additions & 3 deletions b/‎daiv/automation/agent/middlewares/web_fetch.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎daiv/automation/agent/middlewares/web_search.py‎
Lines changed: 12 additions & 15 deletions b/‎daiv/automation/agent/middlewares/web_search.py‎
Lines changed: 12 additions & 15 deletions
diff --git a/‎daiv/chat/api/event_filter.py‎
Lines changed: 146 additions & 0 deletions b/‎daiv/chat/api/event_filter.py‎
Lines changed: 146 additions & 0 deletions
@@ -2,15 +2,22 @@
  * Alpine.js components for real-time activity status updates via SSE.
  *
  * activityStream (list page) — tracks multiple activities in place:
- *   dotClass(id, fallback)    → "status-dot-{variant}" CSS class
- *   statusClass(id, fallback) → "status-badge-{variant}" CSS class
+ *   dotClass(id, fallback)    → object toggling status-dot-{variant} classes
+ *   statusClass(id, fallback) → object toggling status-badge-{variant} classes
  *   statusLabel(id, fallback) → human-readable label
  *
+ * Object class maps (rather than a single string) are required so Alpine
+ * removes the previously rendered variant class when the status transitions —
+ * otherwise the static server-rendered class lingers alongside the new one
+ * and the later CSS rule wins.
+ *
  * activityDetail (detail page) — subscribes to one activity and reloads the
  * page on any state change so server-rendered fields (started_at, finished_at,
  * elapsed counter, duration, timeline dots) reflect the new state.
  */
 document.addEventListener("alpine:init", () => {
+    const VARIANTS = ["success", "failed", "running", "pending"];
+
     function statusVariantFor(status) {
         if (status === "SUCCESSFUL") return "success";
         if (status === "FAILED") return "failed";
@@ -25,6 +32,10 @@ document.addEventListener("alpine:init", () => {
         return "Pending";
     }
 
+    function variantClassMap(prefix, active) {
+        return Object.fromEntries(VARIANTS.map((v) => [prefix + v, v === active]));
+    }
+
     Alpine.data("activityStream", (streamUrl, inFlightIds) => ({
         updates: {},
         init() {
@@ -42,10 +53,10 @@ document.addEventListener("alpine:init", () => {
             source.onerror = () => source.close();
         },
         statusClass(id, fallback) {
-            return "status-badge-" + statusVariantFor(this.updates[id]?.status || fallback);
+            return variantClassMap("status-badge-", statusVariantFor(this.updates[id]?.status || fallback));
         },
         dotClass(id, fallback) {
-            return "status-dot-" + statusVariantFor(this.updates[id]?.status || fallback);
+            return variantClassMap("status-dot-", statusVariantFor(this.updates[id]?.status || fallback));
         },
         statusLabel(id, fallback) {
             const update = this.updates[id];
 
@@ -3,6 +3,7 @@
 import logging
 from typing import TYPE_CHECKING, Annotated, Any, cast
 
+from asgiref.sync import sync_to_async
 from langchain.agents import AgentState
 from langchain.agents.middleware import AgentMiddleware, ModelRequest, ModelResponse
 from langchain.agents.middleware.types import PrivateStateAttr
@@ -11,6 +12,7 @@
 
 from automation.agent.publishers import GitChangePublisher
 from codebase.base import MergeRequest, Scope
+from codebase.clients import RepoClient
 from codebase.context import RuntimeCtx  # noqa: TC001
 from codebase.utils import GitManager, get_repo_ref
 
@@ -59,9 +61,11 @@ class GitState(AgentState):
     State for the git middleware.
     """
 
-    merge_request: Annotated[MergeRequest | None, PrivateStateAttr]
+    merge_request: MergeRequest | None
     """
-    The merge request used to commit the changes.
+    The merge request used to commit the changes. Public on the output schema so
+    it streams in AG-UI ``STATE_SNAPSHOT`` events — the chat UI's MR pill is wired
+    directly to this field instead of a custom post-run event.
     """
 
     code_changes: Annotated[bool, PrivateStateAttr]
@@ -116,6 +120,11 @@ async def abefore_agent(self, state: GitState, runtime: Runtime[RuntimeCtx]) ->
             # In this case, ignore the branch name and merge request ID from the state,
             # and use the source branch and merge request ID from the merge request.
             merge_request = runtime.context.merge_request
+        elif merge_request is None:
+            # Surface any pre-existing open MR on the current branch so the chat
+            # composer pill reflects reality from the very first turn. Issue-scope
+            # runs always start on the default branch, where this lookup short-circuits.
+            merge_request = await self._alookup_open_mr(runtime.context)
 
         if merge_request and merge_request.source_branch != get_repo_ref(runtime.context.gitrepo):
             git_manager = GitManager(runtime.context.gitrepo)
@@ -131,6 +140,23 @@ async def abefore_agent(self, state: GitState, runtime: Runtime[RuntimeCtx]) ->
 
         return {"merge_request": merge_request, "code_changes": False}
 
+    @staticmethod
+    async def _alookup_open_mr(context: RuntimeCtx) -> MergeRequest | None:
+        """Best-effort lookup of an open MR whose source branch matches the current ref."""
+        current_branch = get_repo_ref(context.gitrepo)
+        if not current_branch or current_branch == context.config.default_branch:
+            return None
+        try:
+            client = RepoClient.create_instance()
+            return await sync_to_async(client.get_merge_request_by_branches)(
+                context.repository.slug, current_branch, context.config.default_branch
+            )
+        except Exception:
+            logger.exception(
+                "Failed to look up open merge request for %s on %s", context.repository.slug, current_branch
+            )
+            return None
+
     async def awrap_model_call(
         self, request: ModelRequest[RuntimeCtx], handler: Callable[[ModelRequest[RuntimeCtx]], Awaitable[ModelResponse]]
     ) -> ModelResponse:
 
@@ -36,6 +36,29 @@
 DEFAULT_MAX_OUTPUT_LINES = 2_000
 DEFAULT_CLI_TIMEOUT = 30
 
+
+def _truncate_cli_output(output: str, *, keep: Literal["head", "tail"]) -> str:
+    """
+    Cap CLI output to ``DEFAULT_MAX_OUTPUT_LINES``, appending a sentinel when
+    truncation occurs so the agent and the chat UI both know the slice is
+    partial. ``keep="tail"`` is for job traces / run logs where the failing
+    tail is the interesting part.
+    """
+    # Cheap line count avoids materializing splitlines on the (common) happy path.
+    if output.count("\n") < DEFAULT_MAX_OUTPUT_LINES:
+        return output
+
+    lines = output.splitlines(keepends=True)
+    if len(lines) <= DEFAULT_MAX_OUTPUT_LINES:
+        return output
+
+    omitted = len(lines) - DEFAULT_MAX_OUTPUT_LINES
+    sentinel = f"... (truncated, {omitted} lines omitted)\n"
+    if keep == "tail":
+        return sentinel + "".join(lines[-DEFAULT_MAX_OUTPUT_LINES:])
+    return "".join(lines[:DEFAULT_MAX_OUTPUT_LINES]) + sentinel
+
+
 GITLAB_REQUESTS_TIMEOUT = 15
 GITLAB_PER_PAGE = "5"
 GITLAB_TOOL_NAME = "gitlab"
@@ -607,9 +630,9 @@ async def gitlab_tool(
     if resource == "project-job" and splitted_subcommand[1] == "trace":
         # TODO: evict the output to the file system if it's too long
         output = clean_job_logs(output, runtime.context.git_platform)
-        return "".join(output.splitlines(keepends=True)[-DEFAULT_MAX_OUTPUT_LINES:])
+        return _truncate_cli_output(output, keep="tail")
 
-    return "".join(output.splitlines(keepends=True)[:DEFAULT_MAX_OUTPUT_LINES])
+    return _truncate_cli_output(output, keep="head")
 
 
 def _get_cached_github_cli_token(runtime: ToolRuntime[RuntimeCtx]) -> tuple[str, dict[str, str | float] | None]:
@@ -753,9 +776,9 @@ async def github_tool(
     elif resource == "run" and action == "view" and "--log" in splitted_subcommand:
         # TODO: evict the output to the file system if it's too long
         output = clean_job_logs(output, runtime.context.git_platform)
-        output = "".join(output.splitlines(keepends=True)[-DEFAULT_MAX_OUTPUT_LINES:])
+        output = _truncate_cli_output(output, keep="tail")
     else:
-        output = "".join(output.splitlines(keepends=True)[:DEFAULT_MAX_OUTPUT_LINES])
+        output = _truncate_cli_output(output, keep="head")
 
     # Return Command with state update if token was cached/refreshed
     if state_update:
 
@@ -204,7 +204,7 @@ async def web_fetch_tool(
     """
     url = _upgrade_http_to_https(url.strip())
     if not _is_valid_http_url(url):
-        return "Invalid URL. Provide a fully-formed http(s) URL (e.g., https://example.com)."
+        return "error: Invalid URL. Provide a fully-formed http(s) URL (e.g., https://example.com)."
 
     prompt = prompt or ""
 
@@ -218,12 +218,12 @@ async def web_fetch_tool(
         # Used for special redirect signaling.
         return str(e)
     except Exception as e:
-        return f"Failed to fetch URL: {e}"
+        return f"error: Failed to fetch URL: {e}"
 
     # Safety guard: avoid silently truncating; ask for a narrower URL/prompt instead.
     if len(content) > site_settings.web_fetch_max_content_chars:
         return (
-            "Page content is too large to safely analyze in one pass.\n"
+            "error: Page content is too large to safely analyze in one pass.\n"
             "Provide a more specific URL (e.g. a specific section/anchor) or narrow the prompt."
         )
 
 
@@ -1,7 +1,7 @@
 from __future__ import annotations
 
+import json
 import logging
-import textwrap
 from typing import TYPE_CHECKING, Annotated
 
 from django.utils import timezone
@@ -45,13 +45,18 @@
  - Access up-to-date information for current events and recent data
  - Access information beyond your knowledge cutoff
 
+Result format:
+  - The tool returns a JSON array of objects with `title`, `link`, and `content` fields.
+  - An empty array (`[]`) means no relevant results were found — broaden the query and retry, or tell the user no results exist.
+  - Tavily may prepend a synthesized summary as the first entry with `title="Suggested answer"` and `link=""`. Treat it as a hint, not a citable source.
+
 IMPORTANT - Use the correct year in search queries:
   - You MUST use this year when searching for recent information, documentation, or current events.
   - Example: If today is {{current_year}}-07-15 and the user asks for "latest React docs", search for "React documentation {{current_year}}", NOT "React documentation {{previous_year}}".
 
 CRITICAL REQUIREMENT - You MUST follow this when using web search:
   - After answering the user's question using web search results, you MUST include a "Sources:" section at the end of your response when the answer primarily derives from search results.
-  - In the Sources section, list all relevant URLs from the search results as markdown hyperlinks: [Title](URL)
+  - In the Sources section, list each relevant entry's `link` as a markdown hyperlink using its `title`: `[<title>](<link>)`. Skip entries with an empty `link` (the "Suggested answer" hint).
   - This is MANDATORY - never skip including sources in your response
   - Example format:
 
@@ -129,19 +134,11 @@ async def web_search_tool(query: Annotated[str, "The search query."]) -> str:
     Tool to search the web and use the results to inform responses.
     """  # noqa: E501
 
-    if not (results := await _get_web_search_results(query)):
-        return "No relevant results found for the given search query."
-
-    return "\n".join([
-        textwrap.dedent(
-            """\
-            <web_search_result title="{title}" link="{link}">
-            {body}
-            </web_search_result>
-            """
-        ).format(title=result["title"], link=result["link"], body=result["content"])
-        for result in results
-    ])
+    results = await _get_web_search_results(query)
+    # `ensure_ascii=False` keeps non-ASCII titles/snippets readable for the model
+    # (and saves tokens vs. \uXXXX escapes). An empty array is a real, valid
+    # outcome the model is told how to handle in the system prompt.
+    return json.dumps(results, ensure_ascii=False)
 
 
 class WebSearchMiddleware(AgentMiddleware):
 
@@ -0,0 +1,146 @@
+import json
+from typing import TYPE_CHECKING, Any
+
+from ag_ui.core.events import EventType, ToolCallArgsEvent, ToolCallEndEvent, ToolCallStartEvent
+
+if TYPE_CHECKING:
+    from collections.abc import AsyncIterator, Iterable
+
+    from ag_ui.core.events import BaseEvent
+
+
+class SubagentEventFilter:
+    """Reorder/suppress AGUI events so subagent frames don't leak into the parent turn.
+
+    Two upstream behaviors collide on ``task``-tool turns:
+
+    1. ag_ui_langgraph drops the parent's ``task`` TOOL_CALL_START on the
+       text→tool_call transition chunk (the chunk that ends the parent's text
+       stream also carries the new tool_call name, but the handler returns
+       after emitting TEXT_MESSAGE_END). Subsequent chunks only have args, so
+       OnChatModelStream never reaches ``is_tool_call_start_event``. The
+       ``task`` TOOL_CALL_START finally arrives from the OnToolEnd re-emit —
+       *after* the subagent has already streamed text/tool calls to the
+       client.
+
+    2. With ``stream_subgraphs=True``, every chunk emitted from inside
+       ``subagent.ainvoke()`` flows through the parent's stream with a
+       nested ``langgraph_checkpoint_ns`` (``"tools:UUID|model:UUID"``).
+       Without (1)'s TOOL_CALL_START there is no ``task`` segment to
+       suppress them against.
+
+    This filter:
+
+    * captures ``task`` tool_call ids from top-level STATE_SNAPSHOT events,
+    * synthesizes TOOL_CALL_START + ARGS + END for each on the first nested
+      event so the chat creates the segment *before* the subagent runs,
+    * drops every nested event (``|`` in ns),
+    * drops the LATE OnToolEnd re-emitted START/ARGS/END for tool_calls we
+      already synthesized (deduping by tool_call_id).
+
+    The parent's TOOL_CALL_RESULT for the task tool still flows through
+    untouched — it's a top-level event with the same ``tool_call_id``, so the
+    chat UI flips the synthesized segment to ``done`` exactly like a normal
+    tool call.
+    """
+
+    # Tool name used by deepagents' SubAgentMiddleware to invoke a subagent.
+    TASK_TOOL_NAME = "task"
+
+    def __init__(self) -> None:
+        # Two-state lifecycle: a tool_call_id starts in ``_pending`` (synthesize
+        # on next nested event), then moves to ``_emitted`` (drop the late
+        # re-emit). Membership in either is enough to dedup a STATE_SNAPSHOT
+        # rebroadcast; ``_emitted`` alone gates the late TOOL_CALL_*
+        # re-emit drop.
+        self._pending: dict[str, tuple[str, Any]] = {}
+        self._emitted: set[str] = set()
+
+    async def apply(self, stream: AsyncIterator[BaseEvent]) -> AsyncIterator[BaseEvent]:
+        async for event in stream:
+            ns = self._checkpoint_ns(event)
+            is_nested = "|" in ns
+
+            if not is_nested and event.type == EventType.STATE_SNAPSHOT:
+                for tcid, name, args in self._iter_latest_task_calls(event):
+                    if tcid not in self._pending and tcid not in self._emitted:
+                        self._pending[tcid] = (name, args)
+
+            if is_nested:
+                for tcid, (name, args) in self._pending.items():
+                    yield ToolCallStartEvent(type=EventType.TOOL_CALL_START, tool_call_id=tcid, tool_call_name=name)
+                    if args:
+                        # ``default=str`` so a Pydantic model / datetime / other
+                        # non-JSON-native object in args doesn't kill the entire
+                        # chat stream — better a stringified field than RUN_ERROR.
+                        delta = args if isinstance(args, str) else json.dumps(args, default=str)
+                        yield ToolCallArgsEvent(type=EventType.TOOL_CALL_ARGS, tool_call_id=tcid, delta=delta)
+                    yield ToolCallEndEvent(type=EventType.TOOL_CALL_END, tool_call_id=tcid)
+                    self._emitted.add(tcid)
+                self._pending.clear()
+                continue
+
+            if event.type in (EventType.TOOL_CALL_START, EventType.TOOL_CALL_ARGS, EventType.TOOL_CALL_END):
+                tcid = getattr(event, "tool_call_id", None)
+                if isinstance(tcid, str) and tcid in self._emitted:
+                    continue
+
+            yield event
+
+    @staticmethod
+    def _checkpoint_ns(event: BaseEvent) -> str:
+        """Extract the LangGraph checkpoint namespace from an AGUI event's raw_event.
+
+        A ``|`` in the namespace means the event was emitted from a *nested*
+        LangGraph execution — i.e. from inside a subagent invoked by the parent's
+        ``task`` tool. Top-level events have an empty ns or a single
+        ``"<node>:UUID"`` segment (e.g. ``"model:..."``, ``"tools:..."``) with no
+        pipe.
+        """
+        raw = getattr(event, "raw_event", None)
+        if not isinstance(raw, dict):
+            return ""
+        md = raw.get("metadata") or {}
+        return str(md.get("langgraph_checkpoint_ns", "") or "")
+
+    @classmethod
+    def _iter_latest_task_calls(cls, event: BaseEvent) -> Iterable[tuple[str, str, Any]]:
+        """Yield ``(tool_call_id, name, args)`` for every ``task`` tool_call on the
+        snapshot's latest AIMessage. Caller is responsible for dedup against
+        already-emitted ids — this is just the per-snapshot scan.
+        """
+        snap = getattr(event, "snapshot", None)
+        if not isinstance(snap, dict):
+            return
+        msgs = snap.get("messages")
+        if not isinstance(msgs, list):
+            return
+        # Only the latest AIMessage matters — older AIMessages were emitted on
+        # earlier snapshots and their task ids are already in ``task_calls``.
+        # Walking past the latest is just wasted work; the dedup map at the call
+        # site is what guarantees no double-synthesis.
+        for m in reversed(msgs):
+            if cls._msg_role(m) not in ("ai", "assistant"):
+                continue
+            for tc in cls._msg_field(m, "tool_calls") or []:
+                tcid = cls._msg_field(tc, "id")
+                name = cls._msg_field(tc, "name")
+                if name == cls.TASK_TOOL_NAME and isinstance(tcid, str):
+                    yield tcid, name, cls._msg_field(tc, "args")
+            return
+
+    @staticmethod
+    def _msg_field(message: Any, name: str, default: Any = None) -> Any:
+        """Read a field from a LangChain message or its dict-encoded form.
+
+        STATE_SNAPSHOT can carry either shape depending on whether the snapshot
+        has been serialized yet — running through the AGUI encoder turns objects
+        into dicts, but the filter here sits *before* the encoder.
+        """
+        if isinstance(message, dict):
+            return message.get(name, default)
+        return getattr(message, name, default)
+
+    @classmethod
+    def _msg_role(cls, message: Any) -> str:
+        return str(cls._msg_field(message, "type", "") or cls._msg_field(message, "role", "") or "").lower()