From 0c702d441c72fe0ae5c27327a332fd3554f67e11 Mon Sep 17 00:00:00 2001
From: Anirudh Reddy Malgari <anirudh.malgari@datahub.com>
Date: Thu, 23 Apr 2026 17:34:22 -0700
Subject: [PATCH 1/3] loads mcp app for get_context

---
 backend/src/analytics_agent/agent/graph.py    |  15 +-
 .../src/analytics_agent/agent/mcp_app_tool.py |  37 ++
 .../src/analytics_agent/agent/streaming.py    |  61 +-
 backend/src/analytics_agent/api/__init__.py   |   3 +-
 backend/src/analytics_agent/api/chat.py       |  68 ++-
 backend/src/analytics_agent/api/mcp_apps.py   | 279 +++++++++
 .../analytics_agent/context/mcp_platform.py   |   8 +
 .../analytics_agent/context/mcp_resources.py  | 240 ++++++++
 backend/src/analytics_agent/context/mcp_ui.py | 220 +++++++
 backend/src/analytics_agent/db/repository.py  |   3 +
 .../src/analytics_agent/engines/mcp/engine.py |   9 +
 backend/src/analytics_agent/prompts/system.py |   7 +-
 .../analytics_agent/prompts/system_prompt.md  |   4 +-
 frontend/src/api/mcpApp.ts                    |  62 ++
 frontend/src/api/stream.ts                    |   6 +-
 frontend/src/components/Chat/ChatView.tsx     |   1 +
 frontend/src/components/Chat/MessageList.tsx  |  85 +--
 .../Chat/messages/AgentWorkBlock.tsx          |  11 +
 .../Chat/messages/MCPAppMessage.tsx           | 123 ++++
 .../Chat/messages/SelectionChip.tsx           |  39 ++
 frontend/src/lib/buildUiMessages.ts           |   1 +
 frontend/src/lib/groupMessages.ts             |   2 +-
 frontend/src/lib/mcpApps/MCPAppFrame.tsx      | 137 +++++
 frontend/src/lib/mcpApps/protocol.ts          | 184 ++++++
 frontend/src/lib/mcpApps/useMcpAppBridge.ts   | 542 ++++++++++++++++++
 frontend/src/types/index.ts                   |  18 +
 .../unit/test_business_context_suppression.py | 131 +++++
 27 files changed, 2245 insertions(+), 51 deletions(-)
 create mode 100644 backend/src/analytics_agent/agent/mcp_app_tool.py
 create mode 100644 backend/src/analytics_agent/api/mcp_apps.py
 create mode 100644 backend/src/analytics_agent/context/mcp_resources.py
 create mode 100644 backend/src/analytics_agent/context/mcp_ui.py
 create mode 100644 frontend/src/api/mcpApp.ts
 create mode 100644 frontend/src/components/Chat/messages/MCPAppMessage.tsx
 create mode 100644 frontend/src/components/Chat/messages/SelectionChip.tsx
 create mode 100644 frontend/src/lib/mcpApps/MCPAppFrame.tsx
 create mode 100644 frontend/src/lib/mcpApps/protocol.ts
 create mode 100644 frontend/src/lib/mcpApps/useMcpAppBridge.ts
 create mode 100644 tests/unit/test_business_context_suppression.py

diff --git a/backend/src/analytics_agent/agent/graph.py b/backend/src/analytics_agent/agent/graph.py
index 3f48ca1..55e40a1 100644
--- a/backend/src/analytics_agent/agent/graph.py
+++ b/backend/src/analytics_agent/agent/graph.py
@@ -43,6 +43,7 @@ def build_graph(
     enabled_mutations: set[str] | None = None,
     context_tools: list | None = None,  # pre-built from DB context platforms at request time
     engine_tools: list | None = None,  # pre-built for MCP data sources (bypasses QueryEngine)
+    suppress_business_context_skill: bool = False,
 ):
     from analytics_agent.agent.chart_generator import chart_node
     from analytics_agent.engines.factory import get_registry
@@ -64,7 +65,10 @@ def build_graph(
     # Always-on skills (context search etc.) + opt-in write-back skills
     from analytics_agent.skills.loader import build_always_on_skill_tools, build_skill_tools
 
-    skill_tools = build_always_on_skill_tools() + build_skill_tools(enabled_mutations or set())
+    always_on_skills = build_always_on_skill_tools()
+    if suppress_business_context_skill:
+        always_on_skills = [t for t in always_on_skills if t.name != "search_business_context"]
+    skill_tools = always_on_skills + build_skill_tools(enabled_mutations or set())
 
     # Engine tools — MCP data sources supply pre-built tools; native engines use QueryEngine
     if engine_tools is not None:
@@ -87,12 +91,17 @@ def build_graph(
         )
 
         system_prompt = system_prompt_override.format(engine_name=engine_name)
-        system_prompt += get_search_business_context_section()
+        if not suppress_business_context_skill:
+            system_prompt += get_search_business_context_section()
         system_prompt += get_improve_context_prompt_section()
         if enabled_mutations:
             system_prompt += get_skill_system_prompt_section(enabled_mutations)
     else:
-        system_prompt = build_system_prompt(engine_name, enabled_skills=enabled_mutations)
+        system_prompt = build_system_prompt(
+            engine_name,
+            enabled_skills=enabled_mutations,
+            include_business_context=not suppress_business_context_skill,
+        )
 
     # Enable per-tool error handling so validation errors (e.g. hallucinated
     # arguments like filter= on get_entities) are returned as tool messages
diff --git a/backend/src/analytics_agent/agent/mcp_app_tool.py b/backend/src/analytics_agent/agent/mcp_app_tool.py
new file mode 100644
index 0000000..d18833a
--- /dev/null
+++ b/backend/src/analytics_agent/agent/mcp_app_tool.py
@@ -0,0 +1,37 @@
+"""Side-channel for MCP App tool results.
+
+Mirrors the _pending_charts pattern in chart_tool.py:
+- The wrapped tool returns a short marker string (MCP_APP_READY:<app_id>).
+- The actual structured payload lives here, keyed by app_id.
+- streaming.py pops from this dict when it sees the marker in on_tool_end.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any
+
+
+@dataclass
+class PendingApp:
+    app_id: str
+    connection_key: str
+    server_name: str
+    tool_name: str
+    tool_input: dict
+    # Structured CallToolResult content (list of content blocks), preserved so
+    # the frontend can forward it verbatim as `ui/notifications/tool-result`
+    # params per the MCP Apps spec.
+    tool_result: Any
+    resource_uri: str
+    csp: str | None = None
+    permissions: list[str] = field(default_factory=list)
+    # Tool names scoped to this app's connection that the iframe is allowed to
+    # call via the Phase 2 tool-proxy endpoint. Populated at wrap time from the
+    # full tool list for the originating connection_key. Persisted in the MCP_APP
+    # SSE payload so the endpoint can rehydrate it from the DB row.
+    allowed_tools: list[str] = field(default_factory=list)
+
+
+# Keyed by app_id; popped once streaming.py emits the MCP_APP SSE event.
+_pending_apps: dict[str, PendingApp] = {}
diff --git a/backend/src/analytics_agent/agent/streaming.py b/backend/src/analytics_agent/agent/streaming.py
index da01197..d2ff6c6 100644
--- a/backend/src/analytics_agent/agent/streaming.py
+++ b/backend/src/analytics_agent/agent/streaming.py
@@ -68,6 +68,14 @@ async def stream_graph_events(
     final_state: dict[str, Any] = {}
     chart_emitted = False  # guard against double-emitting CHART
 
+    # Track active tool runs by run_id -> tool_name so we can detect when a
+    # wrapped tool (e.g. MCP UI wrapper) invokes an inner tool of the same name.
+    # LangGraph v2 fires on_tool_start/on_tool_end for both the outer StructuredTool
+    # and the inner delegated tool, which would otherwise double-record TOOL_CALL
+    # and emit a redundant TOOL_RESULT alongside the MCP_APP bubble.
+    active_tool_runs: dict[str, str] = {}
+    suppressed_tool_runs: set[str] = set()
+
     try:
         from analytics_agent.config import settings as _settings
 
@@ -78,6 +86,7 @@ async def stream_graph_events(
             data: dict[str, Any] = event.get("data", {})
             name: str = event.get("name", "")
             run_id: str = event.get("run_id", "")
+            parent_ids: list[str] = event.get("parent_ids", []) or []
             node: str = event.get("metadata", {}).get("langgraph_node", "")
 
             # ── TEXT ──
@@ -88,12 +97,16 @@ async def stream_graph_events(
                 if getattr(chunk, "tool_call_chunks", None):
                     continue
                 content = chunk.content if hasattr(chunk, "content") else ""
+                # Each chunk gets its own unique message_id. All other event
+                # types already do this (uuid4). Sharing run_id across chunks
+                # collides on the Message.id primary key in persistence and
+                # silently drops every chunk after the first (see chat.py).
                 if isinstance(content, str) and content:
                     final_text_parts.append(content)
                     yield {
                         "event": "TEXT",
                         "conversation_id": conversation_id,
-                        "message_id": run_id,
+                        "message_id": str(uuid.uuid4()),
                         "payload": {"text": content},
                     }
                 elif isinstance(content, list):
@@ -105,13 +118,19 @@ async def stream_graph_events(
                                 yield {
                                     "event": "TEXT",
                                     "conversation_id": conversation_id,
-                                    "message_id": run_id,
+                                    "message_id": str(uuid.uuid4()),
                                     "payload": {"text": text},
                                 }
 
             # ── TOOL_CALL ──
             elif event_type == "on_tool_start":
                 tool_input = data.get("input", {})
+                # Suppress inner tool calls nested under a same-named outer tool
+                # (MCP UI wrapper pattern) so the bubble/history isn't duplicated.
+                if any(active_tool_runs.get(pid) == name for pid in parent_ids):
+                    suppressed_tool_runs.add(run_id)
+                    continue
+                active_tool_runs[run_id] = name
                 if name == "execute_sql":
                     pending_sql[run_id] = tool_input.get("sql", "")
                 # create_chart renders as a CHART event — don't show a tool call bubble
@@ -126,6 +145,11 @@ async def stream_graph_events(
 
             # ── TOOL_ERROR (unhandled exception from tool) ──
             elif event_type == "on_tool_error":
+                if run_id in suppressed_tool_runs:
+                    suppressed_tool_runs.discard(run_id)
+                    active_tool_runs.pop(run_id, None)
+                    pending_sql.pop(run_id, None)
+                    continue
                 error_msg = str(data.get("error", "Tool failed"))
                 yield {
                     "event": "TOOL_RESULT",
@@ -138,9 +162,16 @@ async def stream_graph_events(
                     },
                 }
                 pending_sql.pop(run_id, None)
+                active_tool_runs.pop(run_id, None)
 
             # ── SQL / TOOL_RESULT / CHART ──
             elif event_type == "on_tool_end":
+                if run_id in suppressed_tool_runs:
+                    suppressed_tool_runs.discard(run_id)
+                    active_tool_runs.pop(run_id, None)
+                    pending_sql.pop(run_id, None)
+                    continue
+                active_tool_runs.pop(run_id, None)
                 output = data.get("output", "")
                 if hasattr(output, "content"):
                     output = output.content
@@ -184,6 +215,32 @@ async def stream_graph_events(
                                 "is_error": True,
                             },
                         }
+                elif output_str.startswith("MCP_APP_READY:"):
+                    # Pop the PendingApp from the side-channel and emit an MCP_APP event.
+                    # HTML is never included in the SSE payload — the frontend fetches
+                    # it via GET .../mcp-app/{message_id}/ui (prefetch warms the cache).
+                    app_id = output_str.split(":", 1)[1].split()[0].strip()
+                    from analytics_agent.agent.mcp_app_tool import _pending_apps
+
+                    pending_app = _pending_apps.pop(app_id, None)
+                    if pending_app:
+                        yield {
+                            "event": "MCP_APP",
+                            "conversation_id": conversation_id,
+                            "message_id": str(uuid.uuid4()),
+                            "payload": {
+                                "app_id": app_id,
+                                "connection_key": pending_app.connection_key,
+                                "server_name": pending_app.server_name,
+                                "tool_name": pending_app.tool_name,
+                                "tool_input": pending_app.tool_input,
+                                "tool_result": pending_app.tool_result,
+                                "resource_uri": pending_app.resource_uri,
+                                "csp": pending_app.csp,
+                                "permissions": pending_app.permissions,
+                                "allowed_tools": pending_app.allowed_tools,
+                            },
+                        }
                 elif name == "create_chart":
                     # Fetch chart spec from side-channel (tool returns only a short marker)
                     if output_str.startswith("CHART_READY:"):
diff --git a/backend/src/analytics_agent/api/__init__.py b/backend/src/analytics_agent/api/__init__.py
index c96a525..fdd148f 100644
--- a/backend/src/analytics_agent/api/__init__.py
+++ b/backend/src/analytics_agent/api/__init__.py
@@ -2,11 +2,12 @@
 
 from fastapi import APIRouter
 
-from analytics_agent.api import chat, conversations, oauth, settings
+from analytics_agent.api import chat, conversations, mcp_apps, oauth, settings
 
 api_router = APIRouter()
 api_router.include_router(conversations.router)
 api_router.include_router(chat.router)
+api_router.include_router(mcp_apps.router)
 api_router.include_router(settings.router)
 api_router.include_router(oauth.router)
 
diff --git a/backend/src/analytics_agent/api/chat.py b/backend/src/analytics_agent/api/chat.py
index d4dad54..ace4c1f 100644
--- a/backend/src/analytics_agent/api/chat.py
+++ b/backend/src/analytics_agent/api/chat.py
@@ -74,6 +74,16 @@ async def _compute_quality_background(conv_id: str, factory) -> None:
 
 class ChatMessageRequest(BaseModel):
     text: str
+    # Phase 2: MCP App iframe-originated turns include these for auditing and
+    # frontend rendering (source="mcp_app" rows render as SelectionChip, not a
+    # user bubble; origin_message_id anchors the chip under its selector iframe).
+    source: str | None = None  # e.g. "mcp_app"
+    app_id: str | None = None
+    origin_message_id: str | None = None
+    # Short human-readable label shown on the SelectionChip; `text` may be a
+    # richer agent-facing message (e.g. includes URN + instruction to prevent
+    # redundant disambiguation tool calls).
+    display_text: str | None = None
 
 
 async def _persist_message(
@@ -83,9 +93,10 @@ async def _persist_message(
     role: str,
     payload: dict,
     sequence: int,
+    message_id: str | None = None,
 ) -> None:
     msg = Message(
-        id=str(uuid.uuid4()),
+        id=message_id or str(uuid.uuid4()),
         conversation_id=conversation_id,
         event_type=event_type,
         role=role,
@@ -103,6 +114,10 @@ async def _run_and_broadcast(
     user_text: str,
     engine_name: str,
     keepalive_interval: int,
+    source: str | None = None,
+    app_id: str | None = None,
+    origin_message_id: str | None = None,
+    display_text: str | None = None,
 ) -> None:
     """
     Background task: runs the full agent pipeline independently of the HTTP
@@ -123,8 +138,17 @@ def _broadcast(evt: dict) -> None:
             msg_repo = MessageRepo(session)
             sequence = await msg_repo.next_sequence(conversation_id)
 
+            user_payload: dict = {"text": user_text}
+            if source:
+                user_payload["source"] = source
+            if app_id:
+                user_payload["app_id"] = app_id
+            if origin_message_id:
+                user_payload["origin_message_id"] = origin_message_id
+            if display_text:
+                user_payload["display_text"] = display_text
             await _persist_message(
-                session, conversation_id, "TEXT", "user", {"text": user_text}, sequence
+                session, conversation_id, "TEXT", "user", user_payload, sequence
             )
             await session.commit()
             sequence += 1
@@ -238,6 +262,10 @@ def _broadcast(evt: dict) -> None:
             try:
                 context_tools: list = []
                 include_mutations = bool(enabled_mutations)
+                suppress_business_context_skill = False
+
+                # Each platform owns its disabled_tools and include_mutations state.
+                # build_platform() reads from DB config; get_tools() filters internally.
                 for row in all_cp_rows:
                     platform = build_platform(
                         row,
@@ -248,6 +276,12 @@ def _broadcast(evt: dict) -> None:
                         continue
                     tools = await platform.get_tools()
                     context_tools.extend(tools)
+                    # If a datahub-mcp server advertises `get_context`, it supersedes
+                    # the packaged `search_business_context` skill. Check post-filter
+                    # so an operator who explicitly disabled `get_context` keeps the
+                    # packaged skill active.
+                    if row.type == "datahub-mcp" and any(t.name == "get_context" for t in tools):
+                        suppress_business_context_skill = True
 
                 logger.info(
                     "Total context_tools=%d for conversation %s",
@@ -268,6 +302,7 @@ def _broadcast(evt: dict) -> None:
                     enabled_mutations=enabled_mutations,
                     context_tools=context_tools,
                     engine_tools=engine_tools,
+                    suppress_business_context_skill=suppress_business_context_skill,
                 )
             except Exception as exc:
                 for _evt in cast(
@@ -310,7 +345,7 @@ def _broadcast(evt: dict) -> None:
                 history=history,
             ):
                 if evt.get("event") not in (None, "KEEPALIVE"):
-                    with contextlib.suppress(Exception):
+                    try:
                         await _persist_message(
                             session,
                             conversation_id,
@@ -318,9 +353,24 @@ def _broadcast(evt: dict) -> None:
                             "assistant",
                             evt.get("payload", {}),
                             sequence,
+                            message_id=evt.get("message_id"),
                         )
                         await session.commit()
                         sequence += 1
+                    except Exception as persist_exc:
+                        # A failed commit (e.g. duplicate PK) leaves the async
+                        # session in a doomed transaction — every subsequent
+                        # commit on it would also fail until we rollback.
+                        # Without this, one bad insert silently drops every
+                        # later event in the same turn (incl. COMPLETE).
+                        logger.warning(
+                            "Persist failed for %s event in conv %s: %s",
+                            evt.get("event"),
+                            conversation_id,
+                            persist_exc,
+                        )
+                        with contextlib.suppress(Exception):
+                            await session.rollback()
 
                     if evt.get("event") == "TOOL_RESULT":
                         tool_name = evt.get("payload", {}).get("tool_name", "")
@@ -405,6 +455,14 @@ async def send_message(
     if not body.text.strip():
         raise HTTPException(status_code=422, detail="Message text cannot be empty")
 
+    if body.source:
+        logger.info(
+            "Message in conv %s sourced from %s (app_id=%s)",
+            conversation_id,
+            body.source,
+            body.app_id,
+        )
+
     stream = ConvStream(task=None)
     _active_streams[conversation_id] = stream
     stream.task = asyncio.create_task(
@@ -414,6 +472,10 @@ async def send_message(
             body.text.strip(),
             conv.engine_name,
             settings.sse_keepalive_interval,
+            source=body.source,
+            app_id=body.app_id,
+            origin_message_id=body.origin_message_id,
+            display_text=body.display_text,
         )
     )
 
diff --git a/backend/src/analytics_agent/api/mcp_apps.py b/backend/src/analytics_agent/api/mcp_apps.py
new file mode 100644
index 0000000..619fcd2
--- /dev/null
+++ b/backend/src/analytics_agent/api/mcp_apps.py
@@ -0,0 +1,279 @@
+"""MCP App endpoints.
+
+Phase 1: GET /api/conversations/{conversation_id}/mcp-app/{message_id}/ui
+
+Resolves the persisted {connection_key, resource_uri} from the MCP_APP message
+row, fetches HTML via MCPResourceClient (cache-first, live-server fallback), and
+returns {html, csp, permissions}.
+
+Returns HTTP 404 when both the cache and the live MCP server are unavailable.
+
+Phase 2: POST /api/conversations/{conversation_id}/mcp-app/{app_id}/tool-call
+
+Scoped MCP tool proxy. The iframe sends {tool_name, arguments}; this endpoint:
+  1. Loads the PendingApp from the in-memory side-channel (fast path, live
+     during streaming) or rehydrates from the persisted MCP_APP message row.
+  2. Validates that (connection_key, tool_name) is in the per-app allow-list
+     so the iframe can never reach engine tools, other MCP servers, or
+     create_chart.
+  3. Dispatches tools/call on the originating MCP client session.
+  4. Returns the CallToolResult as JSON.
+"""
+
+from __future__ import annotations
+
+import logging
+from typing import Any
+
+import orjson
+from fastapi import APIRouter, Depends, HTTPException
+from pydantic import BaseModel
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from analytics_agent.db.base import get_session
+from analytics_agent.db.repository import ConversationRepo, MessageRepo
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter(prefix="/api/conversations", tags=["mcp-apps"])
+
+
+# ── Phase 2 helpers ───────────────────────────────────────────────────────────
+
+
+class _AppContext:
+    """Minimal info needed to authorise and dispatch a scoped tool call."""
+
+    def __init__(self, connection_key: str, server_name: str, allowed_tools: list[str]) -> None:
+        self.connection_key = connection_key
+        self.server_name = server_name
+        self.allowed_tools = allowed_tools
+
+
+async def _load_app_context(
+    conversation_id: str,
+    app_id: str,
+    session: AsyncSession,
+) -> _AppContext:
+    """Return app context from the in-memory side-channel or the DB row.
+
+    Prefers the in-memory PendingApp (available while streaming is active or
+    before it was popped by on_tool_end). Falls back to scanning the
+    conversation's MCP_APP message rows when the in-memory entry is gone
+    (replay / post-stream calls).
+
+    Raises HTTPException 404 if neither source has a record for this app_id.
+    """
+    from analytics_agent.agent.mcp_app_tool import _pending_apps
+
+    pending = _pending_apps.get(app_id)
+    if pending is not None:
+        return _AppContext(
+            connection_key=pending.connection_key,
+            server_name=pending.server_name,
+            allowed_tools=pending.allowed_tools,
+        )
+
+    # Rehydrate from persisted message rows.
+    msg_repo = MessageRepo(session)
+    messages = await msg_repo.list_for_conversation(conversation_id)
+    for msg in messages:
+        if msg.event_type != "MCP_APP" or not msg.payload:
+            continue
+        try:
+            payload: dict = orjson.loads(msg.payload)
+        except Exception:
+            continue
+        if payload.get("app_id") == app_id:
+            connection_key = payload.get("connection_key", "")
+            server_name = payload.get("server_name", "")
+            allowed_tools: list[str] = payload.get("allowed_tools") or []
+            if not connection_key:
+                break
+            return _AppContext(
+                connection_key=connection_key,
+                server_name=server_name,
+                allowed_tools=allowed_tools,
+            )
+
+    raise HTTPException(status_code=404, detail=f"MCP App not found: app_id={app_id!r}")
+
+
+async def _dispatch_tool_call(
+    connection_key: str,
+    server_name: str,
+    tool_name: str,
+    arguments: dict[str, Any],
+) -> dict:
+    """Call tool_name on the originating MCP client; return the CallToolResult dict."""
+    from analytics_agent.context.mcp_resources import _mcp_clients
+
+    if connection_key not in _mcp_clients:
+        raise HTTPException(
+            status_code=503,
+            detail=f"MCP client for connection {connection_key!r} is not available — "
+            "the server may have restarted. Reload the page to reconnect.",
+        )
+
+    client, _sname = _mcp_clients[connection_key]
+    if server_name and _sname != server_name:
+        # server_name mismatch — use the one from the registry to be safe
+        logger.warning(
+            "server_name mismatch for connection_key=%s: stored=%s registry=%s",
+            connection_key,
+            server_name,
+            _sname,
+        )
+        server_name = _sname
+
+    try:
+        async with client.session(server_name) as mcp_session:
+            result = await mcp_session.call_tool(tool_name, arguments)
+    except Exception as exc:
+        logger.error(
+            "MCP tool call failed: connection=%s server=%s tool=%s: %s",
+            connection_key,
+            server_name,
+            tool_name,
+            exc,
+        )
+        raise HTTPException(
+            status_code=502,
+            detail=f"MCP tool call failed: {exc}",
+        ) from exc
+
+    # Serialise the result into a plain dict (content blocks list).
+    content: list[dict] = []
+    for block in result.content or []:
+        if hasattr(block, "model_dump"):
+            content.append(block.model_dump())
+        elif isinstance(block, dict):
+            content.append(block)
+        else:
+            content.append({"type": "text", "text": str(block)})
+
+    return {
+        "content": content,
+        "isError": getattr(result, "isError", False) or False,
+    }
+
+
+class ToolCallRequest(BaseModel):
+    tool_name: str
+    arguments: dict[str, Any] = {}
+
+
+# ── Endpoints ─────────────────────────────────────────────────────────────────
+
+
+@router.get("/{conversation_id}/mcp-app/{message_id}/ui")
+async def get_mcp_app_ui(
+    conversation_id: str,
+    message_id: str,
+    session: AsyncSession = Depends(get_session),
+):
+    """Return the HTML, CSP, and permissions for a persisted MCP App message.
+
+    Cache-first: serves from disk cache within TTL.  Falls back to a live
+    resources/read call when the cache is stale or missing.  Returns 404 with
+    a structured placeholder when both the cache and the live server are
+    unavailable.
+    """
+    conv_repo = ConversationRepo(session)
+    conv = await conv_repo.get(conversation_id)
+    if not conv:
+        raise HTTPException(status_code=404, detail="Conversation not found")
+
+    msg_repo = MessageRepo(session)
+    message = await msg_repo.get_by_id(message_id)
+
+    if message is None or message.conversation_id != conversation_id:
+        raise HTTPException(status_code=404, detail="Message not found")
+
+    if message.event_type != "MCP_APP":
+        raise HTTPException(status_code=404, detail="Message is not an MCP App event")
+
+    try:
+        payload: dict = orjson.loads(message.payload)
+    except Exception:
+        raise HTTPException(status_code=500, detail="Corrupt message payload")
+
+    connection_key: str | None = payload.get("connection_key")
+    resource_uri: str | None = payload.get("resource_uri")
+
+    if not connection_key or not resource_uri:
+        raise HTTPException(
+            status_code=404,
+            detail="Message payload missing connection_key or resource_uri",
+        )
+
+    from analytics_agent.context.mcp_resources import resource_client
+
+    try:
+        result = await resource_client.read_ui_resource(connection_key, resource_uri)
+    except RuntimeError as exc:
+        logger.warning(
+            "MCP app UI unavailable for message_id=%s connection_key=%s uri=%s: %s",
+            message_id,
+            connection_key,
+            resource_uri,
+            exc,
+        )
+        raise HTTPException(
+            status_code=404,
+            detail={
+                "message": "MCP app HTML unavailable — server offline and no cache",
+                "connection_key": connection_key,
+                "resource_uri": resource_uri,
+            },
+        )
+
+    return {
+        "html": result["html"],
+        "csp": result.get("csp"),
+        "permissions": result.get("permissions", []),
+        "is_stale": result.get("is_stale", False),
+    }
+
+
+@router.post("/{conversation_id}/mcp-app/{app_id}/tool-call")
+async def mcp_app_tool_call(
+    conversation_id: str,
+    app_id: str,
+    body: ToolCallRequest,
+    session: AsyncSession = Depends(get_session),
+):
+    """Phase 2: scoped MCP tool proxy for iframe apps.
+
+    Validates the requested (connection_key, tool_name) pair against the
+    per-app allow-list, then dispatches tools/call on the originating MCP
+    client session. Never routes to engine tools, other connections, or
+    create_chart.
+    """
+    conv_repo = ConversationRepo(session)
+    conv = await conv_repo.get(conversation_id)
+    if not conv:
+        raise HTTPException(status_code=404, detail="Conversation not found")
+
+    app_ctx = await _load_app_context(conversation_id, app_id, session)
+
+    # Security: ensure the requested tool is in the per-app allow-list.
+    if app_ctx.allowed_tools and body.tool_name not in app_ctx.allowed_tools:
+        logger.warning(
+            "Blocked tool call from iframe: app_id=%s tool=%s allowed=%s",
+            app_id,
+            body.tool_name,
+            app_ctx.allowed_tools,
+        )
+        raise HTTPException(
+            status_code=403,
+            detail=f"Tool {body.tool_name!r} is not in the allow-list for this app.",
+        )
+
+    result = await _dispatch_tool_call(
+        connection_key=app_ctx.connection_key,
+        server_name=app_ctx.server_name,
+        tool_name=body.tool_name,
+        arguments=body.arguments,
+    )
+    return result
diff --git a/backend/src/analytics_agent/context/mcp_platform.py b/backend/src/analytics_agent/context/mcp_platform.py
index 81223bc..eb3d192 100644
--- a/backend/src/analytics_agent/context/mcp_platform.py
+++ b/backend/src/analytics_agent/context/mcp_platform.py
@@ -110,6 +110,14 @@ async def get_tools(self) -> list[BaseTool]:
 
         client = MultiServerMCPClient({self.name: conn})  # type: ignore[dict-item]
         all_tools = await client.get_tools()
+
+        from analytics_agent.context.mcp_ui import wrap_tools_with_ui_resources
+
+        connection_key = f"ctx:{self.name}"
+        all_tools = await wrap_tools_with_ui_resources(
+            connection_key, client, self.name, all_tools
+        )
+
         self._tools_cache = all_tools
         result = [t for t in all_tools if t.name not in self.disabled_tools]
         logger.info(
diff --git a/backend/src/analytics_agent/context/mcp_resources.py b/backend/src/analytics_agent/context/mcp_resources.py
new file mode 100644
index 0000000..8634f04
--- /dev/null
+++ b/backend/src/analytics_agent/context/mcp_resources.py
@@ -0,0 +1,240 @@
+"""MCPResourceClient — reads ui:// resources from MCP servers.
+
+Reuses the MultiServerMCPClient instances in the _mcp_clients registry so we
+open a fresh session (per resources/read call) without duplicating connection
+config or spinning up a second stdio process.
+
+Disk cache layout::
+
+    ./data/mcp-app-cache/<sha256(connection_key + uri)>.html
+    ./data/mcp-app-cache/<sha256(connection_key + uri)>.meta.json
+
+The .meta.json sidecar holds {etag, last_modified, fetched_at, content_hash}.
+Cache policy:
+  - Within TTL (default 1 h): serve from disk without contacting the server.
+  - Past TTL: re-validate using resources/read; compare content_hash if the
+    server doesn't return ETag/Last-Modified.
+  - Server offline past TTL: return stale cache (HTTP 200) with
+    is_stale=True; 404 only when both cache and live server are unavailable.
+"""
+
+from __future__ import annotations
+
+import hashlib
+import logging
+import time
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+
+import orjson
+
+if TYPE_CHECKING:
+    from langchain_mcp_adapters.client import MultiServerMCPClient
+
+logger = logging.getLogger(__name__)
+
+# Process-local registry populated by mcp_ui.register_mcp_client().
+# Maps connection_key -> (MultiServerMCPClient, server_name).
+_mcp_clients: dict[str, tuple[Any, str]] = {}
+
+# Default disk-cache TTL in seconds (1 hour).
+_DEFAULT_TTL = 3600
+
+_CACHE_DIR: Path | None = None
+
+
+def _get_cache_dir() -> Path:
+    global _CACHE_DIR  # noqa: PLW0603
+    if _CACHE_DIR is None:
+        from analytics_agent.config import settings
+
+        db_path = Path(settings.database_url.split("///")[-1])
+        data_dir = db_path.parent if db_path.parent.exists() else Path("data")
+        _CACHE_DIR = data_dir / "mcp-app-cache"
+        _CACHE_DIR.mkdir(parents=True, exist_ok=True)
+    return _CACHE_DIR
+
+
+def _cache_key(connection_key: str, uri: str) -> str:
+    return hashlib.sha256(f"{connection_key}\x00{uri}".encode()).hexdigest()
+
+
+def _html_path(key: str) -> Path:
+    return _get_cache_dir() / f"{key}.html"
+
+
+def _meta_path(key: str) -> Path:
+    return _get_cache_dir() / f"{key}.meta.json"
+
+
+def _read_cache(key: str) -> tuple[str | None, dict]:
+    """Return (html, meta) from disk; html is None on miss."""
+    html_file = _html_path(key)
+    meta_file = _meta_path(key)
+    if not html_file.exists() or not meta_file.exists():
+        return None, {}
+    try:
+        html = html_file.read_text(encoding="utf-8")
+        meta = orjson.loads(meta_file.read_bytes())
+        return html, meta
+    except Exception:
+        return None, {}
+
+
+def _write_cache(key: str, html: str, meta: dict) -> None:
+    try:
+        _html_path(key).write_text(html, encoding="utf-8")
+        _meta_path(key).write_bytes(orjson.dumps(meta))
+    except Exception:
+        logger.warning("MCP app cache write failed for key=%s", key)
+
+
+def _is_fresh(meta: dict, ttl: int) -> bool:
+    fetched_at = meta.get("fetched_at", 0)
+    return (time.time() - fetched_at) < ttl
+
+
+class MCPResourceClient:
+    """Reads ui:// resources from MCP servers with disk caching.
+
+    Instantiate once per process; the underlying MultiServerMCPClient instances
+    are shared via the _mcp_clients registry.
+    """
+
+    def __init__(self, ttl: int = _DEFAULT_TTL) -> None:
+        self.ttl = ttl
+
+    async def read_ui_resource(
+        self,
+        connection_key: str,
+        uri: str,
+        *,
+        use_cache: bool = True,
+    ) -> dict:
+        """Fetch a ui:// resource.
+
+        Returns a dict with keys: html, csp, permissions, etag, last_modified,
+        is_stale (True when falling back to a stale cache entry).
+
+        Raises RuntimeError if both cache and live server are unavailable.
+        """
+        key = _cache_key(connection_key, uri)
+        cached_html, cached_meta = _read_cache(key)
+
+        if use_cache and cached_html is not None and _is_fresh(cached_meta, self.ttl):
+            logger.debug("MCP app cache hit (fresh) for uri=%s", uri)
+            return {
+                "html": cached_html,
+                "csp": cached_meta.get("csp"),
+                "permissions": cached_meta.get("permissions", []),
+                "etag": cached_meta.get("etag"),
+                "last_modified": cached_meta.get("last_modified"),
+                "is_stale": False,
+            }
+
+        # Need to fetch / re-validate from the server.
+        try:
+            result = await self._fetch_from_server(connection_key, uri, cached_meta)
+        except Exception as exc:
+            if cached_html is not None:
+                logger.warning(
+                    "MCP server unavailable for uri=%s; serving stale cache: %s",
+                    uri,
+                    exc,
+                )
+                return {
+                    "html": cached_html,
+                    "csp": cached_meta.get("csp"),
+                    "permissions": cached_meta.get("permissions", []),
+                    "etag": cached_meta.get("etag"),
+                    "last_modified": cached_meta.get("last_modified"),
+                    "is_stale": True,
+                }
+            raise RuntimeError(
+                f"MCP resource unavailable and no cache for uri={uri!r}: {exc}"
+            ) from exc
+
+        if result is None:
+            # Server said "not modified" (304-style).
+            assert cached_html is not None
+            new_meta = {**cached_meta, "fetched_at": time.time()}
+            _write_cache(key, cached_html, new_meta)
+            return {
+                "html": cached_html,
+                "csp": cached_meta.get("csp"),
+                "permissions": cached_meta.get("permissions", []),
+                "etag": cached_meta.get("etag"),
+                "last_modified": cached_meta.get("last_modified"),
+                "is_stale": False,
+            }
+
+        html, new_meta = result
+        _write_cache(key, html, new_meta)
+        return {
+            "html": html,
+            "csp": new_meta.get("csp"),
+            "permissions": new_meta.get("permissions", []),
+            "etag": new_meta.get("etag"),
+            "last_modified": new_meta.get("last_modified"),
+            "is_stale": False,
+        }
+
+    async def _fetch_from_server(
+        self,
+        connection_key: str,
+        uri: str,
+        cached_meta: dict,
+    ) -> tuple[str, dict] | None:
+        """Fetch resource from the MCP server.
+
+        Returns (html, new_meta) on success, None if content is unchanged.
+        Raises on failure.
+        """
+        if connection_key not in _mcp_clients:
+            raise RuntimeError(
+                f"No MCP client registered for connection_key={connection_key!r}"
+            )
+
+        client, server_name = _mcp_clients[connection_key]
+
+        from pydantic import AnyUrl
+
+        async with client.session(server_name) as session:
+            result = await session.read_resource(AnyUrl(uri))
+
+        if not result.contents:
+            raise RuntimeError(f"Empty resource response for uri={uri!r}")
+
+        first = result.contents[0]
+        if not hasattr(first, "text"):
+            raise RuntimeError(
+                f"Resource {uri!r} returned non-text content (type={type(first).__name__})"
+            )
+        html: str = first.text
+
+        # Compare content hash for change detection when server doesn't send ETags.
+        content_hash = hashlib.sha256(html.encode()).hexdigest()
+        if cached_meta.get("content_hash") == content_hash:
+            return None  # unchanged
+
+        new_meta: dict = {
+            "fetched_at": time.time(),
+            "content_hash": content_hash,
+            "etag": None,
+            "last_modified": None,
+            "csp": None,
+            "permissions": [],
+        }
+
+        # Extract optional csp/permissions from resource metadata (if exposed).
+        meta_obj = getattr(result, "meta", None) or {}
+        if isinstance(meta_obj, dict):
+            ui = meta_obj.get("ui") or {}
+            new_meta["csp"] = ui.get("csp")
+            new_meta["permissions"] = ui.get("permissions") or []
+
+        return html, new_meta
+
+
+# Module-level singleton shared across call sites.
+resource_client = MCPResourceClient()
diff --git a/backend/src/analytics_agent/context/mcp_ui.py b/backend/src/analytics_agent/context/mcp_ui.py
new file mode 100644
index 0000000..f1912b6
--- /dev/null
+++ b/backend/src/analytics_agent/context/mcp_ui.py
@@ -0,0 +1,220 @@
+"""MCP UI helpers — client registry + tool wrapping.
+
+Two responsibilities:
+1. _mcp_clients registry: populated when a platform/engine is built; provides
+   the MultiServerMCPClient reference that MCPResourceClient uses for
+   resources/read calls.
+2. wrap_tools_with_ui_resources(): called from both MCPContextPlatform.get_tools()
+   and MCPQueryEngine.get_tools_async().  For every tool that advertises a
+   _meta.ui.resourceUri, it:
+     a. Kicks off an asyncio.create_task() prefetch of the resource into the disk
+        cache so the cache is warm by the time the agent calls the tool.
+     b. Replaces the tool with a wrapper that, after the underlying MCP tool/call
+        returns, stuffs {tool_result, connection_key, tool_name, tool_input,
+        resource_uri, csp, permissions} into _pending_apps and returns the short
+        marker MCP_APP_READY:<app_id>.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import logging
+import uuid
+from typing import TYPE_CHECKING, Any
+
+import orjson
+
+if TYPE_CHECKING:
+    from langchain_core.tools import BaseTool
+
+logger = logging.getLogger(__name__)
+
+
+_DEFAULT_UI_AGENT_INSTRUCTIONS = (
+    "An interactive UI card has been rendered inline in the chat for the user to "
+    "act on. Do not restate the options, do not call any other tools, and do not "
+    "answer the user's question yet. Stop and wait for the user's next message."
+)
+
+
+def _extract_agent_instructions(content_blocks: list[dict]) -> str | None:
+    """Return the `_agent_instructions` string from any JSON-bearing text block.
+
+    MCP servers that render UI can embed `_agent_instructions` in their tool
+    output so the host model knows to stop and wait for user interaction. Our
+    wrapper previously swallowed the entire payload by returning only a marker,
+    which meant the LLM never saw this directive and would happily call more
+    tools. Surface it back into the tool's return value so it lands in the
+    ToolMessage the agent reads.
+    """
+    for block in content_blocks:
+        if not isinstance(block, dict) or block.get("type") != "text":
+            continue
+        text = block.get("text", "")
+        if not isinstance(text, str) or "_agent_instructions" not in text:
+            continue
+        try:
+            data = orjson.loads(text)
+        except Exception:
+            continue
+        if isinstance(data, dict):
+            instructions = data.get("_agent_instructions")
+            if isinstance(instructions, str) and instructions.strip():
+                return instructions.strip()
+    return None
+
+
+def register_mcp_client(
+    connection_key: str,
+    client: Any,
+    server_name: str,
+) -> None:
+    """Register a MultiServerMCPClient in the shared registry (mcp_resources._mcp_clients)."""
+    from analytics_agent.context.mcp_resources import _mcp_clients
+
+    _mcp_clients[connection_key] = (client, server_name)
+    logger.debug("Registered MCP client for connection_key=%s", connection_key)
+
+
+def _get_ui_meta(tool: BaseTool) -> dict:
+    """Extract _meta.ui from a LangChain tool's metadata (may be empty)."""
+    meta = (tool.metadata or {}).get("_meta") or {}
+    if isinstance(meta, dict):
+        return meta.get("ui") or {}
+    return {}
+
+
+async def _prefetch_resource(connection_key: str, uri: str) -> None:
+    """Best-effort prefetch of a ui:// resource into the disk cache."""
+    try:
+        from analytics_agent.context.mcp_resources import resource_client
+
+        await resource_client.read_ui_resource(connection_key, uri, use_cache=False)
+        logger.debug("Prefetched MCP ui resource: connection=%s uri=%s", connection_key, uri)
+    except Exception as exc:
+        logger.warning(
+            "MCP ui resource prefetch failed (connection=%s uri=%s): %s",
+            connection_key,
+            uri,
+            exc,
+        )
+
+
+def _make_content_blocks(raw: Any) -> list[dict]:
+    """Coerce an ainvoke() return value into standard MCP content blocks.
+
+    The MCP Apps spec requires `ui/notifications/tool-result` params to be a
+    CallToolResult (`{content: [{type, text, ...}, ...]}`). Preserve structured
+    content so the iframe app can parse it; wrap plain strings as a single
+    text block.
+    """
+    if isinstance(raw, list):
+        blocks: list[dict] = []
+        for block in raw:
+            if isinstance(block, dict):
+                blocks.append(block)
+            elif isinstance(block, str):
+                blocks.append({"type": "text", "text": block})
+        return blocks
+    if isinstance(raw, str):
+        return [{"type": "text", "text": raw}]
+    return [{"type": "text", "text": str(raw)}]
+
+
+def _wrap_tool(
+    original: BaseTool,
+    connection_key: str,
+    server_name: str,
+    resource_uri: str,
+    csp: str | None,
+    permissions: list[str],
+    allowed_tools: list[str],
+) -> BaseTool:
+    """Return a new StructuredTool that calls original then stuffs _pending_apps."""
+    from langchain_core.tools import StructuredTool
+
+    from analytics_agent.agent.mcp_app_tool import PendingApp, _pending_apps
+
+    tool_name = original.name
+
+    async def _wrapper(**kwargs: Any) -> str:
+        raw = await original.ainvoke(kwargs)
+        content_blocks = _make_content_blocks(raw)
+
+        app_id = str(uuid.uuid4())
+        _pending_apps[app_id] = PendingApp(
+            app_id=app_id,
+            connection_key=connection_key,
+            server_name=server_name,
+            tool_name=tool_name,
+            tool_input=dict(kwargs),
+            tool_result=content_blocks,
+            resource_uri=resource_uri,
+            csp=csp,
+            permissions=list(permissions),
+            allowed_tools=list(allowed_tools),
+        )
+        # Preserve the server-provided `_agent_instructions` (or fall back to a
+        # sensible default) so the LLM actually receives a directive to stop
+        # and wait for the user. streaming.py still parses the leading
+        # `MCP_APP_READY:<app_id>` marker on the first line.
+        instructions = (
+            _extract_agent_instructions(content_blocks)
+            or _DEFAULT_UI_AGENT_INSTRUCTIONS
+        )
+        return f"MCP_APP_READY:{app_id} ({tool_name})\n{instructions}"
+
+    return StructuredTool(
+        name=original.name,
+        description=original.description,
+        args_schema=original.args_schema,
+        coroutine=_wrapper,
+        metadata=original.metadata,
+    )
+
+
+async def wrap_tools_with_ui_resources(
+    connection_key: str,
+    client: Any,
+    server_name: str,
+    tools: list[BaseTool],
+) -> list[BaseTool]:
+    """Register the client and wrap any UI-bearing tools.
+
+    For each tool whose MCP descriptor carries _meta.ui.resourceUri:
+      - Kick off an asyncio.create_task() prefetch into the disk cache.
+      - Replace the tool with a wrapper that emits MCP_APP_READY:<app_id>.
+
+    Tools without a resourceUri are returned unchanged.
+    """
+    register_mcp_client(connection_key, client, server_name)
+
+    # Collect all tool names on this connection for the Phase 2 allow-list.
+    all_tool_names = [t.name for t in tools]
+
+    result: list[BaseTool] = []
+    for tool in tools:
+        ui_meta = _get_ui_meta(tool)
+        resource_uri: str | None = ui_meta.get("resourceUri")
+        if not resource_uri:
+            result.append(tool)
+            continue
+
+        csp: str | None = ui_meta.get("csp")
+        permissions: list[str] = ui_meta.get("permissions") or []
+
+        # Fire-and-forget prefetch so the cache is warm before the agent calls the tool.
+        asyncio.create_task(
+            _prefetch_resource(connection_key, resource_uri),
+            name=f"mcp-prefetch-{connection_key}-{tool.name}",
+        )
+
+        wrapped = _wrap_tool(
+            tool, connection_key, server_name, resource_uri, csp, permissions, all_tool_names
+        )
+        result.append(wrapped)
+        logger.info(
+            "MCP tool '%s' wrapped with UI resource: %s", tool.name, resource_uri
+        )
+
+    return result
diff --git a/backend/src/analytics_agent/db/repository.py b/backend/src/analytics_agent/db/repository.py
index 3487f5f..9439b36 100644
--- a/backend/src/analytics_agent/db/repository.py
+++ b/backend/src/analytics_agent/db/repository.py
@@ -90,6 +90,9 @@ async def create(self, message: Message) -> Message:
         await self._session.commit()
         return message
 
+    async def get_by_id(self, message_id: str) -> Message | None:
+        return await self._session.get(Message, message_id)
+
     async def list_for_conversation(self, conversation_id: str) -> list[Message]:
         result = await self._session.execute(
             select(Message)
diff --git a/backend/src/analytics_agent/engines/mcp/engine.py b/backend/src/analytics_agent/engines/mcp/engine.py
index b0ab318..9ba25a4 100644
--- a/backend/src/analytics_agent/engines/mcp/engine.py
+++ b/backend/src/analytics_agent/engines/mcp/engine.py
@@ -70,6 +70,15 @@ async def get_tools_async(self) -> list[BaseTool]:
 
         client = MultiServerMCPClient({"engine": conn})  # type: ignore[dict-item]
         tools = await client.get_tools()
+
+        from analytics_agent.context.mcp_ui import wrap_tools_with_ui_resources
+
+        # Use a stable key derived from the MCP config so multiple MCP engines
+        # can coexist in the same process without registry collisions.
+        engine_label = self._mcp_cfg.get("name") or self._mcp_cfg.get("url", "engine")
+        connection_key = f"engine:{engine_label}"
+        tools = await wrap_tools_with_ui_resources(connection_key, client, "engine", tools)
+
         logger.info("MCP engine provided %d tools", len(tools))
         return tools
 
diff --git a/backend/src/analytics_agent/prompts/system.py b/backend/src/analytics_agent/prompts/system.py
index c925791..7c194fe 100644
--- a/backend/src/analytics_agent/prompts/system.py
+++ b/backend/src/analytics_agent/prompts/system.py
@@ -11,6 +11,7 @@ def get_prompt_template() -> str:
 def build_system_prompt(
     engine_name: str,
     enabled_skills: set[str] | None = None,
+    include_business_context: bool = True,
 ) -> str:
     from analytics_agent.skills.loader import (
         get_improve_context_prompt_section,
@@ -21,8 +22,10 @@ def build_system_prompt(
     today = date.today().strftime("%B %d, %Y")
     base = get_prompt_template().format(engine_name=engine_name, today=today)
 
-    # Always inject always-on meta-skills
-    base = base + get_search_business_context_section()
+    # Always inject always-on meta-skills. `search_business_context` is skipped
+    # when a richer `get_context` tool is in play (see build_graph).
+    if include_business_context:
+        base = base + get_search_business_context_section()
     base = base + get_improve_context_prompt_section()
 
     if enabled_skills:
diff --git a/backend/src/analytics_agent/prompts/system_prompt.md b/backend/src/analytics_agent/prompts/system_prompt.md
index 02e6af7..2927fe8 100644
--- a/backend/src/analytics_agent/prompts/system_prompt.md
+++ b/backend/src/analytics_agent/prompts/system_prompt.md
@@ -11,7 +11,7 @@ Your goal is to answer the user's data questions by:
 ## Available tool groups
 
 **DataHub (catalog & context)**
-- search_documents: search business documentation, metric definitions, and domain knowledge — USE THIS FIRST
+- search_documents: search business documentation, metric definitions, and domain knowledge
 - grep_documents: search document content for specific terms or patterns
 - search: find datasets, dashboards, and other data assets by keyword
 - get_entities: get detailed metadata (schema, description, owners) for specific assets — takes a LIST OF URNs only (no filters); call search() first to get URNs, then pass them here
@@ -124,7 +124,7 @@ me about whether I'm querying the right table?*
 
 ## Workflow
 
-For every data question, follow this order:
+For every data question, follow this order only if "get_context" tool is unavailable:
 
 **Step 1 — Understand the business context first**
 Always call search_documents before doing anything else. Search for:
diff --git a/frontend/src/api/mcpApp.ts b/frontend/src/api/mcpApp.ts
new file mode 100644
index 0000000..ec8e667
--- /dev/null
+++ b/frontend/src/api/mcpApp.ts
@@ -0,0 +1,62 @@
+const BASE = "/api";
+
+export interface McpAppUi {
+  html: string;
+  csp: string | null;
+  permissions: string[];
+}
+
+/**
+ * Fetch the HTML for an MCP App by message ID.
+ *
+ * The backend serves this from the disk cache (warmed by the prefetch
+ * at tool-discovery time) or falls back to a live resources/read.
+ * Returns null if both cache and server are unavailable (404).
+ */
+export async function fetchMcpAppUi(
+  conversationId: string,
+  messageId: string
+): Promise<McpAppUi | null> {
+  const res = await fetch(
+    `${BASE}/conversations/${conversationId}/mcp-app/${messageId}/ui`
+  );
+  if (res.status === 404) return null;
+  if (!res.ok) throw new Error(`Failed to fetch MCP App UI: ${res.status}`);
+  return res.json();
+}
+
+export interface McpToolCallResult {
+  content: Array<{ type: string; text?: string; [k: string]: unknown }>;
+  isError?: boolean;
+}
+
+/**
+ * Phase 2: scoped MCP tool proxy.
+ *
+ * Called by useMcpAppBridge when the iframe sends a `tools/call` JSON-RPC
+ * request. The backend validates the (connection_key, tool_name) allow-list
+ * before dispatching to the originating MCP server.
+ *
+ * Throws on network / HTTP errors; the hook re-raises as a JSON-RPC error
+ * reply to the iframe.
+ */
+export async function callMcpAppTool(
+  conversationId: string,
+  appId: string,
+  toolName: string,
+  args: Record<string, unknown> = {}
+): Promise<McpToolCallResult> {
+  const res = await fetch(
+    `${BASE}/conversations/${conversationId}/mcp-app/${appId}/tool-call`,
+    {
+      method: "POST",
+      headers: { "Content-Type": "application/json" },
+      body: JSON.stringify({ tool_name: toolName, arguments: args }),
+    }
+  );
+  if (!res.ok) {
+    const detail = await res.text().catch(() => res.statusText);
+    throw new Error(`MCP tool call failed (${res.status}): ${detail}`);
+  }
+  return res.json();
+}
diff --git a/frontend/src/api/stream.ts b/frontend/src/api/stream.ts
index 9bda768..e103f3d 100644
--- a/frontend/src/api/stream.ts
+++ b/frontend/src/api/stream.ts
@@ -33,12 +33,14 @@ export async function* reattachStream(
 export async function* streamMessage(
   conversationId: string,
   text: string,
-  signal?: AbortSignal
+  signal?: AbortSignal,
+  /** Extra body fields forwarded verbatim (e.g. source, app_id for auditing). */
+  extraBody?: Record<string, unknown>
 ): AsyncIterator<SSEEvent> {
   const res = await fetch(`/api/conversations/${conversationId}/messages`, {
     method: "POST",
     headers: { "Content-Type": "application/json" },
-    body: JSON.stringify({ text }),
+    body: JSON.stringify({ text, ...extraBody }),
     signal,
   });
 
diff --git a/frontend/src/components/Chat/ChatView.tsx b/frontend/src/components/Chat/ChatView.tsx
index f911085..f58f11a 100644
--- a/frontend/src/components/Chat/ChatView.tsx
+++ b/frontend/src/components/Chat/ChatView.tsx
@@ -351,6 +351,7 @@ export function ChatView() {
       <MessageList
         messages={messages}
         isStreaming={isStreaming}
+        conversationId={activeId}
         showReasoning={showReasoning}
         onChartError={(error) => {
           if (chartErrorRetried.current || isStreaming) return;
diff --git a/frontend/src/components/Chat/MessageList.tsx b/frontend/src/components/Chat/MessageList.tsx
index 072f438..175a6e5 100644
--- a/frontend/src/components/Chat/MessageList.tsx
+++ b/frontend/src/components/Chat/MessageList.tsx
@@ -2,16 +2,18 @@ import { Fragment, useEffect, useRef } from "react";
 import type { UIMessage } from "@/types";
 import { TextMessage } from "./messages/TextMessage";
 import { AgentWorkBlock } from "./messages/AgentWorkBlock";
+import { SelectionChip, type SelectionChipPayload } from "./messages/SelectionChip";
 import { groupIntoTurns } from "@/lib/groupMessages";
 
 interface Props {
   messages: UIMessage[];
   isStreaming?: boolean;
+  conversationId?: string;
   showReasoning?: boolean;
   onChartError?: (error: string) => void;
 }
 
-export function MessageList({ messages, isStreaming = false, showReasoning = true, onChartError }: Props) {
+export function MessageList({ messages, isStreaming = false, conversationId, showReasoning = true, onChartError }: Props) {
   const bottomRef = useRef<HTMLDivElement>(null);
 
   useEffect(() => {
@@ -30,42 +32,55 @@ export function MessageList({ messages, isStreaming = false, showReasoning = tru
 
   return (
     <div id="chat-messages" className="flex-1 overflow-y-auto px-4 py-4 space-y-3">
-      {groups.map((group) => (
-        <Fragment key={group.key}>
-          {/* User message */}
-          {group.userMsg && (
-            <div className="flex flex-col items-end" data-print-role="user">
-              <TextMessage
-                payload={group.userMsg.payload as never}
-                role="user"
-                isStreaming={false}
-              />
-            </div>
-          )}
-
-          {/* Agent work block — only shown when there are intermediate steps */}
-          {group.workMsgs.length > 0 && (
-            <AgentWorkBlock
-              workMessages={group.workMsgs}
-              turnUsage={group.finalMsg?.turnUsage}
-              isStreaming={group.isActivelyStreaming}
-              showReasoning={showReasoning}
-              onChartError={onChartError}
-            />
-          )}
+      {groups.map((group) => {
+        // MCP App iframe-originated user turns render as a compact selection
+        // chip (flavor C) — not a full user bubble.
+        const isMcpAppSelection =
+          group.userMsg?.event_type === "TEXT" &&
+          (group.userMsg.payload as Record<string, unknown>).source === "mcp_app";
+        return (
+          <Fragment key={group.key}>
+            {/* User message */}
+            {group.userMsg && isMcpAppSelection && (
+              <div className="flex flex-col items-start" data-print-role="user">
+                <SelectionChip payload={group.userMsg.payload as unknown as SelectionChipPayload} />
+              </div>
+            )}
+            {group.userMsg && !isMcpAppSelection && (
+              <div className="flex flex-col items-end" data-print-role="user">
+                <TextMessage
+                  payload={group.userMsg.payload as never}
+                  role="user"
+                  isStreaming={false}
+                />
+              </div>
+            )}
 
-          {/* Final visible response */}
-          {group.finalMsg && (group.finalMsg.payload as { text?: string }).text?.trim() && (
-            <div className="flex flex-col items-start" data-print-role="assistant">
-              <TextMessage
-                payload={group.finalMsg.payload as never}
-                role="assistant"
-                isStreaming={group.finalMsg.isStreaming}
+            {/* Agent work block — only shown when there are intermediate steps */}
+            {group.workMsgs.length > 0 && (
+              <AgentWorkBlock
+                workMessages={group.workMsgs}
+                turnUsage={group.finalMsg?.turnUsage}
+                isStreaming={group.isActivelyStreaming}
+                showReasoning={showReasoning}
+                conversationId={conversationId}
+                onChartError={onChartError}
               />
-            </div>
-          )}
-        </Fragment>
-      ))}
+            )}
+
+            {/* Final visible response */}
+            {group.finalMsg && (group.finalMsg.payload as { text?: string }).text?.trim() && (
+              <div className="flex flex-col items-start" data-print-role="assistant">
+                <TextMessage
+                  payload={group.finalMsg.payload as never}
+                  role="assistant"
+                  isStreaming={group.finalMsg.isStreaming}
+                />
+              </div>
+            )}
+          </Fragment>
+        );
+      })}
       <div ref={bottomRef} />
     </div>
   );
diff --git a/frontend/src/components/Chat/messages/AgentWorkBlock.tsx b/frontend/src/components/Chat/messages/AgentWorkBlock.tsx
index 23f8c98..20534cf 100644
--- a/frontend/src/components/Chat/messages/AgentWorkBlock.tsx
+++ b/frontend/src/components/Chat/messages/AgentWorkBlock.tsx
@@ -7,6 +7,8 @@ import { ToolCallMessage, ToolResultMessage } from "./ToolCallMessage";
 import { SqlMessage } from "./SqlMessage";
 import { ChartMessage } from "./ChartMessage";
 import { ErrorMessage } from "./ErrorMessage";
+import { MCPAppMessage } from "./MCPAppMessage";
+import type { MCPAppPayload } from "@/types";
 
 function fmt(n: number): string {
   if (n < 1000) return String(n);
@@ -19,6 +21,7 @@ interface Props {
   turnUsage?: TurnUsage;
   isStreaming?: boolean;
   showReasoning?: boolean;
+  conversationId?: string;
   onChartError?: (error: string) => void;
 }
 
@@ -27,6 +30,7 @@ export function AgentWorkBlock({
   turnUsage,
   isStreaming = false,
   showReasoning = true,
+  conversationId,
   onChartError,
 }: Props) {
   const [expanded, setExpanded] = useState(isStreaming);
@@ -197,6 +201,13 @@ export function AgentWorkBlock({
                 {msg.event_type === "CHART" && (
                   <ChartMessage payload={msg.payload as never} onRenderError={onChartError} />
                 )}
+                {msg.event_type === "MCP_APP" && conversationId && (
+                  <MCPAppMessage
+                    messageId={msg.id}
+                    conversationId={conversationId}
+                    payload={msg.payload as unknown as MCPAppPayload}
+                  />
+                )}
                 {msg.event_type === "ERROR" && (
                   <ErrorMessage payload={msg.payload as never} />
                 )}
diff --git a/frontend/src/components/Chat/messages/MCPAppMessage.tsx b/frontend/src/components/Chat/messages/MCPAppMessage.tsx
new file mode 100644
index 0000000..e5f7056
--- /dev/null
+++ b/frontend/src/components/Chat/messages/MCPAppMessage.tsx
@@ -0,0 +1,123 @@
+/**
+ * MCPAppMessage — adapter between an MCP_APP SSE payload and MCPAppFrame.
+ *
+ * On mount, always fetches HTML via GET .../mcp-app/{message_id}/ui.
+ * The prefetched disk cache on the backend makes this fast for first render;
+ * the same code path handles replay when the conversation is reloaded.
+ *
+ * Shows a skeleton while the fetch is in flight, a graceful placeholder on
+ * 404 (both cache and server unavailable), and the sandboxed iframe once ready.
+ */
+
+import { useEffect, useState } from "react";
+import { Loader2, AppWindow } from "lucide-react";
+import type { MCPAppPayload } from "@/types";
+import { fetchMcpAppUi } from "@/api/mcpApp";
+import { MCPAppFrame } from "@/lib/mcpApps/MCPAppFrame";
+
+interface Props {
+  messageId: string;
+  conversationId: string;
+  payload: MCPAppPayload;
+}
+
+type FetchState =
+  | { status: "loading" }
+  | { status: "ready"; html: string; csp: string | null; permissions: string[] }
+  | { status: "unavailable" }
+  | { status: "error"; message: string };
+
+export function MCPAppMessage({ messageId, conversationId, payload }: Props) {
+  const [fetchState, setFetchState] = useState<FetchState>({ status: "loading" });
+  const [appReady, setAppReady] = useState(false);
+
+  useEffect(() => {
+    let cancelled = false;
+    setFetchState({ status: "loading" });
+    setAppReady(false);
+
+    fetchMcpAppUi(conversationId, messageId)
+      .then((ui) => {
+        if (cancelled) return;
+        if (ui === null) {
+          setFetchState({ status: "unavailable" });
+        } else {
+          setFetchState({
+            status: "ready",
+            html: ui.html,
+            csp: ui.csp,
+            permissions: ui.permissions,
+          });
+        }
+      })
+      .catch((err: unknown) => {
+        if (cancelled) return;
+        setFetchState({
+          status: "error",
+          message: err instanceof Error ? err.message : String(err),
+        });
+      });
+
+    return () => {
+      cancelled = true;
+    };
+  }, [conversationId, messageId]);
+
+  return (
+    <div className="w-full rounded-lg border border-border overflow-hidden bg-background">
+      {/* Header strip */}
+      <div className="flex items-center gap-2 px-3 py-2 bg-muted/40 border-b border-border text-xs text-muted-foreground">
+        <AppWindow className="w-3.5 h-3.5 shrink-0" />
+        <span className="font-mono truncate">{payload.tool_name}</span>
+        {payload.server_name && (
+          <span className="ml-auto shrink-0 opacity-60">{payload.server_name}</span>
+        )}
+      </div>
+
+      {/* Content area */}
+      {fetchState.status === "loading" && (
+        <div className="flex items-center justify-center gap-2 py-10 text-muted-foreground text-sm">
+          <Loader2 className="w-4 h-4 animate-spin" />
+          Loading app…
+        </div>
+      )}
+
+      {fetchState.status === "unavailable" && (
+        <div className="px-4 py-6 text-sm text-muted-foreground text-center">
+          <p className="font-medium">App unavailable</p>
+          <p className="mt-1 text-xs opacity-70">
+            The MCP server is offline and no cached version is available.
+          </p>
+        </div>
+      )}
+
+      {fetchState.status === "error" && (
+        <div className="px-4 py-4 text-xs text-red-500 bg-red-50 border-t border-red-100 font-mono">
+          {fetchState.message}
+        </div>
+      )}
+
+      {fetchState.status === "ready" && (
+        <div className="relative">
+          {!appReady && (
+            <div className="absolute inset-0 flex items-center justify-center bg-background/80 z-10">
+              <Loader2 className="w-4 h-4 animate-spin text-muted-foreground" />
+            </div>
+          )}
+          <MCPAppFrame
+            html={fetchState.html}
+            toolInput={payload.tool_input}
+            toolResult={payload.tool_result}
+            csp={fetchState.csp}
+            permissions={fetchState.permissions}
+            onReady={() => setAppReady(true)}
+            className="w-full border-0 block"
+            conversationId={conversationId}
+            appId={payload.app_id}
+            originMessageId={messageId}
+          />
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/components/Chat/messages/SelectionChip.tsx b/frontend/src/components/Chat/messages/SelectionChip.tsx
new file mode 100644
index 0000000..11127bd
--- /dev/null
+++ b/frontend/src/components/Chat/messages/SelectionChip.tsx
@@ -0,0 +1,39 @@
+/**
+ * SelectionChip — compact pill rendered when an MCP App iframe posts a
+ * `ui/message` on behalf of the user (flavor C).
+ *
+ * Appears anchored under the selector iframe that originated the turn
+ * (referenced by origin_message_id in the persisted payload) instead of
+ * rendering a full user-bubble. Keeps the transcript auditable without a
+ * phantom "I picked X" user turn cluttering the conversation.
+ */
+
+import { MousePointerClick } from "lucide-react";
+
+export interface SelectionChipPayload {
+  /** Agent-facing text (may be verbose to prevent LLM re-disambiguation). */
+  text: string;
+  /** Optional short label for display; falls back to `text` if absent. */
+  display_text?: string;
+  source: "mcp_app";
+  app_id?: string;
+  origin_message_id?: string;
+}
+
+interface Props {
+  payload: SelectionChipPayload;
+}
+
+export function SelectionChip({ payload }: Props) {
+  const label = payload.display_text?.trim() || payload.text;
+  return (
+    <div
+      className="inline-flex items-center gap-1.5 px-3 py-1 rounded-full border border-border bg-muted/60 text-sm text-foreground/80 max-w-xs truncate"
+      title={label}
+      data-origin-message-id={payload.origin_message_id}
+    >
+      <MousePointerClick className="w-3.5 h-3.5 shrink-0 text-muted-foreground" />
+      <span className="truncate">{label}</span>
+    </div>
+  );
+}
diff --git a/frontend/src/lib/buildUiMessages.ts b/frontend/src/lib/buildUiMessages.ts
index 3de3426..88be52c 100644
--- a/frontend/src/lib/buildUiMessages.ts
+++ b/frontend/src/lib/buildUiMessages.ts
@@ -91,6 +91,7 @@ export function buildUiMessages(records: MessageRecord[]): {
       case "TOOL_RESULT":
       case "SQL":
       case "CHART":
+      case "MCP_APP":
       case "ERROR":
         result.push({ id: m.id, event_type: m.event_type, role: "assistant", payload: m.payload, created_at: m.created_at });
         break;
diff --git a/frontend/src/lib/groupMessages.ts b/frontend/src/lib/groupMessages.ts
index aa3a76f..ef34836 100644
--- a/frontend/src/lib/groupMessages.ts
+++ b/frontend/src/lib/groupMessages.ts
@@ -1,6 +1,6 @@
 import type { UIMessage, TurnUsage } from "@/types";
 
-const WORK_TYPES = new Set(["TOOL_CALL", "TOOL_RESULT", "SQL", "CHART", "ERROR", "THINKING"]);
+const WORK_TYPES = new Set(["TOOL_CALL", "TOOL_RESULT", "SQL", "CHART", "MCP_APP", "ERROR", "THINKING"]);
 
 export interface TurnGroup {
   key: string;
diff --git a/frontend/src/lib/mcpApps/MCPAppFrame.tsx b/frontend/src/lib/mcpApps/MCPAppFrame.tsx
new file mode 100644
index 0000000..c87d4bd
--- /dev/null
+++ b/frontend/src/lib/mcpApps/MCPAppFrame.tsx
@@ -0,0 +1,137 @@
+/**
+ * MCPAppFrame — sandboxed iframe wrapper for MCP App HTML.
+ *
+ * Security posture:
+ *   - sandbox="allow-scripts"  (no allow-same-origin, no allow-forms, etc.)
+ *   - csp attribute on the iframe element (W3C, Chromium-enforced before any
+ *     script runs; stronger than meta CSP because it supports frame-ancestors).
+ *   - When csp is provided and the browser doesn't support the iframe csp
+ *     attribute (non-Chromium), we inject a <meta http-equiv=CSP> into
+ *     the HTML before setting srcDoc as a documented weaker fallback.
+ *
+ * Wires up useMcpAppBridge so the app receives ui/initialize ack +
+ * ui/toolResult push as soon as it loads.
+ *
+ * Height: starts at MIN_FRAME_HEIGHT_PX and grows via
+ * `ui/notifications/size-changed` from the app. We never shrink below
+ * the min, and we ignore non-finite or non-positive values from the
+ * app (defensive — a buggy app shouldn't collapse the frame to 0).
+ */
+
+import { useCallback, useEffect, useRef, useState } from "react";
+import { useMcpAppBridge } from "./useMcpAppBridge";
+
+const MIN_FRAME_HEIGHT_PX = 120;
+
+export interface MCPAppFrameProps {
+  /** Raw HTML to render inside the iframe. */
+  html: string;
+  /** Tool input arguments (what the agent called the tool with). */
+  toolInput: Record<string, unknown>;
+  /** Tool result to push to the app after ui/initialize. */
+  toolResult: unknown;
+  /** CSP string from the MCP server's _meta.ui.csp field. */
+  csp?: string | null;
+  /** permissions from the MCP server's _meta.ui.permissions field. */
+  permissions?: string[];
+  /** Called when the app sends ui/notifications/initialized. */
+  onReady?: () => void;
+  className?: string;
+  /**
+   * Phase 2: conversation the frame lives in. Passed to useMcpAppBridge so
+   * tools/call requests can be routed to the correct backend endpoint.
+   */
+  conversationId?: string;
+  /**
+   * Phase 2: the app_id for this MCP App instance — used as the path segment
+   * in POST .../mcp-app/{app_id}/tool-call.
+   */
+  appId?: string;
+  /**
+   * Phase 2: the message ID of the MCP_APP message that created this frame.
+   * Forwarded to useMcpAppBridge so `ui/message` posts include it as
+   * `origin_message_id`, enabling the SelectionChip to be anchored under this
+   * selector on replay.
+   */
+  originMessageId?: string;
+}
+
+/** Returns true if the browser supports the iframe `csp` attribute. */
+function supportsCspAttribute(): boolean {
+  return "csp" in HTMLIFrameElement.prototype;
+}
+
+/** Inject a <meta http-equiv=CSP> as a documented weaker fallback. */
+function injectMetaCsp(html: string, csp: string): string {
+  const metaTag = `<meta http-equiv="Content-Security-Policy" content="${csp.replace(/"/g, "&quot;")}">`;
+  if (/<head[^>]*>/i.test(html)) {
+    return html.replace(/(<head[^>]*>)/i, `$1\n  ${metaTag}`);
+  }
+  // No <head> — prepend before everything
+  return `${metaTag}\n${html}`;
+}
+
+export function MCPAppFrame({
+  html,
+  toolInput,
+  toolResult,
+  csp,
+  onReady,
+  className,
+  conversationId,
+  appId,
+  originMessageId,
+}: MCPAppFrameProps) {
+  const iframeRef = useRef<HTMLIFrameElement>(null);
+  const [iframeWindow, setIframeWindow] = useState<Window | null>(null);
+  const [frameHeight, setFrameHeight] = useState<number>(MIN_FRAME_HEIGHT_PX);
+
+  // Resolve srcDoc: inject meta CSP fallback for non-Chromium if needed
+  const srcDoc = (() => {
+    if (csp && !supportsCspAttribute()) {
+      return injectMetaCsp(html, csp);
+    }
+    return html;
+  })();
+
+  const handleSizeChanged = useCallback((height: number) => {
+    setFrameHeight(Math.max(MIN_FRAME_HEIGHT_PX, Math.ceil(height)));
+  }, []);
+
+  useMcpAppBridge({
+    iframeWindow,
+    toolInput,
+    toolResult,
+    onReady,
+    onSizeChanged: handleSizeChanged,
+    conversationId,
+    appId,
+    originMessageId,
+  });
+
+  const handleLoad = useCallback(() => {
+    setIframeWindow(iframeRef.current?.contentWindow ?? null);
+  }, []);
+
+  useEffect(() => {
+    setIframeWindow(null);
+    setFrameHeight(MIN_FRAME_HEIGHT_PX);
+  }, [srcDoc]);
+
+  return (
+    <iframe
+      ref={iframeRef}
+      title="MCP App"
+      srcDoc={srcDoc}
+      sandbox="allow-scripts"
+      // csp attribute: Chromium enforces this before any script runs.
+      // TypeScript's lib.dom.d.ts doesn't include this attribute yet, so we
+      // spread it as a plain object to avoid a type error.
+      {...(csp ? { csp } : {})}
+      onLoad={handleLoad}
+      className={className}
+      style={{ height: `${frameHeight}px` }}
+      referrerPolicy="no-referrer"
+    />
+  );
+}
diff --git a/frontend/src/lib/mcpApps/protocol.ts b/frontend/src/lib/mcpApps/protocol.ts
new file mode 100644
index 0000000..8ffada4
--- /dev/null
+++ b/frontend/src/lib/mcpApps/protocol.ts
@@ -0,0 +1,184 @@
+/**
+ * JSON-RPC 2.0 message types for the MCP Apps postMessage protocol.
+ *
+ * Phase 1 surface (implemented):
+ *   ui/initialize  — app → host: SDK App.connect() handshake request
+ *   ui/toolResult  — host → app: push original tool result after initialize ack
+ *   ui/ready       — app → host: app has rendered, host hides loading skeleton
+ *
+ * Phase 2 surface (typed here for forward-compat, not yet wired):
+ *   tools/call         — app → host: execute a scoped MCP tool
+ *   ui/message         — app → host: send a user turn to the conversation
+ *   ui/context/update  — app → host: inject context for the next agent turn
+ *   sendOpenLink       — app → host: open an external URL
+ */
+
+export const PROTOCOL_VERSION = "2026-01-26";
+
+// ── Base JSON-RPC shapes ────────────────────────────────────────────────────
+
+export interface JsonRpcRequest<P = unknown> {
+  jsonrpc: "2.0";
+  id: string | number;
+  method: string;
+  params?: P;
+}
+
+export interface JsonRpcNotification<P = unknown> {
+  jsonrpc: "2.0";
+  method: string;
+  params?: P;
+}
+
+export interface JsonRpcResponse<R = unknown> {
+  jsonrpc: "2.0";
+  id: string | number;
+  result: R;
+}
+
+export interface JsonRpcError {
+  jsonrpc: "2.0";
+  id: string | number | null;
+  error: { code: number; message: string; data?: unknown };
+}
+
+export type JsonRpcMessage =
+  | JsonRpcRequest
+  | JsonRpcNotification
+  | JsonRpcResponse
+  | JsonRpcError;
+
+// ── Phase 1 ─────────────────────────────────────────────────────────────────
+
+/** app → host: App.connect() sends this; host must ack or app hangs. */
+export interface UiInitializeRequest
+  extends JsonRpcRequest<{ protocolVersion?: string }> {
+  method: "ui/initialize";
+}
+
+export interface HostCapabilities {
+  tools?: Record<string, unknown>;
+  context?: Record<string, unknown>;
+  message?: Record<string, unknown>;
+  openLink?: Record<string, unknown>;
+}
+
+export interface HostInfo {
+  name: string;
+  version: string;
+}
+
+/**
+ * Shape of the `ui/initialize` result the host sends back to the app.
+ * Mirrors the app-side request shape ({appInfo, appCapabilities, protocolVersion})
+ * with host-prefixed names — the MCP Apps SDK's Zod schema on the app side
+ * requires all three object fields; omitting any of them causes the SDK to
+ * reject App.connect() with `invalid_type` errors.
+ */
+export interface UiInitializeResult {
+  protocolVersion: string;
+  hostInfo: HostInfo;
+  hostCapabilities: HostCapabilities;
+  hostContext: Record<string, unknown>;
+}
+
+export interface UiInitializeResponse extends JsonRpcResponse<UiInitializeResult> {}
+
+/**
+ * host → app: structured CallToolResult.
+ * Per MCP Apps spec §"Notifications (Host → View)" the method name is
+ * `ui/notifications/tool-result` and params is the full CallToolResult
+ * (with `content: ContentBlock[]`). NOT `ui/toolResult` and NOT `{content: string}`.
+ */
+export interface McpContentBlock {
+  type: string;
+  text?: string;
+  data?: unknown;
+  [k: string]: unknown;
+}
+
+export interface CallToolResult {
+  content: McpContentBlock[];
+  isError?: boolean;
+  structuredContent?: Record<string, unknown>;
+  _meta?: Record<string, unknown>;
+}
+
+export interface UiToolInputNotification
+  extends JsonRpcNotification<{ arguments: Record<string, unknown> }> {
+  method: "ui/notifications/tool-input";
+}
+
+export interface UiToolResultNotification
+  extends JsonRpcNotification<CallToolResult> {
+  method: "ui/notifications/tool-result";
+}
+
+/**
+ * app → host notification: handshake complete.
+ * Spec §"Lifecycle" uses `ui/notifications/initialized` (mirrors MCP's
+ * notifications/initialized). `ui/ready` is our legacy name — kept as alias.
+ */
+export interface UiInitializedNotification extends JsonRpcNotification {
+  method: "ui/notifications/initialized";
+}
+
+/**
+ * app → host notification: publish the current content size so the host
+ * can auto-resize its iframe to fit. Only `height` is honoured — hosts
+ * own width and constrain it to the chat column.
+ */
+export interface UiSizeChangedNotification
+  extends JsonRpcNotification<{ height?: number; width?: number }> {
+  method: "ui/notifications/size-changed";
+}
+
+// ── Phase 2 (typed, not yet wired) ──────────────────────────────────────────
+
+export interface ToolsCallRequest
+  extends JsonRpcRequest<{ name: string; arguments?: Record<string, unknown> }> {
+  method: "tools/call";
+}
+
+/**
+ * app → host: send a user turn to the conversation.
+ * Per spec §"ui/message": params.content is a content block object
+ * `{ type: "text", text: string }`, NOT a plain string.
+ */
+export interface UiMessageContentBlock {
+  type: string;
+  text: string;
+}
+
+export interface UiMessageRequest
+  extends JsonRpcRequest<{ role?: string; content: UiMessageContentBlock }> {
+  method: "ui/message";
+}
+
+export interface UiContextUpdateNotification
+  extends JsonRpcNotification<{ content: unknown }> {
+  method: "ui/context/update";
+}
+
+export interface SendOpenLinkRequest
+  extends JsonRpcRequest<{ url: string }> {
+  method: "sendOpenLink";
+}
+
+// ── Type guards ──────────────────────────────────────────────────────────────
+
+export function isJsonRpc(msg: unknown): msg is JsonRpcMessage {
+  return (
+    typeof msg === "object" &&
+    msg !== null &&
+    (msg as Record<string, unknown>)["jsonrpc"] === "2.0"
+  );
+}
+
+export function isRequest(msg: JsonRpcMessage): msg is JsonRpcRequest {
+  return "method" in msg && "id" in msg;
+}
+
+export function isNotification(msg: JsonRpcMessage): msg is JsonRpcNotification {
+  return "method" in msg && !("id" in msg);
+}
diff --git a/frontend/src/lib/mcpApps/useMcpAppBridge.ts b/frontend/src/lib/mcpApps/useMcpAppBridge.ts
new file mode 100644
index 0000000..b487dde
--- /dev/null
+++ b/frontend/src/lib/mcpApps/useMcpAppBridge.ts
@@ -0,0 +1,542 @@
+/**
+ * useMcpAppBridge — React hook that implements the host-side AppBridge.
+ *
+ * Attaches a window `message` listener scoped to the given iframe window.
+ * Matches JSON-RPC 2.0 requests by method and id, then:
+ *   1. Answers `ui/initialize` with `hostInfo` / `hostCapabilities` / `hostContext`.
+ *   2. Waits for the app's `ui/notifications/initialized` handshake-complete
+ *      signal, then pushes `ui/toolResult`. Pushing earlier drops the
+ *      notification because the SDK only wires up its listener *after*
+ *      validating the init response.
+ *   3. Treats `ui/notifications/initialized` as the "app is live" signal for
+ *      onReady() (the spec name; some older plans referenced `ui/ready`).
+ *   4. Forwards `ui/notifications/size-changed` (app → host) to the caller so
+ *      the wrapping iframe element can be resized to fit the app's content.
+ *      Spec §"Notifications (View → Host)": params `{ height?, width? }` —
+ *      only `height` is acted on; width is owned by the host layout.
+ *   5. (Phase 2) Handles `tools/call` from the iframe: calls the scoped backend
+ *      proxy endpoint and relays the CallToolResult back via postMessage.
+ *   6. (Phase 2) Handles `ui/message` from the iframe: posts the text to
+ *      POST /api/conversations/{id}/messages as a visible user turn and streams
+ *      the agent response back through the normal SSE pipeline.
+ */
+
+import { useEffect, useRef } from "react";
+import {
+  PROTOCOL_VERSION,
+  isJsonRpc,
+  isRequest,
+  isNotification,
+  type JsonRpcRequest,
+  type JsonRpcResponse,
+  type JsonRpcError,
+  type JsonRpcNotification,
+  type UiInitializeResult,
+  type UiToolInputNotification,
+  type UiToolResultNotification,
+  type CallToolResult,
+  type McpContentBlock,
+  type UiMessageContentBlock,
+} from "./protocol";
+import { callMcpAppTool } from "@/api/mcpApp";
+import { streamMessage } from "@/api/stream";
+import { generateTitle } from "@/api/conversations";
+import { useConversationsStore } from "@/store/conversations";
+
+export interface McpAppBridgeOptions {
+  /** The iframe's contentWindow — set once the element mounts. */
+  iframeWindow: Window | null;
+  /** Tool input arguments (the kwargs the agent called the tool with). */
+  toolInput: Record<string, unknown>;
+  /**
+   * Structured CallToolResult content. Either an array of content blocks
+   * (preferred; matches MCP CallToolResult.content) or a string / object which
+   * we wrap as a single text block for spec compliance.
+   */
+  toolResult: unknown;
+  /** Called when the app sends ui/notifications/initialized (handshake done). */
+  onReady?: () => void;
+  /**
+   * Called when the app publishes `ui/notifications/size-changed`.
+   * Only invoked when `height` is a finite positive number; width is ignored.
+   */
+  onSizeChanged?: (height: number) => void;
+  /**
+   * Phase 2: conversation ID, needed to route `tools/call` to the correct
+   * scoped proxy endpoint.  When absent, `tools/call` requests are rejected
+   * with a JSON-RPC error instead of silently dropped.
+   */
+  conversationId?: string;
+  /**
+   * Phase 2: the app_id that identifies this specific MCP App instance.
+   * Used as the path segment in `POST .../mcp-app/{app_id}/tool-call`.
+   */
+  appId?: string;
+  /**
+   * Phase 2: the message ID of the MCP_APP message that spawned this iframe.
+   * Passed as `origin_message_id` when posting a `ui/message` so the backend
+   * persists it in the payload and the frontend can anchor the SelectionChip
+   * beneath the correct selector iframe on replay.
+   */
+  originMessageId?: string;
+}
+
+/**
+ * Resolves once `isStreaming` is false. If the store is already idle it
+ * resolves on the next microtask. Safe to call from any context because it
+ * only reads/subscribes to the Zustand store.
+ */
+function waitForStreamingToEnd(): Promise<void> {
+  if (!useConversationsStore.getState().isStreaming) {
+    return Promise.resolve();
+  }
+  return new Promise<void>((resolve) => {
+    const unsub = useConversationsStore.subscribe((state) => {
+      if (!state.isStreaming) {
+        unsub();
+        resolve();
+      }
+    });
+  });
+}
+
+/** Coerce whatever we got into a spec-compliant CallToolResult. */
+function toCallToolResult(raw: unknown): CallToolResult {
+  if (Array.isArray(raw)) {
+    return { content: raw as McpContentBlock[] };
+  }
+  if (raw && typeof raw === "object" && Array.isArray((raw as { content?: unknown }).content)) {
+    return raw as CallToolResult;
+  }
+  const text = typeof raw === "string" ? raw : JSON.stringify(raw);
+  return { content: [{ type: "text", text }] };
+}
+
+function reply<R>(
+  target: Window,
+  req: JsonRpcRequest,
+  result: R
+): void {
+  const response: JsonRpcResponse<R> = {
+    jsonrpc: "2.0",
+    id: req.id,
+    result,
+  };
+  target.postMessage(response, "*");
+}
+
+function push<P>(target: Window, notification: JsonRpcNotification<P>): void {
+  target.postMessage(notification, "*");
+}
+
+function replyError(
+  target: Window,
+  req: JsonRpcRequest,
+  code: number,
+  message: string,
+  data?: unknown
+): void {
+  const err: JsonRpcError = {
+    jsonrpc: "2.0",
+    id: req.id,
+    error: { code, message, ...(data !== undefined ? { data } : {}) },
+  };
+  target.postMessage(err, "*");
+}
+
+export function useMcpAppBridge({
+  iframeWindow,
+  toolInput,
+  toolResult,
+  onReady,
+  onSizeChanged,
+  conversationId,
+  appId,
+  originMessageId,
+}: McpAppBridgeOptions): void {
+  // Keep stable refs so the effect doesn't re-run on every render
+  const toolInputRef = useRef(toolInput);
+  const toolResultRef = useRef(toolResult);
+  const onReadyRef = useRef(onReady);
+  const onSizeChangedRef = useRef(onSizeChanged);
+  const conversationIdRef = useRef(conversationId);
+  const appIdRef = useRef(appId);
+  const originMessageIdRef = useRef(originMessageId);
+  useEffect(() => {
+    toolInputRef.current = toolInput;
+  }, [toolInput]);
+  useEffect(() => {
+    toolResultRef.current = toolResult;
+  }, [toolResult]);
+  useEffect(() => {
+    onReadyRef.current = onReady;
+  }, [onReady]);
+  useEffect(() => {
+    onSizeChangedRef.current = onSizeChanged;
+  }, [onSizeChanged]);
+  useEffect(() => {
+    conversationIdRef.current = conversationId;
+  }, [conversationId]);
+  useEffect(() => {
+    appIdRef.current = appId;
+  }, [appId]);
+  useEffect(() => {
+    originMessageIdRef.current = originMessageId;
+  }, [originMessageId]);
+
+  useEffect(() => {
+    if (!iframeWindow) return;
+
+    /**
+     * Submit an iframe-authored selection through the flavor-C pipeline:
+     * appends a SelectionChip locally, then streams the agent response
+     * via the existing SSE endpoint tagged with source="mcp_app".
+     *
+     * `agentText` is what the agent sees in its conversation history — it
+     * should be rich enough to prevent redundant follow-up tool calls (e.g.
+     * re-running `get_context` for an already-disambiguated selection).
+     * `displayText` is what the SelectionChip renders in the UI.
+     *
+     * Used by both `ui/message` and `ui/update-model-context` handlers.
+     */
+    function submitMcpAppTurn(
+      agentText: string,
+      displayText: string = agentText
+    ): void {
+      const convId = conversationIdRef.current;
+      const aid = appIdRef.current;
+      const oid = originMessageIdRef.current;
+      if (!convId || !agentText) return;
+
+      (async () => {
+        await waitForStreamingToEnd();
+
+        const store = useConversationsStore.getState();
+
+        store.appendMessage({
+          id: crypto.randomUUID(),
+          event_type: "TEXT",
+          role: "user",
+          payload: {
+            text: agentText,
+            display_text: displayText,
+            source: "mcp_app",
+            ...(aid ? { app_id: aid } : {}),
+            ...(oid ? { origin_message_id: oid } : {}),
+          },
+        });
+
+        store.setStreaming(true);
+        store.resetStreamingText();
+
+        try {
+          const stream = streamMessage(convId, agentText, undefined, {
+            source: "mcp_app",
+            display_text: displayText,
+            ...(aid ? { app_id: aid } : {}),
+            ...(oid ? { origin_message_id: oid } : {}),
+          });
+          let result = await stream.next();
+          while (!result.done) {
+            const event = result.value;
+            const s = useConversationsStore.getState();
+            if (event.event === "TEXT") {
+              s.appendStreamingText(
+                (event.payload as { text: string }).text
+              );
+            } else if (event.event === "TOOL_CALL") {
+              s.markCurrentAsThinking();
+              s.appendMessage({
+                id: event.message_id,
+                event_type: event.event,
+                role: "assistant",
+                payload: event.payload,
+              });
+            } else if (event.event !== "COMPLETE") {
+              s.appendMessage({
+                id: event.message_id,
+                event_type: event.event,
+                role: "assistant",
+                payload: event.payload,
+              });
+            }
+            result = await stream.next();
+          }
+        } catch (err) {
+          useConversationsStore.getState().appendMessage({
+            id: crypto.randomUUID(),
+            event_type: "ERROR",
+            role: "assistant",
+            payload: { error: String(err) },
+          });
+        } finally {
+          useConversationsStore.getState().setStreaming(false);
+          generateTitle(convId)
+            .then((r) => {
+              if (r.updated) {
+                useConversationsStore
+                  .getState()
+                  .updateConversationTitle(convId, r.title);
+              }
+            })
+            .catch(() => {});
+        }
+      })();
+    }
+
+    function handleMessage(event: MessageEvent): void {
+      // Only accept messages from our iframe
+      if (event.source !== iframeWindow) return;
+
+      const raw = event.data;
+      if (!isJsonRpc(raw)) return;
+
+      if (isRequest(raw)) {
+        switch (raw.method) {
+          case "ui/initialize": {
+            // Ack with host-prefixed fields the MCP Apps SDK's Zod schema
+            // requires. Advertise `tools` capability so the app knows it can
+            // send `tools/call` requests.
+            const result: UiInitializeResult = {
+              protocolVersion: PROTOCOL_VERSION,
+              hostInfo: {
+                name: "analytics-agent",
+                version: "0.1.0",
+              },
+              hostCapabilities: { tools: {}, message: {} },
+              hostContext: {},
+            };
+            reply(iframeWindow!, raw, result);
+            // NOTE: do NOT push ui/toolResult here — the app's toolResult
+            // listener isn't wired up yet. We push it when the app signals
+            // ui/notifications/initialized below (H6 fix).
+            break;
+          }
+
+          case "tools/call": {
+            // Phase 2: iframe requests a scoped MCP tool call.
+            const convId = conversationIdRef.current;
+            const aid = appIdRef.current;
+            const params = (raw.params ?? {}) as {
+              name?: string;
+              arguments?: Record<string, unknown>;
+            };
+            const toolName = params.name ?? "";
+            const args = params.arguments ?? {};
+
+            if (!convId || !aid) {
+              replyError(
+                iframeWindow!,
+                raw,
+                -32603,
+                "tools/call is not available: missing conversationId or appId"
+              );
+              break;
+            }
+            if (!toolName) {
+              replyError(iframeWindow!, raw, -32602, "tools/call: missing tool name");
+              break;
+            }
+
+            // Async: fire the REST call and relay the result back.
+            callMcpAppTool(convId, aid, toolName, args)
+              .then((result) => {
+                const callToolResult: CallToolResult = {
+                  content: result.content as McpContentBlock[],
+                  isError: result.isError ?? false,
+                };
+                reply(iframeWindow!, raw, callToolResult);
+              })
+              .catch((err: unknown) => {
+                replyError(
+                  iframeWindow!,
+                  raw,
+                  -32603,
+                  err instanceof Error ? err.message : String(err)
+                );
+              });
+            break;
+          }
+
+          case "ui/message": {
+            // Phase 2: iframe authors a user turn on behalf of the user.
+            // Per spec §"ui/message": params.content is a content block object
+            // { type: "text", text: string }, NOT a plain string.
+            const msgParams = (raw.params ?? {}) as {
+              role?: string;
+              content?: UiMessageContentBlock | string;
+            };
+            const rawContent = msgParams.content;
+            const content = (
+              typeof rawContent === "string"
+                ? rawContent
+                : (rawContent as UiMessageContentBlock | undefined)?.text ?? ""
+            ).trim();
+
+            if (!conversationIdRef.current || !content) {
+              replyError(
+                iframeWindow!,
+                raw,
+                -32602,
+                "ui/message: missing conversationId or content"
+              );
+              break;
+            }
+
+            // Acknowledge immediately so the iframe's "sending" state resolves.
+            reply(iframeWindow!, raw, {});
+            submitMcpAppTurn(content);
+            break;
+          }
+
+          case "ui/update-model-context": {
+            // Per MCP Apps spec §"ui/update-model-context":
+            //   params: { content?: ContentBlock[], structuredContent?: object }
+            // Spec allows the host to "MAY defer sending the context to the
+            // model until the next user message" OR process immediately.
+            // Apps that use this for selection flows (like the card selector)
+            // expect immediate processing — the iframe shows "Sending…" on
+            // click and waits for a new agent turn.
+            //
+            // We extract a human-readable label for the SelectionChip, prefer
+            // `structuredContent.selected_name`, then fall back to the content
+            // blocks' text, then a JSON blob.
+            const ctxParams = (raw.params ?? {}) as {
+              content?: Array<{ type: string; text?: string }>;
+              structuredContent?: Record<string, unknown>;
+            };
+
+            const structured = ctxParams.structuredContent;
+
+            // Display label: short, human-readable string for the SelectionChip.
+            let displayText = "";
+            if (structured) {
+              const named =
+                (structured as { selected_name?: unknown }).selected_name ??
+                (structured as { name?: unknown }).name ??
+                (structured as { label?: unknown }).label;
+              if (typeof named === "string" && named.trim()) {
+                displayText = named.trim();
+              }
+            }
+            if (!displayText && Array.isArray(ctxParams.content)) {
+              const texts = ctxParams.content
+                .filter((b) => b && b.type === "text" && typeof b.text === "string")
+                .map((b) => b.text as string);
+              if (texts.length > 0) displayText = texts.join(" ").trim();
+            }
+
+            // Agent-facing text: richer than the display label so the LLM
+            // doesn't re-disambiguate an already-resolved selection (e.g. by
+            // re-calling `get_context` when it already has the URN). Includes
+            // identifier(s) from structuredContent + an explicit instruction.
+            let agentText = displayText;
+            if (structured) {
+              const urn =
+                (structured as { selected_urn?: unknown }).selected_urn ??
+                (structured as { urn?: unknown }).urn ??
+                (structured as { id?: unknown }).id;
+              const custom =
+                (structured as { custom_response?: unknown }).custom_response;
+              const parts: string[] = [];
+              if (displayText) {
+                parts.push(
+                  `The user selected "${displayText}" from the previous interactive card.`
+                );
+              }
+              if (typeof urn === "string" && urn.trim()) {
+                parts.push(`Identifier: ${urn.trim()}.`);
+              }
+              if (typeof custom === "string" && custom.trim()) {
+                parts.push(`Additional input: ${custom.trim()}.`);
+              }
+              if (parts.length > 0) {
+                parts.push(
+                  "This selection is already disambiguated — do NOT call `get_context` or other disambiguation tools for this concept; use it directly and continue with the original request."
+                );
+                agentText = parts.join(" ");
+              }
+            }
+            if (!agentText && structured) {
+              try {
+                agentText = JSON.stringify(structured);
+                if (!displayText) displayText = agentText;
+              } catch {
+                agentText = "";
+              }
+            }
+
+            // Always ack — spec requires a response with empty result on success.
+            reply(iframeWindow!, raw, {});
+
+            if (agentText) {
+              submitMcpAppTurn(agentText, displayText || agentText);
+            }
+            break;
+          }
+
+          case "sendOpenLink":
+            // Phase 3 — not yet wired
+            console.warn(
+              `[MCPAppBridge] method "sendOpenLink" received but not yet handled.`
+            );
+            break;
+
+          default:
+            break;
+        }
+      } else if (isNotification(raw)) {
+        switch (raw.method) {
+          case "ui/notifications/initialized":
+          case "ui/ready": {
+            // Spec §"Notifications (Host → View)":
+            //   1. MUST send ui/notifications/tool-input with the tool arguments
+            //   2. MUST follow with ui/notifications/tool-result containing the
+            //      full CallToolResult (with structured content blocks).
+            // The View ignores tool-result if tool-input hasn't arrived yet.
+            const toolInputPush: UiToolInputNotification = {
+              jsonrpc: "2.0",
+              method: "ui/notifications/tool-input",
+              params: { arguments: toolInputRef.current },
+            };
+            const callToolResult = toCallToolResult(toolResultRef.current);
+            const toolResultPush: UiToolResultNotification = {
+              jsonrpc: "2.0",
+              method: "ui/notifications/tool-result",
+              params: callToolResult,
+            };
+            push(iframeWindow!, toolInputPush);
+            push(iframeWindow!, toolResultPush);
+            onReadyRef.current?.();
+            break;
+          }
+          case "ui/notifications/size-changed": {
+            // Spec: params { height?: number, width?: number }. We only
+            // act on height — width is fixed by the chat-column layout.
+            const params = (raw.params ?? {}) as {
+              height?: unknown;
+              width?: unknown;
+            };
+            const h =
+              typeof params.height === "number" && Number.isFinite(params.height)
+                ? params.height
+                : null;
+            if (h !== null && h > 0) {
+              onSizeChangedRef.current?.(h);
+            }
+            break;
+          }
+          case "ui/context/update":
+            // Phase 2 — not yet wired
+            console.warn("[MCPAppBridge] ui/context/update not yet handled.");
+            break;
+          default:
+            break;
+        }
+      }
+    }
+
+    window.addEventListener("message", handleMessage);
+    return () => window.removeEventListener("message", handleMessage);
+  }, [iframeWindow]);
+}
diff --git a/frontend/src/types/index.ts b/frontend/src/types/index.ts
index 4a0b6f5..50bfff6 100644
--- a/frontend/src/types/index.ts
+++ b/frontend/src/types/index.ts
@@ -5,6 +5,7 @@ export type SSEEventType =
   | "TOOL_RESULT"
   | "SQL"
   | "CHART"
+  | "MCP_APP"
   | "USAGE"
   | "COMPLETE"
   | "ERROR";
@@ -53,6 +54,23 @@ export interface UsagePayload {
   node: string;
 }
 
+export interface MCPAppPayload {
+  app_id: string;
+  connection_key: string;
+  server_name: string;
+  tool_name: string;
+  tool_input: Record<string, unknown>;
+  /**
+   * Structured CallToolResult content (list of MCP content blocks, typically
+   * `[{type: "text", text: "..."}]`). Forwarded verbatim to the iframe app via
+   * `ui/notifications/tool-result`.
+   */
+  tool_result: unknown;
+  resource_uri: string;
+  csp: string | null;
+  permissions: string[];
+}
+
 export interface Engine {
   name: string;
   type: string;
diff --git a/tests/unit/test_business_context_suppression.py b/tests/unit/test_business_context_suppression.py
new file mode 100644
index 0000000..7e2d472
--- /dev/null
+++ b/tests/unit/test_business_context_suppression.py
@@ -0,0 +1,131 @@
+"""
+Unit tests for the `search_business_context` skill suppression introduced when a
+`datahub-mcp` context platform advertises a `get_context` tool.
+
+Covers:
+- build_system_prompt(include_business_context=True/False)
+- build_graph(suppress_business_context_skill=True/False) — tool-list filtering
+  and system-prompt section injection.
+"""
+
+from __future__ import annotations
+
+from unittest.mock import MagicMock, patch
+
+import pytest
+from analytics_agent.prompts.system import build_system_prompt
+
+_SECTION_HEADING = "## Skill: search_business_context"
+
+
+# ─── build_system_prompt ─────────────────────────────────────────────────────
+
+
+def test_build_system_prompt_includes_business_context_by_default():
+    prompt = build_system_prompt("snowflake")
+    assert _SECTION_HEADING in prompt
+
+
+def test_build_system_prompt_excludes_business_context_when_disabled():
+    prompt = build_system_prompt("snowflake", include_business_context=False)
+    assert _SECTION_HEADING not in prompt
+    assert "## Meta-Skill: /improve-context" in prompt  # unrelated section still present
+
+
+# ─── build_graph tool-list + prompt injection ────────────────────────────────
+
+
+def _capture_build_graph(suppress: bool):
+    """Build a graph with a stubbed LLM and capture the args passed to create_agent.
+
+    Returns (tool_names, system_prompt_text).
+    """
+    from analytics_agent.agent import graph as graph_mod
+
+    fake_llm = MagicMock(name="fake_llm")
+    captured: dict = {}
+
+    def fake_create_agent(*, model, tools, state_schema, system_prompt):
+        captured["tools"] = tools
+        captured["system_prompt"] = system_prompt
+        compiled = MagicMock(name="react_agent")
+        return compiled
+
+    with (
+        patch.object(graph_mod, "get_llm", return_value=fake_llm),
+        patch.object(graph_mod, "create_agent", side_effect=fake_create_agent),
+    ):
+        graph_mod.build_graph(
+            engine_name="snowflake",
+            engine=MagicMock(get_tools=MagicMock(return_value=[])),
+            context_tools=[],
+            engine_tools=[],
+            suppress_business_context_skill=suppress,
+        )
+
+    tool_names = {t.name for t in captured["tools"]}
+    return tool_names, captured["system_prompt"]
+
+
+def test_build_graph_includes_search_business_context_by_default():
+    tool_names, system_prompt = _capture_build_graph(suppress=False)
+    assert "search_business_context" in tool_names
+    assert _SECTION_HEADING in system_prompt
+
+
+def test_build_graph_suppresses_search_business_context_when_flag_set():
+    tool_names, system_prompt = _capture_build_graph(suppress=True)
+    assert "search_business_context" not in tool_names
+    assert _SECTION_HEADING not in system_prompt
+
+
+def test_build_graph_suppression_also_applies_to_system_prompt_override():
+    """When a custom system_prompt_override is used, the section must still be gated."""
+    from analytics_agent.agent import graph as graph_mod
+
+    fake_llm = MagicMock(name="fake_llm")
+    captured: dict = {}
+
+    def fake_create_agent(*, model, tools, state_schema, system_prompt):
+        captured["system_prompt"] = system_prompt
+        return MagicMock()
+
+    with (
+        patch.object(graph_mod, "get_llm", return_value=fake_llm),
+        patch.object(graph_mod, "create_agent", side_effect=fake_create_agent),
+    ):
+        graph_mod.build_graph(
+            engine_name="snowflake",
+            engine=MagicMock(get_tools=MagicMock(return_value=[])),
+            context_tools=[],
+            engine_tools=[],
+            system_prompt_override="You are an analyst for {engine_name}.",
+            suppress_business_context_skill=True,
+        )
+
+    assert _SECTION_HEADING not in captured["system_prompt"]
+
+
+# ─── chat.py detection logic (row.type + tool name) ──────────────────────────
+
+
+@pytest.mark.parametrize(
+    "row_type, tool_names, expected",
+    [
+        ("datahub-mcp", ["get_context", "search"], True),
+        ("datahub-mcp", ["search", "get_entities"], False),
+        ("datahub", ["get_context"], False),  # native DataHub must not trigger
+        ("other-mcp", ["get_context"], False),  # unrelated MCP must not trigger
+    ],
+)
+def test_detection_matches_datahub_mcp_with_get_context(row_type, tool_names, expected):
+    """Mirror the inline check in chat.py to lock its contract."""
+    row = MagicMock(type=row_type)
+    tools = [MagicMock(name=n) for n in tool_names]
+    # MagicMock assigns `.name` differently than we expect when passed to constructor;
+    # set it explicitly.
+    for tool, n in zip(tools, tool_names):
+        tool.name = n
+
+    triggered = row.type == "datahub-mcp" and any(t.name == "get_context" for t in tools)
+    assert triggered is expected

From 7fc85887613f231d431d9d3e5c02dfc3640a2686 Mon Sep 17 00:00:00 2001
From: Anirudh Reddy Malgari <anirudh.malgari@datahub.com>
Date: Thu, 23 Apr 2026 18:43:07 -0700
Subject: [PATCH 2/3] added UI for improve context

---
 backend/src/analytics_agent/agent/graph.py    |   6 +-
 backend/src/analytics_agent/agent/history.py  |  15 +-
 .../analytics_agent/agent/proposals_tool.py   |  72 ++++++
 .../src/analytics_agent/agent/results_tool.py |  67 ++++++
 .../src/analytics_agent/agent/streaming.py    |  35 ++-
 backend/src/analytics_agent/api/chat.py       |   3 +
 .../skills/improve-context/SKILL.md           |  54 ++++-
 .../skills/save-correction/SKILL.md           |   4 +
 frontend/src/api/conversations.ts             |  31 ++-
 frontend/src/components/Chat/ChatView.tsx     |  56 +++--
 frontend/src/components/Chat/MessageList.tsx  |  67 +++++-
 .../Chat/messages/ProposalResultsMessage.tsx  | 157 ++++++++++++
 .../Chat/messages/ProposalsMessage.tsx        | 227 ++++++++++++++++++
 frontend/src/lib/buildUiMessages.ts           |   2 +
 frontend/src/lib/groupMessages.ts             |  17 +-
 frontend/src/types/index.ts                   |  28 +++
 16 files changed, 794 insertions(+), 47 deletions(-)
 create mode 100644 backend/src/analytics_agent/agent/proposals_tool.py
 create mode 100644 backend/src/analytics_agent/agent/results_tool.py
 create mode 100644 frontend/src/components/Chat/messages/ProposalResultsMessage.tsx
 create mode 100644 frontend/src/components/Chat/messages/ProposalsMessage.tsx

diff --git a/backend/src/analytics_agent/agent/graph.py b/backend/src/analytics_agent/agent/graph.py
index 55e40a1..5521cec 100644
--- a/backend/src/analytics_agent/agent/graph.py
+++ b/backend/src/analytics_agent/agent/graph.py
@@ -52,6 +52,8 @@ def build_graph(
     llm = get_llm(streaming=True)
 
     from analytics_agent.agent.chart_tool import create_chart
+    from analytics_agent.agent.proposals_tool import present_proposals
+    from analytics_agent.agent.results_tool import report_proposal_results
 
     # Context platform tools — built dynamically from DB at request time.
     # Falls back to env-var based build only when caller doesn't provide them.
@@ -81,7 +83,9 @@ def build_graph(
                 raise ValueError(f"Engine '{engine_name}' not found.")
         engine_tools = [t for t in engine.get_tools() if t.name not in disabled]
     chart_tools = [] if "create_chart" in disabled else [create_chart]
-    all_tools = datahub_tools + skill_tools + engine_tools + chart_tools
+    proposal_tools = [] if "present_proposals" in disabled else [present_proposals]
+    results_tools = [] if "report_proposal_results" in disabled else [report_proposal_results]
+    all_tools = datahub_tools + skill_tools + engine_tools + chart_tools + proposal_tools + results_tools
 
     if system_prompt_override:
         from analytics_agent.skills.loader import (
diff --git a/backend/src/analytics_agent/agent/history.py b/backend/src/analytics_agent/agent/history.py
index e708178..d7b580c 100644
--- a/backend/src/analytics_agent/agent/history.py
+++ b/backend/src/analytics_agent/agent/history.py
@@ -74,14 +74,23 @@ def build_history(
                         "input": payload.get("tool_input", {}),
                     }
                 )
-            elif evt in ("TOOL_RESULT", "SQL"):
+            elif evt in ("TOOL_RESULT", "SQL", "PROPOSALS", "PROPOSAL_RESULTS"):
                 idx = len(tool_results)
                 call_id = tool_calls[idx]["id"] if idx < len(tool_calls) else msg.id
+                if evt == "PROPOSALS":
+                    result_text = orjson.dumps(payload).decode()[:4000]
+                    tool_name = "present_proposals"
+                elif evt == "PROPOSAL_RESULTS":
+                    result_text = orjson.dumps(payload).decode()[:4000]
+                    tool_name = "report_proposal_results"
+                else:
+                    result_text = payload.get("result", payload.get("sql", ""))[:4000]
+                    tool_name = payload.get("tool_name", "")
                 tool_results.append(
                     {
                         "id": call_id,
-                        "name": payload.get("tool_name", ""),
-                        "result": payload.get("result", payload.get("sql", ""))[:4000],
+                        "name": tool_name,
+                        "result": result_text,
                     }
                 )
             elif evt == "TEXT":
diff --git a/backend/src/analytics_agent/agent/proposals_tool.py b/backend/src/analytics_agent/agent/proposals_tool.py
new file mode 100644
index 0000000..ad8212c
--- /dev/null
+++ b/backend/src/analytics_agent/agent/proposals_tool.py
@@ -0,0 +1,72 @@
+from __future__ import annotations
+
+import logging
+import uuid
+from typing import Literal
+
+from langchain_core.tools import tool
+from pydantic import BaseModel
+
+logger = logging.getLogger(__name__)
+
+# Side-channel: keyed by prop_id so streaming.py can fetch the payload
+# without the model ever seeing the full JSON.
+_pending_proposals: dict[str, dict] = {}
+
+
+class ProposalItem(BaseModel):
+    id: str
+    kind: Literal["new_doc", "update_doc", "fix_description"]
+    title: str
+    detail: str
+    target: dict | None = None  # e.g. {"urn": "...", "field_path": "..."}
+
+
+@tool
+async def present_proposals(
+    prompt: str,
+    proposals: list[dict],
+) -> str:
+    """
+    Present a list of improvement proposals to the user for review and selection.
+    Call this at the end of Step 3 of the /improve-context workflow, after drafting
+    proposals. The UI will render a card with checkboxes — do NOT print a markdown
+    list yourself.
+
+    Args:
+        prompt: Short framing sentence shown above the proposals
+                (e.g. "I found 3 improvements based on our conversation.")
+        proposals: List of proposal dicts, each with:
+            - id: unique string identifier (e.g. "1", "2", "3")
+            - kind: one of "new_doc", "update_doc", "fix_description"
+            - title: short title for the proposal
+            - detail: 1-2 sentence description of what to add/change
+            - target: optional dict with "urn" and/or "field_path" for existing entities
+
+    Example:
+        present_proposals(
+            prompt="Based on our conversation, here are 3 documentation improvements:",
+            proposals=[
+                {"id": "1", "kind": "new_doc", "title": "Revenue Metrics Guide",
+                 "detail": "Define net ARR vs gross ARR and specify the revenue table."},
+                {"id": "2", "kind": "fix_description", "title": "orders.status column",
+                 "detail": "Current description is empty. Values: pending, confirmed, shipped.",
+                 "target": {"urn": "urn:li:dataset:...", "field_path": "status"}},
+            ]
+        )
+    """
+    try:
+        validated = [ProposalItem(**p) for p in proposals]
+    except Exception as e:
+        return f"present_proposals: invalid proposals format — {e}"
+
+    prop_id = str(uuid.uuid4())
+    _pending_proposals[prop_id] = {
+        "prompt": prompt,
+        "proposals": [p.model_dump() for p in validated],
+    }
+
+    return (
+        f"PROPOSALS_READY:{prop_id} "
+        f"({len(validated)} proposals; awaiting user selection)"
+    )
diff --git a/backend/src/analytics_agent/agent/results_tool.py b/backend/src/analytics_agent/agent/results_tool.py
new file mode 100644
index 0000000..df97d0f
--- /dev/null
+++ b/backend/src/analytics_agent/agent/results_tool.py
@@ -0,0 +1,67 @@
+from __future__ import annotations
+
+import logging
+import uuid
+from typing import Literal
+
+from langchain_core.tools import tool
+from pydantic import BaseModel
+
+logger = logging.getLogger(__name__)
+
+# Side-channel: keyed by result_id so streaming.py can fetch the payload
+# without the model ever seeing the full JSON.
+_pending_results: dict[str, dict] = {}
+
+
+class ProposalResultItem(BaseModel):
+    id: str
+    kind: Literal["new_doc", "update_doc", "fix_description"]
+    title: str
+    status: Literal["success", "error"]
+    urn: str | None = None
+    error: str | None = None
+
+
+@tool
+async def report_proposal_results(
+    results: list[dict],
+) -> str:
+    """
+    Report the outcomes of writing approved proposals back to DataHub.
+    Call this ONCE after all save_correction calls have completed in Step 5
+    of the /improve-context workflow. The UI will render a results card —
+    do NOT write any additional summary text after calling this tool.
+
+    Args:
+        results: List of result dicts, each with:
+            - id: proposal id (matches the id from present_proposals)
+            - kind: one of "new_doc", "update_doc", "fix_description"
+            - title: proposal title
+            - status: "success" or "error"
+            - urn: the URN of the created/updated entity (set on success)
+            - error: error message (set on error)
+
+    Example:
+        report_proposal_results(results=[
+            {"id": "1", "kind": "new_doc", "title": "Revenue Metrics Guide",
+             "status": "success", "urn": "urn:li:corpUser:..."},
+            {"id": "3", "kind": "fix_description", "title": "orders.status column",
+             "status": "error", "error": "Permission denied"},
+        ])
+    """
+    try:
+        validated = [ProposalResultItem(**r) for r in results]
+    except Exception as e:
+        return f"report_proposal_results: invalid results format — {e}"
+
+    result_id = str(uuid.uuid4())
+    _pending_results[result_id] = {
+        "results": [r.model_dump() for r in validated],
+    }
+
+    successes = sum(1 for r in validated if r.status == "success")
+    return (
+        f"RESULTS_READY:{result_id} "
+        f"({successes}/{len(validated)} succeeded)"
+    )
diff --git a/backend/src/analytics_agent/agent/streaming.py b/backend/src/analytics_agent/agent/streaming.py
index d2ff6c6..ba94a37 100644
--- a/backend/src/analytics_agent/agent/streaming.py
+++ b/backend/src/analytics_agent/agent/streaming.py
@@ -67,6 +67,10 @@ async def stream_graph_events(
     final_text_parts: list[str] = []
     final_state: dict[str, Any] = {}
     chart_emitted = False  # guard against double-emitting CHART
+    # Once report_proposal_results emits, the PROPOSAL_RESULTS card IS the summary
+    # for the remainder of the turn — suppress any trailing model text so the user
+    # doesn't see the card AND a redundant narrative explanation underneath.
+    suppress_trailing_text = False
 
     # Track active tool runs by run_id -> tool_name so we can detect when a
     # wrapped tool (e.g. MCP UI wrapper) invokes an inner tool of the same name.
@@ -91,6 +95,8 @@ async def stream_graph_events(
 
             # ── TEXT ──
             if event_type == "on_chat_model_stream" and node not in ("chart", ""):
+                if suppress_trailing_text:
+                    continue
                 chunk = data.get("chunk")
                 if chunk is None:
                     continue
@@ -133,8 +139,8 @@ async def stream_graph_events(
                 active_tool_runs[run_id] = name
                 if name == "execute_sql":
                     pending_sql[run_id] = tool_input.get("sql", "")
-                # create_chart renders as a CHART event — don't show a tool call bubble
-                if name == "create_chart":
+                # create_chart / present_proposals / report_proposal_results render as dedicated events — no tool call bubble
+                if name in ("create_chart", "present_proposals", "report_proposal_results"):
                     continue
                 yield {
                     "event": "TOOL_CALL",
@@ -241,6 +247,31 @@ async def stream_graph_events(
                                 "allowed_tools": pending_app.allowed_tools,
                             },
                         }
+                elif output_str.startswith("PROPOSALS_READY:"):
+                    prop_id = output_str.split(":", 1)[1].split()[0].strip()
+                    from analytics_agent.agent.proposals_tool import _pending_proposals
+
+                    pending = _pending_proposals.pop(prop_id, None)
+                    if pending:
+                        yield {
+                            "event": "PROPOSALS",
+                            "conversation_id": conversation_id,
+                            "message_id": str(uuid.uuid4()),
+                            "payload": pending,
+                        }
+                elif output_str.startswith("RESULTS_READY:"):
+                    result_id = output_str.split(":", 1)[1].split()[0].strip()
+                    from analytics_agent.agent.results_tool import _pending_results
+
+                    pending_result = _pending_results.pop(result_id, None)
+                    if pending_result:
+                        yield {
+                            "event": "PROPOSAL_RESULTS",
+                            "conversation_id": conversation_id,
+                            "message_id": str(uuid.uuid4()),
+                            "payload": pending_result,
+                        }
+                        suppress_trailing_text = True
                 elif name == "create_chart":
                     # Fetch chart spec from side-channel (tool returns only a short marker)
                     if output_str.startswith("CHART_READY:"):
diff --git a/backend/src/analytics_agent/api/chat.py b/backend/src/analytics_agent/api/chat.py
index ace4c1f..5b9bff1 100644
--- a/backend/src/analytics_agent/api/chat.py
+++ b/backend/src/analytics_agent/api/chat.py
@@ -84,6 +84,9 @@ class ChatMessageRequest(BaseModel):
     # richer agent-facing message (e.g. includes URN + instruction to prevent
     # redundant disambiguation tool calls).
     display_text: str | None = None
+    # Audit field for proposal_select turns: the raw proposal IDs the user checked
+    # before submitting. Stored in the user message payload for traceability.
+    selected_ids: list[str] | None = None
 
 
 async def _persist_message(
diff --git a/backend/src/analytics_agent/skills/improve-context/SKILL.md b/backend/src/analytics_agent/skills/improve-context/SKILL.md
index 98f9a69..1b5a23b 100644
--- a/backend/src/analytics_agent/skills/improve-context/SKILL.md
+++ b/backend/src/analytics_agent/skills/improve-context/SKILL.md
@@ -44,25 +44,53 @@ Format each proposal clearly, like this:
 
 Keep each proposal to 1–2 sentences. Be specific about what to add or change.
 
-### Step 4 — Ask for approval
+### Step 4 — Present proposals via tool
 
-Present the numbered list and ask: **"Which of these would you like me to publish? Reply with the numbers, 'all', or 'none'."**
+Call `present_proposals` with a short framing `prompt` and the `proposals` list you drafted in Step 3. The UI will render a review card with checkboxes — do **not** print a markdown numbered list yourself.
 
-Do NOT call any write-back tools until the user explicitly approves.
+Each proposal must include:
+- `id`: a string like `"1"`, `"2"`, `"3"` matching the Step 3 draft order
+- `kind`: one of `"new_doc"`, `"update_doc"`, `"fix_description"`
+- `title`: short label (e.g. `"Revenue Metrics Guide"`)
+- `detail`: 1–2 sentence description of what to add or change
+- `target` (optional): `{"urn": "...", "field_path": "..."}` for fix_description proposals that target a known entity
 
-### Step 5 — Execute approved changes
+Example call:
+```
+present_proposals(
+    prompt="I found 3 documentation improvements based on our conversation:",
+    proposals=[
+        {"id": "1", "kind": "new_doc", "title": "Revenue Metrics Guide",
+         "detail": "Define net ARR vs gross ARR and specify the revenue table as source of truth."},
+        {"id": "2", "kind": "update_doc", "title": "Orders FAQ",
+         "detail": "Add: deleted_at IS NULL means the order is active; non-null means soft-deleted."},
+        {"id": "3", "kind": "fix_description", "title": "orders.status column",
+         "detail": "Current description is empty. Values: pending, confirmed, shipped, cancelled, refunded.",
+         "target": {"urn": "urn:li:dataset:(urn:li:dataPlatform:snowflake,orders,PROD)", "field_path": "status"}},
+    ]
+)
+```
 
-For each approved proposal, follow the `save_correction` skill instructions to
-confirm the change with the user before writing:
+Do **not** call any write-back tools until the user explicitly selects proposals and submits.
 
-- **New doc** → Use `save_correction` Mode 3: find the right parent folder first
-  via `search_documents`, then call with `doc_title`, `doc_body`, `parent_doc_urn`
-- **Update existing doc** → Use `save_correction` Mode 2: call with `doc_urn`,
-  `doc_title`, `doc_body` (full updated body)
-- **Fix description** → Use `save_correction` Mode 1: call with `entity_urn`,
-  `corrected_description`, and `field_path` if field-level
+### Step 5 — Execute approved changes directly
 
-After each write, report the URN and location so the user can find it in DataHub.
+> **Note: the user has already approved these changes via the proposals card; do NOT ask for another confirmation.**
+
+The user's submission of the proposals card is the final confirmation. Do **NOT** ask for any further confirmation. Do **NOT** print the doc body for review before writing.
+
+For each approved proposal (and only the approved ones, in order):
+
+1. **Draft the full content now:**
+   - `new_doc` → write the full markdown body using the template from `save_correction` Mode 3 Step 2. Find the parent folder via `search_documents`.
+   - `update_doc` → fetch the existing doc with `search_documents` or `get_entities`, produce the full updated body.
+   - `fix_description` → compose the corrected description text.
+
+2. **Call `save_correction` immediately** with the drafted content. **Skip the in-skill confirmation sub-steps** (Mode 1 Step 3, Mode 2 Step 2, Mode 3 Step 3). Collect the result (success + URN, or error message).
+
+3. Do not write any interim "I'm working on it" text between `save_correction` calls. Proceed silently through all selected proposals.
+
+After all writes complete, call `report_proposal_results` **once** with the full list of outcomes. This is the **final action of the turn**. Do **NOT** output any text after calling `report_proposal_results` — no narrative summary, no restating of what succeeded/failed, no "Here's what happened", no bullet list of results. The card rendered from the tool call IS the complete summary; any additional text is redundant noise that will be stripped.
 
 ### Step 6 — Graceful degradation (write-back not available)
 
diff --git a/backend/src/analytics_agent/skills/save-correction/SKILL.md b/backend/src/analytics_agent/skills/save-correction/SKILL.md
index 4991d0f..366ffbc 100644
--- a/backend/src/analytics_agent/skills/save-correction/SKILL.md
+++ b/backend/src/analytics_agent/skills/save-correction/SKILL.md
@@ -17,6 +17,10 @@ metadata:
 
 # save_correction
 
+## When called from /improve-context
+
+When this skill is invoked during `/improve-context` execution (after the user has submitted the proposals card), skip the confirmation sub-steps in each Mode (Mode 1 Step 3, Mode 2 Step 2, Mode 3 Step 3). The user has already approved the change via the proposals card; proceed directly to the save call without showing diffs or asking "Shall I apply this?".
+
 ## Overview
 
 This skill writes correct knowledge back to DataHub. It handles three cases:
diff --git a/frontend/src/api/conversations.ts b/frontend/src/api/conversations.ts
index 6c60251..f858047 100644
--- a/frontend/src/api/conversations.ts
+++ b/frontend/src/api/conversations.ts
@@ -1,4 +1,5 @@
-import type { ConversationDetail, ConversationSummary, Engine } from "@/types";
+import type { ConversationDetail, ConversationSummary, Engine, ProposalItem } from "@/types";
+import { streamMessage } from "@/api/stream";
 
 const BASE = "/api";
 
@@ -59,3 +60,31 @@ export async function getContextQuality(conversationId: string): Promise<Context
   if (!res.ok) throw new Error("Failed to fetch context quality");
   return res.json();
 }
+
+/**
+ * Submit a proposal selection back to the agent as a user turn.
+ * Returns the underlying SSE stream so callers can consume events.
+ */
+export function sendProposalSelection(
+  conversationId: string,
+  originMessageId: string,
+  selectedIds: string[],
+  proposals: ProposalItem[]
+) {
+  const selectedItems = proposals.filter((p) => selectedIds.includes(p.id));
+  const agentText =
+    selectedItems.length === 0
+      ? "Skip all proposals — make no changes."
+      : `Publish the following proposals: ${selectedItems.map((p) => `"${p.title}"`).join(", ")}.`;
+  const displayText =
+    selectedItems.length === 0
+      ? "Skipped proposals"
+      : `Selected ${selectedItems.length} proposal${selectedItems.length === 1 ? "" : "s"}`;
+
+  return streamMessage(conversationId, agentText, undefined, {
+    source: "proposal_select",
+    origin_message_id: originMessageId,
+    display_text: displayText,
+    selected_ids: selectedIds,
+  });
+}
diff --git a/frontend/src/components/Chat/ChatView.tsx b/frontend/src/components/Chat/ChatView.tsx
index f58f11a..56dceac 100644
--- a/frontend/src/components/Chat/ChatView.tsx
+++ b/frontend/src/components/Chat/ChatView.tsx
@@ -198,26 +198,12 @@ export function ChatView() {
     setExportModalOpen(false);
   }, [activeConv?.title]);
 
-  const handleSend = async (text: string) => {
-    if (!activeId || isStreaming) return;
-
-    // Append user message immediately
-    appendMessage({
-      id: crypto.randomUUID(),
-      event_type: "TEXT",
-      role: "user",
-      payload: { text },
-    });
-
+  const consumeStream = async (stream: AsyncIterator<import("@/types").SSEEvent>, convId: string) => {
     setStreaming(true);
     resetStreamingText(); // new turn — reset so TEXT goes to a fresh message
 
-    const conversationId = activeId;
     let aborted = false;
     try {
-      const controller = new AbortController();
-      streamAbortRef.current = controller;
-      const stream = streamMessage(conversationId, text, controller.signal);
       let result = await stream.next();
       const sendTurnUsage: TurnUsage = { input_tokens: 0, output_tokens: 0, total_tokens: 0, cache_read_tokens: 0, cache_creation_tokens: 0, calls: 0 };
       while (!result.done) {
@@ -225,7 +211,6 @@ export function ChatView() {
         if (event.event === "TEXT") {
           appendStreamingText((event.payload as { text: string }).text);
         } else if (event.event === "TOOL_CALL") {
-          // Text before this tool call was reasoning — mark it as a thinking block
           markCurrentAsThinking();
           appendMessage({
             id: event.message_id,
@@ -279,13 +264,30 @@ export function ChatView() {
       setStreaming(false);
       if (!aborted) {
         // Fire-and-forget title generation after the turn completes
-        generateTitle(conversationId).then((r) => {
-          if (r.updated) updateConversationTitle(conversationId, r.title);
+        generateTitle(convId).then((r) => {
+          if (r.updated) updateConversationTitle(convId, r.title);
         }).catch(() => {});
       }
     }
   };
 
+  const handleSend = async (text: string) => {
+    if (!activeId || isStreaming) return;
+
+    // Append user message immediately
+    appendMessage({
+      id: crypto.randomUUID(),
+      event_type: "TEXT",
+      role: "user",
+      payload: { text },
+    });
+
+    const controller = new AbortController();
+    streamAbortRef.current = controller;
+    const stream = streamMessage(activeId, text, controller.signal);
+    await consumeStream(stream, activeId);
+  };
+
   const handleWelcomeSend = async (text: string, engineName: string) => {
     pendingFirstMessage.current = text;
     const conv = await createConversation(engineName);
@@ -353,6 +355,24 @@ export function ChatView() {
         isStreaming={isStreaming}
         conversationId={activeId}
         showReasoning={showReasoning}
+        onProposalStream={async (stream, userPayload) => {
+          if (!activeId || isStreaming) return;
+          // Append the selection chip as a user message immediately so it
+          // appears anchored under the proposals card without waiting for reload.
+          appendMessage({
+            id: crypto.randomUUID(),
+            event_type: "TEXT",
+            role: "user",
+            payload: {
+              text: userPayload.text,
+              display_text: userPayload.display_text,
+              source: "proposal_select",
+              origin_message_id: userPayload.origin_message_id,
+              selected_ids: userPayload.selected_ids,
+            },
+          });
+          await consumeStream(stream, activeId);
+        }}
         onChartError={(error) => {
           if (chartErrorRetried.current || isStreaming) return;
           chartErrorRetried.current = true;
diff --git a/frontend/src/components/Chat/MessageList.tsx b/frontend/src/components/Chat/MessageList.tsx
index 175a6e5..781504d 100644
--- a/frontend/src/components/Chat/MessageList.tsx
+++ b/frontend/src/components/Chat/MessageList.tsx
@@ -1,8 +1,15 @@
 import { Fragment, useEffect, useRef } from "react";
-import type { UIMessage } from "@/types";
+import type {
+  UIMessage,
+  ProposalsPayload,
+  ProposalResultsPayload,
+  SSEEvent,
+} from "@/types";
 import { TextMessage } from "./messages/TextMessage";
 import { AgentWorkBlock } from "./messages/AgentWorkBlock";
 import { SelectionChip, type SelectionChipPayload } from "./messages/SelectionChip";
+import { ProposalsMessage } from "./messages/ProposalsMessage";
+import { ProposalResultsMessage } from "./messages/ProposalResultsMessage";
 import { groupIntoTurns } from "@/lib/groupMessages";
 
 interface Props {
@@ -11,9 +18,25 @@ interface Props {
   conversationId?: string;
   showReasoning?: boolean;
   onChartError?: (error: string) => void;
+  onProposalStream?: (
+    stream: AsyncIterator<SSEEvent>,
+    userPayload: {
+      text: string;
+      display_text: string;
+      origin_message_id: string;
+      selected_ids: string[];
+    }
+  ) => void;
 }
 
-export function MessageList({ messages, isStreaming = false, conversationId, showReasoning = true, onChartError }: Props) {
+export function MessageList({
+  messages,
+  isStreaming = false,
+  conversationId,
+  showReasoning = true,
+  onChartError,
+  onProposalStream,
+}: Props) {
   const bottomRef = useRef<HTMLDivElement>(null);
 
   useEffect(() => {
@@ -33,11 +56,12 @@ export function MessageList({ messages, isStreaming = false, conversationId, sho
   return (
     <div id="chat-messages" className="flex-1 overflow-y-auto px-4 py-4 space-y-3">
       {groups.map((group) => {
-        // MCP App iframe-originated user turns render as a compact selection
+        // MCP App / proposal-select user turns render as a compact selection
         // chip (flavor C) — not a full user bubble.
+        const userSource = (group.userMsg?.payload as Record<string, unknown> | undefined)?.source;
         const isMcpAppSelection =
           group.userMsg?.event_type === "TEXT" &&
-          (group.userMsg.payload as Record<string, unknown>).source === "mcp_app";
+          (userSource === "mcp_app" || userSource === "proposal_select");
         return (
           <Fragment key={group.key}>
             {/* User message */}
@@ -68,6 +92,41 @@ export function MessageList({ messages, isStreaming = false, conversationId, sho
               />
             )}
 
+            {/* Interactive cards (proposals / results) — sibling to work block */}
+            {group.interactiveMsgs.map((msg) => {
+              if (msg.event_type === "PROPOSALS" && conversationId) {
+                const submitted = messages.some(
+                  (m) =>
+                    m.role === "user" &&
+                    (m.payload as Record<string, unknown>).source === "proposal_select" &&
+                    (m.payload as Record<string, unknown>).origin_message_id === msg.id
+                );
+                return (
+                  <div key={msg.id} className="flex flex-col items-start">
+                    <ProposalsMessage
+                      messageId={msg.id}
+                      conversationId={conversationId}
+                      payload={msg.payload as unknown as ProposalsPayload}
+                      submitted={submitted}
+                      onStream={(stream, userPayload) =>
+                        onProposalStream?.(stream, userPayload)
+                      }
+                    />
+                  </div>
+                );
+              }
+              if (msg.event_type === "PROPOSAL_RESULTS") {
+                return (
+                  <div key={msg.id} className="flex flex-col items-start">
+                    <ProposalResultsMessage
+                      payload={msg.payload as unknown as ProposalResultsPayload}
+                    />
+                  </div>
+                );
+              }
+              return null;
+            })}
+
             {/* Final visible response */}
             {group.finalMsg && (group.finalMsg.payload as { text?: string }).text?.trim() && (
               <div className="flex flex-col items-start" data-print-role="assistant">
diff --git a/frontend/src/components/Chat/messages/ProposalResultsMessage.tsx b/frontend/src/components/Chat/messages/ProposalResultsMessage.tsx
new file mode 100644
index 0000000..f1ece83
--- /dev/null
+++ b/frontend/src/components/Chat/messages/ProposalResultsMessage.tsx
@@ -0,0 +1,157 @@
+/**
+ * ProposalResultsMessage — renders the outcomes of a /improve-context write
+ * run as a compact status card. Each row shows a green check (success) or
+ * red X (error), the kind badge, the title, the written URN, and an
+ * "Open in DataHub" link for successes.
+ */
+
+import { useEffect, useState } from "react";
+import { CheckCircle2, XCircle, FilePlus, FileText, Tag, ExternalLink, ClipboardList } from "lucide-react";
+import type { ProposalResultItem, ProposalResultsPayload } from "@/types";
+import { listConnections } from "@/api/settings";
+
+interface Props {
+  payload: ProposalResultsPayload;
+}
+
+const KIND_META: Record<
+  ProposalResultItem["kind"],
+  { label: string; className: string; icon: React.ReactNode }
+> = {
+  new_doc: {
+    label: "New doc",
+    className: "bg-emerald-100 text-emerald-700 dark:bg-emerald-900/40 dark:text-emerald-400",
+    icon: <FilePlus className="w-3 h-3" />,
+  },
+  update_doc: {
+    label: "Update doc",
+    className: "bg-blue-100 text-blue-700 dark:bg-blue-900/40 dark:text-blue-400",
+    icon: <FileText className="w-3 h-3" />,
+  },
+  fix_description: {
+    label: "Fix description",
+    className: "bg-amber-100 text-amber-700 dark:bg-amber-900/40 dark:text-amber-400",
+    icon: <Tag className="w-3 h-3" />,
+  },
+};
+
+/** Derive the DataHub UI base URL from the GMS URL stored in the connection config.
+ *  e.g. "https://instance.acryl.io/gms" → "https://instance.acryl.io" */
+function useDataHubBaseUrl(): string | null {
+  const [baseUrl, setBaseUrl] = useState<string | null>(null);
+
+  useEffect(() => {
+    listConnections()
+      .then((connections) => {
+        const dhConn = connections.find(
+          (c) => c.type === "datahub" || c.type === "datahub_mcp"
+        );
+        if (!dhConn) return;
+        const urlField = dhConn.fields.find((f) => f.key === "url");
+        if (!urlField?.value) return;
+        // Strip trailing /gms to get the UI base
+        const raw = urlField.value.replace(/\/gms\/?$/, "").replace(/\/$/, "");
+        setBaseUrl(raw);
+      })
+      .catch(() => {});
+  }, []);
+
+  return baseUrl;
+}
+
+function buildEntityUrl(baseUrl: string, urn: string): string {
+  return `${baseUrl}/entity/${encodeURIComponent(urn)}`;
+}
+
+export function ProposalResultsMessage({ payload }: Props) {
+  const { results } = payload;
+  const baseUrl = useDataHubBaseUrl();
+
+  const successCount = results.filter((r) => r.status === "success").length;
+  const total = results.length;
+
+  return (
+    <div className="w-full rounded-lg border border-border overflow-hidden bg-background">
+      {/* Header strip */}
+      <div className="flex items-center gap-2 px-3 py-2 bg-muted/40 border-b border-border text-xs text-muted-foreground">
+        <ClipboardList className="w-3.5 h-3.5 shrink-0" />
+        <span className="font-medium">Write results</span>
+        <span className="ml-auto shrink-0 opacity-60">
+          {successCount} of {total} succeeded
+        </span>
+      </div>
+
+      {/* Results list */}
+      <ul className="divide-y divide-border">
+        {results.map((item) => {
+          const meta = KIND_META[item.kind];
+          const isSuccess = item.status === "success";
+
+          return (
+            <li key={item.id} className="flex gap-3 px-4 py-3">
+              {/* Status icon */}
+              <div className="mt-0.5 shrink-0">
+                {isSuccess ? (
+                  <CheckCircle2 className="w-4 h-4 text-emerald-500" />
+                ) : (
+                  <XCircle className="w-4 h-4 text-red-500" />
+                )}
+              </div>
+
+              {/* Content */}
+              <div className="flex-1 min-w-0">
+                <div className="flex flex-wrap items-center gap-2 mb-1">
+                  {/* Kind badge */}
+                  <span
+                    className={`inline-flex items-center gap-1 px-1.5 py-0.5 rounded text-[10px] font-semibold uppercase tracking-wide ${meta.className}`}
+                  >
+                    {meta.icon}
+                    {meta.label}
+                  </span>
+                  <span className="text-sm font-medium text-foreground truncate">
+                    {item.title}
+                  </span>
+                </div>
+
+                {isSuccess && item.urn && (
+                  <div className="flex items-center gap-2 mt-1">
+                    <code className="text-[10px] font-mono text-muted-foreground/70 truncate">
+                      {item.urn}
+                    </code>
+                    {baseUrl && (
+                      <a
+                        href={buildEntityUrl(baseUrl, item.urn)}
+                        target="_blank"
+                        rel="noopener noreferrer"
+                        className="inline-flex items-center gap-0.5 text-[10px] text-primary hover:underline shrink-0"
+                        onClick={(e) => e.stopPropagation()}
+                      >
+                        <ExternalLink className="w-2.5 h-2.5" />
+                        Open
+                      </a>
+                    )}
+                  </div>
+                )}
+
+                {!isSuccess && item.error && (
+                  <p className="mt-1 text-[10px] font-mono text-red-500/90 break-words">
+                    {item.error}
+                  </p>
+                )}
+              </div>
+            </li>
+          );
+        })}
+      </ul>
+
+      {/* Footer summary */}
+      <div className="px-4 py-2.5 border-t border-border bg-muted/20 text-xs text-muted-foreground">
+        {successCount === total
+          ? `All ${total} change${total !== 1 ? "s" : ""} applied successfully.`
+          : successCount === 0
+          ? `All ${total} change${total !== 1 ? "s" : ""} failed.`
+          : `${successCount} of ${total} changes applied; ${total - successCount} failed.`}
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/Chat/messages/ProposalsMessage.tsx b/frontend/src/components/Chat/messages/ProposalsMessage.tsx
new file mode 100644
index 0000000..2c5c7e6
--- /dev/null
+++ b/frontend/src/components/Chat/messages/ProposalsMessage.tsx
@@ -0,0 +1,227 @@
+/**
+ * ProposalsMessage — renders a set of agent-proposed documentation changes
+ * as an interactive card. The user selects which proposals to apply and
+ * clicks Submit (or Skip to bypass all). Once submitted, the card
+ * transitions to a disabled read-only state.
+ */
+
+import { useState, useEffect } from "react";
+import { FileText, FilePlus, Tag, CheckSquare, Square, Loader2 } from "lucide-react";
+import ReactMarkdown from "react-markdown";
+import remarkGfm from "remark-gfm";
+import type { ProposalItem, ProposalsPayload } from "@/types";
+import { sendProposalSelection } from "@/api/conversations";
+
+interface Props {
+  messageId: string;
+  conversationId: string;
+  payload: ProposalsPayload;
+  submitted: boolean;
+  onStream: (
+    stream: AsyncIterator<import("@/types").SSEEvent>,
+    userPayload: {
+      text: string;
+      display_text: string;
+      origin_message_id: string;
+      selected_ids: string[];
+    }
+  ) => void;
+}
+
+const KIND_META: Record<
+  ProposalItem["kind"],
+  { label: string; className: string; icon: React.ReactNode }
+> = {
+  new_doc: {
+    label: "New doc",
+    className: "bg-emerald-100 text-emerald-700 dark:bg-emerald-900/40 dark:text-emerald-400",
+    icon: <FilePlus className="w-3 h-3" />,
+  },
+  update_doc: {
+    label: "Update doc",
+    className: "bg-blue-100 text-blue-700 dark:bg-blue-900/40 dark:text-blue-400",
+    icon: <FileText className="w-3 h-3" />,
+  },
+  fix_description: {
+    label: "Fix description",
+    className: "bg-amber-100 text-amber-700 dark:bg-amber-900/40 dark:text-amber-400",
+    icon: <Tag className="w-3 h-3" />,
+  },
+};
+
+export function ProposalsMessage({ messageId, conversationId, payload, submitted, onStream }: Props) {
+  const { proposals } = payload;
+  const [selected, setSelected] = useState<Set<string>>(() => new Set());
+  const [isSubmitting, setIsSubmitting] = useState(false);
+
+  // Clear the spinner once the parent confirms submission (selection chip appended)
+  useEffect(() => {
+    if (submitted) setIsSubmitting(false);
+  }, [submitted]);
+
+  const toggle = (id: string) => {
+    if (submitted || isSubmitting) return;
+    setSelected((prev) => {
+      const next = new Set(prev);
+      if (next.has(id)) next.delete(id);
+      else next.add(id);
+      return next;
+    });
+  };
+
+  const selectAll = () => {
+    if (submitted || isSubmitting) return;
+    setSelected(new Set(proposals.map((p) => p.id)));
+  };
+
+  const selectNone = () => {
+    if (submitted || isSubmitting) return;
+    setSelected(new Set());
+  };
+
+  const handleSubmit = async (skipAll = false) => {
+    if (submitted || isSubmitting) return;
+    setIsSubmitting(true);
+    try {
+      const ids = skipAll ? [] : Array.from(selected);
+      const selectedItems = proposals.filter((p) => ids.includes(p.id));
+      const agentText =
+        selectedItems.length === 0
+          ? "Skip all proposals — make no changes."
+          : `Publish the following proposals: ${selectedItems.map((p) => `"${p.title}"`).join(", ")}.`;
+      const displayText =
+        selectedItems.length === 0
+          ? "Skipped proposals"
+          : `Selected ${selectedItems.length} proposal${selectedItems.length === 1 ? "" : "s"}`;
+
+      const stream = sendProposalSelection(conversationId, messageId, ids, proposals);
+      onStream(stream, {
+        text: agentText,
+        display_text: displayText,
+        origin_message_id: messageId,
+        selected_ids: ids,
+      });
+    } catch {
+      setIsSubmitting(false);
+    }
+  };
+
+  const disabled = submitted || isSubmitting;
+
+  return (
+    <div className="w-full rounded-lg border border-border overflow-hidden bg-background">
+      {/* Header strip */}
+      <div className="flex items-center gap-2 px-3 py-2 bg-muted/40 border-b border-border text-xs text-muted-foreground">
+        <FilePlus className="w-3.5 h-3.5 shrink-0" />
+        <span className="font-medium">Proposed changes</span>
+        <span className="ml-auto shrink-0 opacity-60">
+          {proposals.length} proposal{proposals.length !== 1 ? "s" : ""}
+        </span>
+      </div>
+
+      {/* Prompt / description */}
+      {payload.prompt && (
+        <div className="px-4 pt-3 pb-1 text-sm text-muted-foreground prose prose-sm max-w-none">
+          <ReactMarkdown remarkPlugins={[remarkGfm]}>{payload.prompt}</ReactMarkdown>
+        </div>
+      )}
+
+      {/* Proposal list */}
+      <ul className="divide-y divide-border">
+        {proposals.map((proposal) => {
+          const meta = KIND_META[proposal.kind];
+          const isChecked = selected.has(proposal.id);
+
+          return (
+            <li
+              key={proposal.id}
+              className={`flex gap-3 px-4 py-3 ${disabled ? "" : "cursor-pointer hover:bg-muted/30 transition-colors"}`}
+              onClick={() => toggle(proposal.id)}
+            >
+              {/* Checkbox */}
+              <div className="mt-0.5 shrink-0 text-primary">
+                {isChecked ? (
+                  <CheckSquare className={`w-4 h-4 ${disabled ? "opacity-50" : ""}`} />
+                ) : (
+                  <Square className={`w-4 h-4 text-muted-foreground ${disabled ? "opacity-50" : ""}`} />
+                )}
+              </div>
+
+              {/* Content */}
+              <div className="flex-1 min-w-0">
+                <div className="flex flex-wrap items-center gap-2 mb-1">
+                  {/* Kind badge */}
+                  <span
+                    className={`inline-flex items-center gap-1 px-1.5 py-0.5 rounded text-[10px] font-semibold uppercase tracking-wide ${meta.className}`}
+                  >
+                    {meta.icon}
+                    {meta.label}
+                  </span>
+                  <span className="text-sm font-medium text-foreground truncate">
+                    {proposal.title}
+                  </span>
+                </div>
+                {proposal.detail && (
+                  <div className="text-xs text-muted-foreground prose prose-sm max-w-none">
+                    <ReactMarkdown remarkPlugins={[remarkGfm]}>{proposal.detail}</ReactMarkdown>
+                  </div>
+                )}
+                {proposal.target?.field_path && (
+                  <p className="mt-1 text-[10px] font-mono text-muted-foreground/70 truncate">
+                    {proposal.target.field_path}
+                  </p>
+                )}
+              </div>
+            </li>
+          );
+        })}
+      </ul>
+
+      {/* Footer */}
+      <div className="flex items-center justify-between gap-3 px-4 py-3 border-t border-border bg-muted/20">
+        {/* Select all / none */}
+        {!disabled && (
+          <div className="flex items-center gap-3 text-xs text-muted-foreground">
+            <button
+              onClick={(e) => { e.stopPropagation(); selectAll(); }}
+              className="hover:text-foreground transition-colors underline-offset-2 hover:underline"
+            >
+              Select all
+            </button>
+            <button
+              onClick={(e) => { e.stopPropagation(); selectNone(); }}
+              className="hover:text-foreground transition-colors underline-offset-2 hover:underline"
+            >
+              Select none
+            </button>
+          </div>
+        )}
+        {disabled && <div />}
+
+        {/* Action buttons */}
+        <div className="flex items-center gap-2">
+          {!disabled && (
+            <button
+              onClick={(e) => { e.stopPropagation(); void handleSubmit(true); }}
+              className="text-xs px-3 py-1.5 rounded-md border border-border text-muted-foreground hover:text-foreground hover:bg-muted/60 transition-colors"
+            >
+              Skip
+            </button>
+          )}
+          <button
+            disabled={disabled}
+            onClick={(e) => { e.stopPropagation(); void handleSubmit(false); }}
+            className={`inline-flex items-center gap-1.5 text-xs px-3 py-1.5 rounded-md font-medium transition-colors
+              ${disabled
+                ? "bg-primary/40 text-primary-foreground cursor-not-allowed"
+                : "bg-primary text-primary-foreground hover:bg-primary/90"
+              }`}
+          >
+            {isSubmitting && <Loader2 className="w-3 h-3 animate-spin" />}
+            {submitted ? "Submitted" : isSubmitting ? "Submitting…" : `Submit selected (${selected.size})`}
+          </button>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/lib/buildUiMessages.ts b/frontend/src/lib/buildUiMessages.ts
index 88be52c..0d4d7f3 100644
--- a/frontend/src/lib/buildUiMessages.ts
+++ b/frontend/src/lib/buildUiMessages.ts
@@ -92,6 +92,8 @@ export function buildUiMessages(records: MessageRecord[]): {
       case "SQL":
       case "CHART":
       case "MCP_APP":
+      case "PROPOSALS":
+      case "PROPOSAL_RESULTS":
       case "ERROR":
         result.push({ id: m.id, event_type: m.event_type, role: "assistant", payload: m.payload, created_at: m.created_at });
         break;
diff --git a/frontend/src/lib/groupMessages.ts b/frontend/src/lib/groupMessages.ts
index ef34836..d4f1142 100644
--- a/frontend/src/lib/groupMessages.ts
+++ b/frontend/src/lib/groupMessages.ts
@@ -6,24 +6,31 @@ export interface TurnGroup {
   key: string;
   userMsg?: UIMessage;
   workMsgs: UIMessage[];
+  // Interactive cards (proposals + proposal results) — rendered outside the
+  // collapsible work block since users need to see and act on them.
+  interactiveMsgs: UIMessage[];
   finalMsg?: UIMessage;
   isActivelyStreaming: boolean;
 }
 
+const INTERACTIVE_TYPES = new Set(["PROPOSALS", "PROPOSAL_RESULTS"]);
+
 export function groupIntoTurns(messages: UIMessage[], globalStreaming: boolean): TurnGroup[] {
   const groups: TurnGroup[] = [];
-  let current: TurnGroup = { key: "init", workMsgs: [], isActivelyStreaming: false };
+  let current: TurnGroup = { key: "init", workMsgs: [], interactiveMsgs: [], isActivelyStreaming: false };
 
   for (const msg of messages) {
     if (msg.role === "user") {
-      if (current.userMsg || current.workMsgs.length > 0 || current.finalMsg) {
+      if (current.userMsg || current.workMsgs.length > 0 || current.interactiveMsgs.length > 0 || current.finalMsg) {
         groups.push(current);
       }
-      current = { key: msg.id, userMsg: msg, workMsgs: [], isActivelyStreaming: false };
+      current = { key: msg.id, userMsg: msg, workMsgs: [], interactiveMsgs: [], isActivelyStreaming: false };
       continue;
     }
 
-    if (msg.event_type === "TEXT" && !msg.isThinking) {
+    if (INTERACTIVE_TYPES.has(msg.event_type)) {
+      current.interactiveMsgs.push(msg);
+    } else if (msg.event_type === "TEXT" && !msg.isThinking) {
       if (msg.isStreaming) current.isActivelyStreaming = true;
       current.finalMsg = msg;
     } else if (WORK_TYPES.has(msg.event_type) || (msg.event_type === "TEXT" && msg.isThinking)) {
@@ -31,7 +38,7 @@ export function groupIntoTurns(messages: UIMessage[], globalStreaming: boolean):
     }
   }
 
-  if (current.userMsg || current.workMsgs.length > 0 || current.finalMsg) {
+  if (current.userMsg || current.workMsgs.length > 0 || current.interactiveMsgs.length > 0 || current.finalMsg) {
     if (globalStreaming && !current.finalMsg?.isStreaming) {
       current.isActivelyStreaming = globalStreaming;
     }
diff --git a/frontend/src/types/index.ts b/frontend/src/types/index.ts
index 50bfff6..3fddcf1 100644
--- a/frontend/src/types/index.ts
+++ b/frontend/src/types/index.ts
@@ -6,6 +6,8 @@ export type SSEEventType =
   | "SQL"
   | "CHART"
   | "MCP_APP"
+  | "PROPOSALS"
+  | "PROPOSAL_RESULTS"
   | "USAGE"
   | "COMPLETE"
   | "ERROR";
@@ -71,6 +73,32 @@ export interface MCPAppPayload {
   permissions: string[];
 }
 
+export interface ProposalItem {
+  id: string;
+  kind: "new_doc" | "update_doc" | "fix_description";
+  title: string;
+  detail: string;
+  target?: { urn?: string; field_path?: string } | null;
+}
+
+export interface ProposalsPayload {
+  prompt: string;
+  proposals: ProposalItem[];
+}
+
+export interface ProposalResultItem {
+  id: string;
+  kind: "new_doc" | "update_doc" | "fix_description";
+  title: string;
+  status: "success" | "error";
+  urn?: string;
+  error?: string;
+}
+
+export interface ProposalResultsPayload {
+  results: ProposalResultItem[];
+}
+
 export interface Engine {
   name: string;
   type: string;

From 625a669f2c4298d6d0ae1d03cde77a1df906a678 Mon Sep 17 00:00:00 2001
From: Gabe Lyons <gabe.lyons@acryl.io>
Date: Mon, 4 May 2026 17:49:19 -0700
Subject: [PATCH 3/3] refactor: render MCP_APP messages outside the collapsible
 work block

Promotes MCP_APP from WORK_TYPES to INTERACTIVE_TYPES so app frames
render alongside proposal cards instead of collapsing with tool calls.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 frontend/src/components/Chat/MessageList.tsx     | 16 ++++++++++++++--
 .../components/Chat/messages/AgentWorkBlock.tsx  | 11 -----------
 frontend/src/lib/groupMessages.ts                |  4 ++--
 3 files changed, 16 insertions(+), 15 deletions(-)

diff --git a/frontend/src/components/Chat/MessageList.tsx b/frontend/src/components/Chat/MessageList.tsx
index 781504d..b7cee2b 100644
--- a/frontend/src/components/Chat/MessageList.tsx
+++ b/frontend/src/components/Chat/MessageList.tsx
@@ -1,6 +1,7 @@
 import { Fragment, useEffect, useRef } from "react";
 import type {
   UIMessage,
+  MCPAppPayload,
   ProposalsPayload,
   ProposalResultsPayload,
   SSEEvent,
@@ -8,6 +9,7 @@ import type {
 import { TextMessage } from "./messages/TextMessage";
 import { AgentWorkBlock } from "./messages/AgentWorkBlock";
 import { SelectionChip, type SelectionChipPayload } from "./messages/SelectionChip";
+import { MCPAppMessage } from "./messages/MCPAppMessage";
 import { ProposalsMessage } from "./messages/ProposalsMessage";
 import { ProposalResultsMessage } from "./messages/ProposalResultsMessage";
 import { groupIntoTurns } from "@/lib/groupMessages";
@@ -87,13 +89,23 @@ export function MessageList({
                 turnUsage={group.finalMsg?.turnUsage}
                 isStreaming={group.isActivelyStreaming}
                 showReasoning={showReasoning}
-                conversationId={conversationId}
                 onChartError={onChartError}
               />
             )}
 
-            {/* Interactive cards (proposals / results) — sibling to work block */}
+            {/* Interactive cards (MCP apps / proposals / results) — sibling to work block, never collapses */}
             {group.interactiveMsgs.map((msg) => {
+              if (msg.event_type === "MCP_APP" && conversationId) {
+                return (
+                  <div key={msg.id} className="flex flex-col items-start">
+                    <MCPAppMessage
+                      messageId={msg.id}
+                      conversationId={conversationId}
+                      payload={msg.payload as unknown as MCPAppPayload}
+                    />
+                  </div>
+                );
+              }
               if (msg.event_type === "PROPOSALS" && conversationId) {
                 const submitted = messages.some(
                   (m) =>
diff --git a/frontend/src/components/Chat/messages/AgentWorkBlock.tsx b/frontend/src/components/Chat/messages/AgentWorkBlock.tsx
index 20534cf..23f8c98 100644
--- a/frontend/src/components/Chat/messages/AgentWorkBlock.tsx
+++ b/frontend/src/components/Chat/messages/AgentWorkBlock.tsx
@@ -7,8 +7,6 @@ import { ToolCallMessage, ToolResultMessage } from "./ToolCallMessage";
 import { SqlMessage } from "./SqlMessage";
 import { ChartMessage } from "./ChartMessage";
 import { ErrorMessage } from "./ErrorMessage";
-import { MCPAppMessage } from "./MCPAppMessage";
-import type { MCPAppPayload } from "@/types";
 
 function fmt(n: number): string {
   if (n < 1000) return String(n);
@@ -21,7 +19,6 @@ interface Props {
   turnUsage?: TurnUsage;
   isStreaming?: boolean;
   showReasoning?: boolean;
-  conversationId?: string;
   onChartError?: (error: string) => void;
 }
 
@@ -30,7 +27,6 @@ export function AgentWorkBlock({
   turnUsage,
   isStreaming = false,
   showReasoning = true,
-  conversationId,
   onChartError,
 }: Props) {
   const [expanded, setExpanded] = useState(isStreaming);
@@ -201,13 +197,6 @@ export function AgentWorkBlock({
                 {msg.event_type === "CHART" && (
                   <ChartMessage payload={msg.payload as never} onRenderError={onChartError} />
                 )}
-                {msg.event_type === "MCP_APP" && conversationId && (
-                  <MCPAppMessage
-                    messageId={msg.id}
-                    conversationId={conversationId}
-                    payload={msg.payload as unknown as MCPAppPayload}
-                  />
-                )}
                 {msg.event_type === "ERROR" && (
                   <ErrorMessage payload={msg.payload as never} />
                 )}
diff --git a/frontend/src/lib/groupMessages.ts b/frontend/src/lib/groupMessages.ts
index d4f1142..7d5698b 100644
--- a/frontend/src/lib/groupMessages.ts
+++ b/frontend/src/lib/groupMessages.ts
@@ -1,6 +1,6 @@
 import type { UIMessage, TurnUsage } from "@/types";
 
-const WORK_TYPES = new Set(["TOOL_CALL", "TOOL_RESULT", "SQL", "CHART", "MCP_APP", "ERROR", "THINKING"]);
+const WORK_TYPES = new Set(["TOOL_CALL", "TOOL_RESULT", "SQL", "CHART", "ERROR", "THINKING"]);
 
 export interface TurnGroup {
   key: string;
@@ -13,7 +13,7 @@ export interface TurnGroup {
   isActivelyStreaming: boolean;
 }
 
-const INTERACTIVE_TYPES = new Set(["PROPOSALS", "PROPOSAL_RESULTS"]);
+const INTERACTIVE_TYPES = new Set(["PROPOSALS", "PROPOSAL_RESULTS", "MCP_APP"]);
 
 export function groupIntoTurns(messages: UIMessage[], globalStreaming: boolean): TurnGroup[] {
   const groups: TurnGroup[] = [];