diff --git a/Makefile b/Makefile
index 9d23d6f..28dd17e 100644
--- a/Makefile
+++ b/Makefile
@@ -27,7 +27,7 @@ DC := docker compose -f docker-compose.yml
 PYTEST_FOCUS ?= app
 PYTEST_APP_TESTS := archive/services/orchestrator_legacy_python/tests/test_orchestrator_retrieval.py archive/services/orchestrator_legacy_python/tests/test_migration_runtime.py
 
-.PHONY: help launch all up up-core down status ps logs build rebuild pull clean prune             mcp-proxy-up init qdrant-init mindsdb-seed letta-seed models-pull             proxy-status doctor mem-ping monitor-open monitor-check dmg-build msi-build linux-bundle-build            storage-audit qdrant-snapshot-prune qdrant-cutover cold-snapshot-pack cold-snapshot-tier cold-snapshot-restore telemetry-archive fanout-status fanout-deadletters fanout-rehydrate retention-install retention-uninstall retention-status retention-install-daily storage-ledger-capture storage-ledger-prune storage-ledger-install storage-ledger-uninstall storage-ledger-status memory-graph-quality memory-graph-quality-install memory-graph-quality-uninstall memory-graph-quality-status weekly-lineage-rollup weekly-lineage-install weekly-lineage-uninstall weekly-lineage-status            docker-fs-watchdog-run docker-fs-watchdog-install docker-fs-watchdog-uninstall docker-fs-watchdog-status            storage-migrate-hot-bindings disk-clean-safe            mem-mode-show mem-mode-core mem-mode-balanced mem-mode-full mem-up-core mem-up-balanced mem-up-full observability-up observability-down launch-readiness-gate launch-readiness-gate-schedule launch-readiness-gate-schedule-status launch-readiness-gate-schedule-cancel paid-launch-checklist backup-restore-drill mem-up-release mem-up-lite-release release-lock-verify qdrant-cloud-check quickstart submission-preflight launch-lock launch-lock-public test-py bench-shortlist bench-qdrant-tuning bench-backend-lanes env-lock-check env-lock-apply sentrux-check sentrux-gate sentrux-gate-save agent-context-gate
+.PHONY: help launch all up up-core down status ps logs build rebuild pull clean prune             mcp-proxy-up init qdrant-init mindsdb-seed letta-seed models-pull             proxy-status doctor mem-ping monitor-open monitor-check dmg-build msi-build linux-bundle-build            storage-audit qdrant-snapshot-prune qdrant-cutover cold-snapshot-pack cold-snapshot-tier cold-snapshot-restore telemetry-archive fanout-status fanout-deadletters fanout-rehydrate retention-install retention-uninstall retention-status retention-install-daily storage-ledger-capture storage-ledger-prune storage-ledger-install storage-ledger-uninstall storage-ledger-status memory-graph-quality memory-graph-quality-install memory-graph-quality-uninstall memory-graph-quality-status recall-quality recall-quality-refresh recall-quality-tuning open-core-boundary-audit weekly-lineage-rollup weekly-lineage-install weekly-lineage-uninstall weekly-lineage-status            docker-fs-watchdog-run docker-fs-watchdog-install docker-fs-watchdog-uninstall docker-fs-watchdog-status            storage-migrate-hot-bindings disk-clean-safe            mem-mode-show mem-mode-core mem-mode-balanced mem-mode-full mem-up-core mem-up-balanced mem-up-full observability-up observability-down launch-readiness-gate launch-readiness-gate-schedule launch-readiness-gate-schedule-status launch-readiness-gate-schedule-cancel paid-launch-checklist backup-restore-drill mem-up-release mem-up-lite-release release-lock-verify qdrant-cloud-check quickstart submission-preflight launch-lock launch-lock-public test-py bench-shortlist bench-qdrant-tuning bench-backend-lanes env-lock-check env-lock-apply sentrux-check sentrux-gate sentrux-gate-save agent-context-gate
 
 help:
 > echo "Targets:"
@@ -54,6 +54,8 @@ help:
 > echo "  storage-ledger-capture|storage-ledger-prune: append/prune metadata-only storage growth ledger"
 > echo "  storage-ledger-install|storage-ledger-status: install hourly ledger runner (launchd)"
 > echo "  memory-graph-quality*: score graph coverage and install bounded repair runner"
+> echo "  recall-quality*: run saved recall eval, terminal quality view, and tuning"
+> echo "  open-core-boundary-audit: verify lite/full/paid branch feature boundaries"
 > echo "  weekly-lineage-rollup: generate weekly per-project lineage + global synergy rollups"
 > echo "  weekly-lineage-install|weekly-lineage-status: install weekly lineage runner (launchd)"
 > echo "  qdrant-cutover: set QDRANT_COLLECTION and rehydrate vectors"
@@ -319,6 +321,21 @@ memory-graph-quality-uninstall:
 memory-graph-quality-status:
 > bash scripts/install_memory_graph_quality_runner.sh status
 
+recall-quality:
+> scripts/agent/recall-quality-eval --tuning --pretty
+
+recall-quality-refresh:
+> scripts/agent/recall-quality-eval --refresh-cases --tuning --pretty
+
+recall-quality-tuning:
+> if [ -f .env ]; then source .env >/dev/null 2>&1 || true; fi
+> base="$${CONTEXTLATTICE_ORCHESTRATOR_URL:-http://127.0.0.1:8075}"; key="$${CONTEXTLATTICE_ORCHESTRATOR_API_KEY:-}"; \
+> if [ -n "$$key" ]; then curl -fsS -H "x-api-key: $$key" "$${base%/}/telemetry/recall/tuning?min_samples=1" | jq .; \
+> else curl -fsS "$${base%/}/telemetry/recall/tuning?min_samples=1" | jq .; fi
+
+open-core-boundary-audit:
+> scripts/agent/audit-open-core-boundary --pretty
+
 weekly-lineage-rollup:
 > scripts/context_storage_ops.sh weekly-lineage \
 >   --orchestrator-url "$${CONTEXTLATTICE_ORCHESTRATOR_URL:-http://127.0.0.1:8075}" \
diff --git a/contextlattice-dashboard/app/api/telemetry/recall/route.ts b/contextlattice-dashboard/app/api/telemetry/recall/route.ts
new file mode 100644
index 0000000..2e17ff8
--- /dev/null
+++ b/contextlattice-dashboard/app/api/telemetry/recall/route.ts
@@ -0,0 +1,16 @@
+import { NextResponse } from "next/server";
+import { callOrchestrator } from "@/lib/orchestrator";
+
+export async function GET(request: Request) {
+  const url = new URL(request.url);
+  const params = new URLSearchParams();
+  for (const key of ["traffic_class"]) {
+    const value = url.searchParams.get(key);
+    if (value) {
+      params.set(key, value);
+    }
+  }
+  const suffix = params.toString() ? `?${params.toString()}` : "";
+  const data = await callOrchestrator(`/telemetry/recall${suffix}`);
+  return NextResponse.json(data);
+}
diff --git a/contextlattice-dashboard/app/api/telemetry/recall/tuning/route.ts b/contextlattice-dashboard/app/api/telemetry/recall/tuning/route.ts
new file mode 100644
index 0000000..522c2d8
--- /dev/null
+++ b/contextlattice-dashboard/app/api/telemetry/recall/tuning/route.ts
@@ -0,0 +1,16 @@
+import { NextResponse } from "next/server";
+import { callOrchestrator } from "@/lib/orchestrator";
+
+export async function GET(request: Request) {
+  const url = new URL(request.url);
+  const params = new URLSearchParams();
+  for (const key of ["lookback_hours", "min_samples", "max_samples"]) {
+    const value = url.searchParams.get(key);
+    if (value) {
+      params.set(key, value);
+    }
+  }
+  const suffix = params.toString() ? `?${params.toString()}` : "";
+  const data = await callOrchestrator(`/telemetry/recall/tuning${suffix}`);
+  return NextResponse.json(data);
+}
diff --git a/contextlattice-dashboard/app/status/page.tsx b/contextlattice-dashboard/app/status/page.tsx
index f438f83..84cdca3 100644
--- a/contextlattice-dashboard/app/status/page.tsx
+++ b/contextlattice-dashboard/app/status/page.tsx
@@ -3,6 +3,7 @@
 import { useEffect, useState } from "react";
 import { RetrievalPanel } from "@/components/RetrievalPanel";
 import { MemoryGraphPanel, type MemoryGraphPayload } from "@/components/MemoryGraphPanel";
+import { RecallQualityPanel, type RecallQualityPayload, type RecallTuningPayload } from "@/components/RecallQualityPanel";
 
 type Service = {
   name: string;
@@ -63,18 +64,22 @@ export default function StatusPage() {
   const [topics, setTopics] = useState<TopicsPayload | null>(null);
   const [memoryTelemetry, setMemoryTelemetry] = useState<MemoryTelemetry | null>(null);
   const [memoryGraph, setMemoryGraph] = useState<MemoryGraphPayload | null>(null);
+  const [recallQuality, setRecallQuality] = useState<RecallQualityPayload | null>(null);
+  const [recallTuning, setRecallTuning] = useState<RecallTuningPayload | null>(null);
   const [error, setError] = useState<string | null>(null);
   const [updatedAt, setUpdatedAt] = useState<string | null>(null);
 
   async function loadStatus() {
     try {
       setError(null);
-      const [statusRes, prefRes, topicRes, memRes, graphRes] = await Promise.all([
+      const [statusRes, prefRes, topicRes, memRes, graphRes, recallRes, tuningRes] = await Promise.all([
         fetch("/api/memory/status", { cache: "no-store" }),
         fetch("/api/memory/preferences", { cache: "no-store" }),
         fetch("/api/memory/topics", { cache: "no-store" }),
         fetch("/api/telemetry/memory", { cache: "no-store" }),
         fetch("/api/telemetry/memory/graph", { cache: "no-store" }),
+        fetch("/api/telemetry/recall", { cache: "no-store" }),
+        fetch("/api/telemetry/recall/tuning", { cache: "no-store" }),
       ]);
       const statusData = await statusRes.json();
       if (!statusRes.ok) {
@@ -93,6 +98,12 @@ export default function StatusPage() {
       if (graphRes.ok) {
         setMemoryGraph(await graphRes.json());
       }
+      if (recallRes.ok) {
+        setRecallQuality(await recallRes.json());
+      }
+      if (tuningRes.ok) {
+        setRecallTuning(await tuningRes.json());
+      }
       setUpdatedAt(new Date().toLocaleTimeString());
     } catch (err: any) {
       setError(err?.message || "Status unavailable");
@@ -214,6 +225,8 @@ export default function StatusPage() {
 
       <MemoryGraphPanel graph={memoryGraph} />
 
+      <RecallQualityPanel recall={recallQuality} tuning={recallTuning} />
+
       <RetrievalPanel />
     </div>
   );
diff --git a/contextlattice-dashboard/components/RecallQualityPanel.tsx b/contextlattice-dashboard/components/RecallQualityPanel.tsx
new file mode 100644
index 0000000..ba6d33d
--- /dev/null
+++ b/contextlattice-dashboard/components/RecallQualityPanel.tsx
@@ -0,0 +1,195 @@
+"use client";
+
+type QualityTotals = {
+  requests?: number;
+  timeouts?: number;
+  errors?: number;
+  sourceErrorRate?: number;
+  noHitRate?: number;
+  lowConfidenceRate?: number;
+  staleHitRate?: number;
+  recallAtK?: number | null;
+  mrr?: number | null;
+  numericExactness?: number | null;
+  citationCoverage?: number | null;
+  sourceDiversity?: number | null;
+  graphLift?: number | null;
+  evalP95Ms?: number | null;
+  lastEvalAt?: string | null;
+};
+
+export type RecallQualityPayload = {
+  updatedAt?: string;
+  trafficClass?: string;
+  quality?: {
+    status?: string;
+    totals?: QualityTotals;
+    sampleCount?: number;
+    recommendations?: string[];
+  };
+  alerts?: {
+    count?: number;
+  };
+};
+
+export type RecallTuningPayload = {
+  window?: {
+    samples?: number;
+    minSamples?: number;
+    sufficient?: boolean;
+  };
+  recommended?: {
+    quality?: {
+      graphExpansion?: {
+        enabled?: boolean;
+        depth?: number;
+        neighborLimit?: number;
+      };
+      sourceOrder?: string[];
+      recommendations?: string[];
+    };
+  };
+};
+
+function numberValue(value: unknown): number {
+  return typeof value === "number" && Number.isFinite(value) ? value : 0;
+}
+
+function percentText(value: unknown): string {
+  if (typeof value !== "number" || !Number.isFinite(value)) {
+    return "-";
+  }
+  return `${Math.round(value * 100)}%`;
+}
+
+function statusTone(status: string) {
+  if (status === "repair_recommended" || status === "insufficient_cases") {
+    return "bg-amber-500 text-amber-950";
+  }
+  if (status === "watch" || status === "unknown") {
+    return "bg-cyan-500 text-cyan-950";
+  }
+  return "bg-emerald-500 text-emerald-950";
+}
+
+function QualityBar({ value, tone = "good" }: { value: number; tone?: "good" | "warn" | "neutral" }) {
+  const pct = Math.max(0, Math.min(100, value * 100));
+  const color = tone === "warn" ? "bg-amber-300" : tone === "neutral" ? "bg-cyan-300" : "bg-emerald-300";
+  return (
+    <div className="h-2 w-full rounded bg-slate-800 overflow-hidden" aria-hidden="true">
+      <div className={`h-full ${color}`} style={{ width: `${pct}%` }} />
+    </div>
+  );
+}
+
+function Metric({ label, value, tone }: { label: string; value: string; tone?: "warn" | "good" }) {
+  const toneClass =
+    tone === "warn" ? "text-amber-200 border-amber-500/70" : tone === "good" ? "text-emerald-200 border-emerald-500/70" : "text-slate-200 border-slate-600";
+  return (
+    <div className={`rounded border px-3 py-2 ${toneClass}`}>
+      <div className="text-xs uppercase tracking-wide text-slate-400">{label}</div>
+      <div className="text-lg font-semibold">{value}</div>
+    </div>
+  );
+}
+
+export function RecallQualityPanel({
+  recall,
+  tuning,
+}: {
+  recall: RecallQualityPayload | null;
+  tuning?: RecallTuningPayload | null;
+}) {
+  if (!recall) {
+    return (
+      <section className="card">
+        <h3 className="text-lg font-semibold">Recall quality</h3>
+        <p className="text-sm text-slate-400 mt-2">Recall telemetry unavailable.</p>
+      </section>
+    );
+  }
+
+  const totals = recall.quality?.totals ?? {};
+  const status = String(recall.quality?.status || "unknown");
+  const graphExpansion = tuning?.recommended?.quality?.graphExpansion;
+  const sourceOrder = tuning?.recommended?.quality?.sourceOrder ?? [];
+  const recallAtK = typeof totals.recallAtK === "number" ? totals.recallAtK : 0;
+  const mrr = typeof totals.mrr === "number" ? totals.mrr : 0;
+  const citationCoverage = typeof totals.citationCoverage === "number" ? totals.citationCoverage : 0;
+  const graphLift = typeof totals.graphLift === "number" ? totals.graphLift : 0;
+  const recommendations = [
+    ...(recall.quality?.recommendations ?? []),
+    ...(tuning?.recommended?.quality?.recommendations ?? []),
+  ].slice(0, 4);
+
+  return (
+    <section className="card space-y-5">
+      <div className="flex flex-wrap items-start justify-between gap-3">
+        <div>
+          <h3 className="text-lg font-semibold">Recall quality</h3>
+          <p className="text-xs text-slate-500 mt-1">
+            {totals.lastEvalAt ? `Last eval ${new Date(totals.lastEvalAt).toLocaleTimeString()}` : "No saved eval sample yet"}
+          </p>
+        </div>
+        <span className={`text-xs px-2 py-1 rounded ${statusTone(status)}`}>{status}</span>
+      </div>
+
+      <div className="grid md:grid-cols-6 gap-3 text-sm">
+        <Metric label="Recall@K" value={percentText(totals.recallAtK)} tone={recallAtK >= 0.75 ? "good" : "warn"} />
+        <Metric label="MRR" value={mrr ? mrr.toFixed(2) : "-"} tone={mrr >= 0.55 ? "good" : "warn"} />
+        <Metric label="Citations" value={percentText(totals.citationCoverage)} tone={citationCoverage >= 0.9 ? "good" : "warn"} />
+        <Metric label="Graph lift" value={percentText(totals.graphLift)} tone={graphLift > 0 ? "good" : undefined} />
+        <Metric label="Diversity" value={numberValue(totals.sourceDiversity).toFixed(1)} />
+        <Metric label="Eval p95" value={totals.evalP95Ms ? `${Math.round(totals.evalP95Ms)} ms` : "-"} />
+      </div>
+
+      <div className="grid lg:grid-cols-[minmax(0,1fr)_18rem] gap-5">
+        <div className="space-y-3">
+          <div className="grid grid-cols-[5rem_minmax(0,1fr)_3.5rem] items-center gap-3 text-xs">
+            <span className="text-slate-400">recall</span>
+            <QualityBar value={recallAtK} tone={recallAtK >= 0.75 ? "good" : "warn"} />
+            <span className="text-right text-slate-300">{percentText(totals.recallAtK)}</span>
+          </div>
+          <div className="grid grid-cols-[5rem_minmax(0,1fr)_3.5rem] items-center gap-3 text-xs">
+            <span className="text-slate-400">mrr</span>
+            <QualityBar value={mrr} tone={mrr >= 0.55 ? "good" : "warn"} />
+            <span className="text-right text-slate-300">{mrr ? mrr.toFixed(2) : "-"}</span>
+          </div>
+          <div className="grid grid-cols-[5rem_minmax(0,1fr)_3.5rem] items-center gap-3 text-xs">
+            <span className="text-slate-400">graph</span>
+            <QualityBar value={Math.min(1, graphLift * 4)} tone={graphLift > 0 ? "neutral" : "good"} />
+            <span className="text-right text-slate-300">{percentText(totals.graphLift)}</span>
+          </div>
+        </div>
+
+        <div className="rounded border border-slate-700/70 p-3 text-xs text-slate-300">
+          <div className="font-semibold text-slate-100 mb-2">Tuning</div>
+          <div className="flex justify-between gap-3">
+            <span className="text-slate-500">Graph depth</span>
+            <span>{graphExpansion?.enabled ? `${graphExpansion.depth ?? 0} / ${graphExpansion.neighborLimit ?? 0}` : "off"}</span>
+          </div>
+          <div className="mt-2 text-slate-500">Sources</div>
+          <div className="mt-1 flex flex-wrap gap-1">
+            {sourceOrder.slice(0, 5).map((source) => (
+              <span key={source} className="rounded border border-slate-700 px-1.5 py-0.5 text-slate-300">
+                {source}
+              </span>
+            ))}
+            {!sourceOrder.length ? <span>-</span> : null}
+          </div>
+        </div>
+      </div>
+
+      {recommendations.length ? (
+        <div className="rounded border border-slate-700/70 p-3 text-xs text-slate-300">
+          <div className="font-semibold text-slate-100 mb-1">Recommended next action</div>
+          <ul className="space-y-1">
+            {recommendations.map((item) => (
+              <li key={item}>{item}</li>
+            ))}
+          </ul>
+        </div>
+      ) : null}
+    </section>
+  );
+}
diff --git a/contextlattice-dashboard/package.json b/contextlattice-dashboard/package.json
index 04465a2..9447a2d 100644
--- a/contextlattice-dashboard/package.json
+++ b/contextlattice-dashboard/package.json
@@ -14,7 +14,7 @@
     "billing:reconcile:coinbase": "TS_NODE_COMPILER_OPTIONS='{\"module\":\"commonjs\",\"jsx\":\"react-jsx\"}' node --require tsconfig-paths/register --require ts-node/register scripts/reconcile_coinbase.ts",
     "audit:export": "TS_NODE_COMPILER_OPTIONS='{\"module\":\"commonjs\",\"jsx\":\"react-jsx\"}' node --require tsconfig-paths/register --require ts-node/register scripts/export_audit_logs.ts",
     "audit:prune": "TS_NODE_COMPILER_OPTIONS='{\"module\":\"commonjs\",\"jsx\":\"react-jsx\"}' node --require tsconfig-paths/register --require ts-node/register scripts/prune_audit_logs.ts",
-    "test": "TS_NODE_COMPILER_OPTIONS='{\"module\":\"commonjs\",\"jsx\":\"react-jsx\"}' node --require tsconfig-paths/register --test --require ts-node/register tests/overrides-api.test.ts tests/overrides-panel.test.tsx tests/sidecar-health-api.test.ts tests/sidecar-health-panel.test.tsx tests/charts-panel.test.tsx tests/alerts-panel.test.tsx tests/strategy-panel.test.tsx"
+    "test": "TS_NODE_COMPILER_OPTIONS='{\"module\":\"commonjs\",\"jsx\":\"react-jsx\"}' node --require tsconfig-paths/register --test --require ts-node/register tests/overrides-api.test.ts tests/overrides-panel.test.tsx tests/sidecar-health-api.test.ts tests/sidecar-health-panel.test.tsx tests/charts-panel.test.tsx tests/alerts-panel.test.tsx tests/strategy-panel.test.tsx tests/recall-quality-panel.test.tsx"
   },
   "dependencies": {
     "@next-auth/prisma-adapter": "^1.0.7",
diff --git a/contextlattice-dashboard/tests/recall-quality-panel.test.tsx b/contextlattice-dashboard/tests/recall-quality-panel.test.tsx
new file mode 100644
index 0000000..6cd6a30
--- /dev/null
+++ b/contextlattice-dashboard/tests/recall-quality-panel.test.tsx
@@ -0,0 +1,41 @@
+import assert from "node:assert/strict";
+import test from "node:test";
+import React from "react";
+import { renderToStaticMarkup } from "react-dom/server";
+import { RecallQualityPanel } from "@/components/RecallQualityPanel";
+
+test("RecallQualityPanel renders quality metrics and tuning", () => {
+  const html = renderToStaticMarkup(
+    <RecallQualityPanel
+      recall={{
+        quality: {
+          status: "healthy",
+          totals: {
+            recallAtK: 0.91,
+            mrr: 0.78,
+            citationCoverage: 1,
+            sourceDiversity: 2.4,
+            graphLift: 0.12,
+            evalP95Ms: 184,
+            lastEvalAt: "2026-05-29T12:00:00Z",
+          },
+          recommendations: ["Recall quality telemetry is inside current production thresholds."],
+        },
+      }}
+      tuning={{
+        recommended: {
+          quality: {
+            graphExpansion: { enabled: true, depth: 1, neighborLimit: 12 },
+            sourceOrder: ["qdrant", "postgres_pgvector", "topic_rollups"],
+          },
+        },
+      }}
+    />,
+  );
+
+  assert.match(html, /Recall quality/);
+  assert.match(html, /91%/);
+  assert.match(html, /Graph lift/);
+  assert.match(html, /qdrant/);
+  assert.match(html, /1 \/ 12/);
+});
diff --git a/docs/runtime/recall-quality-loop.md b/docs/runtime/recall-quality-loop.md
new file mode 100644
index 0000000..95827a8
--- /dev/null
+++ b/docs/runtime/recall-quality-loop.md
@@ -0,0 +1,11 @@
+# Recall Quality Loop
+
+ContextLattice exposes a single recall quality contract across agent, terminal, and dashboard surfaces:
+
+- `POST /memory/recall/evaluate/saved` runs saved recall cases and emits recall@K, MRR, numeric exactness, citation coverage, source diversity, latency, and graph-neighbor contribution metrics.
+- `GET /telemetry/recall` reports the latest saved-eval sample beside source health.
+- `GET /telemetry/recall/tuning` recommends threshold tuning, source order, and first-hop graph expansion limits from recent monitor samples.
+- `scripts/agent/recall-quality-eval --tuning` gives a terminal quality view suitable for release gates and agent handoffs.
+- `scripts/agent/audit-open-core-boundary` checks that `origin/main`, `public/main`, and `public-paid/main` preserve the lite/full/paid feature boundary before sync.
+
+The graph contribution score is evidence-only at evaluation time: it measures whether first-hop memory edges would recover a missed expected file or term without changing retrieval ranking in the evaluator. Use a positive `graphLift` signal to justify enabling graph expansion in product-boundary context packaging.
diff --git a/scripts/agent/audit-open-core-boundary b/scripts/agent/audit-open-core-boundary
new file mode 100755
index 0000000..8dcb137
--- /dev/null
+++ b/scripts/agent/audit-open-core-boundary
@@ -0,0 +1,140 @@
+#!/usr/bin/env python3
+"""Audit lite/full/paid branch boundaries before public sync."""
+
+from __future__ import annotations
+
+import argparse
+import subprocess
+from dataclasses import dataclass
+from typing import Any
+
+from _common import emit
+
+
+DEFAULT_REFS = ["origin/main", "public/main", "public-paid/main"]
+
+CORE_RUST_PATHS = [
+    "crates/Cargo.toml",
+    "services/fastembed_sidecar_rs/Cargo.toml",
+    "services/fastembed_gate_rs/Cargo.toml",
+    "services/memory_bank_spike_rs/Cargo.toml",
+]
+
+PAID_RUST_PATHS = [
+    "services/spike_adapter_rs/Cargo.toml",
+]
+
+LITE_ENV_MARKERS = [
+    "ORCH_EMBED_PROVIDER",
+    "ORCH_RUST_RETRIEVAL_VECTOR_BACKEND",
+    "ORCH_RUST_RETRIEVAL_LEXICAL_BACKEND",
+    "ORCH_MEMORY_BANK_SPIKE_HTTP_URL",
+]
+
+
+@dataclass
+class Finding:
+    severity: str
+    ref: str
+    check: str
+    detail: str
+
+    def to_dict(self) -> dict[str, str]:
+        return {
+            "severity": self.severity,
+            "ref": self.ref,
+            "check": self.check,
+            "detail": self.detail,
+        }
+
+
+def git(*args: str, check: bool = False) -> subprocess.CompletedProcess[str]:
+    return subprocess.run(["git", *args], text=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE, check=check)
+
+
+def ref_exists(ref: str) -> bool:
+    return git("rev-parse", "--verify", "--quiet", ref).returncode == 0
+
+
+def path_exists(ref: str, path: str) -> bool:
+    return git("cat-file", "-e", f"{ref}:{path}").returncode == 0
+
+
+def read_path(ref: str, path: str) -> str:
+    proc = git("show", f"{ref}:{path}")
+    if proc.returncode != 0:
+        return ""
+    return proc.stdout
+
+
+def audit_ref(ref: str) -> list[Finding]:
+    findings: list[Finding] = []
+    if not ref_exists(ref):
+        return [Finding("error", ref, "ref_exists", "Git ref is missing or not fetched.")]
+
+    for path in CORE_RUST_PATHS:
+        if not path_exists(ref, path):
+            findings.append(Finding("error", ref, "core_rust_present", f"Missing public-safe Rust path: {path}"))
+
+    is_public = ref == "public/main"
+    is_paid_or_private = ref in {"origin/main", "public-paid/main"}
+    for path in PAID_RUST_PATHS:
+        exists = path_exists(ref, path)
+        if is_paid_or_private and not exists:
+            findings.append(Finding("error", ref, "paid_rust_present", f"Missing paid/private Rust path: {path}"))
+        if is_public and exists:
+            findings.append(Finding("warn", ref, "public_lite_boundary", f"Lite branch contains paid/private adapter path: {path}"))
+
+    for compose_path in ["docker-compose.yml", "docker-compose.lite.yml"]:
+        compose = read_path(ref, compose_path)
+        if not compose:
+            findings.append(Finding("error", ref, "compose_present", f"Missing {compose_path}"))
+            continue
+        if ref == "public/main":
+            for marker in LITE_ENV_MARKERS:
+                if marker not in compose:
+                    findings.append(Finding("error", ref, "lite_compose_markers", f"{compose_path} missing {marker}"))
+
+    package = read_path(ref, "README.md") + "\n" + read_path(ref, "docs/open-core-boundary.md")
+    if ref == "public/main" and "Spike" in package and "paid" not in package.lower():
+        findings.append(Finding("warn", ref, "lite_docs_boundary", "Lite docs mention Spike without a paid/full boundary note."))
+
+    return findings
+
+
+def summarize(refs: list[str], findings: list[Finding]) -> dict[str, Any]:
+    errors = [item for item in findings if item.severity == "error"]
+    warnings = [item for item in findings if item.severity == "warn"]
+    return {
+        "ok": not errors,
+        "refs": refs,
+        "summary": {
+            "errors": len(errors),
+            "warnings": len(warnings),
+            "findings": len(findings),
+        },
+        "findings": [item.to_dict() for item in findings],
+        "contract": {
+            "lite": "public/main keeps the public-safe Rust core, qdrant/pgvector-compatible compose markers, and excludes paid/private Spike adapter paths.",
+            "paid": "public-paid/main carries the full Rust adapter surface without private repository history.",
+            "private": "origin/main remains the development superset and source of release promotion.",
+        },
+    }
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("--refs", default=",".join(DEFAULT_REFS), help="Comma-separated refs to audit.")
+    parser.add_argument("--pretty", action="store_true")
+    args = parser.parse_args()
+    refs = [item.strip() for item in args.refs.split(",") if item.strip()]
+    findings: list[Finding] = []
+    for ref in refs:
+        findings.extend(audit_ref(ref))
+    payload = summarize(refs, findings)
+    emit(payload, pretty=args.pretty)
+    return 0 if payload["ok"] else 1
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/scripts/agent/recall-quality-eval b/scripts/agent/recall-quality-eval
new file mode 100755
index 0000000..5e7109f
--- /dev/null
+++ b/scripts/agent/recall-quality-eval
@@ -0,0 +1,147 @@
+#!/usr/bin/env python3
+"""Run saved recall evaluation and print a compact quality view."""
+
+from __future__ import annotations
+
+import argparse
+import urllib.parse
+from typing import Any
+
+from _common import emit, request_json
+
+
+def as_float(value: Any, default: float = 0.0) -> float:
+    try:
+        return float(value)
+    except (TypeError, ValueError):
+        return default
+
+
+def as_int(value: Any, default: int = 0) -> int:
+    try:
+        return int(value)
+    except (TypeError, ValueError):
+        return default
+
+
+def pct(value: Any) -> str:
+    return f"{round(as_float(value) * 100):3d}%"
+
+
+def bar(value: Any, width: int = 24) -> str:
+    ratio = max(0.0, min(1.0, as_float(value)))
+    filled = round(ratio * width)
+    return "[" + ("#" * filled) + ("-" * (width - filled)) + "]"
+
+
+def compact_eval(payload: dict[str, Any], tuning: dict[str, Any] | None) -> dict[str, Any]:
+    metrics = payload.get("metrics") if isinstance(payload.get("metrics"), dict) else {}
+    graph = metrics.get("graphContribution") if isinstance(metrics.get("graphContribution"), dict) else {}
+    quality = None
+    if tuning:
+        recommended = tuning.get("recommended") if isinstance(tuning.get("recommended"), dict) else {}
+        quality = recommended.get("quality") if isinstance(recommended.get("quality"), dict) else None
+    return {
+        "ok": bool(payload.get("ok", False)),
+        "passed": bool(payload.get("passed", False)),
+        "quality_status": payload.get("quality_status") or metrics.get("qualityStatus"),
+        "cases": {
+            "total": as_int(metrics.get("casesTotal")),
+            "evaluated": as_int(metrics.get("casesEvaluated")),
+        },
+        "recall": {
+            "k": as_int(metrics.get("k")),
+            "recallAtK": as_float(metrics.get("recallAtK")),
+            "mrr": as_float(metrics.get("mrr")),
+            "numericExactness": as_float(metrics.get("numericExactness")),
+            "citationCoverage": as_float(metrics.get("citationCoverage")),
+            "sourceDiversity": as_float(metrics.get("sourceDiversity")),
+        },
+        "graph": {
+            "lift": as_float(metrics.get("graphLift")),
+            "helpedCases": as_int(graph.get("helpedCases")),
+            "candidateCount": as_int(graph.get("candidateCount")),
+            "expectedHits": as_int(graph.get("expectedHitCount")),
+            "active": bool(graph.get("memoryGraphStoreActive", False)),
+        },
+        "latency": {
+            "avgMs": as_float(metrics.get("avgLatencyMs")),
+            "p95Ms": as_float(metrics.get("p95LatencyMs")),
+        },
+        "tuning": quality or {},
+        "recommendations": payload.get("recommendations") or [],
+    }
+
+
+def print_terminal(summary: dict[str, Any]) -> None:
+    status = "PASS" if summary["passed"] else "FAIL"
+    print(f"recall-quality {status} status={summary.get('quality_status') or 'unknown'}")
+    recall = summary["recall"]
+    graph = summary["graph"]
+    latency = summary["latency"]
+    print(f"  recall@{recall['k']:<2} {bar(recall['recallAtK'])} {pct(recall['recallAtK'])}   mrr={as_float(recall['mrr']):.3f}")
+    print(f"  citations {bar(recall['citationCoverage'])} {pct(recall['citationCoverage'])}   diversity={as_float(recall['sourceDiversity']):.2f}")
+    print(
+        "  graph     "
+        f"{bar(min(1.0, as_float(graph['lift']) * 4.0))} {pct(graph['lift'])}   "
+        f"helped={graph['helpedCases']} candidates={graph['candidateCount']} expected={graph['expectedHits']}"
+    )
+    print(f"  latency   avg={as_float(latency['avgMs']):.1f}ms p95={as_float(latency['p95Ms']):.1f}ms")
+    tuning = summary.get("tuning") if isinstance(summary.get("tuning"), dict) else {}
+    graph_expansion = tuning.get("graphExpansion") if isinstance(tuning.get("graphExpansion"), dict) else {}
+    source_order = tuning.get("sourceOrder") if isinstance(tuning.get("sourceOrder"), list) else []
+    if graph_expansion or source_order:
+        enabled = "on" if graph_expansion.get("enabled") else "off"
+        depth = as_int(graph_expansion.get("depth"))
+        limit = as_int(graph_expansion.get("neighborLimit"))
+        print(f"  tuning    graph={enabled} depth={depth} limit={limit} sources={','.join(map(str, source_order[:5])) or '-'}")
+    for item in (summary.get("recommendations") or [])[:3]:
+        print(f"  - {item}")
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("--k", type=int, default=None, help="Override saved eval K.")
+    parser.add_argument("--timeout", type=float, default=240.0)
+    parser.add_argument("--include-debug", action="store_true")
+    parser.add_argument("--include-preferences", action="store_true")
+    parser.add_argument("--refresh-cases", action="store_true")
+    parser.add_argument("--max-cases", type=int, default=12)
+    parser.add_argument("--min-hits", type=int, default=1)
+    parser.add_argument("--project", default="")
+    parser.add_argument("--topic-prefix", default="")
+    parser.add_argument("--tuning", action="store_true", help="Fetch recall tuning recommendations after eval.")
+    parser.add_argument("--pretty", action="store_true")
+    parser.add_argument("--json", action="store_true", help="Emit compact JSON instead of terminal view.")
+    args = parser.parse_args()
+
+    refresh_payload = {
+        "max_cases": args.max_cases,
+        "min_hits": args.min_hits,
+        "project": args.project,
+        "topic_prefix": args.topic_prefix,
+    }
+    if args.refresh_cases:
+        request_json("POST", "/memory/recall/eval-cases/refresh", refresh_payload, args.timeout)
+
+    payload: dict[str, Any] = {
+        "include_retrieval_debug": args.include_debug,
+        "include_preferences": args.include_preferences,
+    }
+    if args.k is not None:
+        payload["k"] = args.k
+    evaluation = request_json("POST", "/memory/recall/evaluate/saved", payload, args.timeout)
+    tuning = None
+    if args.tuning:
+        query = urllib.parse.urlencode({"max_samples": "96", "min_samples": "1"})
+        tuning = request_json("GET", f"/telemetry/recall/tuning?{query}", None, args.timeout)
+    summary = compact_eval(evaluation, tuning)
+    if args.json or args.pretty:
+        emit(summary, pretty=args.pretty)
+    else:
+        print_terminal(summary)
+    return 0 if summary["passed"] else 1
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/services/gateway-go/main_test.go b/services/gateway-go/main_test.go
index 1e19b56..9de936b 100644
--- a/services/gateway-go/main_test.go
+++ b/services/gateway-go/main_test.go
@@ -2,6 +2,7 @@ package main
 
 import (
 	"bufio"
+	"context"
 	"encoding/json"
 	"io"
 	"net/http"
@@ -603,6 +604,7 @@ func TestProxyForwardsMemorySearchRequest(t *testing.T) {
 
 func TestMemorySearchUsesGoStagedRetrieval(t *testing.T) {
 	t.Setenv("GO_RETRIEVAL_STAGED_ENABLED", "true")
+	t.Setenv("GO_RETRIEVAL_NATIVE_QDRANT_ENABLED", "false")
 	t.Setenv("ORCH_RETRIEVAL_SOURCES", "qdrant")
 	t.Setenv("ORCH_RETRIEVAL_FAST_SOURCES", "qdrant")
 	t.Setenv("ORCH_RETRIEVAL_SLOW_SOURCES", "")
@@ -998,11 +1000,13 @@ func TestMemorySearchInjectsConfiguredAPIKeyWhenMissing(t *testing.T) {
 
 func TestMemoryRecallEvaluateSavedIsGoNative(t *testing.T) {
 	t.Setenv("GO_RETRIEVAL_STAGED_ENABLED", "true")
+	t.Setenv("GO_RETRIEVAL_NATIVE_QDRANT_ENABLED", "false")
 	t.Setenv("ORCH_RETRIEVAL_SOURCES", "qdrant")
 	t.Setenv("ORCH_RETRIEVAL_FAST_SOURCES", "qdrant")
 	t.Setenv("ORCH_RETRIEVAL_SLOW_SOURCES", "")
 
 	recallCasesPath := filepath.Join(t.TempDir(), "recall_eval_cases.json")
+	recallMonitorPath := filepath.Join(t.TempDir(), "recall_monitor.ndjson")
 	if err := os.WriteFile(
 		recallCasesPath,
 		[]byte(`{
@@ -1025,6 +1029,7 @@ func TestMemoryRecallEvaluateSavedIsGoNative(t *testing.T) {
 		t.Fatalf("write saved recall eval config: %v", err)
 	}
 	t.Setenv("ORCH_RECALL_EVAL_CASES_PATH", recallCasesPath)
+	t.Setenv("RECALL_MONITOR_PATH", recallMonitorPath)
 
 	var capturedPath string
 	backend := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
@@ -1071,11 +1076,156 @@ func TestMemoryRecallEvaluateSavedIsGoNative(t *testing.T) {
 	if anyToInt(metrics["casesEvaluated"], 0) != 1 {
 		t.Fatalf("expected one evaluated case, got %#v", metrics)
 	}
+	if anyToFloat64(metrics["citationCoverage"], 0) != 1 {
+		t.Fatalf("expected citation coverage default 1.0, got %#v", metrics)
+	}
+	if anyToFloat64(metrics["sourceDiversity"], 0) != 1 {
+		t.Fatalf("expected one source in diversity metric, got %#v", metrics)
+	}
+	if anyToFloat64(metrics["p95LatencyMs"], -1) < 0 {
+		t.Fatalf("expected p95 latency metric, got %#v", metrics)
+	}
+	graphContribution, _ := metrics["graphContribution"].(map[string]any)
+	if anyToBool(graphContribution["memoryGraphStoreActive"]) {
+		t.Fatalf("expected disabled graph store in native route smoke, got %#v", graphContribution)
+	}
+	cases, _ := payload["cases"].([]any)
+	if len(cases) != 1 {
+		t.Fatalf("expected one case report, got %#v", payload["cases"])
+	}
+	caseReport, _ := cases[0].(map[string]any)
+	if _, ok := caseReport["graph_contribution"].(map[string]any); !ok {
+		t.Fatalf("expected case graph contribution, got %#v", caseReport)
+	}
+	monitorRaw, err := os.ReadFile(recallMonitorPath)
+	if err != nil {
+		t.Fatalf("expected recall monitor sample: %v", err)
+	}
+	if !strings.Contains(string(monitorRaw), `"recallAtK"`) {
+		t.Fatalf("expected recall monitor sample to include eval metrics, got %s", string(monitorRaw))
+	}
 	if capturedPath != "/v1/retrieval/query" {
 		t.Fatalf("expected go-native route to call retrieval query path, got %s", capturedPath)
 	}
 }
 
+func TestMemoryRecallEvaluateSavedScoresGraphContribution(t *testing.T) {
+	t.Setenv("BACKEND_URL", "http://127.0.0.1:1")
+	t.Setenv("GATEWAY_PROXY_TIMEOUT_SECS", "2")
+	t.Setenv("GO_TELEMETRY_SINK_ENABLED", "false")
+	t.Setenv("GO_RUNTIME_STRICT_NO_PYTHON", "false")
+	t.Setenv("GO_RETRIEVAL_CONTINUATION_DURABLE_ENABLED", "false")
+	t.Setenv("GO_RETRIEVAL_STAGED_ENABLED", "true")
+	t.Setenv("GO_RETRIEVAL_NATIVE_QDRANT_ENABLED", "false")
+	t.Setenv("ORCH_RETRIEVAL_SOURCES", "qdrant")
+	t.Setenv("ORCH_RETRIEVAL_FAST_SOURCES", "qdrant")
+	t.Setenv("ORCH_RETRIEVAL_SLOW_SOURCES", "")
+	t.Setenv("GO_MEMORY_STORE_ENABLED", "true")
+	root := t.TempDir()
+	t.Setenv("GO_MEMORY_STORE_ROOT", root)
+	t.Setenv("GO_MEMORY_STORE_HISTORY_PATH", filepath.Join(root, "_contextlattice", "memory_write_history.ndjson"))
+	t.Setenv("GO_MEMORY_STORE_ACCESS_LOG_PATH", filepath.Join(root, "_contextlattice", "memory_access_log.ndjson"))
+	t.Setenv("GO_MEMORY_STORE_CONTENT_BLOBS_PATH", filepath.Join(root, "_contextlattice", "objects"))
+	t.Setenv("GO_MEMORY_GRAPH_EDGE_PATH", filepath.Join(root, "_contextlattice", "memory_edges.ndjson"))
+	t.Setenv("RECALL_MONITOR_PATH", filepath.Join(root, "_contextlattice", "recall_monitor.ndjson"))
+	t.Setenv("CONTEXTLATTICE_ORCHESTRATOR_API_KEY", "")
+
+	recallCasesPath := filepath.Join(t.TempDir(), "recall_eval_cases.json")
+	if err := os.WriteFile(
+		recallCasesPath,
+		[]byte(`{
+  "version": 1,
+  "updatedAt": "2026-04-28T00:00:00Z",
+  "k": 3,
+  "gate": {"minRecallAtK": 0.0, "minMrr": 0.0, "minNumericExactness": 0.0},
+  "cases": [
+    {
+      "id": "graph-lift",
+      "query": "target by neighbor",
+      "limit": 3,
+      "project": "alpha",
+      "sources": ["qdrant"],
+      "expected_files": ["notes/target.md"]
+    }
+  ]
+}`),
+		0o644,
+	); err != nil {
+		t.Fatalf("write saved recall eval config: %v", err)
+	}
+	t.Setenv("ORCH_RECALL_EVAL_CASES_PATH", recallCasesPath)
+
+	backend := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		w.Header().Set("Content-Type", "application/json")
+		if r.URL.Path != "/v1/retrieval/query" {
+			_, _ = w.Write([]byte(`{"ok":true}`))
+			return
+		}
+		_, _ = w.Write([]byte(`{"results":[{"project":"alpha","file":"notes/seed.md","memory_id":"alpha::notes/seed.md","summary":"seed only","source":"qdrant","score":0.91}],"warnings":[]}`))
+	}))
+	defer backend.Close()
+	t.Setenv("BACKEND_URL", backend.URL)
+
+	s := newServer()
+	if s.memoryStore == nil || !s.memoryStore.policy.enabled {
+		t.Fatalf("expected enabled memory store")
+	}
+	for _, item := range []normalizedWrite{
+		{project: "alpha", fileName: "notes/seed.md", content: "seed memory", topicPath: "recall/graph"},
+		{project: "alpha", fileName: "notes/target.md", content: "target memory", topicPath: "recall/graph"},
+	} {
+		if _, _, err := s.memoryStore.put(item); err != nil {
+			t.Fatalf("seed memory store: %v", err)
+		}
+	}
+	if _, err := s.memoryStore.upsertMemoryEdge(context.Background(), memoryEdgeEntry{
+		SourceID:   "alpha::notes/seed.md",
+		TargetID:   "alpha::notes/target.md",
+		Relation:   "inferred_related",
+		Project:    "alpha",
+		TopicPath:  "recall/graph",
+		Confidence: 0.92,
+		CreatedAt:  nowUTCISO(),
+		Source:     memoryEdgeSource,
+	}); err != nil {
+		t.Fatalf("seed memory edge: %v", err)
+	}
+
+	gateway := httptest.NewServer(buildMux(s))
+	defer gateway.Close()
+
+	resp, err := http.Post(gateway.URL+"/memory/recall/evaluate/saved", "application/json", strings.NewReader(`{"include_retrieval_debug":true}`))
+	if err != nil {
+		t.Fatalf("request failed: %v", err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusOK {
+		body, _ := io.ReadAll(resp.Body)
+		t.Fatalf("expected 200, got %d body=%s", resp.StatusCode, string(body))
+	}
+	var payload map[string]any
+	if err := json.NewDecoder(resp.Body).Decode(&payload); err != nil {
+		t.Fatalf("decode response payload: %v", err)
+	}
+	metrics, _ := payload["metrics"].(map[string]any)
+	if anyToFloat64(metrics["recallAtK"], -1) != 0 {
+		t.Fatalf("expected top-k miss before graph expansion, got %#v", metrics)
+	}
+	if anyToFloat64(metrics["graphLift"], 0) != 1 {
+		t.Fatalf("expected graph lift to recover the case, got metrics=%#v cases=%#v", metrics, payload["cases"])
+	}
+	graphContribution, _ := metrics["graphContribution"].(map[string]any)
+	if anyToInt(graphContribution["helpedCases"], 0) != 1 {
+		t.Fatalf("expected one helped graph case, got %#v", graphContribution)
+	}
+	cases, _ := payload["cases"].([]any)
+	caseReport, _ := cases[0].(map[string]any)
+	caseGraph, _ := caseReport["graph_contribution"].(map[string]any)
+	if !anyToBool(caseGraph["helped"]) || anyToInt(caseGraph["added_expected_hit_count"], 0) != 1 {
+		t.Fatalf("expected per-case graph contribution, got %#v", caseGraph)
+	}
+}
+
 func TestMemorySearchAcceptsQueryParamAPIKey(t *testing.T) {
 	t.Setenv("GO_RETRIEVAL_STAGED_ENABLED", "true")
 	t.Setenv("ORCH_RETRIEVAL_SOURCES", "qdrant")
diff --git a/services/gateway-go/memory_recall_eval_saved_native.go b/services/gateway-go/memory_recall_eval_saved_native.go
index 5eef661..3ce726b 100644
--- a/services/gateway-go/memory_recall_eval_saved_native.go
+++ b/services/gateway-go/memory_recall_eval_saved_native.go
@@ -7,8 +7,10 @@ import (
 	"net/http"
 	"os"
 	"path/filepath"
+	"sort"
 	"strconv"
 	"strings"
+	"time"
 )
 
 const (
@@ -88,11 +90,25 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 	includePreferences := anyToBool(payload["include_preferences"])
 	userID := strings.TrimSpace(anyToString(payload["user_id"]))
 
+	evaluationStartedAt := time.Now()
 	recallHits := 0
 	reciprocalRankSum := 0.0
 	evaluatedCases := 0
 	numericExpectedTotal := 0
 	numericMatchedTotal := 0
+	citationExpectedTotal := 0
+	citationMatchedTotal := 0
+	noHitCases := 0
+	lowConfidenceCases := 0
+	sourceDiversitySum := 0.0
+	latencyValues := make([]float64, 0, len(cfg.Cases))
+	graphEvaluatedCases := 0
+	graphSeedCount := 0
+	graphCandidateCount := 0
+	graphAddedCandidateCount := 0
+	graphExpectedHitCount := 0
+	graphAddedExpectedHitCount := 0
+	graphHelpedCases := 0
 	caseReports := make([]map[string]any, 0, len(cfg.Cases))
 
 	for idx, rawCase := range cfg.Cases {
@@ -116,6 +132,11 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 				"expected_substrings": []string{},
 				"expected_numeric":    []string{},
 				"matched_numeric":     []string{},
+				"matched_files":       []string{},
+				"citation_coverage":   0.0,
+				"source_diversity":    0,
+				"latency_ms":          0.0,
+				"graph_contribution":  recallGraphContributionUnavailable("case query missing"),
 				"warnings":            []string{"case query missing"},
 				"retrieval_mode":      normalizeRetrievalMode(anyToString(rawCase["retrieval_mode"])),
 				"agent_id":            strings.TrimSpace(anyToString(rawCase["agent_id"])),
@@ -148,12 +169,15 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 			reqPayload["retrieval_intent"] = "decision"
 		}
 
+		caseStartedAt := time.Now()
 		searchResp, status, execErr := s.executeRetrieval(
 			context.Background(),
 			incomingHeaders,
 			reqPayload,
 			true,
 		)
+		latencyMs := float64(time.Since(caseStartedAt).Microseconds()) / 1000.0
+		latencyValues = append(latencyValues, latencyMs)
 		if execErr != nil {
 			caseReports = append(caseReports, map[string]any{
 				"id":                  caseID,
@@ -169,6 +193,11 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 				"expected_substrings": []string{},
 				"expected_numeric":    []string{},
 				"matched_numeric":     []string{},
+				"matched_files":       []string{},
+				"citation_coverage":   0.0,
+				"source_diversity":    0,
+				"latency_ms":          roundFloat(latencyMs, 3),
+				"graph_contribution":  recallGraphContributionUnavailable("retrieval failed"),
 				"warnings":            []string{"retrieval failed: " + execErr.Error()},
 				"retrieval_mode":      reqPayload["retrieval_mode"],
 				"agent_id":            reqPayload["agent_id"],
@@ -182,6 +211,20 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 		expectedFiles := normalizeExpectedFileTokens(rawCase["expected_files"])
 		expectedTerms := normalizeExpectedTerms(rawCase["expected_substrings"])
 		expectedNumeric := normalizeExpectedNumeric(rawCase["expected_numeric"])
+		matchedFiles := matchedExpectedFilesWithinK(results, expectedFiles, k)
+		caseCitationCoverage := 1.0
+		if len(expectedFiles) > 0 {
+			caseCitationCoverage = float64(len(matchedFiles)) / float64(len(expectedFiles))
+		}
+		caseSources := uniqueSourcesWithinK(results, k)
+		graphContribution := s.evaluateRecallGraphContribution(
+			context.Background(),
+			results,
+			expectedFiles,
+			expectedTerms,
+			k,
+			strings.TrimSpace(anyToString(reqPayload["project"])),
+		)
 
 		matchedRank := matchRankWithinK(results, expectedFiles, expectedTerms, k)
 		hit := matchedRank != nil
@@ -195,11 +238,28 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 			evaluatedCases += 1
 			if hit {
 				recallHits += 1
+			} else {
+				noHitCases += 1
 			}
 			reciprocalRankSum += reciprocalRank
+			if topResultScore(results) > 0 && topResultScore(results) < 0.45 {
+				lowConfidenceCases += 1
+			}
+			sourceDiversitySum += float64(len(caseSources))
+			graphEvaluatedCases += 1
+			graphSeedCount += anyToInt(graphContribution["seed_count"], 0)
+			graphCandidateCount += anyToInt(graphContribution["candidate_count"], 0)
+			graphAddedCandidateCount += anyToInt(graphContribution["added_candidate_count"], 0)
+			graphExpectedHitCount += anyToInt(graphContribution["expected_hit_count"], 0)
+			graphAddedExpectedHitCount += anyToInt(graphContribution["added_expected_hit_count"], 0)
+			if !hit && anyToBool(graphContribution["helped"]) {
+				graphHelpedCases += 1
+			}
 		}
 		numericExpectedTotal += len(expectedNumeric)
 		numericMatchedTotal += len(numericMatches)
+		citationExpectedTotal += len(expectedFiles)
+		citationMatchedTotal += len(matchedFiles)
 
 		report := map[string]any{
 			"id":                        caseID,
@@ -215,6 +275,12 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 			"expected_substrings":       expectedTerms,
 			"expected_numeric":          expectedNumeric,
 			"matched_numeric":           numericMatches,
+			"matched_files":             matchedFiles,
+			"citation_coverage":         roundFloat(caseCitationCoverage, 6),
+			"source_diversity":          len(caseSources),
+			"sources":                   caseSources,
+			"latency_ms":                roundFloat(latencyMs, 3),
+			"graph_contribution":        graphContribution,
 			"warnings":                  parseWarnings(searchResp["warnings"]),
 			"retrieval_mode":            searchResp["retrieval_mode"],
 			"agent_id":                  searchResp["agent_id"],
@@ -239,21 +305,95 @@ func (s *server) memoryRecallEvaluateSavedNative(w http.ResponseWriter, r *http.
 	if numericExpectedTotal > 0 {
 		numericExactness = float64(numericMatchedTotal) / float64(numericExpectedTotal)
 	}
+	citationCoverage := 1.0
+	if citationExpectedTotal > 0 {
+		citationCoverage = float64(citationMatchedTotal) / float64(citationExpectedTotal)
+	}
+	avgSourceDiversity := 0.0
+	noHitRate := 0.0
+	lowConfidenceRate := 0.0
+	graphLift := 0.0
+	if evaluatedCases > 0 {
+		avgSourceDiversity = sourceDiversitySum / float64(evaluatedCases)
+		noHitRate = float64(noHitCases) / float64(evaluatedCases)
+		lowConfidenceRate = float64(lowConfidenceCases) / float64(evaluatedCases)
+		graphLift = float64(graphHelpedCases) / float64(evaluatedCases)
+	}
+	avgLatencyMs, p95LatencyMs := recallLatencyStats(latencyValues)
 	passed := evaluatedCases > 0 && recallAtK >= gate.MinRecallAtK && mrr >= gate.MinMRR && numericExactness >= gate.MinNumericExactly
+	qualityStatus := recallEvalQualityStatus(passed, evaluatedCases, recallAtK, mrr, numericExactness)
+	metrics := map[string]any{
+		"k":                      k,
+		"casesTotal":             len(cfg.Cases),
+		"casesEvaluated":         evaluatedCases,
+		"recallAtK":              roundFloat(recallAtK, 6),
+		"mrr":                    roundFloat(mrr, 6),
+		"numericExactness":       roundFloat(numericExactness, 6),
+		"numericExpected":        numericExpectedTotal,
+		"numericMatched":         numericMatchedTotal,
+		"citationCoverage":       roundFloat(citationCoverage, 6),
+		"citationExpected":       citationExpectedTotal,
+		"citationMatched":        citationMatchedTotal,
+		"noHitRate":              roundFloat(noHitRate, 6),
+		"lowConfidenceRate":      roundFloat(lowConfidenceRate, 6),
+		"sourceDiversity":        roundFloat(avgSourceDiversity, 3),
+		"avgLatencyMs":           roundFloat(avgLatencyMs, 3),
+		"p95LatencyMs":           roundFloat(p95LatencyMs, 3),
+		"durationMs":             roundFloat(float64(time.Since(evaluationStartedAt).Microseconds())/1000.0, 3),
+		"qualityStatus":          qualityStatus,
+		"graphEvaluatedCases":    graphEvaluatedCases,
+		"graphSeedCount":         graphSeedCount,
+		"graphCandidateCount":    graphCandidateCount,
+		"graphAddedCandidates":   graphAddedCandidateCount,
+		"graphExpectedHits":      graphExpectedHitCount,
+		"graphAddedExpectedHits": graphAddedExpectedHitCount,
+		"graphHelpedCases":       graphHelpedCases,
+		"graphLift":              roundFloat(graphLift, 6),
+		"graphContribution": map[string]any{
+			"evaluatedCases":         graphEvaluatedCases,
+			"seedCount":              graphSeedCount,
+			"candidateCount":         graphCandidateCount,
+			"addedCandidateCount":    graphAddedCandidateCount,
+			"expectedHitCount":       graphExpectedHitCount,
+			"addedExpectedHitCount":  graphAddedExpectedHitCount,
+			"helpedCases":            graphHelpedCases,
+			"lift":                   roundFloat(graphLift, 6),
+			"neighborLimitPerSeed":   recallEvalGraphNeighborLimit(),
+			"memoryGraphStoreActive": s.memoryGraphBackend() != nil,
+		},
+	}
+	recommendations := recallEvalRecommendations(metrics, gate, passed)
+	_ = s.appendRecallMonitorSample(map[string]any{
+		"timestamp":             nowUTCISO(),
+		"source":                "saved_recall_eval",
+		"passed":                passed,
+		"qualityStatus":         qualityStatus,
+		"caseCount":             len(cfg.Cases),
+		"evaluatedCases":        evaluatedCases,
+		"k":                     k,
+		"recallAtK":             roundFloat(recallAtK, 6),
+		"mrr":                   roundFloat(mrr, 6),
+		"numericExactness":      roundFloat(numericExactness, 6),
+		"citationCoverage":      roundFloat(citationCoverage, 6),
+		"noHitRate":             roundFloat(noHitRate, 6),
+		"lowConfidenceRate":     roundFloat(lowConfidenceRate, 6),
+		"staleHitRate":          0.0,
+		"maxSourceErrorRate":    0.0,
+		"sourceDiversity":       roundFloat(avgSourceDiversity, 3),
+		"graphLift":             roundFloat(graphLift, 6),
+		"graphExpectedHitCount": graphExpectedHitCount,
+		"graphHelpedCases":      graphHelpedCases,
+		"avgLatencyMs":          roundFloat(avgLatencyMs, 3),
+		"evalP95Ms":             roundFloat(p95LatencyMs, 3),
+		"retrievalAlertCount":   0,
+	})
 
 	writeJSON(w, http.StatusOK, map[string]any{
-		"ok":     true,
-		"passed": passed,
-		"metrics": map[string]any{
-			"k":                k,
-			"casesTotal":       len(cfg.Cases),
-			"casesEvaluated":   evaluatedCases,
-			"recallAtK":        roundFloat(recallAtK, 6),
-			"mrr":              roundFloat(mrr, 6),
-			"numericExactness": roundFloat(numericExactness, 6),
-			"numericExpected":  numericExpectedTotal,
-			"numericMatched":   numericMatchedTotal,
-		},
+		"ok":              true,
+		"passed":          passed,
+		"quality_status":  qualityStatus,
+		"metrics":         metrics,
+		"recommendations": recommendations,
 		"gate": map[string]any{
 			"minRecallAtK":        gate.MinRecallAtK,
 			"minMrr":              gate.MinMRR,
@@ -360,6 +500,32 @@ func resolveRecallEvalCasesPath() string {
 	return candidates[0]
 }
 
+func (s *server) appendRecallMonitorSample(sample map[string]any) error {
+	path := resolveStoragePath(
+		"RECALL_MONITOR_PATH",
+		filepath.Join("services", "orchestrator", "data", "recall_monitor.ndjson"),
+	)
+	if strings.TrimSpace(path) == "" {
+		return nil
+	}
+	if err := os.MkdirAll(filepath.Dir(path), 0o755); err != nil {
+		return err
+	}
+	raw, err := json.Marshal(sample)
+	if err != nil {
+		return err
+	}
+	file, err := os.OpenFile(path, os.O_APPEND|os.O_CREATE|os.O_WRONLY, 0o644)
+	if err != nil {
+		return err
+	}
+	defer file.Close()
+	if _, err := file.Write(append(raw, '\n')); err != nil {
+		return err
+	}
+	return nil
+}
+
 func normalizeExpectedFileTokens(raw any) map[string]struct{} {
 	out := map[string]struct{}{}
 	for _, item := range anyToStringSlice(raw) {
@@ -455,6 +621,296 @@ func resultHitsExpectations(row map[string]any, expectedFiles map[string]struct{
 	return false
 }
 
+func matchedExpectedFilesWithinK(results []map[string]any, expectedFiles map[string]struct{}, k int) []string {
+	if len(expectedFiles) == 0 {
+		return []string{}
+	}
+	matched := map[string]struct{}{}
+	maxRank := clampInt(k, 1, 100)
+	for idx, row := range results {
+		if idx >= maxRank {
+			break
+		}
+		rowFile := strings.Trim(strings.TrimSpace(strings.ToLower(anyToString(row["file"]))), "/")
+		if rowFile == "" {
+			continue
+		}
+		for candidate := range expectedFiles {
+			if rowFile == candidate || strings.HasSuffix(rowFile, candidate) {
+				matched[candidate] = struct{}{}
+			}
+		}
+	}
+	return sortedKeys(matched)
+}
+
+func uniqueSourcesWithinK(results []map[string]any, k int) []string {
+	seen := map[string]struct{}{}
+	maxRank := clampInt(k, 1, 100)
+	for idx, row := range results {
+		if idx >= maxRank {
+			break
+		}
+		for _, source := range sourcesForRecallResult(row) {
+			seen[source] = struct{}{}
+		}
+	}
+	return sortedKeys(seen)
+}
+
+func sourcesForRecallResult(row map[string]any) []string {
+	seen := map[string]struct{}{}
+	for _, item := range anyToStringSlice(row["sources"]) {
+		source := strings.TrimSpace(strings.ToLower(item))
+		if source != "" {
+			seen[source] = struct{}{}
+		}
+	}
+	for _, key := range []string{"source", "retrieval_source"} {
+		source := strings.TrimSpace(strings.ToLower(anyToString(row[key])))
+		if source != "" {
+			seen[source] = struct{}{}
+		}
+	}
+	return sortedKeys(seen)
+}
+
+func recallResultMemoryID(row map[string]any) string {
+	if memoryID := strings.TrimSpace(anyToString(row["memory_id"])); memoryID != "" {
+		if _, _, canonical, _, err := canonicalMemoryID(memoryID); err == nil {
+			return canonical
+		}
+		return memoryID
+	}
+	project := strings.TrimSpace(anyToString(row["project"]))
+	fileName := strings.TrimSpace(anyToString(row["file"]))
+	if project != "" && fileName != "" {
+		if _, _, canonical, _, err := canonicalMemoryID(project + "::" + fileName); err == nil {
+			return canonical
+		}
+		return project + "::" + fileName
+	}
+	return strings.TrimSpace(anyToString(row["id"]))
+}
+
+func recallEvalGraphNeighborLimit() int {
+	return clampInt(envInt("ORCH_RECALL_EVAL_GRAPH_NEIGHBOR_LIMIT", 40), 1, 200)
+}
+
+func recallGraphContributionUnavailable(reason string) map[string]any {
+	return map[string]any{
+		"enabled":                  false,
+		"reason":                   reason,
+		"seed_count":               0,
+		"candidate_count":          0,
+		"added_candidate_count":    0,
+		"expected_hit_count":       0,
+		"added_expected_hit_count": 0,
+		"helped":                   false,
+		"relations":                []string{},
+	}
+}
+
+func (s *server) evaluateRecallGraphContribution(
+	ctx context.Context,
+	results []map[string]any,
+	expectedFiles map[string]struct{},
+	expectedTerms []string,
+	k int,
+	project string,
+) map[string]any {
+	if len(expectedFiles) == 0 && len(expectedTerms) == 0 {
+		return recallGraphContributionUnavailable("no expectations")
+	}
+	backend := s.memoryGraphBackend()
+	if backend == nil {
+		return recallGraphContributionUnavailable("memory graph store unavailable")
+	}
+	maxRank := clampInt(k, 1, 100)
+	seedIDs := make([]string, 0, maxRank)
+	topIDs := map[string]struct{}{}
+	for idx, row := range results {
+		if idx >= maxRank {
+			break
+		}
+		memoryID := recallResultMemoryID(row)
+		if memoryID == "" {
+			continue
+		}
+		if _, _, canonical, _, err := canonicalMemoryID(memoryID); err == nil {
+			memoryID = canonical
+		}
+		if _, exists := topIDs[memoryID]; exists {
+			continue
+		}
+		topIDs[memoryID] = struct{}{}
+		seedIDs = append(seedIDs, memoryID)
+	}
+	if len(seedIDs) == 0 {
+		return recallGraphContributionUnavailable("top results have no memory ids")
+	}
+
+	limit := recallEvalGraphNeighborLimit()
+	relationCounts := map[string]int{}
+	candidateRows := map[string]map[string]any{}
+	candidateSeen := map[string]struct{}{}
+	addedCandidateCount := 0
+	expectedHitCount := 0
+	addedExpectedHitCount := 0
+
+	for _, seedID := range seedIDs {
+		_, _, canonicalSeed, _, err := canonicalMemoryID(seedID)
+		if err != nil {
+			continue
+		}
+		edges, err := backend.listMemoryEdges(ctx, memoryEdgeQuery{
+			MemoryID: canonicalSeed,
+			Project:  project,
+			Limit:    limit,
+		})
+		if err != nil {
+			continue
+		}
+		for _, edge := range edges {
+			relation := strings.TrimSpace(edge.Relation)
+			if relation == "" {
+				relation = "related"
+			}
+			relationCounts[relation] += 1
+			candidateID := edge.TargetID
+			if edge.TargetID == canonicalSeed {
+				candidateID = edge.SourceID
+			}
+			projectName, fileName, canonicalCandidate, _, err := canonicalMemoryID(candidateID)
+			if err != nil {
+				continue
+			}
+			if _, exists := candidateSeen[canonicalCandidate]; exists {
+				continue
+			}
+			candidateSeen[canonicalCandidate] = struct{}{}
+			row := map[string]any{
+				"memory_id":  canonicalCandidate,
+				"project":    projectName,
+				"file":       fileName,
+				"source":     memoryEdgeSource,
+				"summary":    "memory edge " + edge.SourceID + " -[" + edge.Relation + "]-> " + edge.TargetID,
+				"score":      edge.Confidence,
+				"relation":   relation,
+				"edge_id":    edge.EdgeID,
+				"created_at": edge.CreatedAt,
+			}
+			candidateRows[canonicalCandidate] = row
+			if _, exists := topIDs[canonicalCandidate]; !exists {
+				addedCandidateCount += 1
+			}
+		}
+	}
+
+	matchedCandidateIDs := make([]string, 0)
+	addedMatchedCandidateIDs := make([]string, 0)
+	for candidateID, row := range candidateRows {
+		if !resultHitsExpectations(row, expectedFiles, expectedTerms) {
+			continue
+		}
+		expectedHitCount += 1
+		matchedCandidateIDs = append(matchedCandidateIDs, candidateID)
+		if _, exists := topIDs[candidateID]; !exists {
+			addedExpectedHitCount += 1
+			addedMatchedCandidateIDs = append(addedMatchedCandidateIDs, candidateID)
+		}
+	}
+	sortStrings(matchedCandidateIDs)
+	sortStrings(addedMatchedCandidateIDs)
+	relations := make([]string, 0, len(relationCounts))
+	for relation := range relationCounts {
+		relations = append(relations, relation)
+	}
+	sortStrings(relations)
+	return map[string]any{
+		"enabled":                  true,
+		"seed_count":               len(seedIDs),
+		"candidate_count":          len(candidateRows),
+		"added_candidate_count":    addedCandidateCount,
+		"expected_hit_count":       expectedHitCount,
+		"added_expected_hit_count": addedExpectedHitCount,
+		"helped":                   addedExpectedHitCount > 0,
+		"relations":                relations,
+		"relation_counts":          relationCounts,
+		"matched_memory_ids":       matchedCandidateIDs,
+		"added_matched_memory_ids": addedMatchedCandidateIDs,
+	}
+}
+
+func recallLatencyStats(values []float64) (float64, float64) {
+	clean := make([]float64, 0, len(values))
+	sum := 0.0
+	for _, value := range values {
+		if value < 0 {
+			continue
+		}
+		clean = append(clean, value)
+		sum += value
+	}
+	if len(clean) == 0 {
+		return 0, 0
+	}
+	sort.Float64s(clean)
+	return sum / float64(len(clean)), percentileFloat(clean, 0.95)
+}
+
+func recallEvalQualityStatus(passed bool, evaluatedCases int, recallAtK float64, mrr float64, numericExactness float64) string {
+	if evaluatedCases == 0 {
+		return "insufficient_cases"
+	}
+	if passed &&
+		recallAtK >= defaultRecallEvalGateMinRecallAtK &&
+		mrr >= defaultRecallEvalGateMinMRR &&
+		numericExactness >= defaultRecallEvalGateMinNumeric {
+		return "healthy"
+	}
+	if recallAtK < 0.5 || mrr < 0.35 || numericExactness < 0.8 {
+		return "repair_recommended"
+	}
+	return "watch"
+}
+
+func recallEvalRecommendations(metrics map[string]any, gate recallEvalGate, passed bool) []string {
+	recommendations := make([]string, 0, 5)
+	recallAtK := anyToFloat64(metrics["recallAtK"], 0)
+	mrr := anyToFloat64(metrics["mrr"], 0)
+	citationCoverage := anyToFloat64(metrics["citationCoverage"], 1)
+	sourceDiversity := anyToFloat64(metrics["sourceDiversity"], 0)
+	graphLift := anyToFloat64(metrics["graphLift"], 0)
+	p95LatencyMs := anyToFloat64(metrics["p95LatencyMs"], 0)
+	if recallAtK < gate.MinRecallAtK {
+		recommendations = append(recommendations, "Refresh saved eval cases, then inspect source coverage for queries below recall gate.")
+	}
+	if mrr < gate.MinMRR {
+		recommendations = append(recommendations, "Tune ranking weights or source ordering; hits are present but not surfacing early enough.")
+	}
+	if citationCoverage < 0.9 {
+		recommendations = append(recommendations, "Increase citation-backed retrieval coverage for cases with expected files.")
+	}
+	if graphLift > 0 {
+		recommendations = append(recommendations, "Graph neighbors add recall coverage; keep first-hop memory-edge expansion available for agent context packs.")
+	}
+	if sourceDiversity < 1.5 && anyToInt(metrics["casesEvaluated"], 0) > 0 {
+		recommendations = append(recommendations, "Source diversity is low; verify qdrant, pgvector, and topic rollup lanes are available for this profile.")
+	}
+	if p95LatencyMs > 5000 {
+		recommendations = append(recommendations, "Recall eval p95 latency is elevated; inspect /telemetry/retrieval/source-quality before widening fanout.")
+	}
+	if len(recommendations) == 0 {
+		if passed {
+			recommendations = append(recommendations, "Recall quality is inside the saved gate; keep scheduled evaluation and graph quality repair enabled.")
+		} else {
+			recommendations = append(recommendations, "Recall gate failed without a dominant signal; inspect per-case failures and retrieval debug.")
+		}
+	}
+	return recommendations
+}
+
 func matchedNumericFacts(grounding map[string]any, expected []string) []string {
 	if len(expected) == 0 {
 		return []string{}
diff --git a/services/gateway-go/telemetry_native_routes.go b/services/gateway-go/telemetry_native_routes.go
index 0a78d5a..06d0e62 100644
--- a/services/gateway-go/telemetry_native_routes.go
+++ b/services/gateway-go/telemetry_native_routes.go
@@ -879,22 +879,59 @@ func (s *server) telemetryRecallRoute(w http.ResponseWriter, r *http.Request) {
 		sourceErrorRate = float64(totalErrors) / float64(totalRequests)
 	}
 	alerts := buildRetrievalAlerts(order, statsBySource)
+	monitorRows := s.readRecallMonitorHistory(envInt("ORCH_RECALL_MONITOR_HISTORY_LIMIT", 96))
+	latestQuality := latestRecallEvalMonitorSample(monitorRows)
+	qualityTotals := map[string]any{
+		"requests":          totalRequests,
+		"timeouts":          totalTimeouts,
+		"errors":            totalErrors,
+		"sourceErrorRate":   roundFloat(sourceErrorRate, 6),
+		"noHitRate":         0.0,
+		"lowConfidenceRate": 0.0,
+		"staleHitRate":      0.0,
+		"recallAtK":         nil,
+		"mrr":               nil,
+		"numericExactness":  nil,
+		"citationCoverage":  nil,
+		"sourceDiversity":   nil,
+		"graphLift":         nil,
+		"evalP95Ms":         nil,
+		"lastEvalAt":        nil,
+	}
+	qualityStatus := "unknown"
+	if latestQuality != nil {
+		qualityStatus = strings.TrimSpace(anyToString(latestQuality["qualityStatus"]))
+		if qualityStatus == "" {
+			qualityStatus = recallQualityStatusFromSample(latestQuality)
+		}
+		qualityTotals["noHitRate"] = anyToFloat64(latestQuality["noHitRate"], 0.0)
+		qualityTotals["lowConfidenceRate"] = anyToFloat64(latestQuality["lowConfidenceRate"], 0.0)
+		qualityTotals["staleHitRate"] = anyToFloat64(latestQuality["staleHitRate"], 0.0)
+		qualityTotals["recallAtK"] = anyToFloat64(latestQuality["recallAtK"], 0.0)
+		qualityTotals["mrr"] = anyToFloat64(latestQuality["mrr"], 0.0)
+		qualityTotals["numericExactness"] = anyToFloat64(latestQuality["numericExactness"], 0.0)
+		qualityTotals["citationCoverage"] = anyToFloat64(latestQuality["citationCoverage"], 0.0)
+		qualityTotals["sourceDiversity"] = anyToFloat64(latestQuality["sourceDiversity"], 0.0)
+		qualityTotals["graphLift"] = anyToFloat64(latestQuality["graphLift"], 0.0)
+		qualityTotals["evalP95Ms"] = anyToFloat64(latestQuality["evalP95Ms"], 0.0)
+		qualityTotals["lastEvalAt"] = latestQuality["timestamp"]
+	}
+	recentQuality := recentRecallEvalMonitorSamples(monitorRows, 10)
 	writeJSON(w, http.StatusOK, map[string]any{
 		"updatedAt":    updatedAt,
 		"trafficClass": trafficClass,
 		"quality": map[string]any{
-			"updatedAt": updatedAt,
-			"totals": map[string]any{
-				"requests":          totalRequests,
-				"timeouts":          totalTimeouts,
-				"errors":            totalErrors,
-				"sourceErrorRate":   roundFloat(sourceErrorRate, 6),
-				"noHitRate":         0.0,
-				"lowConfidenceRate": 0.0,
-				"staleHitRate":      0.0,
-			},
-			"bySource": bySource,
-			"recent":   []any{},
+			"updatedAt":   updatedAt,
+			"status":      qualityStatus,
+			"totals":      qualityTotals,
+			"bySource":    bySource,
+			"recent":      recentQuality,
+			"sampleCount": len(recentQuality),
+			"recommendations": recallTelemetryQualityRecommendations(
+				latestQuality,
+				totalRequests,
+				sourceErrorRate,
+			),
 		},
 		"alerts": map[string]any{
 			"thresholds": map[string]any{
@@ -959,6 +996,95 @@ func (s *server) syntheticRecallMonitorSample() map[string]any {
 	}
 }
 
+func latestRecallEvalMonitorSample(rows []map[string]any) map[string]any {
+	for idx := len(rows) - 1; idx >= 0; idx-- {
+		row := rows[idx]
+		if row == nil {
+			continue
+		}
+		if _, exists := row["recallAtK"]; exists {
+			return row
+		}
+		if _, exists := row["mrr"]; exists {
+			return row
+		}
+	}
+	return nil
+}
+
+func recentRecallEvalMonitorSamples(rows []map[string]any, limit int) []map[string]any {
+	if limit < 1 {
+		limit = 1
+	}
+	out := make([]map[string]any, 0, limit)
+	for idx := len(rows) - 1; idx >= 0 && len(out) < limit; idx-- {
+		row := rows[idx]
+		if row == nil {
+			continue
+		}
+		if _, exists := row["recallAtK"]; !exists {
+			if _, exists := row["mrr"]; !exists {
+				continue
+			}
+		}
+		out = append(out, row)
+	}
+	for left, right := 0, len(out)-1; left < right; left, right = left+1, right-1 {
+		out[left], out[right] = out[right], out[left]
+	}
+	return out
+}
+
+func recallQualityStatusFromSample(sample map[string]any) string {
+	if sample == nil {
+		return "unknown"
+	}
+	if anyToBool(sample["passed"]) {
+		return "healthy"
+	}
+	recallAtK := anyToFloat64(sample["recallAtK"], 0)
+	mrr := anyToFloat64(sample["mrr"], 0)
+	if recallAtK < 0.5 || mrr < 0.35 {
+		return "repair_recommended"
+	}
+	return "watch"
+}
+
+func recallTelemetryQualityRecommendations(sample map[string]any, totalRequests int, sourceErrorRate float64) []string {
+	recommendations := make([]string, 0, 5)
+	if sample == nil {
+		recommendations = append(recommendations, "Run scripts/agent/recall-quality-eval to seed recall quality telemetry.")
+	} else {
+		recallAtK := anyToFloat64(sample["recallAtK"], 0)
+		mrr := anyToFloat64(sample["mrr"], 0)
+		citationCoverage := anyToFloat64(sample["citationCoverage"], 1)
+		graphLift := anyToFloat64(sample["graphLift"], 0)
+		sourceDiversity := anyToFloat64(sample["sourceDiversity"], 0)
+		if recallAtK < 0.75 {
+			recommendations = append(recommendations, "Recall@K is below the production floor; refresh saved cases and inspect failing queries.")
+		}
+		if mrr < 0.55 {
+			recommendations = append(recommendations, "MRR is below target; tune ranking and staged source ordering before increasing context size.")
+		}
+		if citationCoverage < 0.9 {
+			recommendations = append(recommendations, "Citation coverage is weak; prioritize file-backed hits in context packs.")
+		}
+		if graphLift > 0 {
+			recommendations = append(recommendations, "Graph neighbors improve recall; keep first-hop edge expansion enabled in agent-boundary context packaging.")
+		}
+		if sourceDiversity < 1.5 {
+			recommendations = append(recommendations, "Recall is leaning on too few sources; verify qdrant, pgvector, and topic rollups are healthy.")
+		}
+	}
+	if totalRequests > 0 && sourceErrorRate >= 0.25 {
+		recommendations = append(recommendations, "Retrieval source error rate is elevated; inspect /telemetry/retrieval/source-quality.")
+	}
+	if len(recommendations) == 0 {
+		recommendations = append(recommendations, "Recall quality telemetry is inside current production thresholds.")
+	}
+	return recommendations
+}
+
 func (s *server) telemetryRecallMonitorRoute(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet {
 		writeJSON(w, http.StatusMethodNotAllowed, map[string]any{"error": "method not allowed"})
@@ -984,6 +1110,393 @@ func (s *server) telemetryRecallMonitorRoute(w http.ResponseWriter, r *http.Requ
 	})
 }
 
+func recallMonitorSamplesForWindow(rows []map[string]any, lookbackHours float64, maxSamples int) []map[string]any {
+	if maxSamples < 1 {
+		maxSamples = 1
+	}
+	if len(rows) == 0 {
+		return []map[string]any{}
+	}
+	cutoff := time.Now().UTC().Add(-time.Duration(lookbackHours * float64(time.Hour)))
+	selected := make([]map[string]any, 0, len(rows))
+	for _, row := range rows {
+		if row == nil {
+			continue
+		}
+		parsed, ok := parseRecallMonitorSampleTimestamp(row["timestamp"])
+		if !ok {
+			continue
+		}
+		if parsed.After(cutoff) || parsed.Equal(cutoff) {
+			selected = append(selected, row)
+		}
+	}
+	if len(selected) == 0 {
+		if len(rows) <= maxSamples {
+			return append([]map[string]any(nil), rows...)
+		}
+		return append([]map[string]any(nil), rows[len(rows)-maxSamples:]...)
+	}
+	if len(selected) > maxSamples {
+		selected = append([]map[string]any(nil), selected[len(selected)-maxSamples:]...)
+	} else {
+		selected = append([]map[string]any(nil), selected...)
+	}
+	return selected
+}
+
+func parseRecallMonitorSampleTimestamp(value any) (time.Time, bool) {
+	token := strings.TrimSpace(anyToString(value))
+	if token == "" {
+		return time.Time{}, false
+	}
+	if parsed, err := time.Parse(time.RFC3339Nano, token); err == nil {
+		return parsed.UTC(), true
+	}
+	if parsed, err := time.Parse(time.RFC3339, token); err == nil {
+		return parsed.UTC(), true
+	}
+	return time.Time{}, false
+}
+
+func recommendRecallRateThreshold(values []float64, current float64, floor float64, ceiling float64) float64 {
+	clean := make([]float64, 0, len(values))
+	for _, value := range values {
+		if value < 0 {
+			value = 0
+		}
+		clean = append(clean, value)
+	}
+	if len(clean) == 0 {
+		return roundFloat(clampFloat(current, floor, ceiling), 6)
+	}
+	sort.Float64s(clean)
+	p95 := percentileFloat(clean, 0.95)
+	p99 := percentileFloat(clean, 0.99)
+	suggested := maxFloat(current*0.8, maxFloat(p95*1.2, p99*1.05))
+	return roundFloat(clampFloat(suggested, floor, ceiling), 6)
+}
+
+func recommendRecallLatencyThreshold(values []float64, current float64, floor float64) float64 {
+	clean := make([]float64, 0, len(values))
+	for _, value := range values {
+		if value <= 0 {
+			continue
+		}
+		clean = append(clean, value)
+	}
+	if len(clean) == 0 {
+		return roundFloat(maxFloat(current, floor), 3)
+	}
+	sort.Float64s(clean)
+	p95 := percentileFloat(clean, 0.95)
+	p99 := percentileFloat(clean, 0.99)
+	suggested := maxFloat(current*0.85, maxFloat(p95*1.15, maxFloat(p99*1.05, floor)))
+	return roundFloat(suggested, 3)
+}
+
+func maxFloat(left float64, right float64) float64 {
+	if left >= right {
+		return left
+	}
+	return right
+}
+
+func recallPercentile(values []float64, pct float64) float64 {
+	clean := make([]float64, 0, len(values))
+	for _, value := range values {
+		if value < 0 {
+			continue
+		}
+		clean = append(clean, value)
+	}
+	if len(clean) == 0 {
+		return 0
+	}
+	sort.Float64s(clean)
+	return roundFloat(percentileFloat(clean, pct), 6)
+}
+
+func buildRecallQualityTuningRecommendation(
+	latest map[string]any,
+	recallAtKValues []float64,
+	mrrValues []float64,
+	citationCoverageValues []float64,
+	sourceDiversityValues []float64,
+	graphLiftValues []float64,
+	evalP95Values []float64,
+	defaultSources []string,
+) map[string]any {
+	recallLatest := anyToFloat64(latest["recallAtK"], 0)
+	mrrLatest := anyToFloat64(latest["mrr"], 0)
+	graphLiftLatest := anyToFloat64(latest["graphLift"], 0)
+	sourceDiversityLatest := anyToFloat64(latest["sourceDiversity"], 0)
+	citationLatest := anyToFloat64(latest["citationCoverage"], 0)
+	depth := 0
+	neighborLimit := 0
+	if latest != nil && (graphLiftLatest > 0 || recallLatest < 0.75 || mrrLatest < 0.55) {
+		depth = 1
+		neighborLimit = 12
+		if graphLiftLatest >= 0.15 {
+			neighborLimit = 20
+		}
+	}
+	sourceOrder := orderedSourceUnion(
+		defaultSources,
+		[]string{sourceTopicRollup, sourceQdrant, sourcePgvector, sourceMemoryBank},
+	)
+	recommendations := make([]string, 0, 5)
+	if latest == nil {
+		recommendations = append(recommendations, "Run saved recall evaluation before applying quality tuning.")
+	} else {
+		if recallLatest < 0.75 || mrrLatest < 0.55 {
+			recommendations = append(recommendations, "Keep source fanout broad for boundary context packs until recall and MRR are back above floor.")
+		}
+		if graphLiftLatest > 0 {
+			recommendations = append(recommendations, "Use first-hop graph expansion for agent context packages; graph neighbors are contributing measurable recall.")
+		}
+		if citationLatest > 0 && citationLatest < 0.9 {
+			recommendations = append(recommendations, "Prefer file-backed citations in ranking when context packs need auditable memory evidence.")
+		}
+		if sourceDiversityLatest > 0 && sourceDiversityLatest < 1.5 {
+			recommendations = append(recommendations, "Do not narrow retrieval source order yet; current quality samples show low source diversity.")
+		}
+	}
+	if len(recommendations) == 0 {
+		recommendations = append(recommendations, "Quality samples support current source order and graph expansion defaults.")
+	}
+	return map[string]any{
+		"latest": map[string]any{
+			"recallAtK":        roundFloat(recallLatest, 6),
+			"mrr":              roundFloat(mrrLatest, 6),
+			"citationCoverage": roundFloat(citationLatest, 6),
+			"sourceDiversity":  roundFloat(sourceDiversityLatest, 3),
+			"graphLift":        roundFloat(graphLiftLatest, 6),
+		},
+		"baselines": map[string]any{
+			"recallAtKP50":        recallPercentile(recallAtKValues, 0.50),
+			"recallAtKP95":        recallPercentile(recallAtKValues, 0.95),
+			"mrrP50":              recallPercentile(mrrValues, 0.50),
+			"citationCoverageP50": recallPercentile(citationCoverageValues, 0.50),
+			"sourceDiversityP50":  recallPercentile(sourceDiversityValues, 0.50),
+			"graphLiftP95":        recallPercentile(graphLiftValues, 0.95),
+			"evalP95MsP95":        recallPercentile(evalP95Values, 0.95),
+		},
+		"graphExpansion": map[string]any{
+			"enabled":       depth > 0,
+			"depth":         depth,
+			"neighborLimit": neighborLimit,
+			"policy":        "first_hop_only",
+		},
+		"sourceOrder": sourceOrder,
+		"cadence": map[string]any{
+			"savedEval":     "hourly_or_before_release",
+			"caseRefresh":   "daily_or_after_memory_schema_change",
+			"openCoreAudit": "before_public_or_paid_sync",
+		},
+		"recommendations": recommendations,
+	}
+}
+
+func (s *server) telemetryRecallTuningRoute(w http.ResponseWriter, r *http.Request) {
+	if r.Method != http.MethodGet {
+		writeJSON(w, http.StatusMethodNotAllowed, map[string]any{"error": "method not allowed"})
+		return
+	}
+	if _, ok := s.prepareAuthorizedHeaders(w, r); !ok {
+		return
+	}
+
+	query := r.URL.Query()
+	lookbackHours := parseOptionalFloatQuery(
+		query.Get("lookback_hours"),
+		maxFloat(1.0, envFloat("ORCH_RECALL_MONITOR_LOOKBACK_HOURS", 24.0)),
+		1.0,
+		24.0*365.0,
+	)
+	minSamples := parseOptionalIntQuery(
+		query.Get("min_samples"),
+		maxInt(4, envInt("ORCH_RECALL_TUNING_MIN_SAMPLES", 16)),
+		1,
+		100000,
+	)
+	maxSamples := parseOptionalIntQuery(
+		query.Get("max_samples"),
+		maxInt(24, envInt("ORCH_RECALL_MONITOR_HISTORY_LIMIT", 288)),
+		1,
+		100000,
+	)
+
+	rows := s.readRecallMonitorHistory(maxSamples)
+	windowSamples := recallMonitorSamplesForWindow(rows, lookbackHours, maxSamples)
+
+	noHitValues := make([]float64, 0, len(windowSamples))
+	lowConfidenceValues := make([]float64, 0, len(windowSamples))
+	staleValues := make([]float64, 0, len(windowSamples))
+	sourceErrorValues := make([]float64, 0, len(windowSamples))
+	lettaP95Values := make([]float64, 0, len(windowSamples))
+	lettaP99Values := make([]float64, 0, len(windowSamples))
+	lettaTimeoutValues := make([]float64, 0, len(windowSamples))
+	recallAtKValues := make([]float64, 0, len(windowSamples))
+	mrrValues := make([]float64, 0, len(windowSamples))
+	citationCoverageValues := make([]float64, 0, len(windowSamples))
+	sourceDiversityValues := make([]float64, 0, len(windowSamples))
+	graphLiftValues := make([]float64, 0, len(windowSamples))
+	evalP95Values := make([]float64, 0, len(windowSamples))
+	for _, sample := range windowSamples {
+		noHitValues = append(noHitValues, anyToFloat64(sample["noHitRate"], 0.0))
+		lowConfidenceValues = append(lowConfidenceValues, anyToFloat64(sample["lowConfidenceRate"], 0.0))
+		staleValues = append(staleValues, anyToFloat64(sample["staleHitRate"], 0.0))
+		sourceErrorValues = append(sourceErrorValues, anyToFloat64(sample["maxSourceErrorRate"], 0.0))
+
+		lettaP95 := anyToFloat64(sample["lettaP95Ms"], 0.0)
+		if lettaP95 > 0 {
+			lettaP95Values = append(lettaP95Values, lettaP95)
+		}
+		lettaP99 := anyToFloat64(sample["lettaP99Ms"], 0.0)
+		if lettaP99 > 0 {
+			lettaP99Values = append(lettaP99Values, lettaP99)
+		}
+		lettaTimeoutValues = append(lettaTimeoutValues, anyToFloat64(sample["lettaTimeoutRate"], 0.0))
+		if _, exists := sample["recallAtK"]; exists {
+			recallAtKValues = append(recallAtKValues, anyToFloat64(sample["recallAtK"], 0.0))
+			mrrValues = append(mrrValues, anyToFloat64(sample["mrr"], 0.0))
+			citationCoverageValues = append(citationCoverageValues, anyToFloat64(sample["citationCoverage"], 0.0))
+			sourceDiversityValues = append(sourceDiversityValues, anyToFloat64(sample["sourceDiversity"], 0.0))
+			graphLiftValues = append(graphLiftValues, anyToFloat64(sample["graphLift"], 0.0))
+			evalP95Values = append(evalP95Values, anyToFloat64(sample["evalP95Ms"], 0.0))
+		}
+	}
+
+	currentRecallNoHit := clampFloat(envFloat("ORCH_RECALL_ALERT_NO_HIT_RATE", 0.35), 0.0, 1.0)
+	currentRecallLowConfidence := clampFloat(envFloat("ORCH_RECALL_ALERT_LOW_CONFIDENCE_RATE", 0.4), 0.0, 1.0)
+	currentRecallStale := clampFloat(envFloat("ORCH_RECALL_ALERT_STALE_HIT_RATE", 0.45), 0.0, 1.0)
+	currentRecallSourceError := clampFloat(envFloat("ORCH_RECALL_ALERT_SOURCE_ERROR_RATE", 0.25), 0.0, 1.0)
+	currentRecallMinRequests := maxInt(5, envInt("ORCH_RECALL_ALERT_MIN_REQUESTS", 50))
+
+	currentRetrievalLettaP95 := maxFloat(1000.0, envFloat("ORCH_RETRIEVAL_ALERT_LETTA_P95_MS", 30000.0))
+	currentRetrievalLettaP99 := maxFloat(currentRetrievalLettaP95, envFloat("ORCH_RETRIEVAL_ALERT_LETTA_P99_MS", 45000.0))
+	currentRetrievalLettaTimeout := clampFloat(envFloat("ORCH_RETRIEVAL_ALERT_LETTA_TIMEOUT_RATE", 0.05), 0.0, 1.0)
+	currentRetrievalMinRequests := maxInt(1, envInt("ORCH_RETRIEVAL_ALERT_MIN_REQUESTS", 20))
+
+	recommended := map[string]any{
+		"recall": map[string]any{
+			"noHitRate": recommendRecallRateThreshold(noHitValues, currentRecallNoHit, 0.001, 1.0),
+			"lowConfidenceRate": recommendRecallRateThreshold(
+				lowConfidenceValues,
+				currentRecallLowConfidence,
+				0.001,
+				1.0,
+			),
+			"staleHitRate": recommendRecallRateThreshold(staleValues, currentRecallStale, 0.001, 1.0),
+			"sourceErrorRate": recommendRecallRateThreshold(
+				sourceErrorValues,
+				currentRecallSourceError,
+				0.001,
+				1.0,
+			),
+			"minRequests": currentRecallMinRequests,
+		},
+		"retrieval": map[string]any{
+			"lettaP95Ms": recommendRecallLatencyThreshold(
+				lettaP95Values,
+				currentRetrievalLettaP95,
+				1000.0,
+			),
+			"lettaP99Ms": recommendRecallLatencyThreshold(
+				lettaP99Values,
+				currentRetrievalLettaP99,
+				currentRetrievalLettaP95,
+			),
+			"lettaTimeoutRate": recommendRecallRateThreshold(
+				lettaTimeoutValues,
+				currentRetrievalLettaTimeout,
+				0.001,
+				1.0,
+			),
+			"minRequests": currentRetrievalMinRequests,
+		},
+	}
+	latestQualitySample := latestRecallEvalMonitorSample(windowSamples)
+	qualityRecommendation := buildRecallQualityTuningRecommendation(
+		latestQualitySample,
+		recallAtKValues,
+		mrrValues,
+		citationCoverageValues,
+		sourceDiversityValues,
+		graphLiftValues,
+		evalP95Values,
+		s.retrieval.defaultSources,
+	)
+	recommended["quality"] = qualityRecommendation
+
+	warnings := make([]string, 0, 1)
+	if len(windowSamples) < minSamples {
+		warnings = append(
+			warnings,
+			"Only "+strconv.Itoa(len(windowSamples))+" recall monitor samples available; collect at least "+
+				strconv.Itoa(minSamples)+" for stable tuning.",
+		)
+	}
+
+	monitorLimit := maxSamples
+	if monitorLimit > 20 {
+		monitorLimit = 20
+	}
+	monitorRows := s.readRecallMonitorHistory(monitorLimit)
+	latestSample := any(nil)
+	if len(windowSamples) > 0 {
+		latestSample = windowSamples[len(windowSamples)-1]
+	}
+
+	writeJSON(w, http.StatusOK, map[string]any{
+		"window": map[string]any{
+			"lookbackHours": lookbackHours,
+			"samples":       len(windowSamples),
+			"minSamples":    minSamples,
+			"sufficient":    len(windowSamples) >= minSamples,
+		},
+		"current": map[string]any{
+			"recall": map[string]any{
+				"noHitRate":         currentRecallNoHit,
+				"lowConfidenceRate": currentRecallLowConfidence,
+				"staleHitRate":      currentRecallStale,
+				"sourceErrorRate":   currentRecallSourceError,
+				"minRequests":       currentRecallMinRequests,
+			},
+			"retrieval": map[string]any{
+				"lettaP95Ms":       currentRetrievalLettaP95,
+				"lettaP99Ms":       currentRetrievalLettaP99,
+				"lettaTimeoutRate": currentRetrievalLettaTimeout,
+				"minRequests":      currentRetrievalMinRequests,
+			},
+		},
+		"recommended": recommended,
+		"env": map[string]any{
+			"ORCH_RECALL_ALERT_NO_HIT_RATE":               recommended["recall"].(map[string]any)["noHitRate"],
+			"ORCH_RECALL_ALERT_LOW_CONFIDENCE_RATE":       recommended["recall"].(map[string]any)["lowConfidenceRate"],
+			"ORCH_RECALL_ALERT_STALE_HIT_RATE":            recommended["recall"].(map[string]any)["staleHitRate"],
+			"ORCH_RECALL_ALERT_SOURCE_ERROR_RATE":         recommended["recall"].(map[string]any)["sourceErrorRate"],
+			"ORCH_RETRIEVAL_ALERT_LETTA_P95_MS":           recommended["retrieval"].(map[string]any)["lettaP95Ms"],
+			"ORCH_RETRIEVAL_ALERT_LETTA_P99_MS":           recommended["retrieval"].(map[string]any)["lettaP99Ms"],
+			"ORCH_RETRIEVAL_ALERT_LETTA_TIMEOUT_RATE":     recommended["retrieval"].(map[string]any)["lettaTimeoutRate"],
+			"CONTEXTLATTICE_RECALL_GRAPH_EXPANSION_DEPTH": qualityRecommendation["graphExpansion"].(map[string]any)["depth"],
+			"CONTEXTLATTICE_RECALL_GRAPH_EXPANSION_LIMIT": qualityRecommendation["graphExpansion"].(map[string]any)["neighborLimit"],
+		},
+		"warnings":     warnings,
+		"latestSample": latestSample,
+		"monitor": map[string]any{
+			"updatedAt": nowUTCISO(),
+			"history":   monitorRows,
+			"count":     len(monitorRows),
+			"config": map[string]any{
+				"historyLimit":  monitorLimit,
+				"lookbackHours": maxFloat(1.0, envFloat("ORCH_RECALL_MONITOR_LOOKBACK_HOURS", 24.0)),
+			},
+		},
+	})
+}
+
 func (s *server) telemetryToolsInvocationsRoute(w http.ResponseWriter, r *http.Request) {
 	if r.Method != http.MethodGet {
 		writeJSON(w, http.StatusMethodNotAllowed, map[string]any{"error": "method not allowed"})