From a2afe67c018593c56a46329ebba0171f787c212c Mon Sep 17 00:00:00 2001
From: Neo <neo@Neos-iMac-Pro.local>
Date: Thu, 11 Jun 2026 16:03:58 +0900
Subject: [PATCH 1/3] feat(reviewer): run the reviewer on Vertex AI Agent
 Engine (hybrid runtime)

Track 3 'deploy on Agent Engine' consideration. The reviewer is pure
reasoning + grounding, so it moves to Vertex AI Agent Engine; the coder
stays on Cloud Run where it needs a git/shell sandbox.

- deploy_agent_engine.py: deploys the reviewer root_agent to Agent Engine
  (reasoning_engines.AdkApp), idempotent create/update, bundles the
  CONVENTIONS.md grounding corpus. Runs as the project's default Reasoning
  Engine Service Agent (needs discoveryengine.viewer for live Vertex AI
  Search; bundled corpus is the graceful fallback). Public repo => the
  reviewer reads PRs unauthenticated, so no GitHub token / SecretRef.
- github-issue-resolver.yaml: review_pr step is now a python step that mints
  an aiplatform.user access token from the orchestrator metadata server and
  calls the engine ':streamQuery' endpoint, parsing the JSON verdict from the
  streamed events. New 'reviewer_agent_engine' input holds the resource name;
  legacy reviewer_agent_url kept for fallback.

Verified: querying engine 3625053003137941504 returns a grounded verdict
citing 'Rule 1: Money is integer cents, never floats'.

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
---
 cloud-agents/reviewer/deploy_agent_engine.py  | 107 ++++++++++++++++++
 .../builtins/github-issue-resolver.yaml       |  81 +++++++++++--
 2 files changed, 177 insertions(+), 11 deletions(-)
 create mode 100644 cloud-agents/reviewer/deploy_agent_engine.py

diff --git a/cloud-agents/reviewer/deploy_agent_engine.py b/cloud-agents/reviewer/deploy_agent_engine.py
new file mode 100644
index 0000000..d3cffce
--- /dev/null
+++ b/cloud-agents/reviewer/deploy_agent_engine.py
@@ -0,0 +1,107 @@
+"""Deploy the ADK reviewer agent to Vertex AI Agent Engine.
+
+The reviewer is a pure reasoning + grounding agent (Gemini via Vertex AI +
+Vertex AI Search), which is exactly what Agent Engine is built to host — so it
+runs there, while the coder agent (which needs a real git/shell sandbox) stays
+on Cloud Run. This is the "right runtime per agent" half of Revka's hybrid
+deployment.
+
+Idempotent: updates the existing Agent Engine with the same display name if one
+exists, otherwise creates it. Prints the reasoning-engine resource name, which
+Revka's workflow uses to call the agent over Agent Engine's query API.
+
+Run locally (gcloud ADC) or from CI (Workload Identity Federation):
+
+    cd cloud-agents/reviewer && python deploy_agent_engine.py
+
+Config via env (sensible defaults for project construct-498201):
+    PROJECT, LOCATION, STAGING_BUCKET, RUNTIME_SERVICE_ACCOUNT,
+    REVIEWER_DATASTORE_ID, GITHUB_TOKEN_SECRET, DISPLAY_NAME
+"""
+from __future__ import annotations
+
+import os
+import sys
+
+import vertexai
+from vertexai import agent_engines
+from vertexai.preview import reasoning_engines
+
+from agent import root_agent, REVIEWER_DATASTORE_ID  # local module
+
+PROJECT = os.getenv("PROJECT", "construct-498201")
+LOCATION = os.getenv("LOCATION", "us-central1")
+STAGING_BUCKET = os.getenv("STAGING_BUCKET", f"gs://{PROJECT}-agent-engine")
+# Reuse the reviewer Cloud Run SA: it already holds aiplatform.user,
+# discoveryengine.viewer, and secretAccessor on revka-GITHUB_TOKEN.
+RUNTIME_SA = os.getenv(
+    "RUNTIME_SERVICE_ACCOUNT",
+    f"reviewer-agent@{PROJECT}.iam.gserviceaccount.com",
+)
+GITHUB_TOKEN_SECRET = os.getenv("GITHUB_TOKEN_SECRET", "revka-GITHUB_TOKEN")
+DISPLAY_NAME = os.getenv("DISPLAY_NAME", "revka-reviewer")
+
+REQUIREMENTS = [
+    "google-adk==1.15.0",
+    "httpx>=0.27.0,<1.0.0",
+    "google-auth>=2.28",
+    "google-cloud-aiplatform[agent_engines]>=1.95.1",
+]
+
+# Both files travel with the agent so the bundled-conventions corpus fallback
+# (retrieve_conventions) keeps working even if the search index is still settling.
+EXTRA_PACKAGES = ["agent.py", "grounding/CONVENTIONS.md"]
+
+ENV_VARS = {
+    # GOOGLE_CLOUD_PROJECT / GOOGLE_CLOUD_LOCATION are reserved on Agent Engine
+    # (provided automatically); GOOGLE_GENAI_USE_VERTEXAI is set in agent.py.
+    "REVIEWER_DATASTORE_ID": REVIEWER_DATASTORE_ID,
+}
+
+# The reviewer only *reads* PRs, so against a public repo it needs no GitHub
+# token (unauthenticated REST is fine). Only attach the Secret Manager token for
+# a private repo — and then the Agent Engine runtime service agent must have
+# secretAccessor on it, or instances fail readiness ("no running instances").
+if os.getenv("ATTACH_GITHUB_SECRET", "").lower() in ("1", "true", "yes"):
+    # A dict is converted to a SecretRef proto by the SDK (version-agnostic).
+    ENV_VARS["GITHUB_TOKEN"] = {"secret": GITHUB_TOKEN_SECRET, "version": "latest"}
+
+
+def main() -> None:
+    vertexai.init(project=PROJECT, location=LOCATION, staging_bucket=STAGING_BUCKET)
+
+    app = reasoning_engines.AdkApp(agent=root_agent, enable_tracing=True)
+
+    # Note: the v1 Agent Engine API runs the engine as the project's default
+    # Reasoning Engine Service Agent (custom service_account is not honored in v1),
+    # which must hold roles/discoveryengine.viewer for live Vertex AI Search
+    # grounding (the bundled CONVENTIONS.md corpus is the graceful fallback).
+    common = dict(
+        requirements=REQUIREMENTS,
+        extra_packages=EXTRA_PACKAGES,
+        env_vars=ENV_VARS,
+        display_name=DISPLAY_NAME,
+        description=(
+            "Revka reviewer agent (ADK/Gemini via Vertex AI) — reviews GitHub "
+            "PRs grounded in repo coding conventions via Vertex AI Search."
+        ),
+    )
+
+    existing = [
+        a for a in agent_engines.list()
+        if getattr(a, "display_name", None) == DISPLAY_NAME
+    ]
+    if existing:
+        target = existing[0]
+        print(f"==> Updating existing Agent Engine: {target.resource_name}", file=sys.stderr)
+        remote = target.update(agent_engine=app, **common)
+    else:
+        print("==> Creating new Agent Engine", file=sys.stderr)
+        remote = agent_engines.create(agent_engine=app, **common)
+
+    # stdout = just the resource name, so CI / callers can capture it cleanly.
+    print(remote.resource_name)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml b/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml
index 9c5c94a..bb84af4 100644
--- a/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml
+++ b/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml
@@ -24,7 +24,11 @@ inputs:
   - name: reviewer_agent_url
     required: false
     default: "https://reviewer-agent-n22ujw2j2a-uc.a.run.app"
-    description: Cloud Run A2A reviewer executor (ADK/Gemini via Vertex).
+    description: Legacy Cloud Run A2A reviewer executor (kept for fallback; the reviewer now runs on Vertex AI Agent Engine).
+  - name: reviewer_agent_engine
+    required: false
+    default: "projects/1091585228963/locations/us-central1/reasoningEngines/3625053003137941504"
+    description: Vertex AI Agent Engine resource for the ADK/Gemini reviewer (reasoning + Vertex AI Search grounding).
   - name: fix_strategy
     required: false
     default: "Analyze the issue and implement the smallest correct fix. Add or adjust tests to cover the change. Run pytest. Keep the change minimal and well-scoped."
@@ -303,23 +307,78 @@ steps:
         issue_number: "${assess_issue.output_data.issue_number}"
 
   # -------------------------------------------------------------------------
-  # 6. Review the PR — A2A call to the Cloud Run ADK/Gemini reviewer. Threaded
-  #    pr_number comes from the extract step above.
+  # 6. Review the PR — query the ADK/Gemini reviewer running on Vertex AI Agent
+  #    Engine (reasoning + Vertex AI Search grounding). The orchestrator mints an
+  #    OAuth access token from its metadata server (its SA holds aiplatform.user)
+  #    and calls the engine's :streamQuery endpoint, then parses the reviewer's
+  #    JSON verdict out of the streamed events. Threaded pr_number comes from the
+  #    extract step above.
   # -------------------------------------------------------------------------
   - id: review_pr
-    name: "Review Pull Request (A2A / Cloud Run)"
-    type: a2a
+    name: "Review Pull Request (Vertex AI Agent Engine)"
+    type: python
     position:
       x: 513.52
       y: 600.0
     depends_on: [extract_pr_number]
-    a2a:
-      url: "${inputs.reviewer_agent_url}"
-      cloud_run_auth: gcloud
-      cloud_run_audience: "${inputs.reviewer_agent_url}"
+    python:
       timeout: 900
-      message: |
-        {"repo_name": "${inputs.repo_name}", "pr_number": ${extract_pr_number.output_data.pr_number}}
+      code: |
+        import json, sys, re, urllib.request, urllib.parse
+        ctx = json.load(sys.stdin)
+        engine = (ctx["args"].get("reviewer_agent_engine") or "").strip()
+        repo = ctx["args"].get("repo_name") or ""
+        pr = ctx["args"].get("pr_number")
+        out = {"review_status": "needs_changes", "findings": [],
+               "standards_checked": [], "summary": ""}
+        def metadata_access_token():
+            url = ("http://metadata.google.internal/computeMetadata/v1/instance/"
+                   "service-accounts/default/token")
+            req = urllib.request.Request(url, headers={"Metadata-Flavor": "Google"})
+            with urllib.request.urlopen(req, timeout=5) as r:
+                return json.loads(r.read().decode("utf-8"))["access_token"]
+        try:
+            loc = engine.split("/locations/")[1].split("/")[0]
+            token = metadata_access_token()
+            api = ("https://" + loc + "-aiplatform.googleapis.com/v1/" + engine +
+                   ":streamQuery?alt=sse")
+            message = json.dumps({"repo_name": repo, "pr_number": pr})
+            body = json.dumps({"class_method": "stream_query",
+                               "input": {"user_id": "revka", "message": message}})
+            req = urllib.request.Request(
+                api, data=body.encode("utf-8"),
+                headers={"Authorization": "Bearer " + token,
+                         "Content-Type": "application/json"})
+            with urllib.request.urlopen(req, timeout=870) as r:
+                raw = r.read().decode("utf-8", "replace")
+            final = ""
+            for line in raw.splitlines():
+                line = line.strip()
+                if not line:
+                    continue
+                if line.startswith("data:"):
+                    line = line[5:].strip()
+                try:
+                    ev = json.loads(line)
+                except Exception:
+                    continue
+                for p in (ev.get("content", {}) or {}).get("parts", []) or []:
+                    if p.get("text"):
+                        final = p["text"]
+            m = re.search(r"\{.*\}", final, re.S)
+            if m:
+                out = json.loads(m.group(0))
+            else:
+                out["summary"] = ("Reviewer returned no parseable verdict: " +
+                                  final[:500])
+        except Exception as exc:
+            out["summary"] = ("Agent Engine review call failed: " +
+                              type(exc).__name__ + ": " + str(exc)[:300])
+        json.dump(out, sys.stdout)
+      args:
+        reviewer_agent_engine: "${inputs.reviewer_agent_engine}"
+        repo_name: "${inputs.repo_name}"
+        pr_number: "${extract_pr_number.output_data.pr_number}"
 
   # -------------------------------------------------------------------------
   # 7. Human gate — approve the merge.

From 287d51dc4f3f4b7f87b13f9d5584b8f64c3aca63 Mon Sep 17 00:00:00 2001
From: Neo <neo@Neos-iMac-Pro.local>
Date: Thu, 11 Jun 2026 16:47:58 +0900
Subject: [PATCH 2/3] fix(reviewer): retry the Agent Engine review on transient
 ADK/Gemini failure

A single ADK/Gemini hiccup (empty stream) was dropping the verdict to
'no parseable verdict'. Retry the :streamQuery call 3x with backoff inside
the step budget; only fall back to a needs_changes summary if all attempts
fail. Mirrors the live registered workflow.

Verified live E2E: issue #12 -> PR #13 (MERGED) -> issue CLOSED, with the
Agent Engine reviewer citing Rules 1/5/6/7/9/10.

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
---
 .../builtins/github-issue-resolver.yaml       | 35 ++++++++++++-------
 1 file changed, 23 insertions(+), 12 deletions(-)

diff --git a/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml b/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml
index bb84af4..e0938e7 100644
--- a/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml
+++ b/operator-mcp/operator_mcp/workflow/builtins/github-issue-resolver.yaml
@@ -324,7 +324,7 @@ steps:
     python:
       timeout: 900
       code: |
-        import json, sys, re, urllib.request, urllib.parse
+        import json, sys, re, time, urllib.request, urllib.parse
         ctx = json.load(sys.stdin)
         engine = (ctx["args"].get("reviewer_agent_engine") or "").strip()
         repo = ctx["args"].get("repo_name") or ""
@@ -337,7 +337,7 @@ steps:
             req = urllib.request.Request(url, headers={"Metadata-Flavor": "Google"})
             with urllib.request.urlopen(req, timeout=5) as r:
                 return json.loads(r.read().decode("utf-8"))["access_token"]
-        try:
+        def query_reviewer():
             loc = engine.split("/locations/")[1].split("/")[0]
             token = metadata_access_token()
             api = ("https://" + loc + "-aiplatform.googleapis.com/v1/" + engine +
@@ -349,7 +349,7 @@ steps:
                 api, data=body.encode("utf-8"),
                 headers={"Authorization": "Bearer " + token,
                          "Content-Type": "application/json"})
-            with urllib.request.urlopen(req, timeout=870) as r:
+            with urllib.request.urlopen(req, timeout=280) as r:
                 raw = r.read().decode("utf-8", "replace")
             final = ""
             for line in raw.splitlines():
@@ -365,15 +365,26 @@ steps:
                 for p in (ev.get("content", {}) or {}).get("parts", []) or []:
                     if p.get("text"):
                         final = p["text"]
-            m = re.search(r"\{.*\}", final, re.S)
-            if m:
-                out = json.loads(m.group(0))
-            else:
-                out["summary"] = ("Reviewer returned no parseable verdict: " +
-                                  final[:500])
-        except Exception as exc:
-            out["summary"] = ("Agent Engine review call failed: " +
-                              type(exc).__name__ + ": " + str(exc)[:300])
+            return final
+        # The ADK/Gemini agent can transiently fail (empty stream); retry so a
+        # single hiccup doesn't drop the verdict. Grounding stays additive.
+        final, last_err = "", ""
+        for attempt in range(3):
+            try:
+                final = query_reviewer()
+                if final.strip():
+                    break
+            except Exception as exc:
+                last_err = type(exc).__name__ + ": " + str(exc)[:200]
+            time.sleep(8 * (attempt + 1))
+        m = re.search(r"\{.*\}", final, re.S)
+        if m:
+            out = json.loads(m.group(0))
+        elif last_err:
+            out["summary"] = "Agent Engine review call failed: " + last_err
+        else:
+            out["summary"] = ("Reviewer returned no parseable verdict: " +
+                              final[:500])
         json.dump(out, sys.stdout)
       args:
         reviewer_agent_engine: "${inputs.reviewer_agent_engine}"

From dd9c0ea28440f619e4965b4f6fc3605a67430611 Mon Sep 17 00:00:00 2001
From: Neo <neo@Neos-iMac-Pro.local>
Date: Thu, 11 Jun 2026 17:26:46 +0900
Subject: [PATCH 3/3] feat(reviewer): run Agent Engine as reviewer-agent SA for
 live Vertex AI Search
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Set spec.service_account=reviewer-agent (which holds discoveryengine.viewer +
aiplatform.user) via the SDK's service_account arg — honored on create and
update, so it applies in place without a new resource ID. The Agent Engine
service agent needs serviceAccountTokenCreator on reviewer-agent (granted).

Verified: the reviewer's Discovery Engine :search call now returns HTTP 200
(was 403 as the default service agent) — grounding is live Vertex AI Search,
not the bundled-corpus fallback.

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
---
 cloud-agents/reviewer/deploy_agent_engine.py | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/cloud-agents/reviewer/deploy_agent_engine.py b/cloud-agents/reviewer/deploy_agent_engine.py
index d3cffce..3e5f1b2 100644
--- a/cloud-agents/reviewer/deploy_agent_engine.py
+++ b/cloud-agents/reviewer/deploy_agent_engine.py
@@ -72,14 +72,16 @@ def main() -> None:
 
     app = reasoning_engines.AdkApp(agent=root_agent, enable_tracing=True)
 
-    # Note: the v1 Agent Engine API runs the engine as the project's default
-    # Reasoning Engine Service Agent (custom service_account is not honored in v1),
-    # which must hold roles/discoveryengine.viewer for live Vertex AI Search
-    # grounding (the bundled CONVENTIONS.md corpus is the graceful fallback).
+    # Run the engine as the reviewer SA (it already holds aiplatform.user +
+    # discoveryengine.viewer), so Vertex AI Search grounding is live rather than
+    # falling back to the bundled CONVENTIONS.md corpus. Requires the Agent
+    # Engine service agent to have roles/iam.serviceAccountTokenCreator on this
+    # SA. Set via the SDK's spec.service_account (honored on create and update).
     common = dict(
         requirements=REQUIREMENTS,
         extra_packages=EXTRA_PACKAGES,
         env_vars=ENV_VARS,
+        service_account=RUNTIME_SA,
         display_name=DISPLAY_NAME,
         description=(
             "Revka reviewer agent (ADK/Gemini via Vertex AI) — reviews GitHub "