From 3e404d2650421242d7638cf3d0464302ae46f0ee Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 12:37:48 +0800
Subject: [PATCH 01/11] refactor: unify dialogue session runtime state

---
 docs/session-state-v1.md            | 110 +++++
 src/core/session_store.py           |   8 +-
 src/web/chat/helpers.py             |  86 +++-
 src/web/chat/service.py             | 687 +++++++++++++++++++++++++---
 src/web/service_facades/dialogue.py |  36 +-
 tests/test_session_store.py         |  10 +-
 tests/test_web_app.py               | 138 ++++--
 7 files changed, 961 insertions(+), 114 deletions(-)
 create mode 100644 docs/session-state-v1.md

diff --git a/docs/session-state-v1.md b/docs/session-state-v1.md
new file mode 100644
index 0000000..a4a20cf
--- /dev/null
+++ b/docs/session-state-v1.md
@@ -0,0 +1,110 @@
+# Session State V1
+
+## Goal
+
+This branch treats dialogue session state as a first-class runtime model instead of a loose bag of side effects.
+
+We intentionally optimize for a clean canonical schema rather than backward compatibility.
+
+## Canonical State
+
+Each dialogue session owns one canonical `state` object:
+
+```json
+{
+  "version": 1,
+  "scene": {
+    "location": "",
+    "time_hint": "",
+    "atmosphere_summary": "",
+    "progression_note": "",
+    "updated_at": ""
+  },
+  "presence": {
+    "present_participants": [],
+    "offstage_participants": [],
+    "updated_at": ""
+  },
+  "progression": {
+    "should_offer_scene_shift": false,
+    "scene_shift_reason": "",
+    "turns_in_current_scene": 0,
+    "beat_maturity": 0,
+    "world_tension_summary": "",
+    "updated_at": ""
+  },
+  "relations": {
+    "matrix": {},
+    "delta": {}
+  },
+  "characters": {
+    "snapshots": {}
+  },
+  "signals": {
+    "recent": [],
+    "by_type": {},
+    "updated_at": ""
+  },
+  "memory": {
+    "summary": {}
+  }
+}
+```
+
+## Rules
+
+1. `state` is the only source of truth for session runtime evolution.
+2. API payloads may still project convenience views like `scene_progress` or `relation_delta`, but those are derived views, not primary storage.
+3. Session payloads may expose derived helpers like `runtime_state_overview` for UI rendering, but these are read-only projections from canonical `state`.
+4. `runtime_state_overview` should stay presentation-friendly: short labels, trimmed text, and stable ordering for characters / relations / events.
+5. Scene flow is split into three concerns:
+   - `scene`: where/when/what tone the current beat has
+   - `presence`: who is currently onstage or offstage
+   - `progression`: whether the beat is mature enough to shift scenes
+6. Relationship updates are split into:
+   - `relations.matrix`: baseline merged relation graph for session participants
+   - `relations.delta`: session-local drift caused by this conversation
+7. Character-local runtime drift belongs in `characters.snapshots`.
+8. Small event cues, transitions, exits, and atmosphere shifts belong in `signals`.
+9. Compression summaries belong in `memory.summary`.
+
+## Implementation Checklist
+
+### Slice 1: Canonical State Foundation
+
+- [x] Define the canonical session-state schema
+- [x] Centralize session-state creation and normalization
+- [x] Project derived `scene_progress` from canonical state
+- [x] Project derived `relation_delta`, `character_snapshots`, and `event_signals`
+- [x] Move session-store readers to canonical state paths
+
+### Slice 2: Progression Engine
+
+- [x] Split time, location, atmosphere, and onstage/offstage decisions into dedicated state updaters
+- [x] Track scene maturity explicitly in `progression.beat_maturity`
+- [x] Let narration, exits, and returns update canonical presence state directly
+
+### Slice 3: Session Snapshots
+
+- [x] Expand character snapshots into stable per-character runtime cards
+- [x] Expand relation deltas into stable per-pair interaction drift
+- [x] Add explicit session-level world tension / atmosphere summary
+
+### Slice 4: Prompt Integration
+
+- [x] Feed canonical state into turn payloads
+- [x] Feed canonical state into suggestion payloads
+- [x] Feed canonical state into scene-progress generation prompts
+- [x] Trim prompt payloads using canonical active-state priority
+
+### Slice 5: UI Integration
+
+- [x] Surface canonical presence/time/progression hints in the chat UI
+- [x] Surface natural next-scene hints from `progression`
+- [x] Surface per-character session drift from `characters.snapshots`
+
+## Non-Goals
+
+- Preserving every old session-state shape on disk
+- Layering more compatibility shims for low-value legacy paths
+- Keeping duplicated state across multiple top-level session fields
diff --git a/src/core/session_store.py b/src/core/session_store.py
index 4491bc7..834b893 100644
--- a/src/core/session_store.py
+++ b/src/core/session_store.py
@@ -91,12 +91,12 @@ def compress_context(
         to_archive = history[:-recent_turns]
         keep = history[-recent_turns:]
         state = session.setdefault("state", {})
-        memory_summary = dict(state.get("memory_summary", {}) or {})
+        memory_summary = dict(dict(state.get("memory", {}) or {}).get("summary", {}) or {})
         previous_summary = _normalize_text(memory_summary.get("summary", ""))
         compressed = self._build_memory_summary(previous_summary, to_archive, summary_limit)
         key_points = self._extract_key_points(to_archive, limit=8)
 
-        state["memory_summary"] = {
+        state.setdefault("memory", {})["summary"] = {
             "summary": compressed,
             "key_points": key_points,
             "compressed_turns": len(to_archive),
@@ -199,8 +199,8 @@ def save_relation_snapshot(self, session: Dict[str, Any]) -> None:
             "session_id": session_id,
             "novel_id": session.get("novel_id"),
             "updated_at": session.get("updated_at"),
-            "relation_matrix": session.get("state", {}).get("relation_matrix", {}),
-            "relation_delta": session.get("state", {}).get("relation_delta", {}),
+            "relation_matrix": dict(dict(session.get("state", {}).get("relations", {}) or {}).get("matrix", {}) or {}),
+            "relation_delta": dict(dict(session.get("state", {}).get("relations", {}) or {}).get("delta", {}) or {}),
         }
         save_markdown_data(
             self._relation_snapshot_path(session_id),
diff --git a/src/web/chat/helpers.py b/src/web/chat/helpers.py
index 198c98e..c47b3ca 100644
--- a/src/web/chat/helpers.py
+++ b/src/web/chat/helpers.py
@@ -7,6 +7,55 @@
 from src.core.exceptions import LLMRequestError
 
 
+def _session_state(session: dict[str, Any]) -> dict[str, Any]:
+    return dict(session.get("state", {}) or {})
+
+
+def _canonical_scene_progress(session: dict[str, Any]) -> dict[str, Any]:
+    state = _session_state(session)
+    scene = dict(state.get("scene", {}) or {})
+    presence = dict(state.get("presence", {}) or {})
+    progression = dict(state.get("progression", {}) or {})
+    derived = {
+        "present_participants": list(presence.get("present_participants", []) or []),
+        "offstage_participants": list(presence.get("offstage_participants", []) or []),
+        "time_hint": str(scene.get("time_hint", "")).strip(),
+        "location": str(scene.get("location", "")).strip(),
+        "atmosphere_summary": str(scene.get("atmosphere_summary", "")).strip(),
+        "progression_note": str(scene.get("progression_note", "")).strip(),
+        "should_offer_scene_shift": bool(progression.get("should_offer_scene_shift", False)),
+        "scene_shift_reason": str(progression.get("scene_shift_reason", "")).strip(),
+        "turns_in_current_scene": int(progression.get("turns_in_current_scene", 0) or 0),
+        "beat_maturity": int(progression.get("beat_maturity", 0) or 0),
+        "world_tension_summary": str(progression.get("world_tension_summary", "")).strip(),
+        "updated_at": (
+            str(progression.get("updated_at", "")).strip()
+            or str(presence.get("updated_at", "")).strip()
+            or str(scene.get("updated_at", "")).strip()
+        ),
+    }
+    merged = dict(derived)
+    merged.update(dict(session.get("scene_progress", {}) or {}))
+    return {key: value for key, value in merged.items() if value not in ("", [], False, 0, None)}
+
+
+def _canonical_relation_delta(session: dict[str, Any]) -> dict[str, Any]:
+    state = _session_state(session)
+    relations = dict(state.get("relations", {}) or {})
+    return dict(session.get("relation_delta", {}) or relations.get("delta", {}) or {})
+
+
+def _canonical_character_snapshots(session: dict[str, Any]) -> dict[str, Any]:
+    state = _session_state(session)
+    characters = dict(state.get("characters", {}) or {})
+    return dict(session.get("character_snapshots", {}) or characters.get("snapshots", {}) or {})
+
+
+def _canonical_event_signals(session: dict[str, Any]) -> dict[str, Any]:
+    state = _session_state(session)
+    return dict(session.get("event_signals", {}) or state.get("signals", {}) or {})
+
+
 def build_dialogue_opening_message(session: dict[str, Any]) -> str:
     mode = str(session.get("mode", "observe")).strip() or "observe"
     participants = [str(item).strip() for item in session.get("participants", []) if str(item).strip()]
@@ -239,7 +288,11 @@ def _compact_memory_context(memory_context: dict[str, Any]) -> dict[str, Any]:
             "archived_summary": compact_archived,
             "retrieved_memories": compact_hits,
             "scene_progress": {
-                inner_key: _trim_text(str(inner_value).strip(), 100)
+                inner_key: (
+                    list(inner_value)[:6]
+                    if isinstance(inner_value, list)
+                    else inner_value
+                )
                 for inner_key, inner_value in scene_progress.items()
                 if _has_meaningful_value(inner_value)
             },
@@ -457,8 +510,8 @@ def build_dialogue_scene_progress_messages(session: dict[str, Any]) -> list[dict
         "scene_card": dict(session.get("session_card", {}).get("scene_card", {}) or session.get("scene_card", {}) or {}),
         "session_memory_summary": dict(session.get("session_memory_summary", {}) or {}),
         "recent_transcript": recent,
-        "current_scene_progress": dict(session.get("scene_progress", {}) or {}),
-        "event_signals": dict(session.get("event_signals", {}) or session.get("state", {}).get("event_signals", {}) or {}),
+        "current_scene_progress": _canonical_scene_progress(session),
+        "event_signals": _canonical_event_signals(session),
     }
     system_prompt = "\n".join(
         [
@@ -467,10 +520,13 @@ def build_dialogue_scene_progress_messages(session: dict[str, Any]) -> list[dict
             "offstage_participants 里的人默认不应继续直接开口，除非最近文本明确写到他们回来、进门、现身、重新加入。",
             "如果最近内容已经从白天聊到傍晚、夜里、深夜等，time_hint 要跟着更新，而不是一直停在原时间。",
             "如果几个人已经离开原场所进入更私密的新地点，其他未同去角色不要继续被视作同场。",
+            "atmosphere_summary 用一句很短的话概括当前氛围，比如“安静下来”“暧昧发僵”“雨夜压下来”。",
+            "beat_maturity 用 0-100 的整数表示这一拍推进到什么程度：刚起势偏低，已经聊出完整一拍则更高。",
+            "world_tension_summary 用一句话概括当前这局最该继续带着走的张力、冲突或悬念。",
             "event_signals 里如果出现 scene_transition / cast_enter / cast_exit / atmosphere_shift / time_change / environment_change / beat_complete，要把它们纳入判断。",
             "should_offer_scene_shift 只在这一幕已经聊出明显一拍、适合自然转场时返回 true。",
             "只返回 JSON 对象，不要解释。",
-            "格式：{\"present_participants\":[],\"offstage_participants\":[],\"time_hint\":\"\",\"location\":\"\",\"progression_note\":\"\",\"should_offer_scene_shift\":false,\"scene_shift_reason\":\"\"}",
+            "格式：{\"present_participants\":[],\"offstage_participants\":[],\"time_hint\":\"\",\"location\":\"\",\"atmosphere_summary\":\"\",\"progression_note\":\"\",\"beat_maturity\":0,\"world_tension_summary\":\"\",\"should_offer_scene_shift\":false,\"scene_shift_reason\":\"\"}",
         ]
     )
     return [
@@ -500,9 +556,9 @@ def build_dialogue_relation_state_messages(
             }
         )
     current_state = {
-        "relation_delta": dict(session.get("state", {}).get("relation_delta", {}) or {}),
-        "character_snapshots": dict(session.get("state", {}).get("character_snapshots", {}) or {}),
-        "event_signals": dict(session.get("state", {}).get("event_signals", {}) or {}),
+        "relation_delta": _canonical_relation_delta(session),
+        "character_snapshots": _canonical_character_snapshots(session),
+        "event_signals": _canonical_event_signals(session),
     }
     payload = {
         "participants": [str(item).strip() for item in list(session.get("participants", []) or []) if str(item).strip()],
@@ -578,12 +634,20 @@ def clean_names(value: Any) -> list[str]:
 
     present = clean_names(parsed.get("present_participants", []))
     offstage = [name for name in clean_names(parsed.get("offstage_participants", [])) if name not in present]
+    try:
+        beat_maturity = max(0, min(100, int(parsed.get("beat_maturity", 0) or 0)))
+    except Exception:
+        beat_maturity = 0
+
     return {
         "present_participants": present,
         "offstage_participants": offstage,
         "time_hint": _trim_text(str(parsed.get("time_hint", "")).strip(), 40),
         "location": _trim_text(str(parsed.get("location", "")).strip(), 40),
+        "atmosphere_summary": _trim_text(str(parsed.get("atmosphere_summary", "")).strip(), 80),
         "progression_note": _trim_text(str(parsed.get("progression_note", "")).strip(), 120),
+        "beat_maturity": beat_maturity,
+        "world_tension_summary": _trim_text(str(parsed.get("world_tension_summary", "")).strip(), 120),
         "should_offer_scene_shift": bool(parsed.get("should_offer_scene_shift", False)),
         "scene_shift_reason": _trim_text(str(parsed.get("scene_shift_reason", "")).strip(), 120),
     }
@@ -636,10 +700,16 @@ def pair_key(left: str, right: str) -> str:
                 amount = 0
             if amount:
                 normalized[field] = max(-3, min(3, amount))
-        for field in ("last_event", "relation_change", "typical_interaction"):
+        for field in ("last_event", "relation_change", "typical_interaction", "last_actor", "last_target", "updated_at"):
             value = _trim_text(str(item.get(field, "")).strip(), 120)
             if value:
                 normalized[field] = value
+        try:
+            momentum = int(item.get("momentum", 0) or 0)
+        except Exception:
+            momentum = 0
+        if momentum:
+            normalized["momentum"] = max(0, min(10, momentum))
         evidence_lines = [
             _trim_text(str(line).strip(), 180)
             for line in list(item.get("evidence_lines", []) or [])
diff --git a/src/web/chat/service.py b/src/web/chat/service.py
index 561a9bc..3f7e1c2 100644
--- a/src/web/chat/service.py
+++ b/src/web/chat/service.py
@@ -22,6 +22,7 @@ def _utc_now() -> str:
 
 
 class DialogueService:
+    SESSION_STATE_VERSION = 1
     _SCENE_ENTER_TOKENS = ("进门", "入内", "走进", "转入", "移步", "到了", "回到", "落座", "入座", "上楼", "进屋", "推门而入")
     _SCENE_EXIT_TOKENS = ("出去", "离开", "退场", "回房", "回家", "出门", "走远", "散去", "下楼", "离席")
     _ACTION_TOKENS = ("抬头", "低头", "笑", "沉默", "转身", "皱眉", "顿住", "垂眼", "抿唇", "抬眼", "偏头", "停住", "看向")
@@ -65,6 +66,229 @@ def __init__(
         self._memory_store_resolver = memory_store_resolver
         self._memory_stores: dict[str, MarkdownSessionStore] = {}
 
+    @classmethod
+    def _empty_session_state(cls) -> dict[str, Any]:
+        return {
+            "version": cls.SESSION_STATE_VERSION,
+            "scene": {
+                "location": "",
+                "time_hint": "",
+                "atmosphere_summary": "",
+                "progression_note": "",
+                "updated_at": "",
+            },
+            "presence": {
+                "present_participants": [],
+                "offstage_participants": [],
+                "updated_at": "",
+            },
+            "progression": {
+                "should_offer_scene_shift": False,
+                "scene_shift_reason": "",
+                "turns_in_current_scene": 0,
+                "beat_maturity": 0,
+                "world_tension_summary": "",
+                "updated_at": "",
+            },
+            "relations": {
+                "matrix": {},
+                "delta": {},
+            },
+            "characters": {
+                "snapshots": {},
+            },
+            "signals": cls._empty_event_signals_state(),
+            "memory": {
+                "summary": {},
+            },
+        }
+
+    def _ensure_session_state(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = dict(session.get("state", {}) or {})
+        canonical = self._empty_session_state()
+        canonical["version"] = int(state.get("version", self.SESSION_STATE_VERSION) or self.SESSION_STATE_VERSION)
+
+        scene = dict(state.get("scene", {}) or {})
+        scene_legacy = dict(state.get("scene_progress", {}) or {})
+        canonical["scene"] = {
+            **dict(canonical.get("scene", {}) or {}),
+            **{key: value for key, value in scene.items() if key in {"location", "time_hint", "atmosphere_summary", "progression_note", "updated_at"}},
+            **{
+                key: value
+                for key, value in scene_legacy.items()
+                if key in {"location", "time_hint", "atmosphere_summary", "progression_note", "updated_at"}
+            },
+        }
+
+        presence = dict(state.get("presence", {}) or {})
+        canonical["presence"] = {
+            **dict(canonical.get("presence", {}) or {}),
+            **{
+                "present_participants": list(presence.get("present_participants", []) or scene_legacy.get("present_participants", []) or []),
+                "offstage_participants": list(presence.get("offstage_participants", []) or scene_legacy.get("offstage_participants", []) or []),
+                "updated_at": str(presence.get("updated_at", "")).strip() or str(scene_legacy.get("updated_at", "")).strip(),
+            },
+        }
+
+        progression = dict(state.get("progression", {}) or {})
+        canonical["progression"] = {
+            **dict(canonical.get("progression", {}) or {}),
+            **{
+                "should_offer_scene_shift": bool(
+                    progression.get("should_offer_scene_shift", scene_legacy.get("should_offer_scene_shift", False))
+                ),
+                "scene_shift_reason": str(
+                    progression.get("scene_shift_reason", scene_legacy.get("scene_shift_reason", ""))
+                ).strip(),
+                "turns_in_current_scene": int(
+                    progression.get("turns_in_current_scene", scene_legacy.get("turns_in_current_scene", 0)) or 0
+                ),
+                "beat_maturity": int(
+                    progression.get("beat_maturity", scene_legacy.get("beat_maturity", 0)) or 0
+                ),
+                "world_tension_summary": str(
+                    progression.get("world_tension_summary", scene_legacy.get("world_tension_summary", ""))
+                ).strip(),
+                "updated_at": str(progression.get("updated_at", "")).strip() or str(scene_legacy.get("updated_at", "")).strip(),
+            },
+        }
+
+        relations = dict(state.get("relations", {}) or {})
+        canonical["relations"] = {
+            "matrix": dict(relations.get("matrix", {}) or state.get("relation_matrix", {}) or {}),
+            "delta": dict(relations.get("delta", {}) or state.get("relation_delta", {}) or {}),
+        }
+        characters = dict(state.get("characters", {}) or {})
+        canonical["characters"] = {
+            "snapshots": dict(characters.get("snapshots", {}) or state.get("character_snapshots", {}) or {}),
+        }
+        canonical["signals"] = dict(state.get("signals", {}) or state.get("event_signals", {}) or self._empty_event_signals_state())
+        memory = dict(state.get("memory", {}) or {})
+        canonical["memory"] = {
+            "summary": dict(memory.get("summary", {}) or state.get("memory_summary", {}) or {}),
+        }
+        session["state"] = canonical
+        return canonical
+
+    def _session_scene_progress(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = self._ensure_session_state(session)
+        scene = dict(state.get("scene", {}) or {})
+        presence = dict(state.get("presence", {}) or {})
+        progression = dict(state.get("progression", {}) or {})
+        return {
+            "present_participants": list(presence.get("present_participants", []) or []),
+            "offstage_participants": list(presence.get("offstage_participants", []) or []),
+            "time_hint": str(scene.get("time_hint", "")).strip(),
+            "location": str(scene.get("location", "")).strip(),
+            "atmosphere_summary": str(scene.get("atmosphere_summary", "")).strip(),
+            "progression_note": str(scene.get("progression_note", "")).strip(),
+            "should_offer_scene_shift": bool(progression.get("should_offer_scene_shift", False)),
+            "scene_shift_reason": str(progression.get("scene_shift_reason", "")).strip(),
+            "turns_in_current_scene": int(progression.get("turns_in_current_scene", 0) or 0),
+            "beat_maturity": int(progression.get("beat_maturity", 0) or 0),
+            "world_tension_summary": str(progression.get("world_tension_summary", "")).strip(),
+            "updated_at": (
+                str(progression.get("updated_at", "")).strip()
+                or str(presence.get("updated_at", "")).strip()
+                or str(scene.get("updated_at", "")).strip()
+            ),
+        }
+
+    def _set_session_scene_progress(self, session: dict[str, Any], scene_progress: dict[str, Any] | None) -> None:
+        state = self._ensure_session_state(session)
+        payload = dict(scene_progress or {})
+        updated_at = str(payload.get("updated_at", "")).strip() or _utc_now()
+        state["scene"] = {
+            "location": str(payload.get("location", "")).strip(),
+            "time_hint": str(payload.get("time_hint", "")).strip(),
+            "atmosphere_summary": str(payload.get("atmosphere_summary", "")).strip(),
+            "progression_note": str(payload.get("progression_note", "")).strip(),
+            "updated_at": updated_at,
+        }
+        state["presence"] = {
+            "present_participants": [str(item).strip() for item in list(payload.get("present_participants", []) or []) if str(item).strip()],
+            "offstage_participants": [str(item).strip() for item in list(payload.get("offstage_participants", []) or []) if str(item).strip()],
+            "updated_at": updated_at,
+        }
+        state["progression"] = {
+            "should_offer_scene_shift": bool(payload.get("should_offer_scene_shift", False)),
+            "scene_shift_reason": str(payload.get("scene_shift_reason", "")).strip(),
+            "turns_in_current_scene": int(payload.get("turns_in_current_scene", 0) or 0),
+            "beat_maturity": int(payload.get("beat_maturity", 0) or 0),
+            "world_tension_summary": str(payload.get("world_tension_summary", "")).strip(),
+            "updated_at": updated_at,
+        }
+        self._sync_character_runtime_cards(session, payload, updated_at=updated_at)
+
+    def _session_relation_matrix(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = self._ensure_session_state(session)
+        return dict(state.get("relations", {}).get("matrix", {}) or {})
+
+    def _set_session_relation_matrix(self, session: dict[str, Any], payload: dict[str, Any] | None) -> None:
+        state = self._ensure_session_state(session)
+        state.setdefault("relations", {})["matrix"] = dict(payload or {})
+
+    def _session_relation_delta(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = self._ensure_session_state(session)
+        return dict(state.get("relations", {}).get("delta", {}) or {})
+
+    def _set_session_relation_delta(self, session: dict[str, Any], payload: dict[str, Any] | None) -> None:
+        state = self._ensure_session_state(session)
+        state.setdefault("relations", {})["delta"] = dict(payload or {})
+
+    def _session_character_snapshots(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = self._ensure_session_state(session)
+        return dict(state.get("characters", {}).get("snapshots", {}) or {})
+
+    def _set_session_character_snapshots(self, session: dict[str, Any], payload: dict[str, Any] | None) -> None:
+        state = self._ensure_session_state(session)
+        state.setdefault("characters", {})["snapshots"] = dict(payload or {})
+
+    def _sync_character_runtime_cards(
+        self,
+        session: dict[str, Any],
+        scene_progress: dict[str, Any] | None,
+        *,
+        updated_at: str,
+    ) -> None:
+        state = self._ensure_session_state(session)
+        snapshots = dict(state.get("characters", {}).get("snapshots", {}) or {})
+        progress = dict(scene_progress or {})
+        participants = [str(item).strip() for item in list(session.get("participants", []) or []) if str(item).strip()]
+        present = {
+            str(item).strip()
+            for item in list(progress.get("present_participants", []) or [])
+            if str(item).strip()
+        }
+        location = str(progress.get("location", "")).strip()
+        time_hint = str(progress.get("time_hint", "")).strip()
+        for name in participants:
+            current = dict(snapshots.get(name, {}) or {})
+            current["present_state"] = "onstage" if name in present else "offstage"
+            if location:
+                current["scene_location"] = location
+            if time_hint:
+                current["time_hint"] = time_hint
+            current["updated_at"] = updated_at
+            snapshots[name] = current
+        state.setdefault("characters", {})["snapshots"] = snapshots
+
+    def _session_event_signals(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = self._ensure_session_state(session)
+        return dict(state.get("signals", {}) or {})
+
+    def _set_session_event_signals(self, session: dict[str, Any], payload: dict[str, Any] | None) -> None:
+        state = self._ensure_session_state(session)
+        state["signals"] = dict(payload or self._empty_event_signals_state())
+
+    def _session_memory_summary_state(self, session: dict[str, Any]) -> dict[str, Any]:
+        state = self._ensure_session_state(session)
+        return dict(state.get("memory", {}).get("summary", {}) or {})
+
+    def _set_session_memory_summary_state(self, session: dict[str, Any], payload: dict[str, Any] | None) -> None:
+        state = self._ensure_session_state(session)
+        state.setdefault("memory", {})["summary"] = dict(payload or {})
+
     def list_sessions(self, run_id: str) -> list[dict[str, Any]]:
         root = self._sessions_root(run_id)
         items: list[dict[str, Any]] = []
@@ -122,17 +346,12 @@ def create_session(
             "branch_origin": dict(branch_origin or {}),
             "history": [],
             "pending_turn": {},
-            "state": {
-                "scene_progress": {},
-                "relation_matrix": self._seed_relation_matrix(run_manifest, selected),
-                "relation_delta": {},
-                "character_snapshots": {},
-                "event_signals": self._empty_event_signals_state(),
-            },
+            "state": self._empty_session_state(),
             "created_at": _utc_now(),
             "updated_at": _utc_now(),
             "status": "ready",
         }
+        self._set_session_relation_matrix(payload, self._seed_relation_matrix(run_manifest, selected))
         if dict(scene_profile or {}):
             initial_summary = self._build_session_memory_summary(run_id, payload, [])
             payload["scene_history"] = [
@@ -142,7 +361,7 @@ def create_session(
                     memory_summary=initial_summary,
                 )
             ]
-        payload["state"]["scene_progress"] = self._derive_scene_progress_state(payload, [])
+        self._set_session_scene_progress(payload, self._derive_scene_progress_state(payload, []))
         self._write_json(root / "session.json", payload)
         if carried_memory_summary:
             session_store = self._resolve_memory_store(run_id)
@@ -194,7 +413,7 @@ def update_scene_card(
                     "ts": _utc_now(),
                 }
             )
-        session.setdefault("state", {})["scene_progress"] = self._derive_scene_progress_state(session, self._serialize_transcript(session))
+        self._set_session_scene_progress(session, self._derive_scene_progress_state(session, self._serialize_transcript(session)))
         transcript = self._serialize_transcript(session)
         memory_summary = self._build_session_memory_summary(run_id, session, transcript)
         scene_history = list(session.get("scene_history", []) or [])
@@ -218,9 +437,12 @@ def update_scene_progress_state(
         scene_progress: dict[str, Any] | None = None,
     ) -> dict[str, Any]:
         session = self._read_json(self._session_file(run_id, session_id))
-        session.setdefault("state", {})["scene_progress"] = self._merge_scene_progress_state(
+        self._set_session_scene_progress(
             session,
-            dict(scene_progress or {}),
+            self._merge_scene_progress_state(
+                session,
+                dict(scene_progress or {}),
+            ),
         )
         session["updated_at"] = _utc_now()
         self._write_json(self._session_file(run_id, session_id), session)
@@ -458,8 +680,8 @@ def _build_turn_payload(
         persona_map = {item["name"]: item for item in character_index}
         relation_graph = dict(run_manifest.get("artifact_index", {}).get("relation_graph", {}) or {})
         full_history = list(session.get("history", []))
-        scene_progress = dict(session.get("state", {}).get("scene_progress", {}) or {})
-        character_snapshots = dict(session.get("state", {}).get("character_snapshots", {}) or {})
+        scene_progress = self._session_scene_progress(session)
+        character_snapshots = self._session_character_snapshots(session)
         active_participants = self._resolve_active_participants(participants, full_history, mode, speaker, scene_progress)
         scene_card = dict(session.get("scene_card", {}) or {})
         transcript = self._serialize_transcript(session)
@@ -638,9 +860,11 @@ def _scene_progress_rule(scene_progress: dict[str, Any]) -> str:
         offstage = [str(item).strip() for item in list(state.get("offstage_participants", []) or []) if str(item).strip()]
         time_hint = str(state.get("time_hint", "")).strip()
         location = str(state.get("location", "")).strip()
+        atmosphere = str(state.get("atmosphere_summary", "")).strip()
         note = str(state.get("progression_note", "")).strip()
         shift = bool(state.get("should_offer_scene_shift", False))
         reason = str(state.get("scene_shift_reason", "")).strip()
+        beat_maturity = int(state.get("beat_maturity", 0) or 0)
 
         bits = [
             "Respect scene continuity: keep who is present, who already left, and what time/location the scene has drifted to internally consistent.",
@@ -651,6 +875,8 @@ def _scene_progress_rule(scene_progress: dict[str, Any]) -> str:
                 details.append(f"time={time_hint}")
             if location:
                 details.append(f"location={location}")
+            if atmosphere:
+                details.append(f"atmosphere={atmosphere}")
             bits.append(f"Current scene state: {', '.join(details)}.")
         if present:
             bits.append(f"Characters currently in-scene: {', '.join(present)}.")
@@ -666,6 +892,11 @@ def _scene_progress_rule(scene_progress: dict[str, Any]) -> str:
         )
         if note:
             bits.append(f"Latest progression note: {note}.")
+        if beat_maturity:
+            bits.append(f"Current beat maturity is {beat_maturity}/100; let replies feel appropriately early, settled, or ready to turn.")
+        tension = str(state.get("world_tension_summary", "")).strip()
+        if tension:
+            bits.append(f"Current world tension to carry forward: {tension}.")
         if shift:
             bits.append(
                 f"This beat is mature enough to hint a next scene or transition if it helps momentum. Reason: {reason or 'the current beat already feels complete'}."
@@ -844,27 +1075,91 @@ def clean_names(values: Any) -> list[str]:
             "offstage_participants": offstage or [name for name in list(base.get("offstage_participants", []) or []) if name not in present],
             "time_hint": str(incoming.get("time_hint", "")).strip() or str(base.get("time_hint", "")).strip(),
             "location": str(incoming.get("location", "")).strip() or str(base.get("location", "")).strip(),
+            "atmosphere_summary": str(incoming.get("atmosphere_summary", "")).strip() or str(base.get("atmosphere_summary", "")).strip(),
             "progression_note": str(incoming.get("progression_note", "")).strip() or str(base.get("progression_note", "")).strip(),
             "should_offer_scene_shift": bool(incoming.get("should_offer_scene_shift", base.get("should_offer_scene_shift", False))),
             "scene_shift_reason": str(incoming.get("scene_shift_reason", "")).strip() or str(base.get("scene_shift_reason", "")).strip(),
             "turns_in_current_scene": int(base.get("turns_in_current_scene", 0) or 0),
+            "beat_maturity": int(incoming.get("beat_maturity", base.get("beat_maturity", 0)) or 0),
+            "world_tension_summary": str(incoming.get("world_tension_summary", "")).strip() or str(base.get("world_tension_summary", "")).strip(),
             "updated_at": _utc_now(),
         }
+        if merged["should_offer_scene_shift"]:
+            merged["beat_maturity"] = max(75, int(merged.get("beat_maturity", 0) or 0))
         return merged
 
     def _derive_scene_progress_state(self, session: dict[str, Any], transcript: list[dict[str, Any]]) -> dict[str, Any]:
         participants = [str(item).strip() for item in list(session.get("participants", []) or []) if str(item).strip()]
         scene_card = dict(session.get("scene_card", {}) or {})
-        prior = dict(session.get("state", {}).get("scene_progress", {}) or {})
+        prior = self._session_scene_progress(session)
         history = list(session.get("history", []) or [])
-        latest_time_event = self._latest_event_signal(session, "time_change")
-        latest_scene_event = self._latest_event_signal(session, "scene_transition")
-        latest_beat_event = self._latest_event_signal(session, "beat_complete")
+        presence_state = self._derive_presence_state(session, participants=participants, history=history)
+        scene_frame = self._derive_scene_frame_state(session, transcript=transcript, scene_card=scene_card, prior=prior)
+        progression_state = self._derive_progression_state(
+            session,
+            transcript=transcript,
+            scene_card=scene_card,
+            prior=prior,
+            presence_state=presence_state,
+            scene_frame=scene_frame,
+        )
+        progression_bits = []
+        if scene_frame.get("location"):
+            progression_bits.append(f"地点：{scene_frame['location']}")
+        if scene_frame.get("time_hint"):
+            progression_bits.append(f"时间：{scene_frame['time_hint']}")
+        if scene_frame.get("atmosphere_summary"):
+            progression_bits.append(f"氛围：{scene_frame['atmosphere_summary']}")
+        if presence_state.get("present_participants"):
+            progression_bits.append(f"在场：{'、'.join(list(presence_state.get('present_participants', []))[:4])}")
+        if presence_state.get("offstage_participants"):
+            progression_bits.append(f"离场：{'、'.join(list(presence_state.get('offstage_participants', []))[:3])}")
+        progression_bits.append(f"成熟度：{int(progression_state.get('beat_maturity', 0) or 0)}")
+        progression_note = "；".join(bit for bit in progression_bits if bit)
+        return {
+            **presence_state,
+            **scene_frame,
+            **progression_state,
+            "progression_note": progression_note,
+            "updated_at": _utc_now(),
+        }
+
+    def _derive_presence_state(
+        self,
+        session: dict[str, Any],
+        *,
+        participants: list[str],
+        history: list[dict[str, Any]],
+    ) -> dict[str, Any]:
         departed = self._infer_departed_participants(participants, history)
+        latest_exit = self._latest_event_signal(session, "cast_exit")
+        latest_enter = self._latest_event_signal(session, "cast_enter")
+        if latest_exit:
+            actor = str(latest_exit.get("actor", "")).strip()
+            if actor in participants:
+                departed.add(actor)
+        if latest_enter:
+            actor = str(latest_enter.get("actor", "")).strip()
+            if actor in participants:
+                departed.discard(actor)
         present = [name for name in participants if name not in departed]
         if not present and participants:
             present = participants[:1]
-        offstage = [name for name in participants if name not in present]
+        return {
+            "present_participants": present,
+            "offstage_participants": [name for name in participants if name not in present],
+        }
+
+    def _derive_scene_frame_state(
+        self,
+        session: dict[str, Any],
+        *,
+        transcript: list[dict[str, Any]],
+        scene_card: dict[str, Any],
+        prior: dict[str, Any],
+    ) -> dict[str, Any]:
+        latest_time_event = self._latest_event_signal(session, "time_change")
+        latest_scene_event = self._latest_event_signal(session, "scene_transition")
         time_hint = (
             str(latest_time_event.get("time_hint", "")).strip()
             or self._infer_time_hint(transcript)
@@ -876,41 +1171,142 @@ def _derive_scene_progress_state(self, session: dict[str, Any], transcript: list
             or str(prior.get("location", "")).strip()
             or str(scene_card.get("location", "")).strip()
         )
+        latest_atmosphere_event = self._latest_event_signal(session, "atmosphere_shift")
+        atmosphere_summary = (
+            self._trim_summary_text(str(latest_atmosphere_event.get("cue", "")).strip(), 80)
+            or self._infer_atmosphere_summary(transcript)
+            or self._trim_summary_text(str(prior.get("atmosphere_summary", "")).strip(), 80)
+            or self._trim_summary_text(str(scene_card.get("atmosphere", "")).strip(), 80)
+        )
+        return {
+            "time_hint": time_hint,
+            "location": location,
+            "atmosphere_summary": atmosphere_summary,
+        }
+
+    def _derive_progression_state(
+        self,
+        session: dict[str, Any],
+        *,
+        transcript: list[dict[str, Any]],
+        scene_card: dict[str, Any],
+        prior: dict[str, Any],
+        presence_state: dict[str, Any],
+        scene_frame: dict[str, Any],
+    ) -> dict[str, Any]:
+        latest_beat_event = self._latest_event_signal(session, "beat_complete")
         turns_in_current_scene = self._count_current_scene_turns(session)
+        beat_maturity = self._estimate_scene_maturity(
+            turns_in_current_scene=turns_in_current_scene,
+            transcript=transcript,
+            scene_card=scene_card,
+            presence_state=presence_state,
+            scene_frame=scene_frame,
+            latest_beat_event=latest_beat_event,
+            prior=prior,
+        )
         scene_shift_reason = ""
         should_offer_scene_shift = False
-        if scene_card and turns_in_current_scene >= 8:
+        if scene_card and beat_maturity >= 72:
             should_offer_scene_shift = True
             scene_shift_reason = "这一幕已经接了好几拍，可以顺势换到下一幕。"
         if latest_beat_event:
             should_offer_scene_shift = True
             scene_shift_reason = str(latest_beat_event.get("cue", "")).strip() or scene_shift_reason
         initial_time = str(scene_card.get("time_hint", "")).strip()
-        if time_hint and initial_time and time_hint != initial_time and turns_in_current_scene >= 5:
+        time_hint = str(scene_frame.get("time_hint", "")).strip()
+        if time_hint and initial_time and time_hint != initial_time and beat_maturity >= 55:
             should_offer_scene_shift = True
             scene_shift_reason = scene_shift_reason or f"时间已经自然推到{time_hint}，适合顺势转下一拍。"
-        progression_bits = []
-        if location:
-            progression_bits.append(f"地点：{location}")
-        if time_hint:
-            progression_bits.append(f"时间：{time_hint}")
-        if present:
-            progression_bits.append(f"在场：{'、'.join(present[:4])}")
-        if offstage:
-            progression_bits.append(f"离场：{'、'.join(offstage[:3])}")
-        progression_note = "；".join(progression_bits)
         return {
-            "present_participants": present,
-            "offstage_participants": offstage,
-            "time_hint": time_hint,
-            "location": location,
-            "progression_note": progression_note,
             "should_offer_scene_shift": should_offer_scene_shift,
             "scene_shift_reason": scene_shift_reason,
             "turns_in_current_scene": turns_in_current_scene,
-            "updated_at": _utc_now(),
+            "beat_maturity": beat_maturity,
+            "world_tension_summary": self._derive_world_tension_summary(session, transcript=transcript, scene_frame=scene_frame),
         }
 
+    def _estimate_scene_maturity(
+        self,
+        *,
+        turns_in_current_scene: int,
+        transcript: list[dict[str, Any]],
+        scene_card: dict[str, Any],
+        presence_state: dict[str, Any],
+        scene_frame: dict[str, Any],
+        latest_beat_event: dict[str, Any],
+        prior: dict[str, Any],
+    ) -> int:
+        score = min(60, max(0, turns_in_current_scene * 10))
+        if latest_beat_event:
+            score += 25
+        if str(scene_frame.get("time_hint", "")).strip() and str(scene_frame.get("time_hint", "")).strip() != str(scene_card.get("time_hint", "")).strip():
+            score += 10
+        if str(scene_frame.get("location", "")).strip() and str(scene_frame.get("location", "")).strip() != str(scene_card.get("location", "")).strip():
+            score += 10
+        if list(presence_state.get("offstage_participants", []) or []):
+            score += 6
+        if str(scene_frame.get("atmosphere_summary", "")).strip():
+            score += 4
+        previous_maturity = int(prior.get("beat_maturity", 0) or 0)
+        if previous_maturity:
+            score = max(score, min(100, previous_maturity - 8))
+        if len(transcript) >= 6:
+            score += 6
+        return max(0, min(100, score))
+
+    def _infer_atmosphere_summary(self, transcript: list[dict[str, Any]]) -> str:
+        recent_messages = [
+            str(item.get("message", "")).strip()
+            for item in list(transcript or [])[-8:]
+            if str(item.get("message", "")).strip()
+        ]
+        if not recent_messages:
+            return ""
+        joined = " ".join(recent_messages)
+        for token in self._ATMOSPHERE_TOKENS:
+            if token in joined:
+                return self._trim_summary_text(token, 40)
+        for message in reversed(recent_messages):
+            trimmed = self._trim_summary_text(message, 40)
+            if trimmed:
+                return trimmed
+        return ""
+
+    def _derive_world_tension_summary(
+        self,
+        session: dict[str, Any],
+        *,
+        transcript: list[dict[str, Any]],
+        scene_frame: dict[str, Any],
+    ) -> str:
+        latest_atmosphere_event = self._latest_event_signal(session, "atmosphere_shift")
+        latest_relation_event = self._latest_event_signal(session, "relationship_shift")
+        latest_scene_event = self._latest_event_signal(session, "scene_transition", "environment_change", "time_change")
+        for candidate in (latest_atmosphere_event, latest_relation_event, latest_scene_event):
+            cue = self._trim_summary_text(str((candidate or {}).get("cue", "")).strip(), 88)
+            if cue:
+                return cue
+        relation_delta = self._session_relation_delta(session)
+        if relation_delta:
+            pair_key, delta = next(iter(relation_delta.items()))
+            metrics: list[str] = []
+            for field, label in (("trust", "信任"), ("affection", "好感"), ("hostility", "敌意"), ("ambiguity", "摇摆")):
+                amount = int(dict(delta or {}).get(field, 0) or 0)
+                if amount:
+                    metrics.append(f"{label}{amount:+d}")
+            if metrics:
+                return self._trim_summary_text(f"{pair_key} 当前仍在变化：{'、'.join(metrics)}", 88)
+        atmosphere = str(scene_frame.get("atmosphere_summary", "")).strip()
+        if atmosphere:
+            return self._trim_summary_text(f"这一拍的气氛是：{atmosphere}", 88)
+        for item in reversed(list(transcript or [])[-8:]):
+            role = str(item.get("role", "")).strip()
+            message = self._trim_summary_text(str(item.get("message", "")).strip(), 88)
+            if role in {"scene", "director"} and message:
+                return message
+        return ""
+
     @staticmethod
     def _infer_time_hint(transcript: list[dict[str, Any]]) -> str:
         tokens = (
@@ -1075,13 +1471,12 @@ def _seed_relation_matrix(self, run_manifest: dict[str, Any], participants: list
         return keys
 
     def _merged_relation_matrix(self, session: dict[str, Any], participants: list[str]) -> dict[str, Any]:
-        state = dict(session.get("state", {}) or {})
         base = {
             str(key).strip(): self._normalize_relation_entry(dict(value or {}))
-            for key, value in dict(state.get("relation_matrix", {}) or {}).items()
+            for key, value in self._session_relation_matrix(session).items()
             if str(key).strip()
         }
-        deltas = dict(state.get("relation_delta", {}) or {})
+        deltas = self._session_relation_delta(session)
         selected = [str(item).strip() for item in list(participants or []) if str(item).strip()]
         for index, left in enumerate(selected):
             for right in selected[index + 1 :]:
@@ -1101,10 +1496,15 @@ def _merged_relation_matrix(self, session: dict[str, Any], participants: list[st
                     step = 0
                 baseline = int(merged.get(field, self._default_relation_entry()[field]) or self._default_relation_entry()[field])
                 merged[field] = max(0, min(10, baseline + step))
-            for field in ("last_event", "relation_change", "typical_interaction"):
+            for field in ("last_event", "relation_change", "typical_interaction", "last_actor", "last_target", "updated_at"):
                 value = str(delta_payload.get(field, "")).strip()
                 if value:
                     merged[field] = value
+            if "momentum" in delta_payload:
+                try:
+                    merged["momentum"] = int(delta_payload.get("momentum", 0) or 0)
+                except Exception:
+                    pass
             evidence_lines = list(merged.get("evidence_lines", []) or [])
             for item in list(delta_payload.get("evidence_lines", []) or []):
                 text = str(item).strip()
@@ -1124,7 +1524,7 @@ def _empty_event_signals_state() -> dict[str, Any]:
         }
 
     def _merge_event_signals_state(self, session: dict[str, Any], incoming: list[dict[str, Any]]) -> dict[str, Any]:
-        current = dict(session.get("state", {}).get("event_signals", {}) or {})
+        current = self._session_event_signals(session)
         recent = [
             dict(item or {})
             for item in list(current.get("recent", []) or [])
@@ -1214,12 +1614,11 @@ def normalize_event(item: dict[str, Any]) -> dict[str, Any]:
             "updated_at": _utc_now(),
         }
 
-    @staticmethod
-    def _latest_event_signal(session: dict[str, Any], *kinds: str) -> dict[str, Any]:
+    def _latest_event_signal(self, session: dict[str, Any], *kinds: str) -> dict[str, Any]:
         wanted = {str(item).strip() for item in kinds if str(item).strip()}
         if not wanted:
             return {}
-        recent = list(dict(session.get("state", {}).get("event_signals", {}) or session.get("event_signals", {}) or {}).get("recent", []) or [])
+        recent = list(self._session_event_signals(session).get("recent", []) or [])
         for item in reversed(recent):
             event = dict(item or {})
             if str(event.get("kind", "")).strip() in wanted:
@@ -1233,7 +1632,7 @@ def _build_session_relation_excerpt(
         participants: list[str],
         active_participants: list[str],
     ) -> str:
-        deltas = dict(session.get("state", {}).get("relation_delta", {}) or {})
+        deltas = self._session_relation_delta(session)
         if not deltas:
             return ""
         merged = self._merged_relation_matrix(session, participants)
@@ -1267,13 +1666,17 @@ def _build_session_relation_excerpt(
             last_event = str(delta.get("last_event", "")).strip()
             if last_event:
                 line = f"{line}\n- last_event: {self._trim_summary_text(last_event, 120)}"
+            last_actor = str(delta.get("last_actor", "")).strip()
+            last_target = str(delta.get("last_target", "")).strip()
+            if last_actor or last_target:
+                line = f"{line}\n- drift: {self._trim_summary_text(' -> '.join([item for item in (last_actor, last_target) if item]), 80)}"
             lines.append(line)
             if len("\n".join(lines)) >= 1200:
                 break
         return "\n".join(lines).strip()
 
     def _build_session_event_excerpt(self, session: dict[str, Any]) -> list[dict[str, Any]]:
-        event_signals = dict(session.get("state", {}).get("event_signals", {}) or {})
+        event_signals = self._session_event_signals(session)
         recent = list(event_signals.get("recent", []) or [])
         normalized: list[dict[str, Any]] = []
         for item in recent[-8:]:
@@ -1408,9 +1811,13 @@ def _persona_snapshot_payload(snapshot: dict[str, Any], *, detailed: bool) -> di
             "focus": str(snapshot.get("focus", "")).strip(),
             "last_target": str(snapshot.get("last_target", "")).strip(),
             "last_message": str(snapshot.get("last_message", "")).strip(),
+            "present_state": str(snapshot.get("present_state", "")).strip(),
+            "scene_location": str(snapshot.get("scene_location", "")).strip(),
+            "time_hint": str(snapshot.get("time_hint", "")).strip(),
         }
         if detailed:
             fields["last_event"] = str(snapshot.get("last_event", "")).strip()
+            fields["updated_at"] = str(snapshot.get("updated_at", "")).strip()
         return {key: value for key, value in fields.items() if value}
 
     def _build_relation_excerpt(
@@ -1502,7 +1909,7 @@ def _build_turn_memory_context(
         scene_card: dict[str, Any],
         scene_progress: dict[str, Any] | None = None,
     ) -> dict[str, Any]:
-        state_summary = dict(session.get("state", {}).get("memory_summary", {}) or {})
+        state_summary = self._session_memory_summary_state(session)
         archived_summary = {
             "summary": self._trim_summary_text(str(state_summary.get("summary", "")).strip(), 360),
             "key_points": [
@@ -1535,6 +1942,7 @@ def _build_turn_memory_context(
             ],
             "should_offer_scene_shift": bool(normalized_progress.get("should_offer_scene_shift", False)),
             "scene_shift_reason": self._trim_summary_text(str(normalized_progress.get("scene_shift_reason", "")).strip(), 120),
+            "world_tension_summary": self._trim_summary_text(str(normalized_progress.get("world_tension_summary", "")).strip(), 120),
         }
         progress_snapshot = {
             key: value
@@ -1543,7 +1951,7 @@ def _build_turn_memory_context(
         }
         character_snapshots = {
             str(name).strip(): self._persona_snapshot_payload(dict(snapshot or {}), detailed=True)
-            for name, snapshot in dict(session.get("state", {}).get("character_snapshots", {}) or {}).items()
+            for name, snapshot in self._session_character_snapshots(session).items()
             if str(name).strip() and self._persona_snapshot_payload(dict(snapshot or {}), detailed=True)
         }
         relation_delta = {
@@ -1552,7 +1960,7 @@ def _build_turn_memory_context(
                 for key, value in dict(delta or {}).items()
                 if value not in ("", [], 0, None)
             }
-            for pair_key, delta in dict(session.get("state", {}).get("relation_delta", {}) or {}).items()
+            for pair_key, delta in self._session_relation_delta(session).items()
             if str(pair_key).strip()
         }
         relation_delta = {key: value for key, value in relation_delta.items() if value}
@@ -1644,10 +2052,10 @@ def _serialize_session(self, run_id: str, payload: dict[str, Any]) -> dict[str,
         session["mode_display"] = self._mode_display(str(session.get("mode", "")).strip())
         transcript = self._serialize_transcript(session)
         session["transcript"] = transcript
-        session["scene_progress"] = dict(session.get("state", {}).get("scene_progress", {}) or {})
-        session["relation_delta"] = dict(session.get("state", {}).get("relation_delta", {}) or {})
-        session["character_snapshots"] = dict(session.get("state", {}).get("character_snapshots", {}) or {})
-        session["event_signals"] = dict(session.get("state", {}).get("event_signals", {}) or {})
+        session["scene_progress"] = self._session_scene_progress(session)
+        session["relation_delta"] = self._session_relation_delta(session)
+        session["character_snapshots"] = self._session_character_snapshots(session)
+        session["event_signals"] = self._session_event_signals(session)
         session["relation_matrix"] = self._merged_relation_matrix(session, list(session.get("participants", []) or []))
         session["last_entry_preview"] = self._build_last_entry_preview(session)
         session["session_card"] = self._build_session_card(session)
@@ -1655,6 +2063,7 @@ def _serialize_session(self, run_id: str, payload: dict[str, Any]) -> dict[str,
         session["branch_origin"] = dict(session.get("branch_origin", {}) or {})
         session["pending_turn_summary"] = self._build_pending_turn_summary(session)
         session["session_memory_summary"] = self._build_session_memory_summary(run_id, session, transcript)
+        session["runtime_state_overview"] = self._build_runtime_state_overview(session)
         return session
 
     def _serialize_transcript(self, session: dict[str, Any]) -> list[dict[str, Any]]:
@@ -1763,12 +2172,175 @@ def _build_pending_turn_summary(self, session: dict[str, Any]) -> dict[str, Any]
             "response_limit_hint": int(pending.get("response_limit_hint", 0) or 0),
         }
 
+    def _build_runtime_state_overview(self, session: dict[str, Any]) -> dict[str, Any]:
+        scene_progress = self._session_scene_progress(session)
+        present = [
+            str(item).strip()
+            for item in list(scene_progress.get("present_participants", []) or [])
+            if str(item).strip()
+        ]
+        offstage = [
+            str(item).strip()
+            for item in list(scene_progress.get("offstage_participants", []) or [])
+            if str(item).strip()
+        ]
+        location = str(scene_progress.get("location", "")).strip()
+        time_hint = str(scene_progress.get("time_hint", "")).strip()
+        atmosphere = self._trim_summary_text(str(scene_progress.get("atmosphere_summary", "")).strip(), 80)
+        beat_maturity = max(0, min(100, int(scene_progress.get("beat_maturity", 0) or 0)))
+        should_offer_scene_shift = bool(scene_progress.get("should_offer_scene_shift", False))
+        shift_reason = self._trim_summary_text(str(scene_progress.get("scene_shift_reason", "")).strip(), 120)
+        tension = self._trim_summary_text(str(scene_progress.get("world_tension_summary", "")).strip(), 120)
+
+        pills: list[dict[str, Any]] = []
+        if location:
+            pills.append({"text": f"地点 · {location}"})
+        if time_hint:
+            pills.append({"text": f"时间 · {time_hint}"})
+        if atmosphere:
+            pills.append({"text": f"氛围 · {atmosphere}"})
+        if beat_maturity > 0:
+            pills.append({"text": f"推进 {beat_maturity}/100"})
+        if should_offer_scene_shift:
+            pills.append({"text": f"可转场 · {shift_reason or '这一拍已经可以顺势转场'}"})
+
+        character_rows: list[dict[str, Any]] = []
+        for name, snapshot in self._session_character_snapshots(session).items():
+            normalized_name = str(name).strip()
+            if not normalized_name:
+                continue
+            current = dict(snapshot or {})
+            parts: list[str] = []
+            present_state = str(current.get("present_state", "")).strip()
+            if present_state == "onstage":
+                parts.append("在场")
+            elif present_state == "offstage":
+                parts.append("离场")
+            for key in ("mood", "interaction_state"):
+                value = str(current.get(key, "")).strip()
+                if value:
+                    parts.append(value)
+            focus = str(current.get("focus", "")).strip()
+            if focus:
+                parts.append(f"看向 {focus}")
+            character_rows.append(
+                {
+                    "title": normalized_name,
+                    "copy": self._trim_summary_text(" · ".join(parts) or "这一拍还没有额外漂移。", 120),
+                    "rank": 0 if present_state == "onstage" else 1,
+                }
+            )
+        character_rows.sort(key=lambda item: (int(item.get("rank", 9) or 9), str(item.get("title", ""))))
+        character_rows = [{"title": item["title"], "copy": item["copy"]} for item in character_rows[:4]]
+
+        relation_rows: list[dict[str, Any]] = []
+        for pair_key, delta in self._session_relation_delta(session).items():
+            normalized_key = str(pair_key).strip()
+            if not normalized_key:
+                continue
+            payload = dict(delta or {})
+            metrics: list[str] = []
+            momentum = int(payload.get("momentum", 0) or 0)
+            for field, label in (("trust", "信任"), ("affection", "好感"), ("hostility", "敌意"), ("ambiguity", "摇摆")):
+                amount = int(payload.get(field, 0) or 0)
+                if amount:
+                    metrics.append(f"{label}{amount:+d}")
+            last_event = self._trim_summary_text(str(payload.get("last_event", "")).strip(), 72)
+            relation_rows.append(
+                {
+                    "title": normalized_key.replace("_", " · "),
+                    "copy": self._trim_summary_text(
+                        f"{' / '.join(metrics)}{' · ' if metrics and last_event else ''}{last_event}".strip() or "这组关系本局有变化。",
+                        120,
+                    ),
+                    "rank": max(momentum, len(metrics)),
+                }
+            )
+        relation_rows.sort(key=lambda item: (-int(item.get("rank", 0) or 0), str(item.get("title", ""))))
+        relation_rows = [{"title": item["title"], "copy": item["copy"]} for item in relation_rows[:3]]
+
+        event_rows: list[dict[str, str]] = []
+        for event in list(self._session_event_signals(session).get("recent", []) or [])[-4:]:
+            payload = dict(event or {})
+            kind = str(payload.get("kind", "")).strip()
+            cue = self._trim_summary_text(str(payload.get("cue", "")).strip(), 88)
+            if not kind or not cue:
+                continue
+            actor = str(payload.get("actor", "")).strip()
+            target = str(payload.get("target", "")).strip()
+            scope = str(payload.get("scope", "")).strip()
+            title_bits = [self._event_kind_label(kind)]
+            if actor:
+                title_bits.append(actor)
+            if target:
+                title_bits.append(target)
+            event_rows.append(
+                {
+                    "title": " · ".join(title_bits) if title_bits else (scope or "event"),
+                    "copy": cue,
+                }
+            )
+
+        status_bits: list[str] = []
+        pill_texts = [str(item.get("text", "")).strip() for item in pills if str(item.get("text", "")).strip()]
+        if pill_texts:
+            status_bits.append(" · ".join(pill_texts[:3]))
+        if present:
+            status_bits.append(f"在场：{'、'.join(present[:3])}")
+        if offstage:
+            status_bits.append(f"离场：{'、'.join(offstage[:2])}")
+        if tension:
+            status_bits.append(f"张力：{self._trim_summary_text(tension, 56)}")
+        status_line = " ｜ ".join(status_bits)
+
+        next_hint = ""
+        if should_offer_scene_shift:
+            next_hint = shift_reason or "这一拍已经可以顺势转场。"
+        elif tension:
+            next_hint = self._trim_summary_text(tension, 72)
+        elif event_rows:
+            next_hint = self._trim_summary_text(str(event_rows[-1].get("copy", "")).strip(), 72)
+
+        return {
+            "present": present,
+            "offstage": offstage,
+            "location": location,
+            "time_hint": time_hint,
+            "atmosphere": atmosphere,
+            "beat_maturity": beat_maturity,
+            "should_offer_scene_shift": should_offer_scene_shift,
+            "scene_shift_reason": shift_reason,
+            "tension": tension,
+            "pills": pills,
+            "character_rows": character_rows,
+            "relation_rows": relation_rows,
+            "event_rows": event_rows,
+            "status_line": status_line,
+            "next_hint": next_hint,
+        }
+
+    @staticmethod
+    def _event_kind_label(kind: str) -> str:
+        mapping = {
+            "scene_transition": "转场",
+            "cast_enter": "入场",
+            "cast_exit": "离场",
+            "atmosphere_shift": "气氛变化",
+            "time_change": "时间推进",
+            "environment_change": "环境变化",
+            "beat_complete": "一拍收束",
+            "relationship_shift": "关系变化",
+            "micro_action": "细微动作",
+        }
+        normalized = str(kind or "").strip()
+        return mapping.get(normalized, normalized or "事件")
+
     def _build_session_memory_summary(self, run_id: str, session: dict[str, Any], transcript: list[dict[str, Any]]) -> dict[str, str]:
         mode = str(session.get("mode", "observe")).strip() or "observe"
         mode_display = self._mode_display(mode)
         participants = [str(item).strip() for item in session.get("participants", []) if str(item).strip()]
         history = list(session.get("history", []) or [])
-        scene_progress = dict(session.get("state", {}).get("scene_progress", {}) or session.get("scene_progress", {}) or {})
+        scene_progress = self._session_scene_progress(session)
         present_participants = [
             str(item).strip()
             for item in list(scene_progress.get("present_participants", []) or [])
@@ -1840,7 +2412,10 @@ def _build_session_memory_summary(self, run_id: str, session: dict[str, Any], tr
             perspective = f"{perspective} 当前时间已经推进到「{time_hint}」。"
 
         world = "当前局势里的动作与情绪线会在这里提醒你。"
-        if progression_note:
+        world_tension_summary = str(scene_progress.get("world_tension_summary", "")).strip()
+        if world_tension_summary:
+            world = self._trim_summary_text(world_tension_summary, 88)
+        elif progression_note:
             world = self._trim_summary_text(progression_note, 88)
         for item in reversed(transcript):
             role = str(item.get("role", "")).strip()
@@ -1883,7 +2458,7 @@ def _build_session_memory_summary(self, run_id: str, session: dict[str, Any], tr
                 semantic_hint = str((hits[0] or {}).get("text", "")).strip()
         if semantic_hint:
             relation = f"{relation} · 长期记忆：{self._trim_summary_text(semantic_hint, 68)}"
-        relation_delta = dict(session.get("state", {}).get("relation_delta", {}) or {})
+        relation_delta = self._session_relation_delta(session)
         if relation_delta:
             delta_bits: list[str] = []
             for pair_key, delta in list(relation_delta.items())[:3]:
diff --git a/src/web/service_facades/dialogue.py b/src/web/service_facades/dialogue.py
index 20e232f..9c3b1b9 100644
--- a/src/web/service_facades/dialogue.py
+++ b/src/web/service_facades/dialogue.py
@@ -297,7 +297,7 @@ def _generate_dialogue_scene_progress(self, run_id: str, session: dict[str, Any]
             return {}
 
         payload = dict(session or {})
-        payload["scene_progress"] = dict(payload.get("scene_progress", {}) or payload.get("state", {}).get("scene_progress", {}) or {})
+        payload["scene_progress"] = self.dialogue._session_scene_progress(payload)
         attempts = (
             build_dialogue_scene_progress_messages(payload),
             [
@@ -356,10 +356,9 @@ def _evolve_relations_from_turn(
                 return
             session_path = self.dialogue._session_file(run_id, session_id)
             session = self.dialogue._read_json(session_path)
-            state = dict(session.get("state", {}) or {})
-            relation_delta = dict(state.get("relation_delta", {}) or {})
-            character_snapshots = dict(state.get("character_snapshots", {}) or {})
-            event_signals = dict(state.get("event_signals", {}) or self.dialogue._empty_event_signals_state())
+            relation_delta = self.dialogue._session_relation_delta(session)
+            character_snapshots = self.dialogue._session_character_snapshots(session)
+            event_signals = self.dialogue._session_event_signals(session)
             input_block = dict(pending_payload.get("input", {}) or {})
             speaker = str(input_block.get("speaker", "")).strip()
             participants = [str(item).strip() for item in input_block.get("participants", []) if str(item).strip()]
@@ -397,10 +396,18 @@ def _evolve_relations_from_turn(
                             continue
                         current[field] = int(current.get(field, 0) or 0) + int(amount)
                     current["last_event"] = message[:220]
+                    current["last_actor"] = responder
+                    current["last_target"] = target
                     evidence_lines = list(current.get("evidence_lines", []) or [])
                     evidence_lines.append(f"{responder}->{target}: {message}"[:220])
                     current["evidence_lines"] = evidence_lines[-10:]
                     current["updated_at"] = session.get("updated_at", "")
+                    current["momentum"] = max(
+                        abs(int(current.get("trust", 0) or 0)),
+                        abs(int(current.get("affection", 0) or 0)),
+                        abs(int(current.get("hostility", 0) or 0)),
+                        abs(int(current.get("ambiguity", 0) or 0)),
+                    )
                     relation_delta[key] = current
                     if any(int(current.get(field, 0) or 0) for field in ("trust", "affection", "hostility", "ambiguity")):
                         detected_events.append(
@@ -459,9 +466,9 @@ def _evolve_relations_from_turn(
                 detected_events,
             )
 
-            session.setdefault("state", {})["relation_delta"] = relation_delta
-            session.setdefault("state", {})["character_snapshots"] = character_snapshots
-            session.setdefault("state", {})["event_signals"] = event_signals
+            self.dialogue._set_session_relation_delta(session, relation_delta)
+            self.dialogue._set_session_character_snapshots(session, character_snapshots)
+            self.dialogue._set_session_event_signals(session, event_signals)
             session["updated_at"] = session.get("updated_at") or ""
             self.dialogue._write_json(session_path, session)
             store = self.dialogue._resolve_memory_store(run_id)
@@ -494,10 +501,8 @@ def _generate_dialogue_relation_state(
             return {}
 
         payload = dict(session or {})
-        payload.setdefault("state", {})
-        payload["state"] = dict(payload.get("state", {}) or {})
-        payload["state"]["relation_delta"] = dict(relation_delta or {})
-        payload["state"]["character_snapshots"] = dict(character_snapshots or {})
+        self.dialogue._set_session_relation_delta(payload, relation_delta)
+        self.dialogue._set_session_character_snapshots(payload, character_snapshots)
         attempts = (
             build_dialogue_relation_state_messages(payload, pending_payload, responses),
             [
@@ -538,10 +543,15 @@ def _merge_relation_delta(base: dict[str, Any], incoming: dict[str, Any]) -> dic
                         current[field] = int(next_value.get(field, 0) or 0)
                     except Exception:
                         pass
-            for field in ("last_event", "relation_change", "typical_interaction"):
+            for field in ("last_event", "relation_change", "typical_interaction", "last_actor", "last_target", "updated_at"):
                 text = str(next_value.get(field, "")).strip()
                 if text:
                     current[field] = text
+            if "momentum" in next_value:
+                try:
+                    current["momentum"] = int(next_value.get("momentum", 0) or 0)
+                except Exception:
+                    pass
             evidence_lines = [
                 str(item).strip()
                 for item in list(next_value.get("evidence_lines", []) or [])
diff --git a/tests/test_session_store.py b/tests/test_session_store.py
index 4ab7846..3a3ea75 100644
--- a/tests/test_session_store.py
+++ b/tests/test_session_store.py
@@ -24,8 +24,10 @@ def test_markdown_session_store_persists_session_and_relation_snapshot(self):
                 "updated_at": 1234567890,
                 "characters": ["刘备", "关羽"],
                 "state": {
-                    "relation_matrix": {"关羽_刘备": {"trust": 9}},
-                    "relation_delta": {"关羽_刘备": {"trust": 10}},
+                    "relations": {
+                        "matrix": {"关羽_刘备": {"trust": 9}},
+                        "delta": {"关羽_刘备": {"trust": 10}},
+                    }
                 },
             }
 
@@ -55,12 +57,12 @@ def test_session_store_compresses_context_and_supports_long_term_search(self):
                     {"speaker": "林黛玉", "message": f"第{i}句提到了宝玉和心事。", "ts": i}
                     for i in range(32)
                 ],
-                "state": {},
+                "state": {"memory": {"summary": {}}},
             }
 
             updated = store.compress_context(session)
             self.assertLess(len(updated["history"]), 32)
-            memory_summary = updated.get("state", {}).get("memory_summary", {})
+            memory_summary = updated.get("state", {}).get("memory", {}).get("summary", {})
             self.assertTrue(memory_summary.get("summary"))
             self.assertGreater(memory_summary.get("compressed_turns", 0), 0)
 
diff --git a/tests/test_web_app.py b/tests/test_web_app.py
index db3974e..ec4c313 100644
--- a/tests/test_web_app.py
+++ b/tests/test_web_app.py
@@ -2964,11 +2964,13 @@ def test_build_turn_payload_includes_memory_context_and_trims_relation_excerpt(s
                 {"speaker": "贾宝玉", "message": "我不是有意惹你心烦。", "ts": "2026-05-12T00:00:01Z"},
             ]
             raw_session["state"] = {
-                "memory_summary": {
-                    "summary": "两人前面已经因一句话生过闷气，但都还惦记对方。",
-                    "key_points": ["林黛玉嘴上轻冷，心里还在意。", "贾宝玉想解释，却总把话说得更乱。"],
-                    "compressed_turns": 18,
-                    "recent_turns_kept": 24,
+                "memory": {
+                    "summary": {
+                        "summary": "两人前面已经因一句话生过闷气，但都还惦记对方。",
+                        "key_points": ["林黛玉嘴上轻冷，心里还在意。", "贾宝玉想解释，却总把话说得更乱。"],
+                        "compressed_turns": 18,
+                        "recent_turns_kept": 24,
+                    }
                 }
             }
             service.dialogue._write_json(service.dialogue._session_file(run_id, session["session_id"]), raw_session)
@@ -3063,16 +3065,23 @@ def test_dialogue_relation_delta_and_character_snapshot_are_session_isolated(sel
             raw_one = service.dialogue._read_json(service.dialogue._session_file(run_id, session_one["session_id"]))
             raw_two = service.dialogue._read_json(service.dialogue._session_file(run_id, session_two["session_id"]))
 
-            delta = raw_one.get("state", {}).get("relation_delta", {}).get("林黛玉_贾宝玉", {})
+            delta = raw_one.get("state", {}).get("relations", {}).get("delta", {}).get("林黛玉_贾宝玉", {})
             self.assertEqual(delta.get("trust"), 1)
             self.assertEqual(delta.get("affection"), 1)
             self.assertEqual(delta.get("hostility"), -1)
-            snapshot = raw_one.get("state", {}).get("character_snapshots", {}).get("贾宝玉", {})
+            self.assertEqual(delta.get("last_actor"), "贾宝玉")
+            self.assertEqual(delta.get("last_target"), "林黛玉")
+            self.assertGreaterEqual(int(delta.get("momentum", 0) or 0), 1)
+            snapshot = raw_one.get("state", {}).get("characters", {}).get("snapshots", {}).get("贾宝玉", {})
             self.assertEqual(snapshot.get("interaction_state"), "softening")
             self.assertEqual(snapshot.get("last_target"), "林黛玉")
+            self.assertEqual(snapshot.get("present_state"), "onstage")
+            self.assertTrue(bool(snapshot.get("updated_at", "")))
 
-            self.assertEqual(raw_two.get("state", {}).get("relation_delta", {}), {})
-            self.assertEqual(raw_two.get("state", {}).get("character_snapshots", {}), {})
+            self.assertEqual(raw_two.get("state", {}).get("relations", {}).get("delta", {}), {})
+            untouched_snapshot = raw_two.get("state", {}).get("characters", {}).get("snapshots", {}).get("贾宝玉", {})
+            self.assertEqual(untouched_snapshot.get("present_state"), "onstage")
+            self.assertFalse(bool(untouched_snapshot.get("interaction_state", "")))
             self.assertEqual(relation_path.read_text(encoding="utf-8"), original_relation_text)
 
     def test_build_turn_payload_includes_session_relation_delta_and_snapshots(self):
@@ -3111,24 +3120,28 @@ def test_build_turn_payload_includes_session_relation_delta_and_snapshots(self):
             raw_session = service.dialogue._read_json(service.dialogue._session_file(run_id, session["session_id"]))
             raw_session["state"] = {
                 **dict(raw_session.get("state", {}) or {}),
-                "relation_matrix": {
-                    "林黛玉_贾宝玉": {"trust": 8, "affection": 8, "hostility": 1, "ambiguity": 3}
-                },
-                "relation_delta": {
-                    "林黛玉_贾宝玉": {
-                        "trust": 1,
-                        "affection": 1,
-                        "last_event": "刚刚把话说软了下来。",
-                        "evidence_lines": ["贾宝玉->林黛玉: 谢谢你愿意陪我一起。"],
-                    }
+                "relations": {
+                    "matrix": {
+                        "林黛玉_贾宝玉": {"trust": 8, "affection": 8, "hostility": 1, "ambiguity": 3}
+                    },
+                    "delta": {
+                        "林黛玉_贾宝玉": {
+                            "trust": 1,
+                            "affection": 1,
+                            "last_event": "刚刚把话说软了下来。",
+                            "evidence_lines": ["贾宝玉->林黛玉: 谢谢你愿意陪我一起。"],
+                        }
+                    },
                 },
-                "character_snapshots": {
-                    "贾宝玉": {
-                        "mood": "放松",
-                        "interaction_state": "softening",
-                        "focus": "林黛玉",
-                        "last_target": "林黛玉",
-                        "last_message": "谢谢你愿意陪我一起。",
+                "characters": {
+                    "snapshots": {
+                        "贾宝玉": {
+                            "mood": "放松",
+                            "interaction_state": "softening",
+                            "focus": "林黛玉",
+                            "last_target": "林黛玉",
+                            "last_message": "谢谢你愿意陪我一起。",
+                        }
                     }
                 },
             }
@@ -3148,6 +3161,65 @@ def test_build_turn_payload_includes_session_relation_delta_and_snapshots(self):
             self.assertIn("session_delta", relation_excerpt)
             detail_map = {item["name"]: item for item in payload.get("persona_contexts", [])}
             self.assertEqual(detail_map["贾宝玉"]["session_snapshot"]["interaction_state"], "softening")
+            serialized = service.dialogue._serialize_session(run_id, raw_session)
+            overview = dict(serialized.get("runtime_state_overview", {}) or {})
+            self.assertTrue(bool(overview.get("relation_rows", [])))
+
+    def test_dialogue_session_state_uses_canonical_grouped_schema(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            service = WebRunService(tmp)
+            service.save_model_settings(
+                provider="openai-compatible",
+                model="deepseek-chat",
+                base_url="https://example.com/v1",
+                api_key="sk-test",
+            )
+            run = service.create_run(
+                novel_name="hongloumeng.txt",
+                novel_content_base64=base64.b64encode("林黛玉见了贾宝玉。".encode("utf-8")).decode("ascii"),
+                characters=["林黛玉", "贾宝玉"],
+            )
+            run_id = run["run_id"]
+            for name in ("林黛玉", "贾宝玉"):
+                service.ingest_character_result(
+                    run_id,
+                    character=name,
+                    content_base64=base64.b64encode(
+                        f"- name: {name}\n- novel_id: hongloumeng\n- core_identity: 人物\n".encode("utf-8")
+                    ).decode("ascii"),
+                )
+
+            session = service.dialogue.create_session(
+                service._require_manifest(run_id),
+                mode="observe",
+                participants=["林黛玉", "贾宝玉"],
+            )
+            raw_session = service.dialogue._read_json(service.dialogue._session_file(run_id, session["session_id"]))
+            state = dict(raw_session.get("state", {}) or {})
+
+            self.assertEqual(state.get("version"), 1)
+            self.assertIn("scene", state)
+            self.assertIn("presence", state)
+            self.assertIn("progression", state)
+            self.assertIn("relations", state)
+            self.assertIn("characters", state)
+            self.assertIn("signals", state)
+            self.assertIn("memory", state)
+            self.assertIn("atmosphere_summary", dict(state.get("scene", {}) or {}))
+            self.assertIn("matrix", dict(state.get("relations", {}) or {}))
+            self.assertIn("delta", dict(state.get("relations", {}) or {}))
+            self.assertIn("snapshots", dict(state.get("characters", {}) or {}))
+            self.assertIn("beat_maturity", dict(state.get("progression", {}) or {}))
+            self.assertIn("world_tension_summary", dict(state.get("progression", {}) or {}))
+            overview = dict(session.get("runtime_state_overview", {}) or {})
+            self.assertIn("present", overview)
+            self.assertIn("offstage", overview)
+            self.assertIn("pills", overview)
+            self.assertIn("character_rows", overview)
+            self.assertIn("relation_rows", overview)
+            self.assertIn("event_rows", overview)
+            self.assertIn("status_line", overview)
+            self.assertIn("next_hint", overview)
 
     def test_dialogue_relation_state_llm_can_lightly_refine_session_delta(self):
         with tempfile.TemporaryDirectory() as tmp:
@@ -3214,11 +3286,11 @@ def test_dialogue_relation_state_llm_can_lightly_refine_session_delta(self):
                 )
 
             raw_session = service.dialogue._read_json(service.dialogue._session_file(run_id, session["session_id"]))
-            delta = raw_session.get("state", {}).get("relation_delta", {}).get("林黛玉_贾宝玉", {})
+            delta = raw_session.get("state", {}).get("relations", {}).get("delta", {}).get("林黛玉_贾宝玉", {})
             self.assertEqual(delta.get("trust"), 2)
             self.assertEqual(delta.get("affection"), 1)
             self.assertIn("明显更松", str(delta.get("last_event", "")))
-            snapshot = raw_session.get("state", {}).get("character_snapshots", {}).get("贾宝玉", {})
+            snapshot = raw_session.get("state", {}).get("characters", {}).get("snapshots", {}).get("贾宝玉", {})
             self.assertEqual(snapshot.get("interaction_state"), "softening")
 
     def test_dialogue_event_signals_capture_scene_and_inline_action_categories(self):
@@ -3271,9 +3343,11 @@ def test_dialogue_event_signals_capture_scene_and_inline_action_categories(self)
                 )
 
             raw_session = service.dialogue._read_json(service.dialogue._session_file(run_id, session["session_id"]))
-            event_signals = dict(raw_session.get("state", {}).get("event_signals", {}) or {})
+            event_signals = dict(raw_session.get("state", {}).get("signals", {}) or {})
             recent = list(event_signals.get("recent", []) or [])
             kinds = {str(item.get("kind", "")).strip() for item in recent}
+            overview = dict(service.dialogue._serialize_session(run_id, raw_session).get("runtime_state_overview", {}) or {})
+            event_rows = list(overview.get("event_rows", []) or [])
 
             self.assertIn("time_change", kinds)
             self.assertIn("environment_change", kinds)
@@ -3281,6 +3355,7 @@ def test_dialogue_event_signals_capture_scene_and_inline_action_categories(self)
             self.assertIn("cast_exit", kinds)
             self.assertIn("micro_action", kinds)
             self.assertIn("atmosphere_shift", kinds)
+            self.assertTrue(event_rows)
 
             micro_action = next(item for item in recent if str(item.get("kind", "")).strip() == "micro_action")
             self.assertEqual(micro_action.get("actor"), "林黛玉")
@@ -5827,6 +5902,9 @@ def test_ingest_turn_updates_scene_progress_and_future_active_participants(self)
             self.assertEqual(updated["scene_progress"]["time_hint"], "夜里")
             self.assertEqual(updated["scene_progress"]["present_participants"], ["林黛玉", "贾宝玉"])
             self.assertEqual(updated["scene_progress"]["offstage_participants"], ["薛宝钗"])
+            self.assertTrue(updated["scene_progress"]["atmosphere_summary"])
+            self.assertGreater(updated["scene_progress"]["beat_maturity"], 0)
+            self.assertTrue(updated["scene_progress"]["world_tension_summary"])
             self.assertIn("夜里", updated["session_memory_summary"]["scene_frame"])
             self.assertIn("薛宝钗", updated["session_memory_summary"]["cast"])
 
@@ -5901,6 +5979,8 @@ def test_scene_progress_can_flag_natural_scene_shift_after_longer_turn(self):
 
             self.assertTrue(updated["scene_progress"]["should_offer_scene_shift"])
             self.assertIn("下一幕", updated["scene_progress"]["scene_shift_reason"])
+            self.assertGreaterEqual(updated["scene_progress"]["beat_maturity"], 70)
+            self.assertTrue(updated["scene_progress"]["world_tension_summary"])
             self.assertIn("转场提示", updated["session_memory_summary"]["scene_frame"])
 
 

From 0f049a867477ea5cb1cfe7594415c4789c64638a Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 12:38:30 +0800
Subject: [PATCH 02/11] feat: surface dialogue runtime state in chat ui

---
 src/web/static/fragments/main-shell.html |  33 ++++
 src/web/static/js/dialogue.js            | 226 +++++++++++++++++++++++
 src/web/static/styles/dialogue.css       | 119 ++++++++++++
 src/web/static/styles/responsive.css     |   8 +
 4 files changed, 386 insertions(+)

diff --git a/src/web/static/fragments/main-shell.html b/src/web/static/fragments/main-shell.html
index f526a4a..ea78147 100644
--- a/src/web/static/fragments/main-shell.html
+++ b/src/web/static/fragments/main-shell.html
@@ -36,6 +36,39 @@
               <div id="dialogue-scene-chain-suggestions" class="dialogue-scene-chain-suggestions hidden"></div>
             </div>
             <div id="dialogue-scene-timeline" class="dialogue-scene-timeline hidden"></div>
+            <section id="dialogue-state-overview" class="dialogue-state-overview hidden">
+              <div class="dialogue-state-overview-head">
+                <strong>本局状态</strong>
+                <small>这一拍推进到哪、谁在场、气氛往哪边偏，都收在这里。</small>
+              </div>
+              <div id="dialogue-state-pills" class="dialogue-state-pills"></div>
+              <div class="dialogue-state-grid">
+                <article class="dialogue-state-card">
+                  <span>当前在场</span>
+                  <div id="dialogue-state-present" class="dialogue-state-chip-list"></div>
+                </article>
+                <article class="dialogue-state-card">
+                  <span>暂时离场</span>
+                  <div id="dialogue-state-offstage" class="dialogue-state-chip-list is-muted"></div>
+                </article>
+                <article class="dialogue-state-card">
+                  <span>局势张力</span>
+                  <p id="dialogue-state-tension">这一拍的情绪和冲突会收在这里。</p>
+                </article>
+                <article class="dialogue-state-card">
+                  <span>角色快照</span>
+                  <div id="dialogue-state-characters" class="dialogue-state-mini-list"></div>
+                </article>
+                <article class="dialogue-state-card">
+                  <span>关系漂移</span>
+                  <div id="dialogue-state-relations" class="dialogue-state-mini-list"></div>
+                </article>
+                <article class="dialogue-state-card">
+                  <span>最近波动</span>
+                  <div id="dialogue-state-events" class="dialogue-state-mini-list"></div>
+                </article>
+              </div>
+            </section>
             <div class="dialogue-memory-grid">
               <article class="dialogue-memory-card">
                 <span>场景回顾</span>
diff --git a/src/web/static/js/dialogue.js b/src/web/static/js/dialogue.js
index ec0785c..467f3c5 100644
--- a/src/web/static/js/dialogue.js
+++ b/src/web/static/js/dialogue.js
@@ -209,6 +209,226 @@ function buildDialogueMemorySnapshot(session) {
   };
 }
 
+function renderDialogueStatePills(root, items) {
+  if (!root) return;
+  root.innerHTML = "";
+  (Array.isArray(items) ? items : []).forEach((item) => {
+    const text = String(item?.text || "").trim();
+    if (!text) return;
+    const chip = document.createElement("span");
+    chip.className = `dialogue-state-pill${item?.faint ? " is-faint" : ""}`;
+    chip.textContent = text;
+    root.appendChild(chip);
+  });
+}
+
+function renderDialogueStateChipList(root, items, emptyText = "暂时还没有明显变化。") {
+  if (!root) return;
+  root.innerHTML = "";
+  const values = Array.isArray(items) ? items.filter(Boolean) : [];
+  if (!values.length) {
+    const chip = document.createElement("span");
+    chip.className = "dialogue-state-chip is-faint";
+    chip.textContent = emptyText;
+    root.appendChild(chip);
+    return;
+  }
+  values.forEach((value) => {
+    const chip = document.createElement("span");
+    chip.className = "dialogue-state-chip";
+    chip.textContent = String(value || "").trim();
+    root.appendChild(chip);
+  });
+}
+
+function renderDialogueStateMiniList(root, items, emptyText = "这一栏还没有收出明显变化。") {
+  if (!root) return;
+  root.innerHTML = "";
+  const rows = Array.isArray(items) ? items.filter(Boolean) : [];
+  if (!rows.length) {
+    const item = document.createElement("div");
+    item.className = "dialogue-state-mini-item";
+    const copy = document.createElement("p");
+    copy.textContent = emptyText;
+    item.appendChild(copy);
+    root.appendChild(item);
+    return;
+  }
+  rows.forEach((row) => {
+    const item = document.createElement("div");
+    item.className = "dialogue-state-mini-item";
+    const title = document.createElement("strong");
+    title.textContent = String(row?.title || "").trim() || "未命名";
+    item.appendChild(title);
+    const copy = document.createElement("p");
+    copy.textContent = String(row?.copy || "").trim() || emptyText;
+    item.appendChild(copy);
+    root.appendChild(item);
+  });
+}
+
+function buildDialogueStateSnapshot(session) {
+  const overview = session?.runtime_state_overview || null;
+  if (overview && typeof overview === "object") {
+    return {
+      present: Array.isArray(overview.present) ? overview.present.filter(Boolean) : [],
+      offstage: Array.isArray(overview.offstage) ? overview.offstage.filter(Boolean) : [],
+      pills: Array.isArray(overview.pills) ? overview.pills.filter((item) => String(item?.text || "").trim()) : [],
+      tension: trimInlineMessage(String(overview.tension || "").trim()) || "这一拍的情绪和冲突会收在这里。",
+      characterRows: Array.isArray(overview.character_rows) ? overview.character_rows : [],
+      relationRows: Array.isArray(overview.relation_rows) ? overview.relation_rows : [],
+      eventRows: Array.isArray(overview.event_rows) ? overview.event_rows : [],
+      statusLine: trimInlineMessage(String(overview.status_line || "").trim()),
+      nextHint: trimInlineMessage(String(overview.next_hint || "").trim()),
+    };
+  }
+  const state = session?.state || {};
+  const scene = state?.scene || {};
+  const presence = state?.presence || {};
+  const progression = state?.progression || {};
+  const progress = session?.scene_progress || {};
+  const present = Array.isArray(progress?.present_participants) ? progress.present_participants : (presence?.present_participants || []);
+  const offstage = Array.isArray(progress?.offstage_participants) ? progress.offstage_participants : (presence?.offstage_participants || []);
+  const location = String(progress?.location || scene?.location || "").trim();
+  const timeHint = String(progress?.time_hint || scene?.time_hint || "").trim();
+  const atmosphere = trimInlineMessage(String(progress?.atmosphere_summary || scene?.atmosphere_summary || "").trim());
+  const beatMaturity = Number(progress?.beat_maturity || progression?.beat_maturity || 0) || 0;
+  const canShift = Boolean(progress?.should_offer_scene_shift ?? progression?.should_offer_scene_shift);
+  const shiftReason = trimInlineMessage(String(progress?.scene_shift_reason || progression?.scene_shift_reason || "").trim());
+  const tension = trimInlineMessage(
+    String(progress?.world_tension_summary || progression?.world_tension_summary || session?.session_memory_summary?.world || "").trim()
+  ) || "这一拍的情绪和冲突会收在这里。";
+  const characterSnapshots = session?.character_snapshots || state?.characters?.snapshots || {};
+  const relationDelta = session?.relation_delta || state?.relations?.delta || {};
+
+  const pills = [];
+  if (location) pills.push({ text: `地点 · ${location}` });
+  if (timeHint) pills.push({ text: `时间 · ${timeHint}` });
+  if (atmosphere) pills.push({ text: `氛围 · ${atmosphere}` });
+  if (beatMaturity > 0) pills.push({ text: `推进 ${Math.max(0, Math.min(100, Math.round(beatMaturity)))}/100` });
+  if (canShift) pills.push({ text: shiftReason ? `可转场 · ${shiftReason}` : "这一拍可以顺势转场" });
+
+  const characterRows = Object.entries(characterSnapshots)
+    .map(([name, snapshot]) => {
+      const item = snapshot || {};
+      const parts = [];
+      const presentState = String(item?.present_state || "").trim();
+      if (presentState === "onstage") parts.push("在场");
+      if (presentState === "offstage") parts.push("离场");
+      if (item?.mood) parts.push(String(item.mood).trim());
+      if (item?.interaction_state) parts.push(String(item.interaction_state).trim());
+      if (item?.focus) parts.push(`看向 ${String(item.focus).trim()}`);
+      if (item?.scene_location && String(item.scene_location).trim() !== location) {
+        parts.push(String(item.scene_location).trim());
+      }
+      return {
+        title: String(name || "").trim(),
+        copy: parts.filter(Boolean).join(" · "),
+        weight: presentState === "onstage" ? 0 : 1,
+      };
+    })
+    .filter((item) => item.title)
+    .sort((left, right) => {
+      if (left.weight !== right.weight) return left.weight - right.weight;
+      return left.title.localeCompare(right.title, "zh-Hans-CN");
+    })
+    .slice(0, 4)
+    .map(({ title, copy }) => ({ title, copy: copy || "这一拍还没有额外漂移。" }));
+
+  const relationRows = Object.entries(relationDelta)
+    .map(([pairKey, delta]) => {
+      const item = delta || {};
+      const metrics = [];
+      [["trust", "信任"], ["affection", "好感"], ["hostility", "敌意"], ["ambiguity", "摇摆"]].forEach(([field, label]) => {
+        const value = Number(item?.[field] || 0) || 0;
+        if (!value) return;
+        metrics.push(`${label}${value > 0 ? "+" : ""}${value}`);
+      });
+      const lastEvent = trimInlineMessage(String(item?.last_event || "").trim());
+      return {
+        title: String(pairKey || "").trim().replace(/_/g, " · "),
+        copy: metrics.length ? `${metrics.join(" / ")}${lastEvent ? ` · ${lastEvent}` : ""}` : (lastEvent || "这组关系本局有变化。"),
+      };
+    })
+    .filter((item) => item.title)
+    .slice(0, 3);
+
+  const eventKindLabel = {
+    scene_transition: "转场",
+    cast_enter: "入场",
+    cast_exit: "离场",
+    atmosphere_shift: "气氛变化",
+    time_change: "时间推进",
+    environment_change: "环境变化",
+    beat_complete: "一拍收束",
+    relationship_shift: "关系变化",
+    micro_action: "细微动作",
+  };
+  return {
+    present: Array.isArray(present) ? present.filter(Boolean) : [],
+    offstage: Array.isArray(offstage) ? offstage.filter(Boolean) : [],
+    pills,
+    tension,
+    characterRows,
+    relationRows,
+    eventRows: Array.isArray(session?.event_signals?.recent)
+      ? session.event_signals.recent.slice(-4).map((item) => ({
+          title: [
+            eventKindLabel[String(item?.kind || "").trim()] || String(item?.kind || "").trim(),
+            String(item?.actor || "").trim(),
+            String(item?.target || "").trim(),
+          ].filter(Boolean).join(" · ") || "事件",
+          copy: trimInlineMessage(String(item?.cue || "").trim()) || "这一拍有了新波动。",
+        }))
+      : [],
+    statusLine: "",
+    nextHint: "",
+  };
+}
+
+function renderDialogueStateOverview(session) {
+  const root = el("dialogue-state-overview");
+  if (!root || !session) return;
+  const snapshot = buildDialogueStateSnapshot(session);
+  const hasContent = Boolean(
+    snapshot.pills.length || snapshot.present.length || snapshot.offstage.length || snapshot.characterRows.length || snapshot.relationRows.length || snapshot.eventRows?.length || snapshot.tension
+  );
+  root.classList.toggle("hidden", !hasContent);
+  if (!hasContent) return;
+  renderDialogueStatePills(el("dialogue-state-pills"), snapshot.pills);
+  renderDialogueStateChipList(el("dialogue-state-present"), snapshot.present, "这会儿还没有明确在场名单。");
+  renderDialogueStateChipList(el("dialogue-state-offstage"), snapshot.offstage, "暂时没人明确离场。");
+  setText("dialogue-state-tension", snapshot.tension, "这一拍的情绪和冲突会收在这里。");
+  renderDialogueStateMiniList(el("dialogue-state-characters"), snapshot.characterRows, "角色快照会在聊出状态差后收进来。");
+  renderDialogueStateMiniList(el("dialogue-state-relations"), snapshot.relationRows, "关系要聊出明显变化，才会在这里留下痕迹。");
+  renderDialogueStateMiniList(el("dialogue-state-events"), snapshot.eventRows || [], "最近还没有收出更明确的事件波动。");
+}
+
+function buildDialogueSessionStatusLine(session) {
+  const snapshot = buildDialogueStateSnapshot(session);
+  if (snapshot.statusLine) {
+    return snapshot.statusLine;
+  }
+  const bits = [];
+  const pillTexts = Array.isArray(snapshot.pills)
+    ? snapshot.pills.map((item) => String(item?.text || "").trim()).filter(Boolean)
+    : [];
+  if (pillTexts.length) {
+    bits.push(pillTexts.slice(0, 3).join(" · "));
+  }
+  if (Array.isArray(snapshot.present) && snapshot.present.length) {
+    bits.push(`在场：${snapshot.present.slice(0, 3).join("、")}`);
+  }
+  if (Array.isArray(snapshot.offstage) && snapshot.offstage.length) {
+    bits.push(`离场：${snapshot.offstage.slice(0, 2).join("、")}`);
+  }
+  const tension = trimInlineMessage(snapshot.tension || "");
+  if (tension) {
+    bits.push(`张力：${tension}`);
+  }
+  return bits.filter(Boolean).join(" ｜ ");
+}
+
 function renderDialogueMemory(session) {
   const root = el("dialogue-memory");
   if (!root) return;
@@ -245,6 +465,7 @@ function renderDialogueMemory(session) {
   if (body) {
     body.classList.toggle("hidden", body.parentElement === root);
   }
+  renderDialogueStateOverview(session);
   renderDialogueSceneTimeline(session);
   if (typeof window.renderDialogueSceneSwitcher === "function") {
     window.renderDialogueSceneSwitcher(session);
@@ -339,6 +560,7 @@ function buildDialogueMemoryClipboardText(session) {
     `【本局记忆】`,
     `模式：${snapshot.modeLabel}`,
     `同席：${participantText}`,
+    `本局状态：${buildDialogueStateSnapshot(session).pills.map((item) => item.text).join(" / ") || "暂无"}`,
     `场景回顾：${snapshot.recap}`,
     `人物动向：${snapshot.cast}`,
     `关系变化：${snapshot.relation}`,
@@ -646,7 +868,11 @@ async function renderDialogueSession(session) {
   if (typeof renderObserveQuickReplies === "function") {
     renderObserveQuickReplies(session);
   }
+  const statusLine = buildDialogueSessionStatusLine(session);
   setSessionBadge("对话中");
+  if (typeof setStatus === "function") {
+    setStatus("dialogue-session-status", statusLine || "这一幕已经铺好，你可以继续说下去。");
+  }
   renderDialogueMemory(session);
   renderDialogueTranscript(session);
   await loadRecentSessions();
diff --git a/src/web/static/styles/dialogue.css b/src/web/static/styles/dialogue.css
index eca6503..5fcb210 100644
--- a/src/web/static/styles/dialogue.css
+++ b/src/web/static/styles/dialogue.css
@@ -225,6 +225,125 @@
   line-height: 1.5;
 }
 
+.dialogue-state-overview {
+  display: grid;
+  gap: 0.5rem;
+  padding: 0.76rem 0.82rem;
+  border-radius: 14px;
+  border: 1px solid rgba(170, 146, 127, 0.12);
+  background:
+    linear-gradient(180deg, rgba(255, 252, 248, 0.82), rgba(255, 248, 242, 0.7));
+}
+
+.dialogue-state-overview-head {
+  display: grid;
+  gap: 0.14rem;
+}
+
+.dialogue-state-overview-head strong {
+  color: var(--ink);
+  font-size: 0.75rem;
+  line-height: 1.4;
+}
+
+.dialogue-state-overview-head small {
+  color: var(--ink-faint);
+  font-size: 0.67rem;
+  line-height: 1.5;
+}
+
+.dialogue-state-pills {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 0.34rem;
+}
+
+.dialogue-state-pill,
+.dialogue-state-chip {
+  display: inline-flex;
+  align-items: center;
+  min-height: 1.45rem;
+  padding: 0 0.56rem;
+  border-radius: 999px;
+  background: rgba(184, 132, 113, 0.1);
+  color: var(--accent-strong);
+  font-size: 0.64rem;
+  line-height: 1.35;
+}
+
+.dialogue-state-pill.is-faint,
+.dialogue-state-chip.is-faint {
+  background: rgba(122, 104, 90, 0.08);
+  color: var(--ink-faint);
+}
+
+.dialogue-state-grid {
+  display: grid;
+  grid-template-columns: repeat(2, minmax(0, 1fr));
+  gap: 0.46rem;
+}
+
+.dialogue-state-card {
+  display: grid;
+  gap: 0.3rem;
+  padding: 0.62rem 0.7rem;
+  border-radius: 12px;
+  border: 1px solid rgba(170, 146, 127, 0.1);
+  background: rgba(255, 255, 255, 0.62);
+  min-height: 0;
+}
+
+.dialogue-state-card span {
+  color: var(--ink-soft);
+  font-size: 0.67rem;
+  line-height: 1.35;
+}
+
+.dialogue-state-card p {
+  margin: 0;
+  color: var(--ink);
+  font-size: 0.72rem;
+  line-height: 1.58;
+}
+
+.dialogue-state-chip-list {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 0.32rem;
+}
+
+.dialogue-state-chip-list.is-muted .dialogue-state-chip {
+  background: rgba(122, 104, 90, 0.08);
+  color: var(--ink-faint);
+}
+
+.dialogue-state-mini-list {
+  display: grid;
+  gap: 0.34rem;
+}
+
+.dialogue-state-mini-item {
+  display: grid;
+  gap: 0.08rem;
+  padding: 0.46rem 0.52rem;
+  border-radius: 10px;
+  background: rgba(255, 250, 246, 0.86);
+  border: 1px solid rgba(170, 146, 127, 0.08);
+}
+
+.dialogue-state-mini-item strong {
+  color: var(--ink);
+  font-size: 0.68rem;
+  line-height: 1.42;
+}
+
+.dialogue-state-mini-item p {
+  margin: 0;
+  color: var(--ink-faint);
+  font-size: 0.65rem;
+  line-height: 1.5;
+}
+
 .dialogue-scene-timeline-list {
   display: grid;
   gap: 0.38rem;
diff --git a/src/web/static/styles/responsive.css b/src/web/static/styles/responsive.css
index 7197dbd..97b9df0 100644
--- a/src/web/static/styles/responsive.css
+++ b/src/web/static/styles/responsive.css
@@ -136,10 +136,18 @@
     grid-template-columns: 1fr;
   }
 
+  .dialogue-memory-modal-scroll .dialogue-state-grid {
+    grid-template-columns: 1fr;
+  }
+
   .dialogue-memory-grid {
     grid-template-columns: 1fr;
   }
 
+  .dialogue-state-grid {
+    grid-template-columns: 1fr;
+  }
+
   .chat-detail {
     min-height: 20rem;
   }

From 38786083163841d29a354ae7cc062d65985dc74b Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:01:03 +0800
Subject: [PATCH 03/11] feat: drive observe quick actions from runtime state

---
 src/web/static/fragments/main-shell.html |   4 +
 src/web/static/js/composer-vue-island.js |  14 ++++
 src/web/static/js/main.js                | 102 ++++++++++++++++++++++-
 src/web/static/styles/dialogue.css       |  24 ++++++
 4 files changed, 142 insertions(+), 2 deletions(-)

diff --git a/src/web/static/fragments/main-shell.html b/src/web/static/fragments/main-shell.html
index ea78147..b8003df 100644
--- a/src/web/static/fragments/main-shell.html
+++ b/src/web/static/fragments/main-shell.html
@@ -110,6 +110,10 @@
     <div class="composer-card">
       <div id="composer-vue-root" class="composer-vue-root hidden"></div>
       <div id="observe-quick-replies" class="quick-reply-row hidden"></div>
+      <div id="observe-quick-hint-row" class="observe-quick-hint-row hidden">
+        <p id="observe-quick-hint" class="observe-quick-hint hidden"></p>
+        <button id="observe-quick-hint-send" type="button" class="soft-button hidden">按提示推进</button>
+      </div>
       <div class="composer-main">
         <div id="dialogue-message-kind" class="composer-kind-toggle" role="group" aria-label="输入类型">
           <button type="button" class="kind-chip active" data-kind="dialogue">台词</button>
diff --git a/src/web/static/js/composer-vue-island.js b/src/web/static/js/composer-vue-island.js
index be1ea41..791016e 100644
--- a/src/web/static/js/composer-vue-island.js
+++ b/src/web/static/js/composer-vue-island.js
@@ -58,6 +58,7 @@
       );
       const placeholder = computed(() => String(composer.value.placeholder || ""));
       const quickReplies = computed(() => (Array.isArray(composer.value.quickReplies) ? composer.value.quickReplies : []));
+      const quickHint = computed(() => String(composer.value.quickHint || "").trim());
       const disabled = computed(() => Boolean(composer.value.disabled));
       const suggestHidden = computed(() => Boolean(composer.value.suggestHidden) || mode.value === "observe");
       const suggestDisabled = computed(() => Boolean(composer.value.suggestDisabled));
@@ -114,6 +115,7 @@
         draftKind,
         handleEnter,
         placeholder,
+        quickHint,
         quickReplies,
         quickReply,
         send,
@@ -140,6 +142,18 @@
           </button>
         </div>
 
+        <div v-if="quickHint" class="observe-quick-hint-row">
+          <p class="observe-quick-hint">顺手往下推：{{ quickHint }}</p>
+          <button
+            type="button"
+            class="soft-button"
+            :disabled="disabled"
+            @click="quickReply(quickHint)"
+          >
+            按提示推进
+          </button>
+        </div>
+
         <div class="composer-main composer-main-vue">
           <div class="composer-kind-toggle" role="group" aria-label="输入类型">
             <button
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index d79b9c9..f3092d4 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -2289,11 +2289,68 @@ const OBSERVE_QUICK_REPLIES = [
 ];
 let currentDialogueMessageKind = "dialogue";
 
+function buildObserveQuickReplies(session = currentDialogueSession) {
+  const overview = session?.runtime_state_overview || {};
+  const present = Array.isArray(overview?.present) ? overview.present.filter(Boolean) : [];
+  const offstage = Array.isArray(overview?.offstage) ? overview.offstage.filter(Boolean) : [];
+  const shouldShift = Boolean(overview?.should_offer_scene_shift);
+  const nextHint = String(overview?.next_hint || "").trim();
+  const tension = String(overview?.tension || "").trim();
+  const eventRows = Array.isArray(overview?.event_rows) ? overview.event_rows : [];
+  const dynamic = [];
+
+  if (shouldShift) {
+    dynamic.push({
+      label: "转下一幕",
+      value: nextHint || "这一拍差不多收住了，场面顺势往下一幕转过去。",
+    });
+  }
+  if (offstage.length) {
+    dynamic.push({
+      label: `切回${String(offstage[0]).slice(0, 4)}`,
+      value: `${offstage[0]}那边也有了新的动静，镜头顺势切过去。`,
+    });
+  }
+  if (present.length >= 2) {
+    dynamic.push({
+      label: "只留他们",
+      value: `旁的人都暂时退开，只剩${present.slice(0, 2).join("和")}把这句话接下去。`,
+    });
+  }
+  if (tension) {
+    dynamic.push({
+      label: "顺着张力",
+      value: "这股气氛没有散，反而又往前逼近了一步。",
+    });
+  }
+  const lastEvent = eventRows.length ? eventRows[eventRows.length - 1] : null;
+  if (lastEvent?.copy) {
+    dynamic.push({
+      label: "顺着波动",
+      value: String(lastEvent.copy || "").trim(),
+    });
+  }
+
+  const merged = [];
+  const seen = new Set();
+  [...dynamic, ...OBSERVE_QUICK_REPLIES].forEach((item) => {
+    const label = String(item?.label || "").trim();
+    const value = String(item?.value || "").trim();
+    if (!label || !value) return;
+    const key = `${label}::${value}`;
+    if (seen.has(key)) return;
+    seen.add(key);
+    merged.push({ label, value });
+  });
+  return merged.slice(0, 6);
+}
+
 function buildComposerUiState() {
   const area = el("dialogue-message");
   const sendButton = el("prepare-turn-button");
   const suggestButton = el("suggest-turn-button");
   const mode = currentDialogueSession?.mode || currentDialogueSession?.session_card?.mode || "";
+  const nextHint = mode === "observe" ? String(currentDialogueSession?.runtime_state_overview?.next_hint || "").trim() : "";
   return {
     mode,
     kind: normalizeDialogueMessageKind(currentDialogueMessageKind),
@@ -2303,7 +2360,8 @@ function buildComposerUiState() {
     suggestHidden: Boolean(suggestButton?.classList.contains("hidden")),
     suggestDisabled: Boolean(suggestButton?.disabled),
     sendDisabled: Boolean(sendButton?.disabled),
-    quickReplies: mode === "observe" ? OBSERVE_QUICK_REPLIES : [],
+    quickReplies: mode === "observe" ? buildObserveQuickReplies(currentDialogueSession) : [],
+    quickHint: nextHint,
   };
 }
 
@@ -2406,17 +2464,29 @@ function setSuggestingState(waiting) {
 
 function renderObserveQuickReplies(session = currentDialogueSession) {
   const root = el("observe-quick-replies");
+  const hint = el("observe-quick-hint");
+  const hintRow = el("observe-quick-hint-row");
+  const hintSend = el("observe-quick-hint-send");
   if (!root) return;
   const mode = session?.mode || session?.session_card?.mode || "";
   if (mode !== "observe") {
     root.innerHTML = "";
     root.classList.add("hidden");
+    if (hintRow) hintRow.classList.add("hidden");
+    if (hint) {
+      hint.textContent = "";
+      hint.classList.add("hidden");
+    }
+    if (hintSend) {
+      hintSend.classList.add("hidden");
+      hintSend.removeAttribute("data-value");
+    }
     publishComposerUiState("composer-quick-replies-hidden");
     return;
   }
 
   root.innerHTML = "";
-  OBSERVE_QUICK_REPLIES.forEach((item) => {
+  buildObserveQuickReplies(session).forEach((item) => {
     const button = document.createElement("button");
     button.type = "button";
     button.className = "quick-reply-chip";
@@ -2428,9 +2498,32 @@ function renderObserveQuickReplies(session = currentDialogueSession) {
     root.appendChild(button);
   });
   root.classList.remove("hidden");
+  const nextHint = String(session?.runtime_state_overview?.next_hint || "").trim();
+  if (hint) {
+    hint.textContent = nextHint ? `顺手往下推：${nextHint}` : "";
+    hint.classList.toggle("hidden", !nextHint);
+  }
+  if (hintSend) {
+    hintSend.classList.toggle("hidden", !nextHint);
+    if (nextHint) {
+      hintSend.setAttribute("data-value", nextHint);
+    } else {
+      hintSend.removeAttribute("data-value");
+    }
+  }
+  if (hintRow) {
+    hintRow.classList.toggle("hidden", !nextHint);
+  }
   publishComposerUiState("composer-quick-replies-rendered");
 }
 
+async function applyQuickHint() {
+  const button = el("observe-quick-hint-send");
+  const value = String(button?.getAttribute("data-value") || "").trim();
+  if (!value) return;
+  await applyQuickReply(value);
+}
+
 async function applyQuickReply(value) {
   const message = String(value || "").trim();
   const area = el("dialogue-message");
@@ -2807,6 +2900,11 @@ function bindEvents() {
       window.toggleDialogueMemory();
     }
   });
+  bind("observe-quick-hint-send", "click", () => {
+    applyQuickHint().catch((error) => {
+      setStatus("dialogue-session-status", error.message || "这句推进提示暂时没有送出去。");
+    });
+  });
   bind("close-dialogue-memory-modal-button", "click", () => {
     if (typeof window.closeDialogueMemoryModal === "function") {
       window.closeDialogueMemoryModal();
diff --git a/src/web/static/styles/dialogue.css b/src/web/static/styles/dialogue.css
index 5fcb210..7093407 100644
--- a/src/web/static/styles/dialogue.css
+++ b/src/web/static/styles/dialogue.css
@@ -822,6 +822,30 @@
   display: none;
 }
 
+.observe-quick-hint-row {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 0.6rem;
+  padding: 0 10px 8px;
+}
+
+.observe-quick-hint {
+  margin: 0;
+  color: var(--ink-faint);
+  font-size: 0.68rem;
+  line-height: 1.55;
+  flex: 1 1 auto;
+  min-width: 0;
+}
+
+#observe-quick-hint-send {
+  min-height: 1.6rem;
+  padding: 0 0.56rem;
+  font-size: 0.65rem;
+  flex: 0 0 auto;
+}
+
 .session-group {
   display: grid;
   gap: 0.55rem;

From 8235d781867fd3e975f4407f99d5f2b3b2f2295f Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:09:04 +0800
Subject: [PATCH 04/11] feat: make scene recommendations state-aware

---
 src/web/service_facades/scene_cards.py | 163 ++++++++++++++++++++-
 tests/test_web_app.py                  | 191 +++++++++++++++++++++++++
 2 files changed, 349 insertions(+), 5 deletions(-)

diff --git a/src/web/service_facades/scene_cards.py b/src/web/service_facades/scene_cards.py
index 7b625db..33bfea0 100644
--- a/src/web/service_facades/scene_cards.py
+++ b/src/web/service_facades/scene_cards.py
@@ -82,6 +82,8 @@ def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict
         mode = str(session.get("mode", "") or session.get("session_card", {}).get("mode", "observe")).strip() or "observe"
         participants = list(session.get("session_card", {}).get("participants", []) or [])
         current_scene = dict(session.get("session_card", {}).get("scene_card", {}) or {})
+        runtime_overview = dict(session.get("runtime_state_overview", {}) or {})
+        current_scene_snapshot = _merge_current_scene_snapshot(current_scene, runtime_overview)
         current_scene_id = str(session.get("session_card", {}).get("scene_card_id", "")).strip()
         recent_text = "\n".join(
             str(item.get("message", "")).strip()
@@ -101,7 +103,7 @@ def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict
                 score -= 5
                 reasons.insert(0, "当前已经在这幕里，优先换一拍")
             else:
-                current_location = str(current_scene.get("location", "")).strip()
+                current_location = str(current_scene_snapshot.get("location", "")).strip()
                 candidate_location = str(fields.get("location", "")).strip()
                 if current_location and candidate_location and candidate_location != current_location:
                     score += 1
@@ -112,6 +114,16 @@ def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict
                     score += overlap
                     reasons.append("和最近这几句的气口更接")
 
+                state_bonus, state_reasons = _score_scene_card_with_runtime_state(
+                    fields,
+                    runtime_overview=runtime_overview,
+                    current_scene=current_scene_snapshot,
+                    participants=participants,
+                    recent_text=recent_text,
+                )
+                score += state_bonus
+                reasons.extend(state_reasons)
+
             reranked_items.append(
                 {
                     **item,
@@ -133,10 +145,11 @@ def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict
         recommended_card_id = str(reranked_items[0].get("card_id", "")).strip() if reranked_items else ""
         top_fields = dict(reranked_items[0].get("fields", {}) or {}) if reranked_items else {}
         chain_suggestions = _build_scene_chain_suggestions(
-            current_scene=current_scene,
+            current_scene=current_scene_snapshot,
             current_scene_id=current_scene_id,
             reranked_items=reranked_items,
             recent_text=recent_text,
+            runtime_overview=runtime_overview,
         )
         return {
             "mode": mode,
@@ -144,15 +157,27 @@ def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict
             "current_scene_card_id": current_scene_id,
             "recommended_card_id": recommended_card_id,
             "recommended_transition_message": _build_transition_message_hint(
-                current_scene=current_scene,
+                current_scene=current_scene_snapshot,
                 next_scene=top_fields,
                 recent_text=recent_text,
+                runtime_overview=runtime_overview,
             ),
             "chain_suggestions": chain_suggestions,
             "items": reranked_items,
         }
 
 
+def _merge_current_scene_snapshot(current_scene: dict[str, Any], runtime_overview: dict[str, Any]) -> dict[str, Any]:
+    merged = dict(current_scene or {})
+    if str(runtime_overview.get("location", "")).strip():
+        merged["location"] = str(runtime_overview.get("location", "")).strip()
+    if str(runtime_overview.get("time_hint", "")).strip():
+        merged["time_hint"] = str(runtime_overview.get("time_hint", "")).strip()
+    if str(runtime_overview.get("atmosphere", "")).strip():
+        merged["atmosphere"] = str(runtime_overview.get("atmosphere", "")).strip()
+    return merged
+
+
 def _scene_text_overlap_score(fields: dict[str, Any], recent_text: str) -> int:
     compact_recent = str(recent_text or "").strip()
     if not compact_recent:
@@ -170,17 +195,117 @@ def _scene_text_overlap_score(fields: dict[str, Any], recent_text: str) -> int:
     return min(3, overlap)
 
 
+def _score_scene_card_with_runtime_state(
+    fields: dict[str, Any],
+    *,
+    runtime_overview: dict[str, Any],
+    current_scene: dict[str, Any],
+    participants: list[str],
+    recent_text: str,
+) -> tuple[int, list[str]]:
+    score = 0
+    reasons: list[str] = []
+    current_location = str(current_scene.get("location", "")).strip()
+    candidate_location = str(fields.get("location", "")).strip()
+    current_time = str(runtime_overview.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
+    candidate_time = str(fields.get("time_hint", "")).strip()
+    beat_maturity = max(0, min(100, int(runtime_overview.get("beat_maturity", 0) or 0)))
+    should_shift = bool(runtime_overview.get("should_offer_scene_shift", False))
+    shift_reason = str(runtime_overview.get("scene_shift_reason", "")).strip()
+    tension = str(runtime_overview.get("tension", "")).strip()
+    next_hint = str(runtime_overview.get("next_hint", "")).strip()
+    atmosphere = str(runtime_overview.get("atmosphere", "")).strip()
+    event_rows = list(runtime_overview.get("event_rows", []) or [])
+    recent_event = str((event_rows[-1] or {}).get("copy", "")).strip() if event_rows else ""
+
+    if should_shift:
+        if current_location and candidate_location and candidate_location != current_location:
+            score += 4
+            reasons.append("这一拍已接近收束，更适合换场推进")
+        elif current_location and candidate_location and candidate_location == current_location:
+            score -= 2
+            reasons.append("这一拍已经该收住了，不必继续原地打转")
+        elif candidate_location:
+            score += 1
+            reasons.append("当前已经适合往下一拍走")
+    elif beat_maturity and beat_maturity < 45 and current_location and candidate_location == current_location:
+        score += 2
+        reasons.append("这一拍还没聊满，先在同场景续火更顺")
+
+    if current_time and candidate_time:
+        if candidate_time == current_time:
+            score += 1
+            reasons.append("时间承接自然")
+        elif should_shift or beat_maturity >= 55:
+            score += 2
+            reasons.append("时间推进能带出下一拍")
+
+    state_overlap = _state_overlap_score(
+        fields,
+        state_texts=[atmosphere, tension, next_hint, recent_event, recent_text],
+    )
+    if state_overlap:
+        score += state_overlap
+        reasons.append("能接住本局气氛和悬念")
+
+    if len(participants) >= 3 and candidate_location and any(token in candidate_location for token in ("厅", "堂", "席", "园", "院")):
+        score += 1
+        reasons.append("多人局切到这个场面更容易铺开")
+
+    if shift_reason:
+        shift_tokens = [part for part in re.split(r"[，,。；;、：:\s]+", shift_reason) if 2 <= len(part.strip()) <= 8]
+        if any(token and token in "\n".join(str(fields.get(key, "")).strip() for key in ("opening_situation", "scene_drive", "hidden_tension")) for token in shift_tokens[:4]):
+            score += 2
+            reasons.append("和当前这拍的收束理由接得上")
+
+    return score, reasons
+
+
+def _state_overlap_score(fields: dict[str, Any], *, state_texts: list[str]) -> int:
+    compact_state = "\n".join(text.strip() for text in state_texts if str(text).strip())
+    if not compact_state:
+        return 0
+    phrases: list[str] = []
+    for key in ("atmosphere", "opening_situation", "public_goal", "hidden_tension", "scene_drive"):
+        raw = str(fields.get(key, "")).strip()
+        if not raw:
+            continue
+        for part in re.split(r"[，,。；;、：:\s]+", raw):
+            text = part.strip()
+            if 2 <= len(text) <= 8 and text not in phrases:
+                phrases.append(text)
+    overlap = sum(1 for phrase in phrases[:14] if phrase in compact_state)
+    return min(4, overlap)
+
+
 def _build_transition_message_hint(
     *,
     current_scene: dict[str, Any],
     next_scene: dict[str, Any],
     recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
 ) -> str:
+    runtime_overview = dict(runtime_overview or {})
     next_location = str(next_scene.get("location", "")).strip()
     next_title = str(next_scene.get("title", "")).strip()
     next_opening = str(next_scene.get("opening_situation", "")).strip()
     next_atmosphere = str(next_scene.get("atmosphere", "")).strip()
     current_location = str(current_scene.get("location", "")).strip()
+    next_time = str(next_scene.get("time_hint", "")).strip()
+    current_time = str(runtime_overview.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
+    shift_reason = str(runtime_overview.get("scene_shift_reason", "")).strip()
+    tension = str(runtime_overview.get("tension", "")).strip()
+    should_shift = bool(runtime_overview.get("should_offer_scene_shift", False))
+
+    if shift_reason and should_shift and current_location and next_location and current_location != next_location:
+        anchor = next_title or next_location
+        return f"{shift_reason}，场面顺势从{current_location}转到{anchor}。"
+
+    if next_time and current_time and next_time != current_time:
+        destination = next_location or next_title or "下一幕"
+        if tension:
+            return f"带着这股{_trim_transition_text(tension, 18)}，时间已经推到{next_time}，场面也转进了{destination}。"
+        return f"这一拍不知不觉拖到了{next_time}，场面也顺势转进了{destination}。"
 
     if next_opening:
         first_sentence = re.split(r"[。！？!?]", next_opening, maxsplit=1)[0].strip()
@@ -194,6 +319,8 @@ def _build_transition_message_hint(
         return f"局面一转，众人从{current_location}挪到{anchor}，气氛也跟着变了。"
 
     compact_recent = str(recent_text or "").strip()
+    if tension and next_atmosphere:
+        return f"刚才那股{_trim_transition_text(tension, 18)}还吊着，场面已经慢慢转成了{next_atmosphere}。"
     if compact_recent and next_atmosphere:
         return f"刚才那股{compact_recent[-12:]}的余波还没散，场面已经转成了{next_atmosphere}。"
 
@@ -212,6 +339,7 @@ def _build_scene_chain_suggestions(
     current_scene_id: str,
     reranked_items: list[dict[str, Any]],
     recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
 ) -> list[dict[str, Any]]:
     candidates = [
         item
@@ -224,11 +352,25 @@ def _build_scene_chain_suggestions(
             if second_index == first_index:
                 continue
             chain_items = [first, second]
-            chains.append(_build_chain_payload(current_scene=current_scene, items=chain_items, recent_text=recent_text))
+            chains.append(
+                _build_chain_payload(
+                    current_scene=current_scene,
+                    items=chain_items,
+                    recent_text=recent_text,
+                    runtime_overview=runtime_overview,
+                )
+            )
             for third_index, third in enumerate(candidates):
                 if third_index in {first_index, second_index}:
                     continue
-                chains.append(_build_chain_payload(current_scene=current_scene, items=[first, second, third], recent_text=recent_text))
+                chains.append(
+                    _build_chain_payload(
+                        current_scene=current_scene,
+                        items=[first, second, third],
+                        recent_text=recent_text,
+                        runtime_overview=runtime_overview,
+                    )
+                )
     chains.sort(key=lambda item: (int(item.get("score", 0) or 0), len(item.get("scenes", []) or [])), reverse=True)
     deduped: list[dict[str, Any]] = []
     seen_keys: set[str] = set()
@@ -249,9 +391,11 @@ def _build_chain_payload(
     current_scene: dict[str, Any],
     items: list[dict[str, Any]],
     recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
 ) -> dict[str, Any]:
     scenes: list[dict[str, str]] = []
     previous_scene = dict(current_scene or {})
+    current_runtime = dict(runtime_overview or {})
     total_score = 0
     locations: list[str] = []
     for index, item in enumerate(items):
@@ -272,10 +416,12 @@ def _build_chain_payload(
                     current_scene=previous_scene,
                     next_scene=fields,
                     recent_text=recent_text if index == 0 else str(previous_scene.get("scene_drive", "")).strip(),
+                    runtime_overview=current_runtime if index == 0 else None,
                 ),
             }
         )
         previous_scene = fields
+        current_runtime = {}
     if len(set(locations)) >= 2:
         total_score += 4
     if _chain_has_progressive_drive(scenes):
@@ -309,3 +455,10 @@ def _build_chain_reason(scenes: list[dict[str, str]]) -> str:
         return "每一幕的推进方向都比较明确，适合顺着往下压。"
     first_title = str(scenes[0].get("title", "")).strip() or "这条线"
     return f"可以先接「{first_title}」，后面还有顺势承接的下一拍。"
+
+
+def _trim_transition_text(text: str, limit: int) -> str:
+    compact = str(text or "").strip()
+    if len(compact) <= limit:
+        return compact
+    return f"{compact[: max(1, limit - 1)]}…"
diff --git a/tests/test_web_app.py b/tests/test_web_app.py
index ec4c313..0ed3e3e 100644
--- a/tests/test_web_app.py
+++ b/tests/test_web_app.py
@@ -155,6 +155,197 @@ def test_dialogue_scene_card_recommendation_prefers_next_scene_not_current_one(s
             self.assertGreaterEqual(len(payload["chain_suggestions"][0]["scenes"]), 2)
             self.assertTrue(str(payload["chain_suggestions"][0]["reason"]).strip())
 
+    def test_dialogue_scene_card_recommendation_stays_in_same_location_when_beat_is_early(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            service = WebRunService(tmp)
+            service.save_model_settings(
+                provider="openai-compatible",
+                model="deepseek-chat",
+                base_url="https://example.com/v1",
+                api_key="sk-test",
+            )
+            current_scene = service.save_scene_card(
+                fields={
+                    "title": "雨夜回廊",
+                    "time_hint": "深夜",
+                    "location": "回廊",
+                    "atmosphere": "雨声压着话头",
+                    "opening_situation": "两个人还站在檐下，谁都没把话说透。",
+                    "public_goal": "先试出彼此来意。",
+                    "hidden_tension": "有些旧话一碰就要翻出来。",
+                    "scene_drive": "让试探再压低一层。",
+                    "expected_rhythm": "慢热",
+                    "forbidden_topics": "旧账",
+                }
+            )
+            same_location = service.save_scene_card(
+                fields={
+                    "title": "回廊压低声气",
+                    "time_hint": "深夜",
+                    "location": "回廊",
+                    "atmosphere": "静得能听见雨线擦过栏杆",
+                    "opening_situation": "两个人谁也没走，反而把声音压得更低。",
+                    "public_goal": "顺着刚才的话再往里探一步。",
+                    "hidden_tension": "谁先心软谁就先露了底。",
+                    "scene_drive": "让场面继续收紧，不急着换幕。",
+                    "expected_rhythm": "缓慢加压",
+                    "forbidden_topics": "外人",
+                }
+            )
+            service.save_scene_card(
+                fields={
+                    "title": "转入花厅",
+                    "time_hint": "夜深",
+                    "location": "花厅",
+                    "atmosphere": "人多却更安静",
+                    "opening_situation": "雨势更大，众人被催着转到花厅落座。",
+                    "public_goal": "先把场面稳住。",
+                    "hidden_tension": "真正要问的话还压在心口。",
+                    "scene_drive": "从试探转向更公开的拉扯。",
+                    "expected_rhythm": "三句一推进",
+                    "forbidden_topics": "旧案",
+                }
+            )
+            run = service.create_run(
+                novel_name="hongloumeng.txt",
+                novel_content_base64=base64.b64encode("林黛玉见了贾宝玉。".encode("utf-8")).decode("ascii"),
+                characters=["林黛玉", "贾宝玉"],
+            )
+            for name in ("林黛玉", "贾宝玉"):
+                service.ingest_character_result(
+                    run["run_id"],
+                    character=name,
+                    content_base64=base64.b64encode(
+                        f"- name: {name}\n- novel_id: hongloumeng\n- core_identity: 人物\n".encode("utf-8")
+                    ).decode("ascii"),
+                )
+
+            with patch.object(
+                WebRunService,
+                "_generate_dialogue_responses",
+                return_value=[{"speaker": "场景提示", "message": "回廊里只剩雨声和一句没说完的话。"}],
+            ):
+                session = service.create_dialogue_session(
+                    run["run_id"],
+                    mode="observe",
+                    participants=["林黛玉", "贾宝玉"],
+                    scene_card_id=current_scene["card_id"],
+                )
+
+            service.dialogue.update_scene_progress_state(
+                run["run_id"],
+                session["session_id"],
+                {
+                    "location": "回廊",
+                    "time_hint": "深夜",
+                    "atmosphere_summary": "雨声压着话头，谁都没有退开",
+                    "beat_maturity": 22,
+                    "should_offer_scene_shift": False,
+                    "scene_shift_reason": "",
+                    "world_tension_summary": "两个人都还在试探，还没到换场的时候",
+                },
+            )
+
+            payload = service.recommend_dialogue_scene_card(run["run_id"], session_id=session["session_id"])
+
+            self.assertEqual(payload["recommended_card_id"], same_location["card_id"])
+
+    def test_dialogue_scene_card_recommendation_uses_runtime_shift_reason_in_transition_hint(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            service = WebRunService(tmp)
+            service.save_model_settings(
+                provider="openai-compatible",
+                model="deepseek-chat",
+                base_url="https://example.com/v1",
+                api_key="sk-test",
+            )
+            current_scene = service.save_scene_card(
+                fields={
+                    "title": "雨夜回廊",
+                    "time_hint": "深夜",
+                    "location": "回廊",
+                    "atmosphere": "雨声压得人心发紧",
+                    "opening_situation": "两个人被雨隔在檐下，话已经逼到边上。",
+                    "public_goal": "先稳住表面客气。",
+                    "hidden_tension": "真正的问题已经快藏不住了。",
+                    "scene_drive": "让试探逼近摊牌。",
+                    "expected_rhythm": "慢热",
+                    "forbidden_topics": "前尘",
+                }
+            )
+            next_scene = service.save_scene_card(
+                fields={
+                    "title": "灯下入席",
+                    "time_hint": "夜深",
+                    "location": "花厅",
+                    "atmosphere": "灯火亮着，谁都更难回避彼此",
+                    "opening_situation": "雨脚催着众人换到花厅，落座后谁也没先碰茶。",
+                    "public_goal": "把表面话撑到头。",
+                    "hidden_tension": "下一句就可能把真正心思挑明。",
+                    "scene_drive": "让局面顺势从回避转向正面相对。",
+                    "expected_rhythm": "越聊越紧",
+                    "forbidden_topics": "闲话",
+                }
+            )
+            service.save_scene_card(
+                fields={
+                    "title": "回廊再压一拍",
+                    "time_hint": "深夜",
+                    "location": "回廊",
+                    "atmosphere": "雨线更急，但还是没人挪步",
+                    "opening_situation": "两个人还站在原地，只把语气压得更轻。",
+                    "public_goal": "把上一句试探再咬紧一点。",
+                    "hidden_tension": "谁先退让谁就输了这口气。",
+                    "scene_drive": "继续在原地消磨彼此的耐心。",
+                    "expected_rhythm": "慢压",
+                    "forbidden_topics": "旁人",
+                }
+            )
+            run = service.create_run(
+                novel_name="hongloumeng.txt",
+                novel_content_base64=base64.b64encode("林黛玉见了贾宝玉。".encode("utf-8")).decode("ascii"),
+                characters=["林黛玉", "贾宝玉"],
+            )
+            for name in ("林黛玉", "贾宝玉"):
+                service.ingest_character_result(
+                    run["run_id"],
+                    character=name,
+                    content_base64=base64.b64encode(
+                        f"- name: {name}\n- novel_id: hongloumeng\n- core_identity: 人物\n".encode("utf-8")
+                    ).decode("ascii"),
+                )
+
+            with patch.object(
+                WebRunService,
+                "_generate_dialogue_responses",
+                return_value=[{"speaker": "场景提示", "message": "雨已经大到不得不换个地方把话说完。"}],
+            ):
+                session = service.create_dialogue_session(
+                    run["run_id"],
+                    mode="observe",
+                    participants=["林黛玉", "贾宝玉"],
+                    scene_card_id=current_scene["card_id"],
+                )
+
+            service.dialogue.update_scene_progress_state(
+                run["run_id"],
+                session["session_id"],
+                {
+                    "location": "回廊",
+                    "time_hint": "深夜",
+                    "atmosphere_summary": "雨势更重，回避已经压不住了",
+                    "beat_maturity": 82,
+                    "should_offer_scene_shift": True,
+                    "scene_shift_reason": "雨势压得两人都没法再站在回廊里装作无事",
+                    "world_tension_summary": "再拖一两句，局面就会逼到必须正面开口",
+                },
+            )
+
+            payload = service.recommend_dialogue_scene_card(run["run_id"], session_id=session["session_id"])
+
+            self.assertEqual(payload["recommended_card_id"], next_scene["card_id"])
+            self.assertIn("雨势压得两人都没法再站在回廊里装作无事", payload["recommended_transition_message"])
+
     def test_dialogue_scene_history_tracks_initial_scene_and_switches(self):
         with tempfile.TemporaryDirectory() as tmp:
             service = WebRunService(tmp)

From 70bbe46e8ae7653a5089aa4ed591a48052ad4345 Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:12:59 +0800
Subject: [PATCH 05/11] feat: surface scene shift prompts in chat ui

---
 src/web/static/fragments/main-shell.html |  4 ++++
 src/web/static/js/main.js                | 26 +++++++++++++++++++++++-
 src/web/static/styles/dialogue.css       | 22 ++++++++++++++++++++
 3 files changed, 51 insertions(+), 1 deletion(-)

diff --git a/src/web/static/fragments/main-shell.html b/src/web/static/fragments/main-shell.html
index b8003df..d76ef0d 100644
--- a/src/web/static/fragments/main-shell.html
+++ b/src/web/static/fragments/main-shell.html
@@ -26,6 +26,10 @@
                 <strong>中途转场</strong>
                 <small>切一张场景卡，再补一句转场提示，就能把这一幕顺手推过去。</small>
               </div>
+              <div id="dialogue-live-scene-shift-hint" class="dialogue-live-scene-shift-hint hidden">
+                <p id="dialogue-live-scene-shift-copy" class="dialogue-live-scene-shift-copy"></p>
+                <button id="dialogue-live-scene-shift-recommend" type="button" class="soft-button">顺手挑下一幕</button>
+              </div>
               <div class="dialogue-scene-switcher-row">
                 <button id="dialogue-live-scene-recommend" type="button" class="soft-button">推荐下一幕</button>
                 <select id="dialogue-live-scene-card"></select>
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index f3092d4..4970cdd 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -930,6 +930,9 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
   const select = el("dialogue-live-scene-card");
   const status = el("dialogue-live-scene-status");
   const recommendButton = el("dialogue-live-scene-recommend");
+  const shiftHint = el("dialogue-live-scene-shift-hint");
+  const shiftCopy = el("dialogue-live-scene-shift-copy");
+  const shiftRecommendButton = el("dialogue-live-scene-shift-recommend");
   if (!shell || !select) return;
   const hasSession = Boolean(session?.session_id) && Boolean(currentRunId);
   shell.classList.toggle("hidden", !hasSession);
@@ -937,11 +940,19 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
     select.innerHTML = "";
     if (status) status.textContent = "";
     if (recommendButton) recommendButton.disabled = true;
+    if (shiftHint) shiftHint.classList.add("hidden");
+    if (shiftCopy) shiftCopy.textContent = "";
+    if (shiftRecommendButton) shiftRecommendButton.disabled = true;
     renderDialogueSceneChainSuggestions([], "");
     return;
   }
   if (recommendButton) recommendButton.disabled = sceneCards.length < 2;
+  if (shiftRecommendButton) shiftRecommendButton.disabled = sceneCards.length < 2;
   const currentSceneId = String(session?.session_card?.scene_card_id || "").trim();
+  const overview = session?.runtime_state_overview || {};
+  const shouldShift = Boolean(overview?.should_offer_scene_shift);
+  const shiftReason = String(overview?.scene_shift_reason || "").trim();
+  const nextHint = String(overview?.next_hint || "").trim();
   const previous = select.value || currentSceneId;
   select.innerHTML = "";
   const blank = document.createElement("option");
@@ -961,8 +972,20 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
   } else {
     select.value = currentSceneId;
   }
+  if (shiftHint) {
+    shiftHint.classList.toggle("hidden", !shouldShift);
+  }
+  if (shiftCopy) {
+    shiftCopy.textContent = shouldShift
+      ? (shiftReason || nextHint || "这一拍差不多收住了，可以顺势切到下一幕。")
+      : "";
+  }
   if (status && !String(status.textContent || "").trim()) {
-    status.textContent = currentSceneId ? "当前会话已经挂载场景卡，你可以随时切到另一幕。" : "当前会话还没挂场景卡，也可以直接在这里接入一张。";
+    if (shouldShift) {
+      status.textContent = "这一拍已经接近收束，可以顺势切一张场景卡。";
+    } else {
+      status.textContent = currentSceneId ? "当前会话已经挂载场景卡，你可以随时切到另一幕。" : "当前会话还没挂场景卡，也可以直接在这里接入一张。";
+    }
   }
   renderDialogueSceneChainSuggestions(currentDialogueSceneChainSuggestions, session?.session_id || "");
 }
@@ -2872,6 +2895,7 @@ function bindEvents() {
   bind("delete-opening-preset-button", "click", handleDeleteOpeningPreset);
   bind("recommend-scene-card-button", "click", handleRecommendSceneCard);
   bind("dialogue-live-scene-recommend", "click", handleRecommendDialogueSceneCard);
+  bind("dialogue-live-scene-shift-recommend", "click", handleRecommendDialogueSceneCard);
   bind("dialogue-live-scene-apply", "click", handleApplyDialogueSceneCard);
   bind("create-scene-card-button", "click", handleOpenNewSceneCard);
   bind("edit-scene-card-button", "click", handleEditCurrentSceneCard);
diff --git a/src/web/static/styles/dialogue.css b/src/web/static/styles/dialogue.css
index 7093407..23e7c4f 100644
--- a/src/web/static/styles/dialogue.css
+++ b/src/web/static/styles/dialogue.css
@@ -140,6 +140,28 @@
   background: rgba(255, 255, 255, 0.62);
 }
 
+.dialogue-live-scene-shift-hint {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 0.7rem;
+  padding: 0.62rem 0.7rem;
+  border-radius: 12px;
+  border: 1px solid rgba(194, 157, 138, 0.18);
+  background: linear-gradient(180deg, rgba(255, 249, 244, 0.96), rgba(249, 238, 229, 0.9));
+}
+
+.dialogue-live-scene-shift-copy {
+  margin: 0;
+  color: var(--ink-soft);
+  font-size: 0.7rem;
+  line-height: 1.55;
+}
+
+#dialogue-live-scene-shift-recommend {
+  flex: 0 0 auto;
+}
+
 .dialogue-scene-chain-suggestions {
   display: grid;
   gap: 0.42rem;

From 8c0610167254b336a8dc28017753fe0323dfa4fe Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:19:03 +0800
Subject: [PATCH 06/11] feat: steer observe suggestions with scene progress

---
 src/web/chat/helpers.py |   4 ++
 src/web/chat/service.py |  74 +++++++++++++++++++++++-----
 tests/test_web_app.py   | 105 ++++++++++++++++++++++++++++++++++++++++
 3 files changed, 172 insertions(+), 11 deletions(-)

diff --git a/src/web/chat/helpers.py b/src/web/chat/helpers.py
index c47b3ca..e13d905 100644
--- a/src/web/chat/helpers.py
+++ b/src/web/chat/helpers.py
@@ -420,6 +420,7 @@ def build_dialogue_suggestion_llm_messages(
     relation_excerpt = str(payload.get("relation_context", {}).get("relations_excerpt", "")).strip()
     history = payload.get("history", [])
     memory_context = dict(payload.get("memory_context", {}) or {})
+    scene_progress = dict(payload.get("scene_progress", {}) or memory_context.get("scene_progress", {}) or {})
     instructions = dict(payload.get("instructions", {}) or {})
     host_action = dict(payload.get("host_action", {}) or {})
     scene_card = dict(payload.get("scene_card", {}) or {})
@@ -439,6 +440,8 @@ def build_dialogue_suggestion_llm_messages(
         "如果上下文允许多种接法，优先选更符合 user_persona 的那一种，而不是只做一个泛用接话。",
         "如果 mode=act，就按 controlled character 的 persona profile、speech_style、temperament 和典型说话习惯来写。",
         "如果 mode=observe，就把这句话写成推动剧情的场景提示：让局势往前走，而不是复述、总结或劝说。",
+        "如果 scene_progress 显示这一拍已经成熟、适合转场，就优先写成自然的转场推进；如果还没到转场时机，就优先续当前这一拍的动作、情绪或张力。",
+        "offstage_participants 里的人不要被你无端写回来，除非这句提示本身就在明确推动他们重新入场。",
         "如果 scene_card 存在，优先服从它给出的地点、气氛、开场局面、明面目标、暗线张力与推进方向。",
         "只输出一句最终可发送的成品台词，不要解释上下文，不要总结历史，不要提供建议理由，不要写“作为/当前场景/我们可以/你可以/建议/回复：”这类分析话术。",
         "不要分段，不要项目符号，不要加引号，不要加说话人标签。",
@@ -454,6 +457,7 @@ def build_dialogue_suggestion_llm_messages(
         "speaker": str(input_block.get("speaker", "")).strip(),
         "seed_text": str(input_block.get("message", "")).strip(),
         "scene_card": scene_card,
+        "scene_progress": scene_progress,
         "memory_context": memory_context,
         "user_persona": user_persona,
         "participants": participants,
diff --git a/src/web/chat/service.py b/src/web/chat/service.py
index 3f7e1c2..0424fea 100644
--- a/src/web/chat/service.py
+++ b/src/web/chat/service.py
@@ -551,7 +551,13 @@ def build_suggestion_payload(
         speaker = str(payload.get("input", {}).get("speaker", "")).strip()
         participants = list(payload.get("input", {}).get("participants", []))
         payload["kind"] = "zaomeng_dialogue_suggestion"
-        payload["user_persona"] = self._build_user_suggestion_persona(mode, session, payload.get("persona_contexts", []))
+        scene_progress = dict(payload.get("scene_progress", {}) or {})
+        payload["user_persona"] = self._build_user_suggestion_persona(
+            mode,
+            session,
+            payload.get("persona_contexts", []),
+            scene_progress=scene_progress,
+        )
         payload["instructions"] = {
             "mode": mode,
             "generation_goal": "Draft one short, natural, directly sendable next user line that fits the current scene, relationships, and persona voices.",
@@ -563,7 +569,12 @@ def build_suggestion_payload(
             "expected_output": {"suggestion": "一句可直接发送的话"},
             "output_rule": "Keep it short, in-scene, directly sendable, and never explanatory.",
         }
-        payload["host_prompt_brief"] = self._host_suggestion_prompt_brief(mode, speaker, participants)
+        payload["host_prompt_brief"] = self._host_suggestion_prompt_brief(
+            mode,
+            speaker,
+            participants,
+            scene_progress=scene_progress,
+        )
         payload["updated_at"] = _utc_now()
         return payload
 
@@ -924,8 +935,11 @@ def _build_user_suggestion_persona(
         mode: str,
         session: dict[str, Any],
         persona_contexts: list[dict[str, Any]],
+        *,
+        scene_progress: dict[str, Any] | None = None,
     ) -> dict[str, Any]:
         scene_card = dict(session.get("scene_card", {}) or {})
+        state = dict(scene_progress or {})
         if mode == "act":
             controlled = str(session.get("controlled_character", "")).strip()
             matched = next(
@@ -951,20 +965,39 @@ def _build_user_suggestion_persona(
                 "profile": dict(card),
                 "scene_card": scene_card,
             }
+        preferred_moves = [
+            "introduce a new action",
+            "add a small interruption",
+            "surface a hidden tension",
+            "shift the emotional temperature",
+            "make someone notice something important",
+        ]
+        offstage = [str(item).strip() for item in list(state.get("offstage_participants", []) or []) if str(item).strip()]
+        if bool(state.get("should_offer_scene_shift", False)):
+            preferred_moves.extend(
+                [
+                    "turn the scene into its next beat naturally",
+                    "advance time or location without sounding abrupt",
+                ]
+            )
+        elif offstage:
+            preferred_moves.append("briefly cut to an offstage thread only if the text explicitly motivates it")
         return {
             "mode": "observe",
             "speaker": "User",
             "source": "observer_hint",
-            "must_follow": "Write as a scene observer giving a short in-world nudge that actively moves the scene, rather than speaking as a cast member.",
+            "must_follow": (
+                "Write as a scene observer giving a short in-world nudge that actively moves the scene, "
+                "rather than speaking as a cast member. Respect the current scene progress, presence state, "
+                "and whether this beat should continue or naturally turn into the next one."
+            ),
             "profile": {
                 "goal": "push_plot_forward",
-                "preferred_moves": [
-                    "introduce a new action",
-                    "add a small interruption",
-                    "surface a hidden tension",
-                    "shift the emotional temperature",
-                    "make someone notice something important",
-                ],
+                "preferred_moves": preferred_moves,
+                "scene_shift_reason": str(state.get("scene_shift_reason", "")).strip(),
+                "time_hint": str(state.get("time_hint", "")).strip(),
+                "location": str(state.get("location", "")).strip(),
+                "world_tension_summary": str(state.get("world_tension_summary", "")).strip(),
             },
             "scene_card": scene_card,
         }
@@ -993,11 +1026,30 @@ def _host_prompt_brief(mode: str, speaker: str, participants: list[str]) -> str:
         return f"The user is observing. Let {', '.join(participants)} continue the scene in character and keep the chosen scene moving."
 
     @staticmethod
-    def _host_suggestion_prompt_brief(mode: str, speaker: str, participants: list[str]) -> str:
+    def _host_suggestion_prompt_brief(
+        mode: str,
+        speaker: str,
+        participants: list[str],
+        *,
+        scene_progress: dict[str, Any] | None = None,
+    ) -> str:
+        state = dict(scene_progress or {})
         if mode == "act":
             return f"Help the user speak as {speaker} with one believable next line."
         if mode == "insert":
             return f"Help the user speak as {speaker} inside the current scene with one natural next line."
+        shift_reason = str(state.get("scene_shift_reason", "")).strip()
+        if bool(state.get("should_offer_scene_shift", False)):
+            return (
+                f"Help the user guide {', '.join(participants)} with one short prompt that naturally turns this scene into its next beat. "
+                f"Current transition pressure: {shift_reason or 'the current beat already feels complete'}."
+            )
+        tension = str(state.get("world_tension_summary", "")).strip()
+        if tension:
+            return (
+                f"Help the user guide {', '.join(participants)} with one short prompt that clearly pushes the scene forward. "
+                f"Carry this tension: {tension}."
+            )
         return f"Help the user guide {', '.join(participants)} with one short prompt that clearly pushes the scene into its next beat."
 
     @staticmethod
diff --git a/tests/test_web_app.py b/tests/test_web_app.py
index 0ed3e3e..4bcde21 100644
--- a/tests/test_web_app.py
+++ b/tests/test_web_app.py
@@ -3881,6 +3881,111 @@ def test_build_suggestion_payload_uses_plot_push_observer_hint_in_observe_mode(s
             self.assertIn("introduce a new action", payload["user_persona"]["profile"]["preferred_moves"])
             self.assertIn("pushes the plot forward", payload["instructions"]["response_style"])
 
+    def test_build_suggestion_payload_observe_mode_carries_scene_shift_pressure(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            service = WebRunService(tmp)
+            service.save_model_settings(
+                provider="openai-compatible",
+                model="deepseek-chat",
+                base_url="https://example.com/v1",
+                api_key="sk-test",
+            )
+            run = service.create_run(
+                novel_name="hongloumeng.txt",
+                novel_content_base64=base64.b64encode("林黛玉见了贾宝玉。".encode("utf-8")).decode("ascii"),
+                characters=["林黛玉", "贾宝玉"],
+            )
+            run_id = run["run_id"]
+            for name in ("林黛玉", "贾宝玉"):
+                service.ingest_character_result(
+                    run_id,
+                    character=name,
+                    content_base64=base64.b64encode(
+                        f"- name: {name}\n- novel_id: hongloumeng\n- core_identity: 人物\n".encode("utf-8")
+                    ).decode("ascii"),
+                )
+            manifest = service._require_manifest(run_id)
+            session = service.dialogue.create_session(
+                manifest,
+                mode="observe",
+                participants=["林黛玉", "贾宝玉"],
+                controlled_character="",
+                self_profile={},
+            )
+            service.dialogue.update_scene_progress_state(
+                run_id,
+                session["session_id"],
+                {
+                    "location": "回廊",
+                    "time_hint": "夜深",
+                    "beat_maturity": 85,
+                    "should_offer_scene_shift": True,
+                    "scene_shift_reason": "雨势更大，再站在回廊里已经接不下去了",
+                    "world_tension_summary": "两个人都知道下一句就该把局面带进新的地方",
+                },
+            )
+
+            payload = service.dialogue.build_suggestion_payload(
+                manifest,
+                session_id=session["session_id"],
+                seed_text="",
+            )
+
+            self.assertIn("turn the scene into its next beat naturally", payload["user_persona"]["profile"]["preferred_moves"])
+            self.assertEqual(payload["user_persona"]["profile"]["scene_shift_reason"], "雨势更大，再站在回廊里已经接不下去了")
+            self.assertIn("naturally turns this scene into its next beat", payload["host_prompt_brief"])
+            self.assertIn("Current transition pressure", payload["host_prompt_brief"])
+
+    def test_build_dialogue_suggestion_messages_use_scene_progress_for_observe_mode(self):
+        payload = {
+            "mode": "observe",
+            "input": {
+                "speaker": "User",
+                "message": "",
+                "participants": ["林黛玉", "贾宝玉"],
+            },
+            "persona_contexts": [],
+            "user_persona": {
+                "mode": "observe",
+                "speaker": "User",
+                "source": "observer_hint",
+                "must_follow": "Write as a scene observer giving a short in-world nudge.",
+                "profile": {
+                    "goal": "push_plot_forward",
+                    "preferred_moves": ["turn the scene into its next beat naturally"],
+                },
+            },
+            "relation_context": {"relations_excerpt": ""},
+            "history": [],
+            "memory_context": {"scene_progress": {"offstage_participants": ["薛宝钗"]}},
+            "scene_progress": {
+                "time_hint": "夜深",
+                "location": "回廊",
+                "offstage_participants": ["薛宝钗"],
+                "should_offer_scene_shift": True,
+                "scene_shift_reason": "这幕已经够满，可以顺势切到花厅",
+            },
+            "instructions": {
+                "generation_goal": "Draft one short, natural, directly sendable next user line that fits the current scene, relationships, and persona voices.",
+                "mode_rule": "Draft the user's next line as a short scene-steering utterance.",
+                "speaker_rule": "Treat the user message as a scene steering hint.",
+                "response_style": "Prefer one short scene-driving prompt that pushes the plot forward immediately.",
+                "scene_rule": "Keep the scene anchored.",
+            },
+            "host_action": {
+                "expected_output": {"suggestion": "一句可直接发送的话"},
+                "output_rule": "Keep it short, in-scene, directly sendable, and never explanatory.",
+            },
+            "host_prompt_brief": "Help the user guide 林黛玉, 贾宝玉 with one short prompt that naturally turns this scene into its next beat.",
+            "scene_card": {},
+        }
+
+        messages = WebRunService._build_dialogue_suggestion_llm_messages(payload)
+
+        self.assertIn("scene_progress", messages[1]["content"])
+        self.assertIn("这一拍已经成熟、适合转场", messages[0]["content"])
+        self.assertIn("offstage_participants", messages[0]["content"])
+
 
 @unittest.skipIf(TestClient is None or create_app is None, "fastapi test dependencies unavailable")
 class WebAppRouteTests(unittest.TestCase):

From a282132fdd08386ab5d8cfab0ac2097c11a3b54a Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:21:38 +0800
Subject: [PATCH 07/11] feat: show scene context in scene switcher

---
 src/web/static/fragments/main-shell.html |  1 +
 src/web/static/js/main.js                | 18 ++++++++++++++++++
 src/web/static/styles/dialogue.css       |  7 +++++++
 3 files changed, 26 insertions(+)

diff --git a/src/web/static/fragments/main-shell.html b/src/web/static/fragments/main-shell.html
index d76ef0d..f260275 100644
--- a/src/web/static/fragments/main-shell.html
+++ b/src/web/static/fragments/main-shell.html
@@ -26,6 +26,7 @@
                 <strong>中途转场</strong>
                 <small>切一张场景卡，再补一句转场提示，就能把这一幕顺手推过去。</small>
               </div>
+              <p id="dialogue-live-scene-context" class="dialogue-live-scene-context hidden"></p>
               <div id="dialogue-live-scene-shift-hint" class="dialogue-live-scene-shift-hint hidden">
                 <p id="dialogue-live-scene-shift-copy" class="dialogue-live-scene-shift-copy"></p>
                 <button id="dialogue-live-scene-shift-recommend" type="button" class="soft-button">顺手挑下一幕</button>
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index 4970cdd..f517888 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -929,6 +929,7 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
   const shell = el("dialogue-scene-switcher");
   const select = el("dialogue-live-scene-card");
   const status = el("dialogue-live-scene-status");
+  const context = el("dialogue-live-scene-context");
   const recommendButton = el("dialogue-live-scene-recommend");
   const shiftHint = el("dialogue-live-scene-shift-hint");
   const shiftCopy = el("dialogue-live-scene-shift-copy");
@@ -939,6 +940,10 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
   if (!hasSession) {
     select.innerHTML = "";
     if (status) status.textContent = "";
+    if (context) {
+      context.textContent = "";
+      context.classList.add("hidden");
+    }
     if (recommendButton) recommendButton.disabled = true;
     if (shiftHint) shiftHint.classList.add("hidden");
     if (shiftCopy) shiftCopy.textContent = "";
@@ -953,6 +958,10 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
   const shouldShift = Boolean(overview?.should_offer_scene_shift);
   const shiftReason = String(overview?.scene_shift_reason || "").trim();
   const nextHint = String(overview?.next_hint || "").trim();
+  const timeHint = String(overview?.time_hint || "").trim();
+  const location = String(overview?.location || "").trim();
+  const present = Array.isArray(overview?.present) ? overview.present.filter(Boolean).slice(0, 3) : [];
+  const offstage = Array.isArray(overview?.offstage) ? overview.offstage.filter(Boolean).slice(0, 2) : [];
   const previous = select.value || currentSceneId;
   select.innerHTML = "";
   const blank = document.createElement("option");
@@ -980,6 +989,15 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
       ? (shiftReason || nextHint || "这一拍差不多收住了，可以顺势切到下一幕。")
       : "";
   }
+  if (context) {
+    const parts = [];
+    if (location) parts.push(`地点：${location}`);
+    if (timeHint) parts.push(`时间：${timeHint}`);
+    if (present.length) parts.push(`在场：${present.join("、")}`);
+    if (offstage.length) parts.push(`离场：${offstage.join("、")}`);
+    context.textContent = parts.join(" · ");
+    context.classList.toggle("hidden", parts.length === 0);
+  }
   if (status && !String(status.textContent || "").trim()) {
     if (shouldShift) {
       status.textContent = "这一拍已经接近收束，可以顺势切一张场景卡。";
diff --git a/src/web/static/styles/dialogue.css b/src/web/static/styles/dialogue.css
index 23e7c4f..391cd57 100644
--- a/src/web/static/styles/dialogue.css
+++ b/src/web/static/styles/dialogue.css
@@ -158,6 +158,13 @@
   line-height: 1.55;
 }
 
+#dialogue-live-scene-context {
+  margin: 0;
+  color: var(--ink-faint);
+  font-size: 0.67rem;
+  line-height: 1.55;
+}
+
 #dialogue-live-scene-shift-recommend {
   flex: 0 0 auto;
 }

From a2418cd9dca1fb6fd532b9578a31098e3e30357e Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:36:51 +0800
Subject: [PATCH 08/11] feat: streamline scene recommendation actions

---
 src/web/static/fragments/main-shell.html |  2 +-
 src/web/static/js/main.js                | 99 ++++++++++++++++++++----
 2 files changed, 87 insertions(+), 14 deletions(-)

diff --git a/src/web/static/fragments/main-shell.html b/src/web/static/fragments/main-shell.html
index f260275..04d744d 100644
--- a/src/web/static/fragments/main-shell.html
+++ b/src/web/static/fragments/main-shell.html
@@ -29,7 +29,7 @@
               <p id="dialogue-live-scene-context" class="dialogue-live-scene-context hidden"></p>
               <div id="dialogue-live-scene-shift-hint" class="dialogue-live-scene-shift-hint hidden">
                 <p id="dialogue-live-scene-shift-copy" class="dialogue-live-scene-shift-copy"></p>
-                <button id="dialogue-live-scene-shift-recommend" type="button" class="soft-button">顺手挑下一幕</button>
+                <button id="dialogue-live-scene-shift-recommend" type="button" class="soft-button">顺手切到下一幕</button>
               </div>
               <div class="dialogue-scene-switcher-row">
                 <button id="dialogue-live-scene-recommend" type="button" class="soft-button">推荐下一幕</button>
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index f517888..9fa52b2 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -1011,49 +1011,63 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
 async function handleApplyDialogueSceneCard(event) {
   if (event && typeof event.preventDefault === "function") event.preventDefault();
   if (!currentRunId || !currentDialogueSessionId) return;
+  await applySelectedDialogueSceneCard();
+}
+
+async function applySelectedDialogueSceneCard(options = {}) {
+  if (!currentRunId || !currentDialogueSessionId) return null;
   const select = el("dialogue-live-scene-card");
   const transition = trimmedValue("dialogue-live-scene-transition", "");
   const status = el("dialogue-live-scene-status");
   const button = el("dialogue-live-scene-apply");
   const sceneCardId = String(select?.value || "").trim();
+  const waitingText = String(options?.waitingText || "正在把这一幕转过去...").trim() || "正在把这一幕转过去...";
+  const successText = String(options?.successText || "新的场景已经接上了。").trim() || "新的场景已经接上了。";
   if (!sceneCardId) {
     if (status) status.textContent = "先挑一张要切进去的场景卡。";
-    return;
+    return null;
   }
   if (button) button.disabled = true;
-  if (status) status.textContent = "正在把这一幕转过去...";
+  if (status) status.textContent = waitingText;
   try {
     const payload = await window.__ZAOMENG_WEBUI_API__.switchDialogueSceneCard(currentRunId, currentDialogueSessionId, {
       scene_card_id: sceneCardId,
       scene_profile: currentSceneCard?.card_id === sceneCardId ? (currentSceneCard?.fields || {}) : {},
       transition_message: transition,
     });
+    clearDialogueSceneRecommendationCache();
     if (el("dialogue-live-scene-transition")) {
       setValue("dialogue-live-scene-transition", "");
     }
-    if (status) status.textContent = "新的场景已经接上了。";
+    if (status) status.textContent = successText;
     await renderDialogueSession(payload);
+    return payload;
   } catch (error) {
     if (status) status.textContent = error.message || "切换场景失败。";
+    throw error;
   } finally {
     if (button) button.disabled = false;
   }
 }
 
-async function handleRecommendDialogueSceneCard(event) {
+async function handleRecommendDialogueSceneCard(event, options = {}) {
   if (event && typeof event.preventDefault === "function") event.preventDefault();
   if (!currentRunId || !currentDialogueSessionId) return;
   const select = el("dialogue-live-scene-card");
   const status = el("dialogue-live-scene-status");
   const button = el("dialogue-live-scene-recommend");
+  const shiftButton = el("dialogue-live-scene-shift-recommend");
+  const autoApply = Boolean(options?.autoApply);
+  const force = Boolean(options?.force);
   if (!sceneCards.length) {
     if (status) status.textContent = "你还没有场景卡，先新建一张再来转场。";
     return;
   }
   if (button) button.disabled = true;
+  if (shiftButton) shiftButton.disabled = true;
   if (status) status.textContent = "正在按当前局势替你挑下一幕...";
   try {
-    const payload = await window.__ZAOMENG_WEBUI_API__.recommendDialogueSceneCard(currentRunId, currentDialogueSessionId);
+    const payload = await fetchDialogueSceneRecommendation({ force });
     const recommendedCardId = String(payload?.recommended_card_id || "").trim();
     const recommendedTransition = String(payload?.recommended_transition_message || "").trim();
     currentDialogueSceneChainSuggestions = Array.isArray(payload?.chain_suggestions) ? payload.chain_suggestions : [];
@@ -1074,10 +1088,17 @@ async function handleRecommendDialogueSceneCard(event) {
       status.textContent = reasons.length ? `已替你挑好下一幕：${reasons.join("，")}。` : "已替你挑好一张更接戏的场景卡。";
     }
     renderDialogueSceneChainSuggestions(currentDialogueSceneChainSuggestions, currentDialogueSessionId);
+    if (autoApply) {
+      await applySelectedDialogueSceneCard({
+        waitingText: "正在顺手把这一幕转到下一拍...",
+        successText: "已经顺手切到下一幕了。",
+      });
+    }
   } catch (error) {
     if (status) status.textContent = error.message || "下一幕推荐失败。";
   } finally {
     if (button) button.disabled = sceneCards.length < 2;
+    if (shiftButton) shiftButton.disabled = sceneCards.length < 2;
   }
 }
 
@@ -1118,9 +1139,11 @@ function renderDialogueSceneChainSuggestions(chains = [], sessionId = "") {
     const button = document.createElement("button");
     button.type = "button";
     button.className = "soft-button";
-    button.textContent = "接这条线";
+    button.textContent = "接这条线并切幕";
     button.addEventListener("click", () => {
-      applyDialogueSceneChain(chain);
+      applyDialogueSceneChain(chain).catch((error) => {
+        setStatus("dialogue-live-scene-status", error.message || "这条线暂时没有接上。");
+      });
     });
     actions.appendChild(button);
     card.appendChild(actions);
@@ -1128,7 +1151,7 @@ function renderDialogueSceneChainSuggestions(chains = [], sessionId = "") {
   });
 }
 
-function applyDialogueSceneChain(chain = {}) {
+async function applyDialogueSceneChain(chain = {}) {
   const scenes = Array.isArray(chain?.scenes) ? chain.scenes : [];
   const first = scenes[0] || {};
   const sceneCardId = String(first?.card_id || "").trim();
@@ -1143,9 +1166,16 @@ function applyDialogueSceneChain(chain = {}) {
   if (status) {
     const tailTitles = scenes.slice(1).map((item) => String(item?.title || "").trim()).filter(Boolean);
     status.textContent = tailTitles.length
-      ? `已替你接上这条线，后面还可以顺势转到：${tailTitles.join("、")}。`
-      : "已替你接上这条线。";
-  }
+      ? `正在替你接上这条线，后面还可以顺势转到：${tailTitles.join("、")}。`
+      : "正在替你接上这条线。";
+  }
+  const tailTitles = scenes.slice(1).map((item) => String(item?.title || "").trim()).filter(Boolean);
+  await applySelectedDialogueSceneCard({
+    waitingText: "正在按这条戏路切到下一幕...",
+    successText: tailTitles.length
+      ? `这条线已经接上了，后面还可以顺势转到：${tailTitles.join("、")}。`
+      : "这条线已经接上了。",
+  });
   return true;
 }
 
@@ -2321,6 +2351,8 @@ const DIALOGUE_SUGGESTION_BUSY_LABEL = "…";
 const DIALOGUE_RETRY_FEEDBACK_DELAY_MS = 2200;
 const DIALOGUE_SEND_RETRY_MESSAGE = "这次声源有点慢，正在自动重试...";
 const DIALOGUE_SUGGEST_RETRY_MESSAGE = "这次生成有点慢，正在自动重试...";
+let currentDialogueSceneRecommendationCacheKey = "";
+let currentDialogueSceneRecommendationCachePayload = null;
 const OBSERVE_QUICK_REPLIES = [
   { label: "……", value: "……" },
   { label: "继续聊", value: "继续聊。" },
@@ -2330,6 +2362,39 @@ const OBSERVE_QUICK_REPLIES = [
 ];
 let currentDialogueMessageKind = "dialogue";
 
+function buildDialogueSceneRecommendationCacheKey(session = currentDialogueSession) {
+  const target = session || {};
+  const overview = target?.runtime_state_overview || {};
+  return [
+    String(currentRunId || "").trim(),
+    String(target?.session_id || "").trim(),
+    String(target?.updated_at || "").trim(),
+    String(target?.session_card?.scene_card_id || "").trim(),
+    String(overview?.status_line || "").trim(),
+    String(overview?.next_hint || "").trim(),
+  ].join("::");
+}
+
+function clearDialogueSceneRecommendationCache() {
+  currentDialogueSceneRecommendationCacheKey = "";
+  currentDialogueSceneRecommendationCachePayload = null;
+}
+
+async function fetchDialogueSceneRecommendation(options = {}) {
+  const force = Boolean(options?.force);
+  if (!currentRunId || !currentDialogueSessionId) {
+    return null;
+  }
+  const cacheKey = buildDialogueSceneRecommendationCacheKey(currentDialogueSession);
+  if (!force && cacheKey && cacheKey === currentDialogueSceneRecommendationCacheKey && currentDialogueSceneRecommendationCachePayload) {
+    return currentDialogueSceneRecommendationCachePayload;
+  }
+  const payload = await window.__ZAOMENG_WEBUI_API__.recommendDialogueSceneCard(currentRunId, currentDialogueSessionId);
+  currentDialogueSceneRecommendationCacheKey = cacheKey;
+  currentDialogueSceneRecommendationCachePayload = payload;
+  return payload;
+}
+
 function buildObserveQuickReplies(session = currentDialogueSession) {
   const overview = session?.runtime_state_overview || {};
   const present = Array.isArray(overview?.present) ? overview.present.filter(Boolean) : [];
@@ -2912,8 +2977,16 @@ function bindEvents() {
   bind("start-opening-preset-button", "click", handleStartOpeningPreset);
   bind("delete-opening-preset-button", "click", handleDeleteOpeningPreset);
   bind("recommend-scene-card-button", "click", handleRecommendSceneCard);
-  bind("dialogue-live-scene-recommend", "click", handleRecommendDialogueSceneCard);
-  bind("dialogue-live-scene-shift-recommend", "click", handleRecommendDialogueSceneCard);
+  bind("dialogue-live-scene-recommend", "click", (event) => {
+    handleRecommendDialogueSceneCard(event).catch((error) => {
+      setStatus("dialogue-live-scene-status", error.message || "下一幕推荐失败。");
+    });
+  });
+  bind("dialogue-live-scene-shift-recommend", "click", (event) => {
+    handleRecommendDialogueSceneCard(event, { autoApply: true }).catch((error) => {
+      setStatus("dialogue-live-scene-status", error.message || "顺手切幕失败。");
+    });
+  });
   bind("dialogue-live-scene-apply", "click", handleApplyDialogueSceneCard);
   bind("create-scene-card-button", "click", handleOpenNewSceneCard);
   bind("edit-scene-card-button", "click", handleEditCurrentSceneCard);

From 17cdc29d98454df03a8a757bc742fb37c879d6b2 Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 13:47:08 +0800
Subject: [PATCH 09/11] feat: auto-continue dialogue after scene switch

---
 src/web/api/routes/dialogue.py      |  1 +
 src/web/api/schemas.py              |  1 +
 src/web/chat/__init__.py            |  2 +
 src/web/chat/entrypoints.py         | 41 +++++++++++++++
 src/web/service_facades/dialogue.py | 19 ++++++-
 src/web/static/js/main.js           |  6 ++-
 tests/test_web_app.py               | 80 +++++++++++++++++++++++++++++
 7 files changed, 148 insertions(+), 2 deletions(-)

diff --git a/src/web/api/routes/dialogue.py b/src/web/api/routes/dialogue.py
index f4144ad..ec35b3c 100644
--- a/src/web/api/routes/dialogue.py
+++ b/src/web/api/routes/dialogue.py
@@ -163,6 +163,7 @@ def switch_dialogue_scene_card(
             scene_card_id=payload.scene_card_id,
             scene_profile=payload.scene_profile,
             transition_message=payload.transition_message,
+            auto_continue=payload.auto_continue,
         )
     except FileNotFoundError as exc:
         raise HTTPException(status_code=404, detail="Session not found.") from exc
diff --git a/src/web/api/schemas.py b/src/web/api/schemas.py
index 38c9d8e..d130fe6 100644
--- a/src/web/api/schemas.py
+++ b/src/web/api/schemas.py
@@ -201,6 +201,7 @@ class SwitchDialogueSceneCardRequest(BaseModel):
     scene_card_id: str = Field(default="")
     scene_profile: dict[str, str] = Field(default_factory=dict)
     transition_message: str = Field(default="")
+    auto_continue: bool = Field(default=False)
 
 
 class BranchDialogueSessionRequest(BaseModel):
diff --git a/src/web/chat/__init__.py b/src/web/chat/__init__.py
index 24ac840..aedd985 100644
--- a/src/web/chat/__init__.py
+++ b/src/web/chat/__init__.py
@@ -1,5 +1,6 @@
 
 from .entrypoints import (
+    continue_dialogue_scene_opening_payload,
     create_dialogue_session_payload,
     reply_dialogue_turn_payload,
     suggest_dialogue_turn_payload,
@@ -31,6 +32,7 @@
     "build_dialogue_opening_message",
     "build_dialogue_scene_progress_messages",
     "compact_dialogue_suggestion_payload",
+    "continue_dialogue_scene_opening_payload",
     "create_dialogue_session_payload",
     "friendly_dialogue_llm_error",
     "generate_dialogue_suggestion",
diff --git a/src/web/chat/entrypoints.py b/src/web/chat/entrypoints.py
index e573ffc..d568b29 100644
--- a/src/web/chat/entrypoints.py
+++ b/src/web/chat/entrypoints.py
@@ -56,6 +56,47 @@ def create_dialogue_session_payload(
     return ingested
 
 
+def continue_dialogue_scene_opening_payload(
+    *,
+    run_id: str,
+    session: dict[str, Any],
+    manifest: dict[str, Any],
+    dialogue: Any,
+    build_dialogue_opening_message: Callable[[dict[str, Any]], str],
+    load_pending_turn_payload: Callable[[str, str], dict[str, Any]],
+    generate_dialogue_responses: Callable[[str, dict[str, Any]], list[dict[str, str]]],
+    friendly_dialogue_llm_error: Callable[[Exception], str],
+    evolve_relations_from_turn: Callable[[str, dict[str, Any], list[dict[str, str]]], None],
+    refresh_scene_progress: Callable[[str, dict[str, Any]], dict[str, Any]] | None = None,
+) -> dict[str, Any]:
+    session_id = str(session.get("session_id", "")).strip()
+    if not session_id:
+        raise ValueError("Session not found.")
+    opening_message = build_dialogue_opening_message(session)
+    dialogue.prepare_turn(
+        manifest,
+        session_id=session_id,
+        message=opening_message,
+        speaker_override="场景提示",
+        transcript_message="",
+    )
+    pending_payload = load_pending_turn_payload(run_id, session_id)
+    try:
+        responses = generate_dialogue_responses(run_id, pending_payload)
+    except LLMRequestError as exc:
+        raise ValueError(friendly_dialogue_llm_error(exc)) from exc
+    evolve_relations_from_turn(run_id, pending_payload, responses)
+    ingested = dialogue.ingest_turn_responses(
+        run_id,
+        session_id=session_id,
+        responses=responses,
+        remember_turn_memory=True,
+    )
+    if callable(refresh_scene_progress):
+        ingested = refresh_scene_progress(run_id, ingested)
+    return ingested
+
+
 def reply_dialogue_turn_payload(
     *,
     run_id: str,
diff --git a/src/web/service_facades/dialogue.py b/src/web/service_facades/dialogue.py
index 9c3b1b9..0add7d7 100644
--- a/src/web/service_facades/dialogue.py
+++ b/src/web/service_facades/dialogue.py
@@ -10,6 +10,7 @@
     build_dialogue_suggestion_llm_messages,
     build_dialogue_opening_message,
     compact_dialogue_suggestion_payload,
+    continue_dialogue_scene_opening_payload,
     create_dialogue_session_payload,
     friendly_dialogue_llm_error,
     generate_dialogue_suggestion,
@@ -109,6 +110,7 @@ def switch_dialogue_scene_card(
         scene_card_id: str = "",
         scene_profile: dict[str, str] | None = None,
         transition_message: str = "",
+        auto_continue: bool = False,
     ) -> dict[str, Any]:
         self._ensure_run_exists(run_id)
         resolved_scene_profile = dict(scene_profile or {})
@@ -122,12 +124,27 @@ def switch_dialogue_scene_card(
                 **resolved_scene_profile,
                 "scene_card_id": str(card.get("card_id", "")).strip(),
             }
-        return self.dialogue.update_scene_card(
+        switched = self.dialogue.update_scene_card(
             run_id,
             session_id,
             scene_profile=resolved_scene_profile,
             transition_message=transition_message,
         )
+        if not auto_continue:
+            return switched
+        manifest = self._require_manifest(run_id)
+        return continue_dialogue_scene_opening_payload(
+            run_id=run_id,
+            session=switched,
+            manifest=manifest,
+            dialogue=self.dialogue,
+            build_dialogue_opening_message=build_dialogue_opening_message,
+            load_pending_turn_payload=self._load_pending_turn_payload,
+            generate_dialogue_responses=self._generate_dialogue_responses,
+            friendly_dialogue_llm_error=friendly_dialogue_llm_error,
+            evolve_relations_from_turn=self._evolve_relations_from_turn,
+            refresh_scene_progress=self._refresh_dialogue_scene_progress,
+        )
 
     def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict[str, Any]:
         return SceneCardServiceMixin.recommend_dialogue_scene_card(self, run_id, session_id=session_id)
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index 9fa52b2..1f9f775 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -1023,6 +1023,7 @@ async function applySelectedDialogueSceneCard(options = {}) {
   const sceneCardId = String(select?.value || "").trim();
   const waitingText = String(options?.waitingText || "正在把这一幕转过去...").trim() || "正在把这一幕转过去...";
   const successText = String(options?.successText || "新的场景已经接上了。").trim() || "新的场景已经接上了。";
+  const autoContinue = Boolean(options?.autoContinue);
   if (!sceneCardId) {
     if (status) status.textContent = "先挑一张要切进去的场景卡。";
     return null;
@@ -1034,6 +1035,7 @@ async function applySelectedDialogueSceneCard(options = {}) {
       scene_card_id: sceneCardId,
       scene_profile: currentSceneCard?.card_id === sceneCardId ? (currentSceneCard?.fields || {}) : {},
       transition_message: transition,
+      auto_continue: autoContinue,
     });
     clearDialogueSceneRecommendationCache();
     if (el("dialogue-live-scene-transition")) {
@@ -1091,7 +1093,8 @@ async function handleRecommendDialogueSceneCard(event, options = {}) {
     if (autoApply) {
       await applySelectedDialogueSceneCard({
         waitingText: "正在顺手把这一幕转到下一拍...",
-        successText: "已经顺手切到下一幕了。",
+        successText: "已经顺手切到下一幕并接起新一拍了。",
+        autoContinue: true,
       });
     }
   } catch (error) {
@@ -1175,6 +1178,7 @@ async function applyDialogueSceneChain(chain = {}) {
     successText: tailTitles.length
       ? `这条线已经接上了，后面还可以顺势转到：${tailTitles.join("、")}。`
       : "这条线已经接上了。",
+    autoContinue: true,
   });
   return true;
 }
diff --git a/tests/test_web_app.py b/tests/test_web_app.py
index 4bcde21..efb098e 100644
--- a/tests/test_web_app.py
+++ b/tests/test_web_app.py
@@ -423,6 +423,86 @@ def test_dialogue_scene_history_tracks_initial_scene_and_switches(self):
             self.assertEqual(history[1]["transition_message"], "雨势更大，众人转入花厅。")
             self.assertEqual(history[1]["is_current"], "true")
 
+    def test_switch_dialogue_scene_card_can_auto_continue_new_scene(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            service = WebRunService(tmp)
+            service.save_model_settings(
+                provider="openai-compatible",
+                model="deepseek-chat",
+                base_url="https://example.com/v1",
+                api_key="sk-test",
+            )
+            first_scene = service.save_scene_card(
+                fields={
+                    "title": "回廊夜谈",
+                    "time_hint": "深夜",
+                    "location": "回廊",
+                    "atmosphere": "安静发紧",
+                    "opening_situation": "两人隔着雨声说话。",
+                    "public_goal": "先探来意。",
+                    "hidden_tension": "旧事随时会被挑开。",
+                    "scene_drive": "把试探慢慢逼紧。",
+                    "expected_rhythm": "慢热",
+                    "forbidden_topics": "前尘",
+                }
+            )
+            second_scene = service.save_scene_card(
+                fields={
+                    "title": "转入花厅",
+                    "time_hint": "夜深",
+                    "location": "花厅",
+                    "atmosphere": "表面客套，暗地收紧",
+                    "opening_situation": "雨势更大，众人不得不转入花厅。",
+                    "public_goal": "先把场面稳住。",
+                    "hidden_tension": "真正要问的话终于躲不过去。",
+                    "scene_drive": "从试探推向摊牌。",
+                    "expected_rhythm": "三句一推进",
+                    "forbidden_topics": "旧账",
+                }
+            )
+            run = service.create_run(
+                novel_name="hongloumeng.txt",
+                novel_content_base64=base64.b64encode("林黛玉见了贾宝玉。".encode("utf-8")).decode("ascii"),
+                characters=["林黛玉", "贾宝玉"],
+            )
+            for name in ("林黛玉", "贾宝玉"):
+                service.ingest_character_result(
+                    run["run_id"],
+                    character=name,
+                    content_base64=base64.b64encode(
+                        f"- name: {name}\n- novel_id: hongloumeng\n- core_identity: 人物\n".encode("utf-8")
+                    ).decode("ascii"),
+                )
+
+            with patch.object(
+                WebRunService,
+                "_generate_dialogue_responses",
+                side_effect=[
+                    [{"speaker": "场景提示", "message": "开场。"}],
+                    [{"speaker": "林黛玉", "message": "（她抬眼看了看门外雨势）进了花厅，也未见得就好说。"}],
+                ],
+            ):
+                session = service.create_dialogue_session(
+                    run["run_id"],
+                    mode="observe",
+                    participants=["林黛玉", "贾宝玉"],
+                    scene_card_id=first_scene["card_id"],
+                )
+                switched = service.switch_dialogue_scene_card(
+                    run["run_id"],
+                    session_id=session["session_id"],
+                    scene_card_id=second_scene["card_id"],
+                    transition_message="雨势更大，众人转入花厅。",
+                    auto_continue=True,
+                )
+
+            transcript = list(switched.get("transcript", []) or [])
+            self.assertEqual(switched["session_card"]["scene_card"]["title"], "转入花厅")
+            self.assertTrue(any("众人转入花厅" in str(item.get("message", "")) for item in transcript))
+            self.assertTrue(any(str(item.get("speaker", "")) == "林黛玉" for item in transcript))
+            self.assertEqual(switched.get("status"), "ready")
+            self.assertFalse(bool(switched.get("pending_turn")))
+
     def test_branch_dialogue_session_from_scene_creates_new_session(self):
         with tempfile.TemporaryDirectory() as tmp:
             service = WebRunService(tmp)

From 639f2c0ced69a70c5923d338c2bc2ea1ac9aa6bc Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 14:09:38 +0800
Subject: [PATCH 10/11] feat: surface scene recommendation summaries

---
 src/web/static/fragments/main-shell.html |  1 +
 src/web/static/js/main.js                | 84 +++++++++++++++++++++++-
 src/web/static/styles/dialogue.css       | 53 +++++++++++++++
 3 files changed, 137 insertions(+), 1 deletion(-)

diff --git a/src/web/static/fragments/main-shell.html b/src/web/static/fragments/main-shell.html
index 04d744d..d1c90fb 100644
--- a/src/web/static/fragments/main-shell.html
+++ b/src/web/static/fragments/main-shell.html
@@ -36,6 +36,7 @@
                 <select id="dialogue-live-scene-card"></select>
                 <button id="dialogue-live-scene-apply" type="button" class="soft-button">切换场景</button>
               </div>
+              <div id="dialogue-live-scene-recommendation" class="dialogue-live-scene-recommendation hidden"></div>
               <textarea id="dialogue-live-scene-transition" rows="2" placeholder="例如：雨势更大，众人不得不转入花厅。"></textarea>
               <p id="dialogue-live-scene-status" class="card-note"></p>
               <div id="dialogue-scene-chain-suggestions" class="dialogue-scene-chain-suggestions hidden"></div>
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index 1f9f775..e57d467 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -948,6 +948,7 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
     if (shiftHint) shiftHint.classList.add("hidden");
     if (shiftCopy) shiftCopy.textContent = "";
     if (shiftRecommendButton) shiftRecommendButton.disabled = true;
+    renderDialogueSceneRecommendationSummary(null);
     renderDialogueSceneChainSuggestions([], "");
     return;
   }
@@ -1005,6 +1006,7 @@ function renderDialogueSceneSwitcher(session = currentDialogueSession) {
       status.textContent = currentSceneId ? "当前会话已经挂载场景卡，你可以随时切到另一幕。" : "当前会话还没挂场景卡，也可以直接在这里接入一张。";
     }
   }
+  renderDialogueSceneRecommendationSummary(session);
   renderDialogueSceneChainSuggestions(currentDialogueSceneChainSuggestions, session?.session_id || "");
 }
 
@@ -1087,8 +1089,10 @@ async function handleRecommendDialogueSceneCard(event, options = {}) {
       setValue("dialogue-live-scene-transition", recommendedTransition);
     }
     if (status) {
-      status.textContent = reasons.length ? `已替你挑好下一幕：${reasons.join("，")}。` : "已替你挑好一张更接戏的场景卡。";
+      const sourceLabel = currentDialogueSceneRecommendationMeta?.fromCache ? "（已从缓存取回）" : "（刚更新）";
+      status.textContent = reasons.length ? `已替你挑好下一幕${sourceLabel}：${reasons.join("，")}。` : `已替你挑好一张更接戏的场景卡${sourceLabel}。`;
     }
+    renderDialogueSceneRecommendationSummary(currentDialogueSession);
     renderDialogueSceneChainSuggestions(currentDialogueSceneChainSuggestions, currentDialogueSessionId);
     if (autoApply) {
       await applySelectedDialogueSceneCard({
@@ -2357,6 +2361,7 @@ const DIALOGUE_SEND_RETRY_MESSAGE = "这次声源有点慢，正在自动重试.
 const DIALOGUE_SUGGEST_RETRY_MESSAGE = "这次生成有点慢，正在自动重试...";
 let currentDialogueSceneRecommendationCacheKey = "";
 let currentDialogueSceneRecommendationCachePayload = null;
+let currentDialogueSceneRecommendationMeta = null;
 const OBSERVE_QUICK_REPLIES = [
   { label: "……", value: "……" },
   { label: "继续聊", value: "继续聊。" },
@@ -2382,6 +2387,7 @@ function buildDialogueSceneRecommendationCacheKey(session = currentDialogueSessi
 function clearDialogueSceneRecommendationCache() {
   currentDialogueSceneRecommendationCacheKey = "";
   currentDialogueSceneRecommendationCachePayload = null;
+  currentDialogueSceneRecommendationMeta = null;
 }
 
 async function fetchDialogueSceneRecommendation(options = {}) {
@@ -2391,14 +2397,90 @@ async function fetchDialogueSceneRecommendation(options = {}) {
   }
   const cacheKey = buildDialogueSceneRecommendationCacheKey(currentDialogueSession);
   if (!force && cacheKey && cacheKey === currentDialogueSceneRecommendationCacheKey && currentDialogueSceneRecommendationCachePayload) {
+    currentDialogueSceneRecommendationMeta = {
+      sessionId: String(currentDialogueSessionId || "").trim(),
+      fromCache: true,
+      payload: currentDialogueSceneRecommendationCachePayload,
+    };
     return currentDialogueSceneRecommendationCachePayload;
   }
   const payload = await window.__ZAOMENG_WEBUI_API__.recommendDialogueSceneCard(currentRunId, currentDialogueSessionId);
   currentDialogueSceneRecommendationCacheKey = cacheKey;
   currentDialogueSceneRecommendationCachePayload = payload;
+  currentDialogueSceneRecommendationMeta = {
+    sessionId: String(currentDialogueSessionId || "").trim(),
+    fromCache: false,
+    payload,
+  };
   return payload;
 }
 
+function renderDialogueSceneRecommendationSummary(session = currentDialogueSession) {
+  const root = el("dialogue-live-scene-recommendation");
+  if (!root) return;
+  const sessionId = String(session?.session_id || "").trim();
+  const meta = currentDialogueSceneRecommendationMeta || null;
+  const payload = meta?.payload || null;
+  if (!sessionId || !payload || String(meta?.sessionId || "").trim() !== sessionId) {
+    root.innerHTML = "";
+    root.classList.add("hidden");
+    return;
+  }
+  const recommendedCardId = String(payload?.recommended_card_id || "").trim();
+  const topItem = Array.isArray(payload?.items) ? payload.items.find((item) => String(item?.card_id || "").trim() === recommendedCardId) || payload.items[0] : null;
+  if (!recommendedCardId || !topItem) {
+    root.innerHTML = "";
+    root.classList.add("hidden");
+    return;
+  }
+  const title = String(topItem?.preview?.title || topItem?.fields?.title || recommendedCardId).trim();
+  const location = String(topItem?.preview?.location || topItem?.fields?.location || "").trim();
+  const transition = String(payload?.recommended_transition_message || "").trim();
+  const reasons = Array.isArray(topItem?.recommendation?.reasons) ? topItem.recommendation.reasons.filter(Boolean).slice(0, 4) : [];
+  const firstChain = Array.isArray(payload?.chain_suggestions) ? payload.chain_suggestions[0] : null;
+  const chainReason = String(firstChain?.reason || "").trim();
+  const sourceLabel = meta?.fromCache ? "已缓存" : "刚更新";
+
+  root.innerHTML = "";
+  const head = document.createElement("div");
+  head.className = "dialogue-live-scene-recommendation-head";
+  const strong = document.createElement("strong");
+  strong.textContent = location ? `推荐：${title} · ${location}` : `推荐：${title}`;
+  const badge = document.createElement("span");
+  badge.textContent = sourceLabel;
+  head.appendChild(strong);
+  head.appendChild(badge);
+  root.appendChild(head);
+
+  if (reasons.length) {
+    const tags = document.createElement("div");
+    tags.className = "dialogue-live-scene-recommendation-tags";
+    reasons.forEach((reason) => {
+      const chip = document.createElement("span");
+      chip.textContent = String(reason || "").trim();
+      tags.appendChild(chip);
+    });
+    root.appendChild(tags);
+  }
+
+  if (transition) {
+    const transitionCopy = document.createElement("p");
+    transitionCopy.textContent = `转场起句：${transition}`;
+    root.appendChild(transitionCopy);
+  }
+
+  if (chainReason) {
+    const chainCopy = document.createElement("p");
+    chainCopy.textContent = `后续走势：${chainReason}`;
+    root.appendChild(chainCopy);
+  }
+
+  const autoCopy = document.createElement("p");
+  autoCopy.textContent = "顺手切到下一幕会直接把新一拍接起来，不会停在空场。";
+  root.appendChild(autoCopy);
+  root.classList.remove("hidden");
+}
+
 function buildObserveQuickReplies(session = currentDialogueSession) {
   const overview = session?.runtime_state_overview || {};
   const present = Array.isArray(overview?.present) ? overview.present.filter(Boolean) : [];
diff --git a/src/web/static/styles/dialogue.css b/src/web/static/styles/dialogue.css
index 391cd57..a4e4ecf 100644
--- a/src/web/static/styles/dialogue.css
+++ b/src/web/static/styles/dialogue.css
@@ -169,6 +169,59 @@
   flex: 0 0 auto;
 }
 
+.dialogue-live-scene-recommendation {
+  display: grid;
+  gap: 0.34rem;
+  padding: 0.58rem 0.64rem;
+  border-radius: 12px;
+  border: 1px solid rgba(170, 146, 127, 0.12);
+  background: rgba(255, 251, 247, 0.84);
+}
+
+.dialogue-live-scene-recommendation-head {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 0.5rem;
+}
+
+.dialogue-live-scene-recommendation-head strong {
+  color: var(--ink);
+  font-size: 0.7rem;
+  line-height: 1.4;
+}
+
+.dialogue-live-scene-recommendation-head span {
+  color: var(--ink-faint);
+  font-size: 0.62rem;
+  white-space: nowrap;
+}
+
+.dialogue-live-scene-recommendation p {
+  margin: 0;
+  color: var(--ink-faint);
+  font-size: 0.65rem;
+  line-height: 1.55;
+}
+
+.dialogue-live-scene-recommendation-tags {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 0.32rem;
+}
+
+.dialogue-live-scene-recommendation-tags span {
+  display: inline-flex;
+  align-items: center;
+  min-height: 1.25rem;
+  padding: 0 0.44rem;
+  border-radius: 999px;
+  background: rgba(184, 132, 113, 0.08);
+  color: var(--accent-strong);
+  font-size: 0.62rem;
+  line-height: 1.3;
+}
+
 .dialogue-scene-chain-suggestions {
   display: grid;
   gap: 0.42rem;

From 590d01063e77096ebbb6a49c9e9a20ba78c3a32b Mon Sep 17 00:00:00 2001
From: wkbin <wangkebin1997@gmail.com>
Date: Thu, 14 May 2026 16:15:09 +0800
Subject: [PATCH 11/11] feat: share scene recommendation pipeline across web
 and skill

---
 README.en.md                                  |   2 +
 README.md                                     |   2 +
 src/skill_support/__init__.py                 |  15 +
 src/skill_support/scene_recommendations.py    | 641 ++++++++++++++++++
 src/web/chat/helpers.py                       |  41 +-
 src/web/review/scene_cards.py                 | 110 +--
 src/web/service_facades/scene_cards.py        | 383 +----------
 src/web/static/js/dialogue.js                 |   6 +-
 src/web/static/js/main.js                     |   7 +
 tests/test_install_skill.py                   |  85 +++
 tests/test_packaging_docs.py                  |  12 +
 tests/test_prompt_payloads.py                 |  86 +++
 tests/test_web_app.py                         |   3 +
 zaomeng-skill/MANIFEST.md                     |   2 +
 zaomeng-skill/README.md                       |   9 +
 zaomeng-skill/README_EN.md                    |   9 +
 zaomeng-skill/SKILL.md                        |  10 +-
 .../examples/host_workflow_example.md         |  17 +
 .../scene_recommendation_context.example.json |  95 +++
 zaomeng-skill/examples/test-prompts.json      |  19 +
 zaomeng-skill/references/capability_index.md  |   4 +
 zaomeng-skill/references/chat_contract.md     |  15 +
 .../tools/_skill_support/__init__.py          |  12 +
 .../_skill_support/scene_recommendations.py   | 641 ++++++++++++++++++
 .../build_scene_recommendation_payload.py     |  40 ++
 25 files changed, 1749 insertions(+), 517 deletions(-)
 create mode 100644 src/skill_support/scene_recommendations.py
 create mode 100644 zaomeng-skill/examples/scene_recommendation_context.example.json
 create mode 100644 zaomeng-skill/tools/_skill_support/scene_recommendations.py
 create mode 100644 zaomeng-skill/tools/build_scene_recommendation_payload.py

diff --git a/README.en.md b/README.en.md
index 2cd571d..ade3b80 100644
--- a/README.en.md
+++ b/README.en.md
@@ -131,6 +131,7 @@ The current Web UI already supports:
 - persona review pages with key-field completion, evidence-gap checks, and secondary-field tuning
 - creating, editing, selecting, and reusing scene cards, self cards, and opening presets
 - automatic next-scene recommendation during chat, with in-session scene switching
+- automatic next-beat surfacing when a scene matures, including a transition line, follow-up chain, and auto-opening cue
 - session restore, recent-session resume, group chat continuation, and direct workbench entry into a scene
 - dialogue context compression that trims persona / relation context around active participants and injects session memory summaries
 - viewing transcripts, continuing group chat, and deleting recent sessions in the same interface
@@ -207,6 +208,7 @@ You can now layer these helpers before or during a session:
 - self cards: prepare your identity, tone, motive, and in-scene role for `insert`
 - opening presets: bundle mode, participants, scene card, and self card into a reusable starting setup
 - automatic scene recommendation: while a session is running, the system can suggest a more suitable next scene card
+- transition assist flow: besides recommending the next scene, it can also provide a transition line, a follow-up scene chain, and an auto-opening cue for the next beat
 
 ## Usage 🛠️
 
diff --git a/README.md b/README.md
index f42f63b..8ce4bc8 100644
--- a/README.md
+++ b/README.md
@@ -132,6 +132,7 @@ python scripts/run_webui.py --reload
 - 人物校对页，支持关键字段补全、证据不足检查与二级字段微调
 - 场景卡、角色卡、开局模板的创建、编辑、选择与复用
 - 聊天过程中自动推荐下一幕场景卡，并支持会话内切换场景
+- 拍点成熟时自动浮出下一幕建议，附带转场起句、后续戏路和自动起拍提示
 - 会话恢复、最近会话续聊、群聊继续与工作台直接入场
 - 对话上下文自动压缩，按活跃角色裁剪人物/关系上下文，并注入会话记忆摘要
 - 在同一页面查看 transcript、继续群聊、删除历史会话
@@ -217,6 +218,7 @@ python scripts/run_webui.py --reload
 - 角色卡：为 `insert` 模式准备你的身份、语气、动机与在场定位
 - 开局模板：把入场方式、参与角色、场景卡、角色卡打包成一套可复用开局
 - 自动场景推荐：会话进行中，系统会结合当前局势推荐更适合的下一幕
+- 转场辅助链路：除了推荐哪一幕，还会给出转场起句、后续戏路，以及切幕后可直接继续开聊的自动起拍提示
 
 ## 使用方式 🛠️
 
diff --git a/src/skill_support/__init__.py b/src/skill_support/__init__.py
index abff2b9..f5feaef 100644
--- a/src/skill_support/__init__.py
+++ b/src/skill_support/__init__.py
@@ -3,3 +3,18 @@
 
 """Shared helpers for prompt-first skill workflows."""
 
+from .scene_recommendations import (
+    build_scene_opening_message,
+    build_scene_recommendation_bundle,
+    normalize_scene_recommendation_context,
+    recommend_dialogue_scene_cards,
+    recommend_scene_cards_base,
+)
+
+__all__ = [
+    "build_scene_opening_message",
+    "build_scene_recommendation_bundle",
+    "normalize_scene_recommendation_context",
+    "recommend_dialogue_scene_cards",
+    "recommend_scene_cards_base",
+]
diff --git a/src/skill_support/scene_recommendations.py b/src/skill_support/scene_recommendations.py
new file mode 100644
index 0000000..f66b8af
--- /dev/null
+++ b/src/skill_support/scene_recommendations.py
@@ -0,0 +1,641 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+from __future__ import annotations
+
+import re
+from typing import Any
+
+_GROUP_SCENE_TOKENS = ("众人", "席间", "满座", "同席", "众目", "围坐", "宴", "厅", "堂", "多人")
+_DUO_SCENE_TOKENS = ("二人", "对坐", "独处", "檐下", "私谈", "夜谈", "回廊", "亭中", "单独")
+_INSERT_SCENE_TOKENS = ("来客", "访客", "外客", "误入", "新到", "初来", "借住", "入席", "登门")
+_PLOT_PUSH_TOKENS = ("试探", "摊牌", "转折", "打断", "逼问", "推", "揭", "撞破", "失手", "变局")
+_SCENE_FIELDS = (
+    "title",
+    "time_hint",
+    "location",
+    "atmosphere",
+    "opening_situation",
+    "public_goal",
+    "hidden_tension",
+    "scene_drive",
+    "expected_rhythm",
+    "forbidden_topics",
+)
+
+
+def build_scene_recommendation_bundle(context: dict[str, Any]) -> dict[str, Any]:
+    normalized = normalize_scene_recommendation_context(context)
+    recommended = recommend_dialogue_scene_cards(
+        cards=list(normalized.get("scene_cards", []) or []),
+        mode=str(normalized.get("mode", "observe")).strip() or "observe",
+        participants=list(normalized.get("participants", []) or []),
+        current_scene=dict(normalized.get("current_scene", {}) or {}),
+        current_scene_id=str(normalized.get("current_scene_card_id", "")).strip(),
+        runtime_overview=dict(normalized.get("runtime_state_overview", {}) or {}),
+        recent_text=str(normalized.get("recent_text", "")).strip(),
+    )
+    top_card: dict[str, Any] = next(
+        (
+            item
+            for item in list(recommended.get("items", []) or [])
+            if str(item.get("card_id", "")).strip() == str(recommended.get("recommended_card_id", "")).strip()
+        ),
+        {},
+    )
+    fields = dict(top_card.get("fields", {}) or {})
+    recommended["recommended_auto_continue_message"] = build_scene_opening_message(
+        mode=str(normalized.get("mode", "observe")).strip() or "observe",
+        participants=list(normalized.get("participants", []) or []),
+        scene_card=fields,
+        controlled_character=str(normalized.get("controlled_character", "")).strip(),
+        self_profile=dict(normalized.get("self_profile", {}) or {}),
+    )
+    return {
+        "kind": "dialogue_scene_recommendation_bundle",
+        "payload": recommended,
+        "host_hint": (
+            "The host may directly apply recommended_card_id + recommended_transition_message. "
+            "If it wants to auto-continue the new beat immediately, it can feed recommended_auto_continue_message "
+            "back into its dialogue engine as the next opening cue."
+        ),
+    }
+
+
+def normalize_scene_recommendation_context(context: dict[str, Any]) -> dict[str, Any]:
+    mode = str(context.get("mode", "observe")).strip() or "observe"
+    participants = [str(item).strip() for item in list(context.get("participants", []) or []) if str(item).strip()]
+    scene_cards = [_normalize_scene_card_entry(item) for item in list(context.get("scene_cards", []) or []) if isinstance(item, dict)]
+    if not scene_cards:
+        raise ValueError("Scene recommendation context requires non-empty scene_cards.")
+    return {
+        "mode": mode,
+        "participants": participants,
+        "scene_cards": scene_cards,
+        "current_scene_card_id": str(context.get("current_scene_card_id", "")).strip(),
+        "current_scene": _normalize_scene_fields(dict(context.get("current_scene", {}) or {})),
+        "runtime_state_overview": dict(context.get("runtime_state_overview", {}) or {}),
+        "recent_text": str(context.get("recent_text", "")).strip() or _transcript_to_recent_text(context.get("transcript", [])),
+        "controlled_character": str(context.get("controlled_character", "")).strip(),
+        "self_profile": dict(context.get("self_profile", {}) or {}),
+    }
+
+
+def recommend_dialogue_scene_cards(
+    *,
+    cards: list[dict[str, Any]],
+    mode: str,
+    participants: list[str],
+    current_scene: dict[str, Any],
+    current_scene_id: str,
+    runtime_overview: dict[str, Any] | None = None,
+    recent_text: str = "",
+) -> dict[str, Any]:
+    normalized_mode = str(mode or "observe").strip() or "observe"
+    participant_list = [str(item).strip() for item in participants if str(item).strip()]
+    current_scene_snapshot = _merge_current_scene_snapshot(current_scene, dict(runtime_overview or {}))
+    base = recommend_scene_cards_base(cards, mode=normalized_mode, participants=participant_list)
+    reranked_items: list[dict[str, Any]] = []
+    for item in list(base.get("items", []) or []):
+        recommendation = dict(item.get("recommendation", {}) or {})
+        score = int(recommendation.get("score", 0) or 0)
+        reasons = [str(reason).strip() for reason in list(recommendation.get("reasons", []) or []) if str(reason).strip()]
+        item_card_id = str(item.get("card_id", "")).strip()
+        fields = dict(item.get("fields", {}) or {})
+
+        if current_scene_id and item_card_id == current_scene_id:
+            score -= 5
+            reasons.insert(0, "当前已经在这幕里，优先换一拍")
+        else:
+            current_location = str(current_scene_snapshot.get("location", "")).strip()
+            candidate_location = str(fields.get("location", "")).strip()
+            if current_location and candidate_location and candidate_location != current_location:
+                score += 1
+                reasons.append("地点切换更明显，适合转场")
+
+            overlap = _scene_text_overlap_score(fields, recent_text)
+            if overlap:
+                score += overlap
+                reasons.append("和最近这几句的气口更接")
+
+            state_bonus, state_reasons = _score_scene_card_with_runtime_state(
+                fields,
+                runtime_overview=dict(runtime_overview or {}),
+                current_scene=current_scene_snapshot,
+                participants=participant_list,
+                recent_text=recent_text,
+            )
+            score += state_bonus
+            reasons.extend(state_reasons)
+
+        reranked_items.append(
+            {
+                **item,
+                "recommendation": {
+                    "score": score,
+                    "reasons": reasons[:4] or ["适合承接当前会话"],
+                },
+            }
+        )
+
+    reranked_items.sort(
+        key=lambda item: (
+            int(item.get("recommendation", {}).get("score", 0) or 0),
+            str(item.get("updated_at", "")),
+            str(item.get("card_id", "")),
+        ),
+        reverse=True,
+    )
+    recommended_card_id = str(reranked_items[0].get("card_id", "")).strip() if reranked_items else ""
+    top_fields = dict(reranked_items[0].get("fields", {}) or {}) if reranked_items else {}
+    return {
+        "mode": normalized_mode,
+        "participants": participant_list,
+        "current_scene_card_id": str(current_scene_id or "").strip(),
+        "recommended_card_id": recommended_card_id,
+        "recommended_transition_message": _build_transition_message_hint(
+            current_scene=current_scene_snapshot,
+            next_scene=top_fields,
+            recent_text=recent_text,
+            runtime_overview=dict(runtime_overview or {}),
+        ),
+        "chain_suggestions": _build_scene_chain_suggestions(
+            current_scene=current_scene_snapshot,
+            current_scene_id=str(current_scene_id or "").strip(),
+            reranked_items=reranked_items,
+            recent_text=recent_text,
+            runtime_overview=dict(runtime_overview or {}),
+        ),
+        "items": reranked_items,
+    }
+
+
+def recommend_scene_cards_base(
+    cards: list[dict[str, Any]],
+    *,
+    mode: str,
+    participants: list[str] | None = None,
+) -> dict[str, Any]:
+    normalized_mode = str(mode or "observe").strip() or "observe"
+    participant_list = [str(item).strip() for item in (participants or []) if str(item).strip()]
+    scored_items: list[dict[str, Any]] = []
+    for item in cards:
+        fields = _normalize_scene_fields(dict(item.get("fields", {}) or {}))
+        score, reasons = _score_scene_card(fields, mode=normalized_mode, participants=participant_list)
+        scored_items.append(
+            {
+                **item,
+                "fields": fields,
+                "recommendation": {
+                    "score": score,
+                    "reasons": reasons,
+                },
+            }
+        )
+    scored_items.sort(
+        key=lambda item: (
+            int(item.get("recommendation", {}).get("score", 0) or 0),
+            str(item.get("updated_at", "")),
+            str(item.get("card_id", "")),
+        ),
+        reverse=True,
+    )
+    return {
+        "mode": normalized_mode,
+        "participants": participant_list,
+        "recommended_card_id": str(scored_items[0].get("card_id", "")).strip() if scored_items else "",
+        "items": scored_items,
+    }
+
+
+def build_scene_opening_message(
+    *,
+    mode: str,
+    participants: list[str],
+    scene_card: dict[str, Any],
+    controlled_character: str = "",
+    self_profile: dict[str, Any] | None = None,
+) -> str:
+    normalized_mode = str(mode or "observe").strip() or "observe"
+    cast = "、".join(str(item).strip() for item in participants if str(item).strip()) or "当前角色"
+    scene = _normalize_scene_fields(scene_card)
+    scene_prefix_bits = [bit for bit in (scene.get("title", ""), scene.get("location", ""), scene.get("atmosphere", "")) if bit]
+    scene_prefix = f"场景设定：{' / '.join(scene_prefix_bits)}。" if scene_prefix_bits else ""
+    opening_suffix = f" 开场局面是：{scene.get('opening_situation', '')}。" if str(scene.get("opening_situation", "")).strip() else ""
+    drive_suffix = f" 推进方向优先朝这边走：{scene.get('scene_drive', '')}。" if str(scene.get("scene_drive", "")).strip() else ""
+    if normalized_mode == "act":
+        controlled = str(controlled_character or "").strip() or "该角色"
+        return (
+            f"{scene_prefix}请先为 {controlled} 与 {cast} 生成一个自然开场。"
+            f"{opening_suffix}{drive_suffix}"
+            "先给 1 条简短的场景提示或旁白，再让其他角色先接出第一轮对话，不要等待用户补充。"
+        )
+    if normalized_mode == "insert":
+        profile = dict(self_profile or {})
+        display_name = str(profile.get("display_name", "")).strip() or "我"
+        scene_identity = str(profile.get("scene_identity", "")).strip() or str(profile.get("core_identity", "")).strip()
+        identity_suffix = f"，身份是{scene_identity}" if scene_identity else ""
+        return (
+            f"{scene_prefix}请先为 {display_name}{identity_suffix} 与 {cast} 生成一个自然开场。"
+            f"{opening_suffix}{drive_suffix}"
+            "先给 1 条简短的场景提示或旁白，再让角色们先开口，对这个进入场景的人作出第一轮反应。"
+        )
+    return (
+        f"{scene_prefix}请先为 {cast} 生成一个自然开场。"
+        f"{opening_suffix}{drive_suffix}"
+        "先给 1 条简短的场景提示或旁白，再让角色们开始第一轮对话，让场景自己动起来。"
+    )
+
+
+def _normalize_scene_card_entry(item: dict[str, Any]) -> dict[str, Any]:
+    fields = _normalize_scene_fields(dict(item.get("fields", {}) or {}))
+    preview = dict(item.get("preview", {}) or {})
+    if not preview:
+        preview = {
+            "title": str(fields.get("title", "")).strip(),
+            "time_hint": str(fields.get("time_hint", "")).strip(),
+            "location": str(fields.get("location", "")).strip(),
+            "atmosphere": str(fields.get("atmosphere", "")).strip(),
+            "opening_situation": str(fields.get("opening_situation", "")).strip(),
+            "scene_drive": str(fields.get("scene_drive", "")).strip(),
+            "expected_rhythm": str(fields.get("expected_rhythm", "")).strip(),
+        }
+    return {
+        "card_id": str(item.get("card_id", "")).strip(),
+        "fields": fields,
+        "preview": preview,
+        "updated_at": str(item.get("updated_at", "")).strip(),
+    }
+
+
+def _normalize_scene_fields(fields: dict[str, Any]) -> dict[str, str]:
+    return {field: str(fields.get(field, "") or "").strip() for field in _SCENE_FIELDS}
+
+
+def _score_scene_card(fields: dict[str, Any], *, mode: str, participants: list[str]) -> tuple[int, list[str]]:
+    normalized = _normalize_scene_fields(fields)
+    combined_text = "\n".join(str(normalized.get(field, "")).strip() for field in _SCENE_FIELDS)
+    participant_count = len(participants)
+    score = 0
+    reasons: list[str] = []
+
+    if normalized["scene_drive"]:
+        score += 3
+        reasons.append("推进方向明确")
+    if normalized["opening_situation"]:
+        score += 2
+        reasons.append("开场局面具体")
+    if normalized["atmosphere"]:
+        score += 1
+        reasons.append("气氛落点清楚")
+
+    if participant_count >= 3:
+        hit = _count_hits(combined_text, _GROUP_SCENE_TOKENS)
+        if hit:
+            score += 3 + min(2, hit - 1)
+            reasons.append("更像多人同席场")
+    elif participant_count == 2:
+        hit = _count_hits(combined_text, _DUO_SCENE_TOKENS)
+        if hit:
+            score += 3 + min(1, hit - 1)
+            reasons.append("更适合双人拉扯")
+
+    if mode == "insert":
+        hit = _count_hits(combined_text, _INSERT_SCENE_TOKENS)
+        if hit:
+            score += 4 + min(1, hit - 1)
+            reasons.append("适合来客/自我入场")
+    elif mode == "observe":
+        hit = _count_hits(combined_text, _PLOT_PUSH_TOKENS)
+        if hit:
+            score += 3 + min(2, hit - 1)
+            reasons.append("更利于旁观推动剧情")
+    elif mode == "act":
+        duo_hit = _count_hits(combined_text, _DUO_SCENE_TOKENS)
+        if duo_hit:
+            score += 2
+            reasons.append("留有角色正面接戏空间")
+
+    if normalized["public_goal"]:
+        score += 1
+    if normalized["hidden_tension"]:
+        score += 1
+    if normalized["expected_rhythm"]:
+        score += 1
+
+    if not reasons:
+        reasons.append("信息比较完整，能直接开场")
+    return score, reasons[:3]
+
+
+def _count_hits(text: str, tokens: tuple[str, ...]) -> int:
+    compact = str(text or "").strip()
+    if not compact:
+        return 0
+    return sum(1 for token in tokens if token and token in compact)
+
+
+def _merge_current_scene_snapshot(current_scene: dict[str, Any], runtime_overview: dict[str, Any]) -> dict[str, Any]:
+    merged = _normalize_scene_fields(current_scene)
+    if str(runtime_overview.get("location", "")).strip():
+        merged["location"] = str(runtime_overview.get("location", "")).strip()
+    if str(runtime_overview.get("time_hint", "")).strip():
+        merged["time_hint"] = str(runtime_overview.get("time_hint", "")).strip()
+    if str(runtime_overview.get("atmosphere", "")).strip():
+        merged["atmosphere"] = str(runtime_overview.get("atmosphere", "")).strip()
+    return merged
+
+
+def _scene_text_overlap_score(fields: dict[str, Any], recent_text: str) -> int:
+    compact_recent = str(recent_text or "").strip()
+    if not compact_recent:
+        return 0
+    phrases: list[str] = []
+    for key in ("location", "atmosphere", "opening_situation", "scene_drive", "public_goal", "hidden_tension"):
+        raw = str(fields.get(key, "") or "").strip()
+        if not raw:
+            continue
+        for part in re.split(r"[，,。；;、：:\s]+", raw):
+            text = part.strip()
+            if 2 <= len(text) <= 8 and text not in phrases:
+                phrases.append(text)
+    overlap = sum(1 for phrase in phrases[:12] if phrase in compact_recent)
+    return min(3, overlap)
+
+
+def _score_scene_card_with_runtime_state(
+    fields: dict[str, Any],
+    *,
+    runtime_overview: dict[str, Any],
+    current_scene: dict[str, Any],
+    participants: list[str],
+    recent_text: str,
+) -> tuple[int, list[str]]:
+    score = 0
+    reasons: list[str] = []
+    current_location = str(current_scene.get("location", "")).strip()
+    candidate_location = str(fields.get("location", "")).strip()
+    current_time = str(runtime_overview.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
+    candidate_time = str(fields.get("time_hint", "")).strip()
+    beat_maturity = max(0, min(100, int(runtime_overview.get("beat_maturity", 0) or 0)))
+    should_shift = bool(runtime_overview.get("should_offer_scene_shift", False))
+    shift_reason = str(runtime_overview.get("scene_shift_reason", "")).strip()
+    tension = str(runtime_overview.get("tension", "")).strip()
+    next_hint = str(runtime_overview.get("next_hint", "")).strip()
+    atmosphere = str(runtime_overview.get("atmosphere", "")).strip()
+    event_rows = list(runtime_overview.get("event_rows", []) or [])
+    recent_event = str((event_rows[-1] or {}).get("copy", "")).strip() if event_rows else ""
+
+    if should_shift:
+        if current_location and candidate_location and candidate_location != current_location:
+            score += 4
+            reasons.append("这一拍已接近收束，更适合换场推进")
+        elif current_location and candidate_location and candidate_location == current_location:
+            score -= 2
+            reasons.append("这一拍已经该收住了，不必继续原地打转")
+        elif candidate_location:
+            score += 1
+            reasons.append("当前已经适合往下一拍走")
+    elif beat_maturity and beat_maturity < 45 and current_location and candidate_location == current_location:
+        score += 2
+        reasons.append("这一拍还没聊满，先在同场景续火更顺")
+
+    if current_time and candidate_time:
+        if candidate_time == current_time:
+            score += 1
+            reasons.append("时间承接自然")
+        elif should_shift or beat_maturity >= 55:
+            score += 2
+            reasons.append("时间推进能带出下一拍")
+
+    state_overlap = _state_overlap_score(
+        fields,
+        state_texts=[atmosphere, tension, next_hint, recent_event, recent_text],
+    )
+    if state_overlap:
+        score += state_overlap
+        reasons.append("能接住本局气氛和悬念")
+
+    if len(participants) >= 3 and candidate_location and any(token in candidate_location for token in ("厅", "堂", "席", "园", "院")):
+        score += 1
+        reasons.append("多人局切到这个场面更容易铺开")
+
+    if shift_reason:
+        shift_tokens = [part for part in re.split(r"[，,。；;、：:\s]+", shift_reason) if 2 <= len(part.strip()) <= 8]
+        if any(token and token in "\n".join(str(fields.get(key, "")).strip() for key in ("opening_situation", "scene_drive", "hidden_tension")) for token in shift_tokens[:4]):
+            score += 2
+            reasons.append("和当前这拍的收束理由接得上")
+
+    return score, reasons
+
+
+def _state_overlap_score(fields: dict[str, Any], *, state_texts: list[str]) -> int:
+    compact_state = "\n".join(text.strip() for text in state_texts if str(text).strip())
+    if not compact_state:
+        return 0
+    phrases: list[str] = []
+    for key in ("atmosphere", "opening_situation", "public_goal", "hidden_tension", "scene_drive"):
+        raw = str(fields.get(key, "")).strip()
+        if not raw:
+            continue
+        for part in re.split(r"[，,。；;、：:\s]+", raw):
+            text = part.strip()
+            if 2 <= len(text) <= 8 and text not in phrases:
+                phrases.append(text)
+    overlap = sum(1 for phrase in phrases[:14] if phrase in compact_state)
+    return min(4, overlap)
+
+
+def _build_transition_message_hint(
+    *,
+    current_scene: dict[str, Any],
+    next_scene: dict[str, Any],
+    recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
+) -> str:
+    runtime = dict(runtime_overview or {})
+    next_location = str(next_scene.get("location", "")).strip()
+    next_title = str(next_scene.get("title", "")).strip()
+    next_opening = str(next_scene.get("opening_situation", "")).strip()
+    next_atmosphere = str(next_scene.get("atmosphere", "")).strip()
+    current_location = str(current_scene.get("location", "")).strip()
+    next_time = str(next_scene.get("time_hint", "")).strip()
+    current_time = str(runtime.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
+    shift_reason = str(runtime.get("scene_shift_reason", "")).strip()
+    tension = str(runtime.get("tension", "")).strip()
+    should_shift = bool(runtime.get("should_offer_scene_shift", False))
+
+    if shift_reason and should_shift and current_location and next_location and current_location != next_location:
+        anchor = next_title or next_location
+        return f"{shift_reason}，场面顺势从{current_location}转到{anchor}。"
+
+    if next_time and current_time and next_time != current_time:
+        destination = next_location or next_title or "下一幕"
+        if tension:
+            return f"带着这股{_trim_transition_text(tension, 18)}，时间已经推到{next_time}，场面也转进了{destination}。"
+        return f"这一拍不知不觉拖到了{next_time}，场面也顺势转进了{destination}。"
+
+    if next_opening:
+        first_sentence = re.split(r"[。！？!?]", next_opening, maxsplit=1)[0].strip()
+        if first_sentence:
+            if not re.search(r"[。！？!?]$", first_sentence):
+                first_sentence = f"{first_sentence}。"
+            return first_sentence
+
+    if current_location and next_location and current_location != next_location:
+        anchor = next_title or next_location
+        return f"局面一转，众人从{current_location}挪到{anchor}，气氛也跟着变了。"
+
+    compact_recent = str(recent_text or "").strip()
+    if tension and next_atmosphere:
+        return f"刚才那股{_trim_transition_text(tension, 18)}还吊着，场面已经慢慢转成了{next_atmosphere}。"
+    if compact_recent and next_atmosphere:
+        return f"刚才那股{compact_recent[-12:]}的余波还没散，场面已经转成了{next_atmosphere}。"
+
+    if next_location and next_atmosphere:
+        return f"这一拍顺势转到{next_location}，场面也慢慢收成了{next_atmosphere}。"
+    if next_location:
+        return f"这一拍顺势转到{next_location}。"
+    if next_title:
+        return f"这一拍顺势转入「{next_title}」。"
+    return ""
+
+
+def _build_scene_chain_suggestions(
+    *,
+    current_scene: dict[str, Any],
+    current_scene_id: str,
+    reranked_items: list[dict[str, Any]],
+    recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
+) -> list[dict[str, Any]]:
+    candidates = [
+        item
+        for item in reranked_items
+        if str(item.get("card_id", "")).strip() and str(item.get("card_id", "")).strip() != current_scene_id
+    ][:5]
+    chains: list[dict[str, Any]] = []
+    for first_index, first in enumerate(candidates):
+        for second_index, second in enumerate(candidates):
+            if second_index == first_index:
+                continue
+            chains.append(
+                _build_chain_payload(
+                    current_scene=current_scene,
+                    items=[first, second],
+                    recent_text=recent_text,
+                    runtime_overview=runtime_overview,
+                )
+            )
+            for third_index, third in enumerate(candidates):
+                if third_index in {first_index, second_index}:
+                    continue
+                chains.append(
+                    _build_chain_payload(
+                        current_scene=current_scene,
+                        items=[first, second, third],
+                        recent_text=recent_text,
+                        runtime_overview=runtime_overview,
+                    )
+                )
+    chains.sort(key=lambda item: (int(item.get("score", 0) or 0), len(item.get("scenes", []) or [])), reverse=True)
+    deduped: list[dict[str, Any]] = []
+    seen_keys: set[str] = set()
+    for chain in chains:
+        scene_ids = [str(scene.get("card_id", "")).strip() for scene in list(chain.get("scenes", []) or [])]
+        key = "->".join(scene_ids)
+        if not key or key in seen_keys:
+            continue
+        seen_keys.add(key)
+        deduped.append(chain)
+        if len(deduped) >= 3:
+            break
+    return deduped
+
+
+def _build_chain_payload(
+    *,
+    current_scene: dict[str, Any],
+    items: list[dict[str, Any]],
+    recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
+) -> dict[str, Any]:
+    scenes: list[dict[str, str]] = []
+    previous_scene = dict(current_scene or {})
+    current_runtime = dict(runtime_overview or {})
+    total_score = 0
+    locations: list[str] = []
+    for index, item in enumerate(items):
+        fields = dict(item.get("fields", {}) or {})
+        score = int(dict(item.get("recommendation", {}) or {}).get("score", 0) or 0)
+        total_score += max(0, score) * max(1, 4 - index)
+        location = str(fields.get("location", "")).strip()
+        if location:
+            locations.append(location)
+        scenes.append(
+            {
+                "card_id": str(item.get("card_id", "")).strip(),
+                "title": str(item.get("preview", {}).get("title", "") or fields.get("title", "")).strip(),
+                "location": location,
+                "atmosphere": str(fields.get("atmosphere", "")).strip(),
+                "scene_drive": str(fields.get("scene_drive", "")).strip(),
+                "transition_message": _build_transition_message_hint(
+                    current_scene=previous_scene,
+                    next_scene=fields,
+                    recent_text=recent_text if index == 0 else str(previous_scene.get("scene_drive", "")).strip(),
+                    runtime_overview=current_runtime if index == 0 else None,
+                ),
+            }
+        )
+        previous_scene = fields
+        current_runtime = {}
+    if len(set(locations)) >= 2:
+        total_score += 4
+    if _chain_has_progressive_drive(scenes):
+        total_score += 3
+    return {
+        "chain_id": " -> ".join(scene.get("card_id", "") for scene in scenes),
+        "score": total_score,
+        "reason": _build_chain_reason(scenes),
+        "scenes": scenes,
+    }
+
+
+def _chain_has_progressive_drive(scenes: list[dict[str, str]]) -> bool:
+    drives = [str(scene.get("scene_drive", "")).strip() for scene in scenes if str(scene.get("scene_drive", "")).strip()]
+    if len(drives) < 2:
+        return False
+    strong_tokens = ("试探", "转折", "摊牌", "揭", "逼", "变局", "收紧")
+    return sum(1 for drive in drives if any(token in drive for token in strong_tokens)) >= 2
+
+
+def _build_chain_reason(scenes: list[dict[str, str]]) -> str:
+    if not scenes:
+        return "这条线能顺着往下接。"
+    locations = [scene.get("location", "") for scene in scenes if scene.get("location", "")]
+    if len(scenes) >= 3 and len(set(locations)) >= 2:
+        return "先换场再收紧，后面还有继续推进的余地。"
+    if len(scenes) >= 2 and len(set(locations)) >= 2:
+        return "地点会连续变化，戏路层次更明显。"
+    if _chain_has_progressive_drive(scenes):
+        return "每一幕的推进方向都比较明确，适合顺着往下压。"
+    first_title = str(scenes[0].get("title", "")).strip() or "这条线"
+    return f"可以先接「{first_title}」，后面还有顺势承接的下一拍。"
+
+
+def _trim_transition_text(text: str, limit: int) -> str:
+    compact = str(text or "").strip()
+    if len(compact) <= limit:
+        return compact
+    return f"{compact[: max(1, limit - 1)]}…"
+
+
+def _transcript_to_recent_text(transcript: Any) -> str:
+    lines: list[str] = []
+    for item in list(transcript or [])[-6:]:
+        if not isinstance(item, dict):
+            continue
+        message = str(item.get("message", "")).strip()
+        if message:
+            lines.append(message)
+    return "\n".join(lines)
diff --git a/src/web/chat/helpers.py b/src/web/chat/helpers.py
index e13d905..3065e6f 100644
--- a/src/web/chat/helpers.py
+++ b/src/web/chat/helpers.py
@@ -5,6 +5,7 @@
 from typing import Any, Callable
 
 from src.core.exceptions import LLMRequestError
+from src.skill_support.scene_recommendations import build_scene_opening_message
 
 
 def _session_state(session: dict[str, Any]) -> dict[str, Any]:
@@ -57,40 +58,12 @@ def _canonical_event_signals(session: dict[str, Any]) -> dict[str, Any]:
 
 
 def build_dialogue_opening_message(session: dict[str, Any]) -> str:
-    mode = str(session.get("mode", "observe")).strip() or "observe"
-    participants = [str(item).strip() for item in session.get("participants", []) if str(item).strip()]
-    cast = "、".join(participants) or "当前角色"
-    scene_card = dict(session.get("scene_card", {}) or {})
-    scene_title = str(scene_card.get("title", "")).strip()
-    location = str(scene_card.get("location", "")).strip()
-    atmosphere = str(scene_card.get("atmosphere", "")).strip()
-    opening = str(scene_card.get("opening_situation", "")).strip()
-    drive = str(scene_card.get("scene_drive", "")).strip()
-    scene_prefix_bits = [bit for bit in (scene_title, location, atmosphere) if bit]
-    scene_prefix = f"场景设定：{' / '.join(scene_prefix_bits)}。" if scene_prefix_bits else ""
-    opening_suffix = f" 开场局面是：{opening}。" if opening else ""
-    drive_suffix = f" 推进方向优先朝这边走：{drive}。" if drive else ""
-    if mode == "act":
-        controlled = str(session.get("controlled_character", "")).strip() or "该角色"
-        return (
-            f"{scene_prefix}请先为 {controlled} 与 {cast} 生成一个自然开场。"
-            f"{opening_suffix}{drive_suffix}"
-            "先给 1 条简短的场景提示或旁白，再让其他角色先接出第一轮对话，不要等待用户补充。"
-        )
-    if mode == "insert":
-        self_profile = dict(session.get("self_insert", {}) or {})
-        display_name = str(self_profile.get("display_name", "")).strip() or "我"
-        scene_identity = str(self_profile.get("scene_identity", "")).strip() or str(self_profile.get("core_identity", "")).strip()
-        identity_suffix = f"，身份是{scene_identity}" if scene_identity else ""
-        return (
-            f"{scene_prefix}请先为 {display_name}{identity_suffix} 与 {cast} 生成一个自然开场。"
-            f"{opening_suffix}{drive_suffix}"
-            "先给 1 条简短的场景提示或旁白，再让角色们先开口，对这个进入场景的人作出第一轮反应。"
-        )
-    return (
-        f"{scene_prefix}请先为 {cast} 生成一个自然开场。"
-        f"{opening_suffix}{drive_suffix}"
-        "先给 1 条简短的场景提示或旁白，再让角色们开始第一轮对话，让场景自己动起来。"
+    return build_scene_opening_message(
+        mode=str(session.get("mode", "observe")).strip() or "observe",
+        participants=[str(item).strip() for item in session.get("participants", []) if str(item).strip()],
+        scene_card=dict(session.get("scene_card", {}) or {}),
+        controlled_character=str(session.get("controlled_character", "")).strip(),
+        self_profile=dict(session.get("self_insert", {}) or {}),
     )
 
 
diff --git a/src/web/review/scene_cards.py b/src/web/review/scene_cards.py
index d9b872a..063d0ee 100644
--- a/src/web/review/scene_cards.py
+++ b/src/web/review/scene_cards.py
@@ -7,6 +7,8 @@
 from typing import Any, Callable
 from uuid import uuid4
 
+from src.skill_support.scene_recommendations import recommend_scene_cards_base
+
 
 SCENE_CARD_FIELDS = (
     "title",
@@ -43,12 +45,6 @@
     "forbidden_topics": "不想碰的话头",
 }
 
-_GROUP_SCENE_TOKENS = ("众人", "席间", "满座", "同席", "众目", "围坐", "宴", "厅", "堂", "多人")
-_DUO_SCENE_TOKENS = ("二人", "对坐", "独处", "檐下", "私谈", "夜谈", "回廊", "亭中", "单独")
-_INSERT_SCENE_TOKENS = ("来客", "访客", "外客", "误入", "新到", "初来", "借住", "入席", "登门")
-_PLOT_PUSH_TOKENS = ("试探", "摊牌", "转折", "打断", "逼问", "推", "揭", "撞破", "失手", "变局")
-
-
 def blank_scene_card_fields() -> dict[str, str]:
     return {field: "" for field in SCENE_CARD_FIELDS}
 
@@ -230,39 +226,7 @@ def recommend_scene_cards(
     mode: str,
     participants: list[str] | None = None,
 ) -> dict[str, Any]:
-    normalized_mode = str(mode or "observe").strip() or "observe"
-    participant_list = [str(item).strip() for item in (participants or []) if str(item).strip()]
-    scored_items: list[dict[str, Any]] = []
-    for item in cards:
-        score, reasons = _score_scene_card(
-            dict(item.get("fields", {}) or {}),
-            mode=normalized_mode,
-            participants=participant_list,
-        )
-        scored_items.append(
-            {
-                **item,
-                "recommendation": {
-                    "score": score,
-                    "reasons": reasons,
-                },
-            }
-        )
-    scored_items.sort(
-        key=lambda item: (
-            int(item.get("recommendation", {}).get("score", 0) or 0),
-            str(item.get("updated_at", "")),
-            str(item.get("card_id", "")),
-        ),
-        reverse=True,
-    )
-    recommended_card_id = str(scored_items[0].get("card_id", "")).strip() if scored_items else ""
-    return {
-        "mode": normalized_mode,
-        "participants": participant_list,
-        "recommended_card_id": recommended_card_id,
-        "items": scored_items,
-    }
+    return recommend_scene_cards_base(cards, mode=mode, participants=participants)
 
 
 def _extract_json_object(text: str) -> dict[str, Any] | None:
@@ -292,74 +256,6 @@ def _load_card_meta(card_dir: Path) -> dict[str, Any]:
     return json.loads(meta_path.read_text(encoding="utf-8"))
 
 
-def _score_scene_card(
-    fields: dict[str, Any],
-    *,
-    mode: str,
-    participants: list[str],
-) -> tuple[int, list[str]]:
-    normalized = normalize_scene_card_fields(fields)
-    combined_text = "\n".join(str(normalized.get(field, "")).strip() for field in SCENE_CARD_FIELDS)
-    participant_count = len(participants)
-    score = 0
-    reasons: list[str] = []
-
-    if normalized["scene_drive"]:
-        score += 3
-        reasons.append("推进方向明确")
-    if normalized["opening_situation"]:
-        score += 2
-        reasons.append("开场局面具体")
-    if normalized["atmosphere"]:
-        score += 1
-        reasons.append("气氛落点清楚")
-
-    if participant_count >= 3:
-        hit = _count_hits(combined_text, _GROUP_SCENE_TOKENS)
-        if hit:
-            score += 3 + min(2, hit - 1)
-            reasons.append("更像多人同席场")
-    elif participant_count == 2:
-        hit = _count_hits(combined_text, _DUO_SCENE_TOKENS)
-        if hit:
-            score += 3 + min(1, hit - 1)
-            reasons.append("更适合双人拉扯")
-
-    if mode == "insert":
-        hit = _count_hits(combined_text, _INSERT_SCENE_TOKENS)
-        if hit:
-            score += 4 + min(1, hit - 1)
-            reasons.append("适合来客/自我入场")
-    elif mode == "observe":
-        hit = _count_hits(combined_text, _PLOT_PUSH_TOKENS)
-        if hit:
-            score += 3 + min(2, hit - 1)
-            reasons.append("更利于旁观推动剧情")
-    elif mode == "act":
-        duo_hit = _count_hits(combined_text, _DUO_SCENE_TOKENS)
-        if duo_hit:
-            score += 2
-            reasons.append("留有角色正面接戏空间")
-
-    if normalized["public_goal"]:
-        score += 1
-    if normalized["hidden_tension"]:
-        score += 1
-    if normalized["expected_rhythm"]:
-        score += 1
-
-    if not reasons:
-        reasons.append("信息比较完整，能直接开场")
-    return score, reasons[:3]
-
-
-def _count_hits(text: str, tokens: tuple[str, ...]) -> int:
-    compact = str(text or "").strip()
-    if not compact:
-        return 0
-    return sum(1 for token in tokens if token and token in compact)
-
-
 def _load_scene_card_fields(
     card_dir: Path,
     *,
diff --git a/src/web/service_facades/scene_cards.py b/src/web/service_facades/scene_cards.py
index 33bfea0..ff676b4 100644
--- a/src/web/service_facades/scene_cards.py
+++ b/src/web/service_facades/scene_cards.py
@@ -1,9 +1,9 @@
 from __future__ import annotations
 
 from datetime import UTC, datetime
-import re
 from typing import Any
 
+from src.skill_support.scene_recommendations import build_scene_recommendation_bundle
 from src.web.artifacts import load_profile_source, render_profile_md
 from src.web.review import (
     build_random_scene_card_messages,
@@ -83,382 +83,23 @@ def recommend_dialogue_scene_card(self, run_id: str, *, session_id: str) -> dict
         participants = list(session.get("session_card", {}).get("participants", []) or [])
         current_scene = dict(session.get("session_card", {}).get("scene_card", {}) or {})
         runtime_overview = dict(session.get("runtime_state_overview", {}) or {})
-        current_scene_snapshot = _merge_current_scene_snapshot(current_scene, runtime_overview)
         current_scene_id = str(session.get("session_card", {}).get("scene_card_id", "")).strip()
         recent_text = "\n".join(
             str(item.get("message", "")).strip()
             for item in list(session.get("transcript", []) or [])[-6:]
             if str(item.get("message", "")).strip()
         )
-        payload = recommend_scene_cards(cards, mode=mode, participants=participants)
-        reranked_items: list[dict[str, Any]] = []
-        for item in list(payload.get("items", []) or []):
-            recommendation = dict(item.get("recommendation", {}) or {})
-            score = int(recommendation.get("score", 0) or 0)
-            reasons = [str(reason).strip() for reason in list(recommendation.get("reasons", []) or []) if str(reason).strip()]
-            item_card_id = str(item.get("card_id", "")).strip()
-            fields = dict(item.get("fields", {}) or {})
-
-            if current_scene_id and item_card_id == current_scene_id:
-                score -= 5
-                reasons.insert(0, "当前已经在这幕里，优先换一拍")
-            else:
-                current_location = str(current_scene_snapshot.get("location", "")).strip()
-                candidate_location = str(fields.get("location", "")).strip()
-                if current_location and candidate_location and candidate_location != current_location:
-                    score += 1
-                    reasons.append("地点切换更明显，适合转场")
-
-                overlap = _scene_text_overlap_score(fields, recent_text)
-                if overlap:
-                    score += overlap
-                    reasons.append("和最近这几句的气口更接")
-
-                state_bonus, state_reasons = _score_scene_card_with_runtime_state(
-                    fields,
-                    runtime_overview=runtime_overview,
-                    current_scene=current_scene_snapshot,
-                    participants=participants,
-                    recent_text=recent_text,
-                )
-                score += state_bonus
-                reasons.extend(state_reasons)
-
-            reranked_items.append(
-                {
-                    **item,
-                    "recommendation": {
-                        "score": score,
-                        "reasons": reasons[:4] or ["适合承接当前会话"],
-                    },
-                }
-            )
-
-        reranked_items.sort(
-            key=lambda item: (
-                int(item.get("recommendation", {}).get("score", 0) or 0),
-                str(item.get("updated_at", "")),
-                str(item.get("card_id", "")),
-            ),
-            reverse=True,
-        )
-        recommended_card_id = str(reranked_items[0].get("card_id", "")).strip() if reranked_items else ""
-        top_fields = dict(reranked_items[0].get("fields", {}) or {}) if reranked_items else {}
-        chain_suggestions = _build_scene_chain_suggestions(
-            current_scene=current_scene_snapshot,
-            current_scene_id=current_scene_id,
-            reranked_items=reranked_items,
-            recent_text=recent_text,
-            runtime_overview=runtime_overview,
-        )
-        return {
-            "mode": mode,
-            "participants": participants,
-            "current_scene_card_id": current_scene_id,
-            "recommended_card_id": recommended_card_id,
-            "recommended_transition_message": _build_transition_message_hint(
-                current_scene=current_scene_snapshot,
-                next_scene=top_fields,
-                recent_text=recent_text,
-                runtime_overview=runtime_overview,
-            ),
-            "chain_suggestions": chain_suggestions,
-            "items": reranked_items,
-        }
-
-
-def _merge_current_scene_snapshot(current_scene: dict[str, Any], runtime_overview: dict[str, Any]) -> dict[str, Any]:
-    merged = dict(current_scene or {})
-    if str(runtime_overview.get("location", "")).strip():
-        merged["location"] = str(runtime_overview.get("location", "")).strip()
-    if str(runtime_overview.get("time_hint", "")).strip():
-        merged["time_hint"] = str(runtime_overview.get("time_hint", "")).strip()
-    if str(runtime_overview.get("atmosphere", "")).strip():
-        merged["atmosphere"] = str(runtime_overview.get("atmosphere", "")).strip()
-    return merged
-
-
-def _scene_text_overlap_score(fields: dict[str, Any], recent_text: str) -> int:
-    compact_recent = str(recent_text or "").strip()
-    if not compact_recent:
-        return 0
-    phrases: list[str] = []
-    for key in ("location", "atmosphere", "opening_situation", "scene_drive", "public_goal", "hidden_tension"):
-        raw = str(fields.get(key, "") or "").strip()
-        if not raw:
-            continue
-        for part in re.split(r"[，,。；;、：:\s]+", raw):
-            text = part.strip()
-            if 2 <= len(text) <= 8 and text not in phrases:
-                phrases.append(text)
-    overlap = sum(1 for phrase in phrases[:12] if phrase in compact_recent)
-    return min(3, overlap)
-
-
-def _score_scene_card_with_runtime_state(
-    fields: dict[str, Any],
-    *,
-    runtime_overview: dict[str, Any],
-    current_scene: dict[str, Any],
-    participants: list[str],
-    recent_text: str,
-) -> tuple[int, list[str]]:
-    score = 0
-    reasons: list[str] = []
-    current_location = str(current_scene.get("location", "")).strip()
-    candidate_location = str(fields.get("location", "")).strip()
-    current_time = str(runtime_overview.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
-    candidate_time = str(fields.get("time_hint", "")).strip()
-    beat_maturity = max(0, min(100, int(runtime_overview.get("beat_maturity", 0) or 0)))
-    should_shift = bool(runtime_overview.get("should_offer_scene_shift", False))
-    shift_reason = str(runtime_overview.get("scene_shift_reason", "")).strip()
-    tension = str(runtime_overview.get("tension", "")).strip()
-    next_hint = str(runtime_overview.get("next_hint", "")).strip()
-    atmosphere = str(runtime_overview.get("atmosphere", "")).strip()
-    event_rows = list(runtime_overview.get("event_rows", []) or [])
-    recent_event = str((event_rows[-1] or {}).get("copy", "")).strip() if event_rows else ""
-
-    if should_shift:
-        if current_location and candidate_location and candidate_location != current_location:
-            score += 4
-            reasons.append("这一拍已接近收束，更适合换场推进")
-        elif current_location and candidate_location and candidate_location == current_location:
-            score -= 2
-            reasons.append("这一拍已经该收住了，不必继续原地打转")
-        elif candidate_location:
-            score += 1
-            reasons.append("当前已经适合往下一拍走")
-    elif beat_maturity and beat_maturity < 45 and current_location and candidate_location == current_location:
-        score += 2
-        reasons.append("这一拍还没聊满，先在同场景续火更顺")
-
-    if current_time and candidate_time:
-        if candidate_time == current_time:
-            score += 1
-            reasons.append("时间承接自然")
-        elif should_shift or beat_maturity >= 55:
-            score += 2
-            reasons.append("时间推进能带出下一拍")
-
-    state_overlap = _state_overlap_score(
-        fields,
-        state_texts=[atmosphere, tension, next_hint, recent_event, recent_text],
-    )
-    if state_overlap:
-        score += state_overlap
-        reasons.append("能接住本局气氛和悬念")
-
-    if len(participants) >= 3 and candidate_location and any(token in candidate_location for token in ("厅", "堂", "席", "园", "院")):
-        score += 1
-        reasons.append("多人局切到这个场面更容易铺开")
-
-    if shift_reason:
-        shift_tokens = [part for part in re.split(r"[，,。；;、：:\s]+", shift_reason) if 2 <= len(part.strip()) <= 8]
-        if any(token and token in "\n".join(str(fields.get(key, "")).strip() for key in ("opening_situation", "scene_drive", "hidden_tension")) for token in shift_tokens[:4]):
-            score += 2
-            reasons.append("和当前这拍的收束理由接得上")
-
-    return score, reasons
-
-
-def _state_overlap_score(fields: dict[str, Any], *, state_texts: list[str]) -> int:
-    compact_state = "\n".join(text.strip() for text in state_texts if str(text).strip())
-    if not compact_state:
-        return 0
-    phrases: list[str] = []
-    for key in ("atmosphere", "opening_situation", "public_goal", "hidden_tension", "scene_drive"):
-        raw = str(fields.get(key, "")).strip()
-        if not raw:
-            continue
-        for part in re.split(r"[，,。；;、：:\s]+", raw):
-            text = part.strip()
-            if 2 <= len(text) <= 8 and text not in phrases:
-                phrases.append(text)
-    overlap = sum(1 for phrase in phrases[:14] if phrase in compact_state)
-    return min(4, overlap)
-
-
-def _build_transition_message_hint(
-    *,
-    current_scene: dict[str, Any],
-    next_scene: dict[str, Any],
-    recent_text: str,
-    runtime_overview: dict[str, Any] | None = None,
-) -> str:
-    runtime_overview = dict(runtime_overview or {})
-    next_location = str(next_scene.get("location", "")).strip()
-    next_title = str(next_scene.get("title", "")).strip()
-    next_opening = str(next_scene.get("opening_situation", "")).strip()
-    next_atmosphere = str(next_scene.get("atmosphere", "")).strip()
-    current_location = str(current_scene.get("location", "")).strip()
-    next_time = str(next_scene.get("time_hint", "")).strip()
-    current_time = str(runtime_overview.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
-    shift_reason = str(runtime_overview.get("scene_shift_reason", "")).strip()
-    tension = str(runtime_overview.get("tension", "")).strip()
-    should_shift = bool(runtime_overview.get("should_offer_scene_shift", False))
-
-    if shift_reason and should_shift and current_location and next_location and current_location != next_location:
-        anchor = next_title or next_location
-        return f"{shift_reason}，场面顺势从{current_location}转到{anchor}。"
-
-    if next_time and current_time and next_time != current_time:
-        destination = next_location or next_title or "下一幕"
-        if tension:
-            return f"带着这股{_trim_transition_text(tension, 18)}，时间已经推到{next_time}，场面也转进了{destination}。"
-        return f"这一拍不知不觉拖到了{next_time}，场面也顺势转进了{destination}。"
-
-    if next_opening:
-        first_sentence = re.split(r"[。！？!?]", next_opening, maxsplit=1)[0].strip()
-        if first_sentence:
-            if not re.search(r"[。！？!?]$", first_sentence):
-                first_sentence = f"{first_sentence}。"
-            return first_sentence
-
-    if current_location and next_location and current_location != next_location:
-        anchor = next_title or next_location
-        return f"局面一转，众人从{current_location}挪到{anchor}，气氛也跟着变了。"
-
-    compact_recent = str(recent_text or "").strip()
-    if tension and next_atmosphere:
-        return f"刚才那股{_trim_transition_text(tension, 18)}还吊着，场面已经慢慢转成了{next_atmosphere}。"
-    if compact_recent and next_atmosphere:
-        return f"刚才那股{compact_recent[-12:]}的余波还没散，场面已经转成了{next_atmosphere}。"
-
-    if next_location and next_atmosphere:
-        return f"这一拍顺势转到{next_location}，场面也慢慢收成了{next_atmosphere}。"
-    if next_location:
-        return f"这一拍顺势转到{next_location}。"
-    if next_title:
-        return f"这一拍顺势转入「{next_title}」。"
-    return ""
-
-
-def _build_scene_chain_suggestions(
-    *,
-    current_scene: dict[str, Any],
-    current_scene_id: str,
-    reranked_items: list[dict[str, Any]],
-    recent_text: str,
-    runtime_overview: dict[str, Any] | None = None,
-) -> list[dict[str, Any]]:
-    candidates = [
-        item
-        for item in reranked_items
-        if str(item.get("card_id", "")).strip() and str(item.get("card_id", "")).strip() != current_scene_id
-    ][:5]
-    chains: list[dict[str, Any]] = []
-    for first_index, first in enumerate(candidates):
-        for second_index, second in enumerate(candidates):
-            if second_index == first_index:
-                continue
-            chain_items = [first, second]
-            chains.append(
-                _build_chain_payload(
-                    current_scene=current_scene,
-                    items=chain_items,
-                    recent_text=recent_text,
-                    runtime_overview=runtime_overview,
-                )
-            )
-            for third_index, third in enumerate(candidates):
-                if third_index in {first_index, second_index}:
-                    continue
-                chains.append(
-                    _build_chain_payload(
-                        current_scene=current_scene,
-                        items=[first, second, third],
-                        recent_text=recent_text,
-                        runtime_overview=runtime_overview,
-                    )
-                )
-    chains.sort(key=lambda item: (int(item.get("score", 0) or 0), len(item.get("scenes", []) or [])), reverse=True)
-    deduped: list[dict[str, Any]] = []
-    seen_keys: set[str] = set()
-    for chain in chains:
-        scene_ids = [str(scene.get("card_id", "")).strip() for scene in list(chain.get("scenes", []) or [])]
-        key = "->".join(scene_ids)
-        if not key or key in seen_keys:
-            continue
-        seen_keys.add(key)
-        deduped.append(chain)
-        if len(deduped) >= 3:
-            break
-    return deduped
-
-
-def _build_chain_payload(
-    *,
-    current_scene: dict[str, Any],
-    items: list[dict[str, Any]],
-    recent_text: str,
-    runtime_overview: dict[str, Any] | None = None,
-) -> dict[str, Any]:
-    scenes: list[dict[str, str]] = []
-    previous_scene = dict(current_scene or {})
-    current_runtime = dict(runtime_overview or {})
-    total_score = 0
-    locations: list[str] = []
-    for index, item in enumerate(items):
-        fields = dict(item.get("fields", {}) or {})
-        score = int(dict(item.get("recommendation", {}) or {}).get("score", 0) or 0)
-        total_score += max(0, score) * max(1, 4 - index)
-        location = str(fields.get("location", "")).strip()
-        if location:
-            locations.append(location)
-        scenes.append(
+        bundle = build_scene_recommendation_bundle(
             {
-                "card_id": str(item.get("card_id", "")).strip(),
-                "title": str(item.get("preview", {}).get("title", "") or fields.get("title", "")).strip(),
-                "location": location,
-                "atmosphere": str(fields.get("atmosphere", "")).strip(),
-                "scene_drive": str(fields.get("scene_drive", "")).strip(),
-                "transition_message": _build_transition_message_hint(
-                    current_scene=previous_scene,
-                    next_scene=fields,
-                    recent_text=recent_text if index == 0 else str(previous_scene.get("scene_drive", "")).strip(),
-                    runtime_overview=current_runtime if index == 0 else None,
-                ),
+                "mode": mode,
+                "participants": participants,
+                "scene_cards": cards,
+                "current_scene": current_scene,
+                "current_scene_card_id": current_scene_id,
+                "runtime_state_overview": runtime_overview,
+                "recent_text": recent_text,
+                "controlled_character": str(session.get("controlled_character", "")).strip(),
+                "self_profile": dict(session.get("self_insert", {}) or {}),
             }
         )
-        previous_scene = fields
-        current_runtime = {}
-    if len(set(locations)) >= 2:
-        total_score += 4
-    if _chain_has_progressive_drive(scenes):
-        total_score += 3
-    return {
-        "chain_id": " -> ".join(scene.get("card_id", "") for scene in scenes),
-        "score": total_score,
-        "reason": _build_chain_reason(scenes),
-        "scenes": scenes,
-    }
-
-
-def _chain_has_progressive_drive(scenes: list[dict[str, str]]) -> bool:
-    drives = [str(scene.get("scene_drive", "")).strip() for scene in scenes if str(scene.get("scene_drive", "")).strip()]
-    if len(drives) < 2:
-        return False
-    strong_tokens = ("试探", "转折", "摊牌", "揭", "逼", "变局", "收紧")
-    hit_count = sum(1 for drive in drives if any(token in drive for token in strong_tokens))
-    return hit_count >= 2
-
-
-def _build_chain_reason(scenes: list[dict[str, str]]) -> str:
-    if not scenes:
-        return "这条线能顺着往下接。"
-    locations = [scene.get("location", "") for scene in scenes if scene.get("location", "")]
-    if len(scenes) >= 3 and len(set(locations)) >= 2:
-        return "先换场再收紧，后面还有继续推进的余地。"
-    if len(scenes) >= 2 and len(set(locations)) >= 2:
-        return "地点会连续变化，戏路层次更明显。"
-    if _chain_has_progressive_drive(scenes):
-        return "每一幕的推进方向都比较明确，适合顺着往下压。"
-    first_title = str(scenes[0].get("title", "")).strip() or "这条线"
-    return f"可以先接「{first_title}」，后面还有顺势承接的下一拍。"
-
-
-def _trim_transition_text(text: str, limit: int) -> str:
-    compact = str(text or "").strip()
-    if len(compact) <= limit:
-        return compact
-    return f"{compact[: max(1, limit - 1)]}…"
+        return dict(bundle.get("payload", {}) or {})
diff --git a/src/web/static/js/dialogue.js b/src/web/static/js/dialogue.js
index 467f3c5..1d8cb1e 100644
--- a/src/web/static/js/dialogue.js
+++ b/src/web/static/js/dialogue.js
@@ -821,7 +821,7 @@ function latestSessionSnippetFromTranscript(items) {
 }
 
 async function maybeAutoRecommendNextScene(session) {
-  const progress = session?.scene_progress || {};
+  const progress = session?.runtime_state_overview || session?.scene_progress || {};
   const sessionId = String(session?.session_id || "").trim();
   if (!sessionId || !progress?.should_offer_scene_shift) return;
   const button = el("dialogue-live-scene-recommend");
@@ -830,10 +830,10 @@ async function maybeAutoRecommendNextScene(session) {
   if ((select?.options?.length || 0) < 3) return;
   const marker = [
     sessionId,
-    String(progress.updated_at || "").trim(),
+    String(progress.updated_at || session?.updated_at || "").trim(),
     String(progress.time_hint || "").trim(),
     String(progress.location || "").trim(),
-    String(progress.scene_shift_reason || "").trim(),
+    String(progress.scene_shift_reason || progress.next_hint || "").trim(),
   ].join("::");
   if (!marker || marker === lastAutoSceneRecommendationKey) return;
   lastAutoSceneRecommendationKey = marker;
diff --git a/src/web/static/js/main.js b/src/web/static/js/main.js
index e57d467..d48b446 100644
--- a/src/web/static/js/main.js
+++ b/src/web/static/js/main.js
@@ -2436,6 +2436,7 @@ function renderDialogueSceneRecommendationSummary(session = currentDialogueSessi
   const title = String(topItem?.preview?.title || topItem?.fields?.title || recommendedCardId).trim();
   const location = String(topItem?.preview?.location || topItem?.fields?.location || "").trim();
   const transition = String(payload?.recommended_transition_message || "").trim();
+  const autoContinueMessage = String(payload?.recommended_auto_continue_message || "").trim();
   const reasons = Array.isArray(topItem?.recommendation?.reasons) ? topItem.recommendation.reasons.filter(Boolean).slice(0, 4) : [];
   const firstChain = Array.isArray(payload?.chain_suggestions) ? payload.chain_suggestions[0] : null;
   const chainReason = String(firstChain?.reason || "").trim();
@@ -2475,6 +2476,12 @@ function renderDialogueSceneRecommendationSummary(session = currentDialogueSessi
     root.appendChild(chainCopy);
   }
 
+  if (autoContinueMessage) {
+    const openingCopy = document.createElement("p");
+    openingCopy.textContent = `自动起拍提示：${autoContinueMessage}`;
+    root.appendChild(openingCopy);
+  }
+
   const autoCopy = document.createElement("p");
   autoCopy.textContent = "顺手切到下一幕会直接把新一拍接起来，不会停在空场。";
   root.appendChild(autoCopy);
diff --git a/tests/test_install_skill.py b/tests/test_install_skill.py
index 2de5920..33ef456 100644
--- a/tests/test_install_skill.py
+++ b/tests/test_install_skill.py
@@ -36,16 +36,19 @@ def test_copy_skill_bundle_installs_prompt_first_payload_by_default(self):
             self.assertTrue((dst / "tools" / "build_prompt_payload.py").exists())
             self.assertTrue((dst / "tools" / "build_persona_autofill_payload.py").exists())
             self.assertTrue((dst / "tools" / "build_dialogue_suggestion_payload.py").exists())
+            self.assertTrue((dst / "tools" / "build_scene_recommendation_payload.py").exists())
             self.assertTrue((dst / "tools" / "manage_self_card.py").exists())
             self.assertTrue((dst / "tools" / "export_relation_graph.py").exists())
             self.assertTrue((dst / "tools" / "init_host_run.py").exists())
             self.assertTrue((dst / "tools" / "materialize_persona_bundle.py").exists())
             self.assertTrue((dst / "tools" / "update_run_progress.py").exists())
             self.assertTrue((dst / "tools" / "verify_host_workflow.py").exists())
+            self.assertTrue((dst / "examples" / "scene_recommendation_context.example.json").exists())
             self.assertTrue((dst / "tools" / "_skill_support" / "novel_preparation.py").exists())
             self.assertTrue((dst / "tools" / "_skill_support" / "persona_bundle.py").exists())
             self.assertTrue((dst / "tools" / "_skill_support" / "persona_review.py").exists())
             self.assertTrue((dst / "tools" / "_skill_support" / "dialogue_payloads.py").exists())
+            self.assertTrue((dst / "tools" / "_skill_support" / "scene_recommendations.py").exists())
             self.assertTrue((dst / "tools" / "_skill_support" / "workflow_completion.py").exists())
             self.assertFalse((dst / "runtime").exists())
 
@@ -367,6 +370,88 @@ def test_installed_dialogue_suggestion_tool_rejects_invalid_mode(self):
             self.assertNotEqual(result.returncode, 0)
             self.assertIn("Unsupported dialogue suggestion mode", result.stderr)
 
+    def test_installed_scene_recommendation_tool_builds_bundle(self):
+        repo_root = Path(__file__).resolve().parents[1]
+        packaged_src = repo_root / "zaomeng-skill"
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            tmp_root = Path(tmpdir)
+            dst = copy_skill_bundle(packaged_src, tmp_root, "zaomeng-skill")
+            context_path = tmp_root / "scene_context.json"
+            context_path.write_text(
+                json.dumps(
+                    {
+                        "mode": "observe",
+                        "participants": ["魏无羡", "蓝忘机", "江澄"],
+                        "current_scene_card_id": "garden",
+                        "current_scene": {
+                            "title": "后园僵持",
+                            "location": "后园",
+                            "time_hint": "傍晚",
+                            "atmosphere": "气氛发紧",
+                        },
+                        "runtime_state_overview": {
+                            "location": "后园",
+                            "time_hint": "傍晚",
+                            "beat_maturity": 82,
+                            "should_offer_scene_shift": True,
+                            "scene_shift_reason": "这边该说的话已经说尽了",
+                        },
+                        "transcript": [
+                            {"message": "魏无羡没再笑。"},
+                            {"message": "江澄也没继续留人。"},
+                        ],
+                        "scene_cards": [
+                            {
+                                "card_id": "garden",
+                                "fields": {
+                                    "title": "后园僵持",
+                                    "location": "后园",
+                                    "time_hint": "傍晚",
+                                    "atmosphere": "气氛发紧",
+                                    "opening_situation": "人都站着没动。",
+                                    "scene_drive": "继续僵持",
+                                },
+                            },
+                            {
+                                "card_id": "hall",
+                                "fields": {
+                                    "title": "回厅再坐",
+                                    "location": "前厅",
+                                    "time_hint": "入夜",
+                                    "atmosphere": "表面平静，底下仍压着话头",
+                                    "opening_situation": "人重新入席，谁都没先开口。",
+                                    "scene_drive": "借换场逼近摊牌",
+                                },
+                            },
+                        ],
+                    },
+                    ensure_ascii=False,
+                ),
+                encoding="utf-8",
+            )
+
+            bundle_path = tmp_root / "scene_bundle.json"
+            subprocess.run(
+                [
+                    sys.executable,
+                    str(dst / "tools" / "build_scene_recommendation_payload.py"),
+                    "--context-file",
+                    str(context_path),
+                    "--output",
+                    str(bundle_path),
+                ],
+                cwd=dst,
+                check=True,
+                capture_output=True,
+            )
+
+            bundle = json.loads(bundle_path.read_text(encoding="utf-8"))
+            self.assertEqual(bundle["kind"], "dialogue_scene_recommendation_bundle")
+            self.assertEqual(bundle["payload"]["recommended_card_id"], "hall")
+            self.assertTrue(bundle["payload"]["recommended_transition_message"])
+            self.assertTrue(bundle["payload"]["recommended_auto_continue_message"])
+
     def test_installed_prepare_excerpt_tool_runs_without_repo_src(self):
         repo_root = Path(__file__).resolve().parents[1]
         packaged_src = repo_root / "zaomeng-skill"
diff --git a/tests/test_packaging_docs.py b/tests/test_packaging_docs.py
index 6407ae8..5b8783a 100644
--- a/tests/test_packaging_docs.py
+++ b/tests/test_packaging_docs.py
@@ -20,6 +20,8 @@ def test_manifest_describes_prompt_first_bundle(self):
         self.assertIn("tools/build_prompt_payload.py", manifest_text)
         self.assertIn("tools/materialize_persona_bundle.py", manifest_text)
         self.assertIn("tools/export_relation_graph.py", manifest_text)
+        self.assertIn("tools/build_scene_recommendation_payload.py", manifest_text)
+        self.assertIn("examples/scene_recommendation_context.example.json", manifest_text)
         self.assertIn("tools/verify_host_workflow.py", manifest_text)
         self.assertNotIn("runtime/zaomeng_cli.py", manifest_text)
         self.assertNotIn("runtime/src", manifest_text)
@@ -52,6 +54,8 @@ def test_readmes_describe_prompt_first_helpers(self):
         self.assertIn("tools/prepare_novel_excerpt.py", skill_readme)
         self.assertIn("tools/build_prompt_payload.py", skill_readme)
         self.assertIn("tools/export_relation_graph.py", skill_readme)
+        self.assertIn("tools/build_scene_recommendation_payload.py", skill_readme)
+        self.assertIn("examples/scene_recommendation_context.example.json", skill_readme)
         self.assertIn("requirements.txt", skill_readme)
         self.assertIn("references/chat_contract.md", skill_readme)
         self.assertIn("references/capability_index.md", skill_readme)
@@ -59,6 +63,8 @@ def test_readmes_describe_prompt_first_helpers(self):
         self.assertIn("tools/prepare_novel_excerpt.py", skill_readme_en)
         self.assertIn("tools/build_prompt_payload.py", skill_readme_en)
         self.assertIn("tools/export_relation_graph.py", skill_readme_en)
+        self.assertIn("tools/build_scene_recommendation_payload.py", skill_readme_en)
+        self.assertIn("examples/scene_recommendation_context.example.json", skill_readme_en)
         self.assertIn("requirements.txt", skill_readme_en)
         self.assertIn("references/chat_contract.md", skill_readme_en)
         self.assertIn("references/capability_index.md", skill_readme_en)
@@ -99,6 +105,7 @@ def test_skill_docs_prioritize_host_llm_and_run_manifest_contract(self):
         self.assertIn("act", clawhub_skill)
         self.assertIn("insert", clawhub_skill)
         self.assertIn("observe", clawhub_skill)
+        self.assertIn("scene_recommendation", clawhub_skill)
         self.assertNotIn("src.cli.app chat", clawhub_skill)
         self.assertNotIn("src.cli.app chat", skill_readme)
         self.assertNotIn("src.cli.app chat", skill_readme_en)
@@ -115,6 +122,8 @@ def test_chat_contract_reference_is_present(self):
         self.assertIn("act", contract_text)
         self.assertIn("insert", contract_text)
         self.assertIn("observe", contract_text)
+        self.assertIn("build_scene_recommendation_payload.py", contract_text)
+        self.assertIn("scene_recommendation_context.example.json", contract_text)
         self.assertIn("PROFILE.md", contract_text)
         self.assertIn("MEMORY.md", contract_text)
         self.assertIn("run_manifest.json", contract_text)
@@ -128,6 +137,8 @@ def test_capability_index_reference_is_present(self):
         self.assertIn("export_graph", capability_text)
         self.assertIn("verify_workflow", capability_text)
         self.assertIn("Dialogue Stage", capability_text)
+        self.assertIn("build_scene_recommendation_payload.py", capability_text)
+        self.assertIn("scene_recommendation_context.example.json", capability_text)
         self.assertIn("references/chat_contract.md", capability_text)
         self.assertIn("examples/host_workflow_example.md", capability_text)
         self.assertNotIn("src.cli.app chat", capability_text)
@@ -141,6 +152,7 @@ def test_host_workflow_example_is_present(self):
         self.assertIn("tools/verify_host_workflow.py", workflow_text)
         self.assertIn("Hand Off To Dialogue", workflow_text)
         self.assertIn("run_manifest.json", workflow_text)
+        self.assertIn("scene_recommendation_context.example.json", workflow_text)
         self.assertNotIn("src.cli.app chat", workflow_text)
 
     def test_distillation_docs_require_multi_character_differentiation(self):
diff --git a/tests/test_prompt_payloads.py b/tests/test_prompt_payloads.py
index e705f7e..19b5e96 100644
--- a/tests/test_prompt_payloads.py
+++ b/tests/test_prompt_payloads.py
@@ -5,6 +5,7 @@
 from pathlib import Path
 
 from src.skill_support.prompt_payloads import build_distill_prompt_payload, build_relation_prompt_payload
+from src.skill_support.scene_recommendations import build_scene_recommendation_bundle
 
 
 class PromptPayloadTests(unittest.TestCase):
@@ -143,6 +144,91 @@ def test_build_distill_prompt_payload_emits_warning_when_no_requested_character_
         self.assertTrue(payload["meta"]["warnings"])
         self.assertIn("未匹配到任何目标角色", payload["meta"]["warnings"][0])
 
+    def test_build_scene_recommendation_bundle_prefers_shifted_scene_when_current_beat_is_mature(self):
+        bundle = build_scene_recommendation_bundle(
+            {
+                "mode": "observe",
+                "participants": ["魏无羡", "蓝忘机", "江澄"],
+                "current_scene_card_id": "scene-garden",
+                "current_scene": {
+                    "title": "园中僵持",
+                    "location": "后园",
+                    "time_hint": "傍晚",
+                    "atmosphere": "气氛发紧",
+                },
+                "runtime_state_overview": {
+                    "location": "后园",
+                    "time_hint": "傍晚",
+                    "beat_maturity": 78,
+                    "should_offer_scene_shift": True,
+                    "scene_shift_reason": "这边该说的话已经说到头了",
+                    "tension": "僵着的一口气",
+                },
+                "transcript": [
+                    {"message": "魏无羡笑意收了，没再接话。"},
+                    {"message": "江澄看了他一眼，气口越发僵。"},
+                ],
+                "scene_cards": [
+                    {
+                        "card_id": "scene-garden",
+                        "fields": {
+                            "title": "园中僵持",
+                            "location": "后园",
+                            "time_hint": "傍晚",
+                            "atmosphere": "气氛发紧",
+                            "opening_situation": "几个人都还站在原地，谁也不肯先退。",
+                            "scene_drive": "继续僵住，看谁先摊牌",
+                        },
+                    },
+                    {
+                        "card_id": "scene-hall",
+                        "fields": {
+                            "title": "回厅再坐",
+                            "location": "前厅",
+                            "time_hint": "入夜",
+                            "atmosphere": "表面平静，底下还压着火",
+                            "opening_situation": "人都重新入席，话题却没人肯先挑明。",
+                            "scene_drive": "借换场把话逼到桌面上",
+                        },
+                    },
+                ],
+            }
+        )
+
+        payload = bundle["payload"]
+        self.assertEqual(bundle["kind"], "dialogue_scene_recommendation_bundle")
+        self.assertEqual(payload["recommended_card_id"], "scene-hall")
+        self.assertIn("后园", payload["recommended_transition_message"])
+        self.assertTrue(payload["recommended_auto_continue_message"])
+
+    def test_build_scene_recommendation_bundle_uses_self_insert_identity_for_opening_hint(self):
+        bundle = build_scene_recommendation_bundle(
+            {
+                "mode": "insert",
+                "participants": ["林黛玉", "贾宝玉"],
+                "self_profile": {
+                    "display_name": "沈拂衣",
+                    "scene_identity": "初到贾府的借宿客",
+                },
+                "scene_cards": [
+                    {
+                        "card_id": "scene-arrival",
+                        "fields": {
+                            "title": "初见偏厅",
+                            "location": "偏厅",
+                            "atmosphere": "初见微妙",
+                            "opening_situation": "你刚被丫鬟领进门，众人的目光都落过来。",
+                            "scene_drive": "先试探来意，再看彼此反应",
+                        },
+                    }
+                ],
+            }
+        )
+
+        opening = bundle["payload"]["recommended_auto_continue_message"]
+        self.assertIn("沈拂衣", opening)
+        self.assertIn("初到贾府的借宿客", opening)
+
 
 if __name__ == "__main__":
     unittest.main()
diff --git a/tests/test_web_app.py b/tests/test_web_app.py
index efb098e..02557bc 100644
--- a/tests/test_web_app.py
+++ b/tests/test_web_app.py
@@ -151,6 +151,7 @@ def test_dialogue_scene_card_recommendation_prefers_next_scene_not_current_one(s
             self.assertNotEqual(payload["recommended_card_id"], current_scene["card_id"])
             self.assertTrue(payload["items"][0]["recommendation"]["reasons"])
             self.assertTrue(str(payload.get("recommended_transition_message", "")).strip())
+            self.assertTrue(str(payload.get("recommended_auto_continue_message", "")).strip())
             self.assertTrue(payload["chain_suggestions"])
             self.assertGreaterEqual(len(payload["chain_suggestions"][0]["scenes"]), 2)
             self.assertTrue(str(payload["chain_suggestions"][0]["reason"]).strip())
@@ -249,6 +250,7 @@ def test_dialogue_scene_card_recommendation_stays_in_same_location_when_beat_is_
             payload = service.recommend_dialogue_scene_card(run["run_id"], session_id=session["session_id"])
 
             self.assertEqual(payload["recommended_card_id"], same_location["card_id"])
+            self.assertIn("生成一个自然开场", str(payload.get("recommended_auto_continue_message", "")).strip())
 
     def test_dialogue_scene_card_recommendation_uses_runtime_shift_reason_in_transition_hint(self):
         with tempfile.TemporaryDirectory() as tmp:
@@ -345,6 +347,7 @@ def test_dialogue_scene_card_recommendation_uses_runtime_shift_reason_in_transit
 
             self.assertEqual(payload["recommended_card_id"], next_scene["card_id"])
             self.assertIn("雨势压得两人都没法再站在回廊里装作无事", payload["recommended_transition_message"])
+            self.assertTrue(str(payload.get("recommended_auto_continue_message", "")).strip())
 
     def test_dialogue_scene_history_tracks_initial_scene_and_switches(self):
         with tempfile.TemporaryDirectory() as tmp:
diff --git a/zaomeng-skill/MANIFEST.md b/zaomeng-skill/MANIFEST.md
index 418732b..5612772 100644
--- a/zaomeng-skill/MANIFEST.md
+++ b/zaomeng-skill/MANIFEST.md
@@ -19,6 +19,7 @@
 - `tools/materialize_persona_bundle.py`
 - `tools/export_relation_graph.py`
 - `tools/verify_host_workflow.py`
+- `tools/build_scene_recommendation_payload.py`
 
 ## Prompt 模板
 
@@ -42,6 +43,7 @@
 - `examples/sample_character_profile.md`
 - `examples/sample_relations.md`
 - `examples/test-prompts.json`
+- `examples/scene_recommendation_context.example.json`
 - `examples/host_workflow_example.md`
 
 ## 打包目标
diff --git a/zaomeng-skill/README.md b/zaomeng-skill/README.md
index 4bb2b43..ed2ceb2 100644
--- a/zaomeng-skill/README.md
+++ b/zaomeng-skill/README.md
@@ -151,6 +151,14 @@
 - `insert`：用户以自己身份进入场景
 - `observe`：用户只观察角色推进群聊
 
+如果宿主想把“下一幕推荐 + 自动转场 + 自动起拍”也接进来，可以额外调用：
+
+- `python tools/build_scene_recommendation_payload.py --context-file <context.json>`
+
+可直接参考：
+
+- `examples/scene_recommendation_context.example.json`
+
 ## 安装方式
 
 ### OpenClaw
@@ -182,6 +190,7 @@ python tools/build_prompt_payload.py --mode distill|relation --novel <路径> [-
 python tools/materialize_persona_bundle.py --profile-file <角色目录/PROFILE.generated.md>
 python tools/export_relation_graph.py --relations-file <关系结果.md>
 python tools/verify_host_workflow.py --characters-root <characters/<novel_id>> [--relations-file <关系结果.md>]
+python tools/build_scene_recommendation_payload.py --context-file <context.json>
 ```
 
 ```bash
diff --git a/zaomeng-skill/README_EN.md b/zaomeng-skill/README_EN.md
index 764e9a3..4682240 100644
--- a/zaomeng-skill/README_EN.md
+++ b/zaomeng-skill/README_EN.md
@@ -151,6 +151,14 @@ Host mode interpretation:
 - `insert`: the user enters the scene as themselves
 - `observe`: the user watches the cast continue the scene
 
+If the host also wants next-beat recommendation, scene-shift text, and auto-opening hints, it can additionally call:
+
+- `python tools/build_scene_recommendation_payload.py --context-file <context.json>`
+
+Reference example:
+
+- `examples/scene_recommendation_context.example.json`
+
 ## Installation
 
 ### OpenClaw
@@ -182,6 +190,7 @@ python tools/build_prompt_payload.py --mode distill|relation --novel <path> [--c
 python tools/materialize_persona_bundle.py --profile-file <character-dir/PROFILE.generated.md>
 python tools/export_relation_graph.py --relations-file <relation-result.md>
 python tools/verify_host_workflow.py --characters-root <characters/<novel_id>> [--relations-file <relation-result.md>]
+python tools/build_scene_recommendation_payload.py --context-file <context.json>
 ```
 
 ```bash
diff --git a/zaomeng-skill/SKILL.md b/zaomeng-skill/SKILL.md
index 4ac80cc..6e6966a 100644
--- a/zaomeng-skill/SKILL.md
+++ b/zaomeng-skill/SKILL.md
@@ -30,7 +30,7 @@ metadata:
 
 ## 2. 宿主能力契约
 
-宿主侧只需要理解四个标准能力，以及三组对话 helper：
+宿主侧只需要理解四个标准能力，以及四组对话 helper：
 
 | 能力 | 入口 | 作用 | 标准成功标记 |
 | --- | --- | --- | --- |
@@ -46,6 +46,7 @@ metadata:
 | `self_card` | `tools/manage_self_card.py` | 创建 / 保存 / 读取 / 删除 self-insert 角色卡，并生成随机角色卡 prompt payload |
 | `persona_autofill` | `tools/build_persona_autofill_payload.py` | 为人物校对单字段生成宿主可调用的补全 payload，并解析模型返回 |
 | `dialogue_suggestion` | `tools/build_dialogue_suggestion_payload.py` | 为 `act` / `insert` / `observe` 生成自动回复建议 payload，并提供压缩重试版本 |
+| `scene_recommendation` | `tools/build_scene_recommendation_payload.py` | 为当前会话生成下一幕场景推荐、转场提示、多拍链路建议，以及可直接用于自动起拍的 opening cue |
 
 所有能力都应该满足：
 
@@ -233,11 +234,16 @@ python tools/verify_host_workflow.py --characters-root <characters/<novel_id>> -
 - `run_manifest.json`
 - `references/output_schema.md`、`references/style_differ.md`、`references/logic_constraint.md`
 
-如果宿主需要角色卡、人物字段补全或对话建议 helper，可直接调用：
+如果宿主需要角色卡、人物字段补全、对话建议或下一幕推荐 helper，可直接调用：
 
 - `python tools/manage_self_card.py --mode blank|list|get|save|delete|build-random-payload|parse-random-response`
 - `python tools/build_persona_autofill_payload.py --persona-dir <角色目录> --field <字段名> --strategy auto|model_knowledge`
 - `python tools/build_dialogue_suggestion_payload.py --context-file <context.json>`
+- `python tools/build_scene_recommendation_payload.py --context-file <context.json>`
+
+其中 `scene_recommendation` 的上下文字段可直接参考：
+
+- `examples/scene_recommendation_context.example.json`
 
 宿主结束提示建议直接说清楚：
 
diff --git a/zaomeng-skill/examples/host_workflow_example.md b/zaomeng-skill/examples/host_workflow_example.md
index 615ad35..48ca890 100644
--- a/zaomeng-skill/examples/host_workflow_example.md
+++ b/zaomeng-skill/examples/host_workflow_example.md
@@ -10,6 +10,7 @@ This example shows one complete host-side flow:
 6. generate / merge the relationship result and export the graph
 7. verify workflow completeness
 8. hand off to host-driven dialogue
+9. optionally ask the packaged scene helper to recommend the next beat during dialogue
 
 ## 1. Initialize The Run
 
@@ -163,6 +164,22 @@ At this point, the host already has everything needed to enter `act`, `insert`,
 
 The host now drives the dialogue directly with its own LLM.
 
+If the host wants packaged help choosing the next beat for the current session, it can also call:
+
+```bash
+python tools/build_scene_recommendation_payload.py --context-file runtime/scene_recommendation_context.json --output runtime/scene_recommendation_bundle.json
+```
+
+You can bootstrap that context shape from:
+
+- `examples/scene_recommendation_context.example.json`
+
+The host can then:
+
+- apply `payload.recommended_card_id`
+- surface `payload.recommended_transition_message`
+- feed `payload.recommended_auto_continue_message` back into its dialogue engine to auto-open the next beat immediately
+
 ## Recommended UI / Agent Surfacing
 
 After the workflow completes, a host can safely surface:
diff --git a/zaomeng-skill/examples/scene_recommendation_context.example.json b/zaomeng-skill/examples/scene_recommendation_context.example.json
new file mode 100644
index 0000000..28ffd6f
--- /dev/null
+++ b/zaomeng-skill/examples/scene_recommendation_context.example.json
@@ -0,0 +1,95 @@
+{
+  "mode": "observe",
+  "participants": ["林黛玉", "贾宝玉", "薛宝钗"],
+  "current_scene_card_id": "scene-garden-evening",
+  "current_scene": {
+    "title": "园中晚坐",
+    "time_hint": "傍晚",
+    "location": "沁芳桥边",
+    "atmosphere": "话里都还留着分寸",
+    "opening_situation": "三人刚把一桩旧事说到半明半暗，谁也没先彻底挑破。",
+    "public_goal": "先把表面体面撑住。",
+    "hidden_tension": "再往下说，就会碰到真正不愿提起的话。",
+    "scene_drive": "让这口气慢慢收紧，再看该不该换场。"
+  },
+  "runtime_state_overview": {
+    "location": "沁芳桥边",
+    "time_hint": "傍晚",
+    "atmosphere": "表面还是平静，底下已经发紧",
+    "beat_maturity": 78,
+    "should_offer_scene_shift": true,
+    "scene_shift_reason": "这一拍已经说到边上，再留在原地只会空转，不如顺势换到下一幕。",
+    "tension": "几个人都知道下一句会更难接",
+    "next_hint": "不如借天色和走动，把人带进更适合把话说开的地方。",
+    "event_rows": [
+      {
+        "title": "气氛变化",
+        "copy": "笑意还在，真正的话头却已经沉下去了。"
+      }
+    ]
+  },
+  "transcript": [
+    {"speaker": "林黛玉", "message": "话既说到这儿，再绕也没什么意思了。"},
+    {"speaker": "贾宝玉", "message": "我不是要逼你，只是有些话总不能一直搁着。"},
+    {"speaker": "薛宝钗", "message": "桥边风凉，真要说开，不如先回去坐下。"}
+  ],
+  "scene_cards": [
+    {
+      "card_id": "scene-garden-evening",
+      "fields": {
+        "title": "园中晚坐",
+        "time_hint": "傍晚",
+        "location": "沁芳桥边",
+        "atmosphere": "话里都还留着分寸",
+        "opening_situation": "三人还站在桥边，谁也没先走。",
+        "public_goal": "先把局面维持住。",
+        "hidden_tension": "真正的话已经快藏不住了。",
+        "scene_drive": "继续原地试探。",
+        "expected_rhythm": "慢压"
+      },
+      "preview": {
+        "title": "园中晚坐",
+        "location": "沁芳桥边",
+        "atmosphere": "话里都还留着分寸"
+      }
+    },
+    {
+      "card_id": "scene-hall-night",
+      "fields": {
+        "title": "回厅夜坐",
+        "time_hint": "入夜",
+        "location": "花厅",
+        "atmosphere": "灯下更难回避彼此",
+        "opening_situation": "众人重新落座，谁也没急着碰茶。",
+        "public_goal": "把表面话撑到头。",
+        "hidden_tension": "下一句就可能把真正心思挑明。",
+        "scene_drive": "借换场把话逼到桌面上。",
+        "expected_rhythm": "越聊越紧"
+      },
+      "preview": {
+        "title": "回厅夜坐",
+        "location": "花厅",
+        "atmosphere": "灯下更难回避彼此"
+      }
+    },
+    {
+      "card_id": "scene-corridor-private",
+      "fields": {
+        "title": "回廊私话",
+        "time_hint": "夜里",
+        "location": "回廊",
+        "atmosphere": "两个人终于能把声音压低",
+        "opening_situation": "人群散开后，只剩两个人还没把那句话说完。",
+        "public_goal": "试着把真正想问的话说出口。",
+        "hidden_tension": "谁先软下来，谁就先露底。",
+        "scene_drive": "让关系从多人局转到双人拉扯。",
+        "expected_rhythm": "缓慢逼近"
+      },
+      "preview": {
+        "title": "回廊私话",
+        "location": "回廊",
+        "atmosphere": "两个人终于能把声音压低"
+      }
+    }
+  ]
+}
diff --git a/zaomeng-skill/examples/test-prompts.json b/zaomeng-skill/examples/test-prompts.json
index 492c17f..4618efb 100644
--- a/zaomeng-skill/examples/test-prompts.json
+++ b/zaomeng-skill/examples/test-prompts.json
@@ -53,6 +53,25 @@
           "needs_revision_on_repeat_mismatch"
         ]
       }
+    },
+    {
+      "id": "scene-recommend-01",
+      "task": "scene_recommendation",
+      "input": "请根据当前会话状态推荐下一幕场景，并给出转场起句与自动起拍提示。",
+      "expect": {
+        "required_keys": [
+          "recommended_card_id",
+          "recommended_transition_message",
+          "recommended_auto_continue_message",
+          "chain_suggestions",
+          "items"
+        ],
+        "validation": [
+          "scene_progress_alignment",
+          "transition_quality",
+          "opening_cue_available"
+        ]
+      }
     }
   ]
 }
diff --git a/zaomeng-skill/references/capability_index.md b/zaomeng-skill/references/capability_index.md
index 0c5343f..a8b2517 100644
--- a/zaomeng-skill/references/capability_index.md
+++ b/zaomeng-skill/references/capability_index.md
@@ -153,6 +153,10 @@ Optional helpers for the dialogue stage:
 - `tools/build_dialogue_suggestion_payload.py`
   - build one-line suggestion payloads for `act` / `insert` / `observe`
   - provide compact retry payloads for long-context fallback
+- `tools/build_scene_recommendation_payload.py`
+  - build next-scene recommendation bundles for the current dialogue state
+  - provide transition text, chain suggestions, and an auto-continue opening cue
+  - see `examples/scene_recommendation_context.example.json` for a starter context shape
 
 ## Read Order
 
diff --git a/zaomeng-skill/references/chat_contract.md b/zaomeng-skill/references/chat_contract.md
index 1368a6e..7ea0b30 100644
--- a/zaomeng-skill/references/chat_contract.md
+++ b/zaomeng-skill/references/chat_contract.md
@@ -114,6 +114,21 @@ The tool returns:
 - retry messages
 - parser contract for model output
 
+If the host wants the skill to help decide what the next beat should be, call:
+
+- `tools/build_scene_recommendation_payload.py --context-file <context.json>`
+
+The tool returns:
+
+- ranked next-scene candidates
+- a recommended transition message
+- scene chain suggestions for follow-up beats
+- a `recommended_auto_continue_message` the host can feed back into its dialogue engine immediately after switching scenes
+
+Recommended starter context:
+
+- `examples/scene_recommendation_context.example.json`
+
 ## Recommended Artifact Read Order
 
 1. `run_manifest.json`
diff --git a/zaomeng-skill/tools/_skill_support/__init__.py b/zaomeng-skill/tools/_skill_support/__init__.py
index 65b324d..44a74d3 100644
--- a/zaomeng-skill/tools/_skill_support/__init__.py
+++ b/zaomeng-skill/tools/_skill_support/__init__.py
@@ -12,6 +12,13 @@
     normalize_dialogue_suggestion_context,
     parse_dialogue_suggestion,
 )
+from .scene_recommendations import (
+    build_scene_opening_message,
+    build_scene_recommendation_bundle,
+    normalize_scene_recommendation_context,
+    recommend_dialogue_scene_cards,
+    recommend_scene_cards_base,
+)
 from .persona_review import (
     PERSONA_AUTOFILLABLE_FIELDS,
     PERSONA_REVIEW_ADVANCED_GROUPS,
@@ -77,17 +84,22 @@
     "build_random_self_card_messages",
     "build_dialogue_suggestion_llm_messages",
     "build_dialogue_suggestion_payload",
+    "build_scene_opening_message",
+    "build_scene_recommendation_bundle",
     "compact_dialogue_suggestion_payload",
     "delete_self_card_payload",
     "list_self_cards_payload",
     "load_persona_review_payload",
     "load_self_card_payload",
     "normalize_dialogue_suggestion_context",
+    "normalize_scene_recommendation_context",
     "normalize_self_card_fields",
     "parse_dialogue_suggestion",
     "parse_persona_field_completion_response",
     "parse_random_self_card_response",
     "read_persona_review_fields",
+    "recommend_dialogue_scene_cards",
+    "recommend_scene_cards_base",
     "resolve_persona_review_source",
     "save_persona_review_profile",
     "save_self_card_payload",
diff --git a/zaomeng-skill/tools/_skill_support/scene_recommendations.py b/zaomeng-skill/tools/_skill_support/scene_recommendations.py
new file mode 100644
index 0000000..f66b8af
--- /dev/null
+++ b/zaomeng-skill/tools/_skill_support/scene_recommendations.py
@@ -0,0 +1,641 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+from __future__ import annotations
+
+import re
+from typing import Any
+
+_GROUP_SCENE_TOKENS = ("众人", "席间", "满座", "同席", "众目", "围坐", "宴", "厅", "堂", "多人")
+_DUO_SCENE_TOKENS = ("二人", "对坐", "独处", "檐下", "私谈", "夜谈", "回廊", "亭中", "单独")
+_INSERT_SCENE_TOKENS = ("来客", "访客", "外客", "误入", "新到", "初来", "借住", "入席", "登门")
+_PLOT_PUSH_TOKENS = ("试探", "摊牌", "转折", "打断", "逼问", "推", "揭", "撞破", "失手", "变局")
+_SCENE_FIELDS = (
+    "title",
+    "time_hint",
+    "location",
+    "atmosphere",
+    "opening_situation",
+    "public_goal",
+    "hidden_tension",
+    "scene_drive",
+    "expected_rhythm",
+    "forbidden_topics",
+)
+
+
+def build_scene_recommendation_bundle(context: dict[str, Any]) -> dict[str, Any]:
+    normalized = normalize_scene_recommendation_context(context)
+    recommended = recommend_dialogue_scene_cards(
+        cards=list(normalized.get("scene_cards", []) or []),
+        mode=str(normalized.get("mode", "observe")).strip() or "observe",
+        participants=list(normalized.get("participants", []) or []),
+        current_scene=dict(normalized.get("current_scene", {}) or {}),
+        current_scene_id=str(normalized.get("current_scene_card_id", "")).strip(),
+        runtime_overview=dict(normalized.get("runtime_state_overview", {}) or {}),
+        recent_text=str(normalized.get("recent_text", "")).strip(),
+    )
+    top_card: dict[str, Any] = next(
+        (
+            item
+            for item in list(recommended.get("items", []) or [])
+            if str(item.get("card_id", "")).strip() == str(recommended.get("recommended_card_id", "")).strip()
+        ),
+        {},
+    )
+    fields = dict(top_card.get("fields", {}) or {})
+    recommended["recommended_auto_continue_message"] = build_scene_opening_message(
+        mode=str(normalized.get("mode", "observe")).strip() or "observe",
+        participants=list(normalized.get("participants", []) or []),
+        scene_card=fields,
+        controlled_character=str(normalized.get("controlled_character", "")).strip(),
+        self_profile=dict(normalized.get("self_profile", {}) or {}),
+    )
+    return {
+        "kind": "dialogue_scene_recommendation_bundle",
+        "payload": recommended,
+        "host_hint": (
+            "The host may directly apply recommended_card_id + recommended_transition_message. "
+            "If it wants to auto-continue the new beat immediately, it can feed recommended_auto_continue_message "
+            "back into its dialogue engine as the next opening cue."
+        ),
+    }
+
+
+def normalize_scene_recommendation_context(context: dict[str, Any]) -> dict[str, Any]:
+    mode = str(context.get("mode", "observe")).strip() or "observe"
+    participants = [str(item).strip() for item in list(context.get("participants", []) or []) if str(item).strip()]
+    scene_cards = [_normalize_scene_card_entry(item) for item in list(context.get("scene_cards", []) or []) if isinstance(item, dict)]
+    if not scene_cards:
+        raise ValueError("Scene recommendation context requires non-empty scene_cards.")
+    return {
+        "mode": mode,
+        "participants": participants,
+        "scene_cards": scene_cards,
+        "current_scene_card_id": str(context.get("current_scene_card_id", "")).strip(),
+        "current_scene": _normalize_scene_fields(dict(context.get("current_scene", {}) or {})),
+        "runtime_state_overview": dict(context.get("runtime_state_overview", {}) or {}),
+        "recent_text": str(context.get("recent_text", "")).strip() or _transcript_to_recent_text(context.get("transcript", [])),
+        "controlled_character": str(context.get("controlled_character", "")).strip(),
+        "self_profile": dict(context.get("self_profile", {}) or {}),
+    }
+
+
+def recommend_dialogue_scene_cards(
+    *,
+    cards: list[dict[str, Any]],
+    mode: str,
+    participants: list[str],
+    current_scene: dict[str, Any],
+    current_scene_id: str,
+    runtime_overview: dict[str, Any] | None = None,
+    recent_text: str = "",
+) -> dict[str, Any]:
+    normalized_mode = str(mode or "observe").strip() or "observe"
+    participant_list = [str(item).strip() for item in participants if str(item).strip()]
+    current_scene_snapshot = _merge_current_scene_snapshot(current_scene, dict(runtime_overview or {}))
+    base = recommend_scene_cards_base(cards, mode=normalized_mode, participants=participant_list)
+    reranked_items: list[dict[str, Any]] = []
+    for item in list(base.get("items", []) or []):
+        recommendation = dict(item.get("recommendation", {}) or {})
+        score = int(recommendation.get("score", 0) or 0)
+        reasons = [str(reason).strip() for reason in list(recommendation.get("reasons", []) or []) if str(reason).strip()]
+        item_card_id = str(item.get("card_id", "")).strip()
+        fields = dict(item.get("fields", {}) or {})
+
+        if current_scene_id and item_card_id == current_scene_id:
+            score -= 5
+            reasons.insert(0, "当前已经在这幕里，优先换一拍")
+        else:
+            current_location = str(current_scene_snapshot.get("location", "")).strip()
+            candidate_location = str(fields.get("location", "")).strip()
+            if current_location and candidate_location and candidate_location != current_location:
+                score += 1
+                reasons.append("地点切换更明显，适合转场")
+
+            overlap = _scene_text_overlap_score(fields, recent_text)
+            if overlap:
+                score += overlap
+                reasons.append("和最近这几句的气口更接")
+
+            state_bonus, state_reasons = _score_scene_card_with_runtime_state(
+                fields,
+                runtime_overview=dict(runtime_overview or {}),
+                current_scene=current_scene_snapshot,
+                participants=participant_list,
+                recent_text=recent_text,
+            )
+            score += state_bonus
+            reasons.extend(state_reasons)
+
+        reranked_items.append(
+            {
+                **item,
+                "recommendation": {
+                    "score": score,
+                    "reasons": reasons[:4] or ["适合承接当前会话"],
+                },
+            }
+        )
+
+    reranked_items.sort(
+        key=lambda item: (
+            int(item.get("recommendation", {}).get("score", 0) or 0),
+            str(item.get("updated_at", "")),
+            str(item.get("card_id", "")),
+        ),
+        reverse=True,
+    )
+    recommended_card_id = str(reranked_items[0].get("card_id", "")).strip() if reranked_items else ""
+    top_fields = dict(reranked_items[0].get("fields", {}) or {}) if reranked_items else {}
+    return {
+        "mode": normalized_mode,
+        "participants": participant_list,
+        "current_scene_card_id": str(current_scene_id or "").strip(),
+        "recommended_card_id": recommended_card_id,
+        "recommended_transition_message": _build_transition_message_hint(
+            current_scene=current_scene_snapshot,
+            next_scene=top_fields,
+            recent_text=recent_text,
+            runtime_overview=dict(runtime_overview or {}),
+        ),
+        "chain_suggestions": _build_scene_chain_suggestions(
+            current_scene=current_scene_snapshot,
+            current_scene_id=str(current_scene_id or "").strip(),
+            reranked_items=reranked_items,
+            recent_text=recent_text,
+            runtime_overview=dict(runtime_overview or {}),
+        ),
+        "items": reranked_items,
+    }
+
+
+def recommend_scene_cards_base(
+    cards: list[dict[str, Any]],
+    *,
+    mode: str,
+    participants: list[str] | None = None,
+) -> dict[str, Any]:
+    normalized_mode = str(mode or "observe").strip() or "observe"
+    participant_list = [str(item).strip() for item in (participants or []) if str(item).strip()]
+    scored_items: list[dict[str, Any]] = []
+    for item in cards:
+        fields = _normalize_scene_fields(dict(item.get("fields", {}) or {}))
+        score, reasons = _score_scene_card(fields, mode=normalized_mode, participants=participant_list)
+        scored_items.append(
+            {
+                **item,
+                "fields": fields,
+                "recommendation": {
+                    "score": score,
+                    "reasons": reasons,
+                },
+            }
+        )
+    scored_items.sort(
+        key=lambda item: (
+            int(item.get("recommendation", {}).get("score", 0) or 0),
+            str(item.get("updated_at", "")),
+            str(item.get("card_id", "")),
+        ),
+        reverse=True,
+    )
+    return {
+        "mode": normalized_mode,
+        "participants": participant_list,
+        "recommended_card_id": str(scored_items[0].get("card_id", "")).strip() if scored_items else "",
+        "items": scored_items,
+    }
+
+
+def build_scene_opening_message(
+    *,
+    mode: str,
+    participants: list[str],
+    scene_card: dict[str, Any],
+    controlled_character: str = "",
+    self_profile: dict[str, Any] | None = None,
+) -> str:
+    normalized_mode = str(mode or "observe").strip() or "observe"
+    cast = "、".join(str(item).strip() for item in participants if str(item).strip()) or "当前角色"
+    scene = _normalize_scene_fields(scene_card)
+    scene_prefix_bits = [bit for bit in (scene.get("title", ""), scene.get("location", ""), scene.get("atmosphere", "")) if bit]
+    scene_prefix = f"场景设定：{' / '.join(scene_prefix_bits)}。" if scene_prefix_bits else ""
+    opening_suffix = f" 开场局面是：{scene.get('opening_situation', '')}。" if str(scene.get("opening_situation", "")).strip() else ""
+    drive_suffix = f" 推进方向优先朝这边走：{scene.get('scene_drive', '')}。" if str(scene.get("scene_drive", "")).strip() else ""
+    if normalized_mode == "act":
+        controlled = str(controlled_character or "").strip() or "该角色"
+        return (
+            f"{scene_prefix}请先为 {controlled} 与 {cast} 生成一个自然开场。"
+            f"{opening_suffix}{drive_suffix}"
+            "先给 1 条简短的场景提示或旁白，再让其他角色先接出第一轮对话，不要等待用户补充。"
+        )
+    if normalized_mode == "insert":
+        profile = dict(self_profile or {})
+        display_name = str(profile.get("display_name", "")).strip() or "我"
+        scene_identity = str(profile.get("scene_identity", "")).strip() or str(profile.get("core_identity", "")).strip()
+        identity_suffix = f"，身份是{scene_identity}" if scene_identity else ""
+        return (
+            f"{scene_prefix}请先为 {display_name}{identity_suffix} 与 {cast} 生成一个自然开场。"
+            f"{opening_suffix}{drive_suffix}"
+            "先给 1 条简短的场景提示或旁白，再让角色们先开口，对这个进入场景的人作出第一轮反应。"
+        )
+    return (
+        f"{scene_prefix}请先为 {cast} 生成一个自然开场。"
+        f"{opening_suffix}{drive_suffix}"
+        "先给 1 条简短的场景提示或旁白，再让角色们开始第一轮对话，让场景自己动起来。"
+    )
+
+
+def _normalize_scene_card_entry(item: dict[str, Any]) -> dict[str, Any]:
+    fields = _normalize_scene_fields(dict(item.get("fields", {}) or {}))
+    preview = dict(item.get("preview", {}) or {})
+    if not preview:
+        preview = {
+            "title": str(fields.get("title", "")).strip(),
+            "time_hint": str(fields.get("time_hint", "")).strip(),
+            "location": str(fields.get("location", "")).strip(),
+            "atmosphere": str(fields.get("atmosphere", "")).strip(),
+            "opening_situation": str(fields.get("opening_situation", "")).strip(),
+            "scene_drive": str(fields.get("scene_drive", "")).strip(),
+            "expected_rhythm": str(fields.get("expected_rhythm", "")).strip(),
+        }
+    return {
+        "card_id": str(item.get("card_id", "")).strip(),
+        "fields": fields,
+        "preview": preview,
+        "updated_at": str(item.get("updated_at", "")).strip(),
+    }
+
+
+def _normalize_scene_fields(fields: dict[str, Any]) -> dict[str, str]:
+    return {field: str(fields.get(field, "") or "").strip() for field in _SCENE_FIELDS}
+
+
+def _score_scene_card(fields: dict[str, Any], *, mode: str, participants: list[str]) -> tuple[int, list[str]]:
+    normalized = _normalize_scene_fields(fields)
+    combined_text = "\n".join(str(normalized.get(field, "")).strip() for field in _SCENE_FIELDS)
+    participant_count = len(participants)
+    score = 0
+    reasons: list[str] = []
+
+    if normalized["scene_drive"]:
+        score += 3
+        reasons.append("推进方向明确")
+    if normalized["opening_situation"]:
+        score += 2
+        reasons.append("开场局面具体")
+    if normalized["atmosphere"]:
+        score += 1
+        reasons.append("气氛落点清楚")
+
+    if participant_count >= 3:
+        hit = _count_hits(combined_text, _GROUP_SCENE_TOKENS)
+        if hit:
+            score += 3 + min(2, hit - 1)
+            reasons.append("更像多人同席场")
+    elif participant_count == 2:
+        hit = _count_hits(combined_text, _DUO_SCENE_TOKENS)
+        if hit:
+            score += 3 + min(1, hit - 1)
+            reasons.append("更适合双人拉扯")
+
+    if mode == "insert":
+        hit = _count_hits(combined_text, _INSERT_SCENE_TOKENS)
+        if hit:
+            score += 4 + min(1, hit - 1)
+            reasons.append("适合来客/自我入场")
+    elif mode == "observe":
+        hit = _count_hits(combined_text, _PLOT_PUSH_TOKENS)
+        if hit:
+            score += 3 + min(2, hit - 1)
+            reasons.append("更利于旁观推动剧情")
+    elif mode == "act":
+        duo_hit = _count_hits(combined_text, _DUO_SCENE_TOKENS)
+        if duo_hit:
+            score += 2
+            reasons.append("留有角色正面接戏空间")
+
+    if normalized["public_goal"]:
+        score += 1
+    if normalized["hidden_tension"]:
+        score += 1
+    if normalized["expected_rhythm"]:
+        score += 1
+
+    if not reasons:
+        reasons.append("信息比较完整，能直接开场")
+    return score, reasons[:3]
+
+
+def _count_hits(text: str, tokens: tuple[str, ...]) -> int:
+    compact = str(text or "").strip()
+    if not compact:
+        return 0
+    return sum(1 for token in tokens if token and token in compact)
+
+
+def _merge_current_scene_snapshot(current_scene: dict[str, Any], runtime_overview: dict[str, Any]) -> dict[str, Any]:
+    merged = _normalize_scene_fields(current_scene)
+    if str(runtime_overview.get("location", "")).strip():
+        merged["location"] = str(runtime_overview.get("location", "")).strip()
+    if str(runtime_overview.get("time_hint", "")).strip():
+        merged["time_hint"] = str(runtime_overview.get("time_hint", "")).strip()
+    if str(runtime_overview.get("atmosphere", "")).strip():
+        merged["atmosphere"] = str(runtime_overview.get("atmosphere", "")).strip()
+    return merged
+
+
+def _scene_text_overlap_score(fields: dict[str, Any], recent_text: str) -> int:
+    compact_recent = str(recent_text or "").strip()
+    if not compact_recent:
+        return 0
+    phrases: list[str] = []
+    for key in ("location", "atmosphere", "opening_situation", "scene_drive", "public_goal", "hidden_tension"):
+        raw = str(fields.get(key, "") or "").strip()
+        if not raw:
+            continue
+        for part in re.split(r"[，,。；;、：:\s]+", raw):
+            text = part.strip()
+            if 2 <= len(text) <= 8 and text not in phrases:
+                phrases.append(text)
+    overlap = sum(1 for phrase in phrases[:12] if phrase in compact_recent)
+    return min(3, overlap)
+
+
+def _score_scene_card_with_runtime_state(
+    fields: dict[str, Any],
+    *,
+    runtime_overview: dict[str, Any],
+    current_scene: dict[str, Any],
+    participants: list[str],
+    recent_text: str,
+) -> tuple[int, list[str]]:
+    score = 0
+    reasons: list[str] = []
+    current_location = str(current_scene.get("location", "")).strip()
+    candidate_location = str(fields.get("location", "")).strip()
+    current_time = str(runtime_overview.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
+    candidate_time = str(fields.get("time_hint", "")).strip()
+    beat_maturity = max(0, min(100, int(runtime_overview.get("beat_maturity", 0) or 0)))
+    should_shift = bool(runtime_overview.get("should_offer_scene_shift", False))
+    shift_reason = str(runtime_overview.get("scene_shift_reason", "")).strip()
+    tension = str(runtime_overview.get("tension", "")).strip()
+    next_hint = str(runtime_overview.get("next_hint", "")).strip()
+    atmosphere = str(runtime_overview.get("atmosphere", "")).strip()
+    event_rows = list(runtime_overview.get("event_rows", []) or [])
+    recent_event = str((event_rows[-1] or {}).get("copy", "")).strip() if event_rows else ""
+
+    if should_shift:
+        if current_location and candidate_location and candidate_location != current_location:
+            score += 4
+            reasons.append("这一拍已接近收束，更适合换场推进")
+        elif current_location and candidate_location and candidate_location == current_location:
+            score -= 2
+            reasons.append("这一拍已经该收住了，不必继续原地打转")
+        elif candidate_location:
+            score += 1
+            reasons.append("当前已经适合往下一拍走")
+    elif beat_maturity and beat_maturity < 45 and current_location and candidate_location == current_location:
+        score += 2
+        reasons.append("这一拍还没聊满，先在同场景续火更顺")
+
+    if current_time and candidate_time:
+        if candidate_time == current_time:
+            score += 1
+            reasons.append("时间承接自然")
+        elif should_shift or beat_maturity >= 55:
+            score += 2
+            reasons.append("时间推进能带出下一拍")
+
+    state_overlap = _state_overlap_score(
+        fields,
+        state_texts=[atmosphere, tension, next_hint, recent_event, recent_text],
+    )
+    if state_overlap:
+        score += state_overlap
+        reasons.append("能接住本局气氛和悬念")
+
+    if len(participants) >= 3 and candidate_location and any(token in candidate_location for token in ("厅", "堂", "席", "园", "院")):
+        score += 1
+        reasons.append("多人局切到这个场面更容易铺开")
+
+    if shift_reason:
+        shift_tokens = [part for part in re.split(r"[，,。；;、：:\s]+", shift_reason) if 2 <= len(part.strip()) <= 8]
+        if any(token and token in "\n".join(str(fields.get(key, "")).strip() for key in ("opening_situation", "scene_drive", "hidden_tension")) for token in shift_tokens[:4]):
+            score += 2
+            reasons.append("和当前这拍的收束理由接得上")
+
+    return score, reasons
+
+
+def _state_overlap_score(fields: dict[str, Any], *, state_texts: list[str]) -> int:
+    compact_state = "\n".join(text.strip() for text in state_texts if str(text).strip())
+    if not compact_state:
+        return 0
+    phrases: list[str] = []
+    for key in ("atmosphere", "opening_situation", "public_goal", "hidden_tension", "scene_drive"):
+        raw = str(fields.get(key, "")).strip()
+        if not raw:
+            continue
+        for part in re.split(r"[，,。；;、：:\s]+", raw):
+            text = part.strip()
+            if 2 <= len(text) <= 8 and text not in phrases:
+                phrases.append(text)
+    overlap = sum(1 for phrase in phrases[:14] if phrase in compact_state)
+    return min(4, overlap)
+
+
+def _build_transition_message_hint(
+    *,
+    current_scene: dict[str, Any],
+    next_scene: dict[str, Any],
+    recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
+) -> str:
+    runtime = dict(runtime_overview or {})
+    next_location = str(next_scene.get("location", "")).strip()
+    next_title = str(next_scene.get("title", "")).strip()
+    next_opening = str(next_scene.get("opening_situation", "")).strip()
+    next_atmosphere = str(next_scene.get("atmosphere", "")).strip()
+    current_location = str(current_scene.get("location", "")).strip()
+    next_time = str(next_scene.get("time_hint", "")).strip()
+    current_time = str(runtime.get("time_hint", "") or current_scene.get("time_hint", "")).strip()
+    shift_reason = str(runtime.get("scene_shift_reason", "")).strip()
+    tension = str(runtime.get("tension", "")).strip()
+    should_shift = bool(runtime.get("should_offer_scene_shift", False))
+
+    if shift_reason and should_shift and current_location and next_location and current_location != next_location:
+        anchor = next_title or next_location
+        return f"{shift_reason}，场面顺势从{current_location}转到{anchor}。"
+
+    if next_time and current_time and next_time != current_time:
+        destination = next_location or next_title or "下一幕"
+        if tension:
+            return f"带着这股{_trim_transition_text(tension, 18)}，时间已经推到{next_time}，场面也转进了{destination}。"
+        return f"这一拍不知不觉拖到了{next_time}，场面也顺势转进了{destination}。"
+
+    if next_opening:
+        first_sentence = re.split(r"[。！？!?]", next_opening, maxsplit=1)[0].strip()
+        if first_sentence:
+            if not re.search(r"[。！？!?]$", first_sentence):
+                first_sentence = f"{first_sentence}。"
+            return first_sentence
+
+    if current_location and next_location and current_location != next_location:
+        anchor = next_title or next_location
+        return f"局面一转，众人从{current_location}挪到{anchor}，气氛也跟着变了。"
+
+    compact_recent = str(recent_text or "").strip()
+    if tension and next_atmosphere:
+        return f"刚才那股{_trim_transition_text(tension, 18)}还吊着，场面已经慢慢转成了{next_atmosphere}。"
+    if compact_recent and next_atmosphere:
+        return f"刚才那股{compact_recent[-12:]}的余波还没散，场面已经转成了{next_atmosphere}。"
+
+    if next_location and next_atmosphere:
+        return f"这一拍顺势转到{next_location}，场面也慢慢收成了{next_atmosphere}。"
+    if next_location:
+        return f"这一拍顺势转到{next_location}。"
+    if next_title:
+        return f"这一拍顺势转入「{next_title}」。"
+    return ""
+
+
+def _build_scene_chain_suggestions(
+    *,
+    current_scene: dict[str, Any],
+    current_scene_id: str,
+    reranked_items: list[dict[str, Any]],
+    recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
+) -> list[dict[str, Any]]:
+    candidates = [
+        item
+        for item in reranked_items
+        if str(item.get("card_id", "")).strip() and str(item.get("card_id", "")).strip() != current_scene_id
+    ][:5]
+    chains: list[dict[str, Any]] = []
+    for first_index, first in enumerate(candidates):
+        for second_index, second in enumerate(candidates):
+            if second_index == first_index:
+                continue
+            chains.append(
+                _build_chain_payload(
+                    current_scene=current_scene,
+                    items=[first, second],
+                    recent_text=recent_text,
+                    runtime_overview=runtime_overview,
+                )
+            )
+            for third_index, third in enumerate(candidates):
+                if third_index in {first_index, second_index}:
+                    continue
+                chains.append(
+                    _build_chain_payload(
+                        current_scene=current_scene,
+                        items=[first, second, third],
+                        recent_text=recent_text,
+                        runtime_overview=runtime_overview,
+                    )
+                )
+    chains.sort(key=lambda item: (int(item.get("score", 0) or 0), len(item.get("scenes", []) or [])), reverse=True)
+    deduped: list[dict[str, Any]] = []
+    seen_keys: set[str] = set()
+    for chain in chains:
+        scene_ids = [str(scene.get("card_id", "")).strip() for scene in list(chain.get("scenes", []) or [])]
+        key = "->".join(scene_ids)
+        if not key or key in seen_keys:
+            continue
+        seen_keys.add(key)
+        deduped.append(chain)
+        if len(deduped) >= 3:
+            break
+    return deduped
+
+
+def _build_chain_payload(
+    *,
+    current_scene: dict[str, Any],
+    items: list[dict[str, Any]],
+    recent_text: str,
+    runtime_overview: dict[str, Any] | None = None,
+) -> dict[str, Any]:
+    scenes: list[dict[str, str]] = []
+    previous_scene = dict(current_scene or {})
+    current_runtime = dict(runtime_overview or {})
+    total_score = 0
+    locations: list[str] = []
+    for index, item in enumerate(items):
+        fields = dict(item.get("fields", {}) or {})
+        score = int(dict(item.get("recommendation", {}) or {}).get("score", 0) or 0)
+        total_score += max(0, score) * max(1, 4 - index)
+        location = str(fields.get("location", "")).strip()
+        if location:
+            locations.append(location)
+        scenes.append(
+            {
+                "card_id": str(item.get("card_id", "")).strip(),
+                "title": str(item.get("preview", {}).get("title", "") or fields.get("title", "")).strip(),
+                "location": location,
+                "atmosphere": str(fields.get("atmosphere", "")).strip(),
+                "scene_drive": str(fields.get("scene_drive", "")).strip(),
+                "transition_message": _build_transition_message_hint(
+                    current_scene=previous_scene,
+                    next_scene=fields,
+                    recent_text=recent_text if index == 0 else str(previous_scene.get("scene_drive", "")).strip(),
+                    runtime_overview=current_runtime if index == 0 else None,
+                ),
+            }
+        )
+        previous_scene = fields
+        current_runtime = {}
+    if len(set(locations)) >= 2:
+        total_score += 4
+    if _chain_has_progressive_drive(scenes):
+        total_score += 3
+    return {
+        "chain_id": " -> ".join(scene.get("card_id", "") for scene in scenes),
+        "score": total_score,
+        "reason": _build_chain_reason(scenes),
+        "scenes": scenes,
+    }
+
+
+def _chain_has_progressive_drive(scenes: list[dict[str, str]]) -> bool:
+    drives = [str(scene.get("scene_drive", "")).strip() for scene in scenes if str(scene.get("scene_drive", "")).strip()]
+    if len(drives) < 2:
+        return False
+    strong_tokens = ("试探", "转折", "摊牌", "揭", "逼", "变局", "收紧")
+    return sum(1 for drive in drives if any(token in drive for token in strong_tokens)) >= 2
+
+
+def _build_chain_reason(scenes: list[dict[str, str]]) -> str:
+    if not scenes:
+        return "这条线能顺着往下接。"
+    locations = [scene.get("location", "") for scene in scenes if scene.get("location", "")]
+    if len(scenes) >= 3 and len(set(locations)) >= 2:
+        return "先换场再收紧，后面还有继续推进的余地。"
+    if len(scenes) >= 2 and len(set(locations)) >= 2:
+        return "地点会连续变化，戏路层次更明显。"
+    if _chain_has_progressive_drive(scenes):
+        return "每一幕的推进方向都比较明确，适合顺着往下压。"
+    first_title = str(scenes[0].get("title", "")).strip() or "这条线"
+    return f"可以先接「{first_title}」，后面还有顺势承接的下一拍。"
+
+
+def _trim_transition_text(text: str, limit: int) -> str:
+    compact = str(text or "").strip()
+    if len(compact) <= limit:
+        return compact
+    return f"{compact[: max(1, limit - 1)]}…"
+
+
+def _transcript_to_recent_text(transcript: Any) -> str:
+    lines: list[str] = []
+    for item in list(transcript or [])[-6:]:
+        if not isinstance(item, dict):
+            continue
+        message = str(item.get("message", "")).strip()
+        if message:
+            lines.append(message)
+    return "\n".join(lines)
diff --git a/zaomeng-skill/tools/build_scene_recommendation_payload.py b/zaomeng-skill/tools/build_scene_recommendation_payload.py
new file mode 100644
index 0000000..511c1ef
--- /dev/null
+++ b/zaomeng-skill/tools/build_scene_recommendation_payload.py
@@ -0,0 +1,40 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+from __future__ import annotations
+
+import argparse
+import json
+from pathlib import Path
+import sys
+
+TOOLS_ROOT = Path(__file__).resolve().parent
+sys.path.insert(0, str(TOOLS_ROOT))
+
+from _skill_support.scene_recommendations import build_scene_recommendation_bundle  # noqa: E402
+
+
+def _write_output(payload: dict[str, object], output: str) -> None:
+    rendered = json.dumps(payload, ensure_ascii=False, indent=2)
+    if output:
+        Path(output).write_text(rendered + "\n", encoding="utf-8")
+    else:
+        print(rendered)
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(
+        description="Build a host-managed dialogue scene recommendation bundle with transition and auto-continue hints."
+    )
+    parser.add_argument("--context-file", required=True, help="JSON context file for building a scene recommendation bundle")
+    parser.add_argument("--output", default="", help="Optional JSON output path")
+    args = parser.parse_args()
+
+    context = json.loads(Path(args.context_file).read_text(encoding="utf-8"))
+    payload = build_scene_recommendation_bundle(context)
+    _write_output(payload, args.output)
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())