diff --git a/pyproject.toml b/pyproject.toml
index 76bf47d1..33ccbb57 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -74,6 +74,7 @@ dev = [
     "setuptools>=68.0",
     "wheel",
     "tomli>=2.0; python_version<\"3.11\"",
+    "pexpect>=4.9.0",
 ]
 
 [build-system]
diff --git a/scripts/README.md b/scripts/README.md
index e793b335..2217ca32 100644
--- a/scripts/README.md
+++ b/scripts/README.md
@@ -9,6 +9,8 @@ repository root with `uv run python ...` unless a script-specific README says ot
 | --- | --- |
 | `a2a/debugger.py` | Web debugger/client for A2A pipeline streams. |
 | `a2a/debugger.md` | Manual usage notes for the A2A debugger. |
+| `a2a/selling_console.py` | Selling pipeline console local HTTP server; proxies text-only UI requests to an A2A server. |
+| `a2a/selling_console_web/` | Static Selling Console frontend. It renders pipeline progress, candidate cards, chat, and debug panels; image input coverage belongs to `a2a/debugger.py`. |
 | `a2a/e2e/` | A2A session recovery end-to-end scenario runner, shared helpers, and result notes. |
 | `a2a/smoke/test_a2a_vpc.py` | Small manual smoke script for A2A VPC/pipeline behavior. |
 | `acp/smoke/test_acp_vpc.py` | Small manual smoke script for ACP VPC behavior. |
@@ -17,14 +19,26 @@ repository root with `uv run python ...` unless a script-specific README says ot
 | `observability/local_observe/` | Local observe server implementation and static web UI. |
 | `observability/local_observe.md` | Manual usage notes for the local observe tool. |
 | `rendering/test_diagram_render.py` | Manual diagram rendering check. |
+| `repl/e2e/` | Real PTY-driven REPL pipeline end-to-end scenario runner. POSIX-only because it uses `pexpect`. |
 
 ## Common Commands
 
 ```bash
 uv run python scripts/a2a/debugger.py --help
+PATH="$HOME/.local/bin:$PATH" \
+uv run python scripts/a2a/selling_console.py --port 41980 \
+  --default-server-url http://127.0.0.1:41299 \
+  --default-cwd "$PWD"
 uv run python scripts/a2a/e2e/run_recovery_scenarios.py --help
 uv run python scripts/observability/local_observe.py --help
+uv run python scripts/repl/e2e/run_pipeline_scenarios.py --help
 ```
 
+`scripts/repl/e2e/run_pipeline_scenarios.py` writes artifacts under the system temporary directory by default and is intended for manual or smoke validation. It is not part of `make test`; the unit tests only cover helper behavior. The real PTY runner depends on the POSIX-only `pexpect` development dependency.
+
+The root `conftest.py` includes a tiktoken isolation fixture so tests do not read or write the developer's real encoding cache. Keep new tests on that fixture path rather than using the user cache directly.
+
+Cleanup ledger temporary files use a leading dot in their generated names only as a cosmetic convention. Correctness relies on atomic replace, retries, and ledger validation, not on Unix hidden-file behavior.
+
 Pytest tests for these helpers live under `tests/`; the executable scripts here are kept for local debugging,
 manual validation, and real end-to-end runs.
diff --git a/scripts/a2a/debugger.md b/scripts/a2a/debugger.md
index c03b96df..621f6ddf 100644
--- a/scripts/a2a/debugger.md
+++ b/scripts/a2a/debugger.md
@@ -30,6 +30,33 @@ uv run python scripts/a2a/debugger.py --port 41880 \
   --default-cwd "$PWD"
 ```
 
+`--default-cwd` is sent to the A2A server as `metadata.iac_code.cwd` on each
+message. It is the server-side workspace for the task, not merely the debugger's
+own working directory.
+
+The A2A server validates this path before running the agent. By default, the
+server accepts its own startup directory and Python's temp directory. If
+`--default-cwd` points inside an allowed root and the directory does not exist
+yet, the server may create it. The request is rejected with
+`Invalid A2A workspace metadata.` when the resolved path escapes the allowed
+root, cannot be created, or cannot be used as a directory.
+
+Use one of these patterns:
+
+```bash
+# Start the debugger with a cwd accepted by the already-running server.
+uv run python scripts/a2a/debugger.py --port 41880 \
+  --default-server-url http://127.0.0.1:41299 \
+  --default-cwd "/path/to/server/workspace"
+```
+
+```bash
+# Or explicitly allow the debugger/client workspace when starting the server.
+IACCODE_A2A_ALLOWED_CWDS="/path/to/server/workspace:/path/to/client/workspace" \
+IAC_CODE_MODE=pipeline \
+uv run iac-code a2a --transport http --host 127.0.0.1 --port 41299
+```
+
 Open:
 
 ```text
@@ -67,3 +94,7 @@ uv run python scripts/a2a/debugger.py --port 41880 \
 - The debugger is a local development tool and does not provide authentication.
 - `contextId` identifies the conversation; `taskId` identifies one A2A task.
 - After `pipeline_handoff_ready`, follow-up messages normally start a new normal-chat task in the same context.
+- Image input accepts supported image MIME types only: `image/png`, `image/jpeg`, `image/webp`, and `image/gif`.
+- A2A part parser limits: text inline/raw and text `file://` parts are limited to 1 MiB; binary inline/raw/data parts are limited to 5 MiB; binary `file://` parts are limited to 25 MiB. Debugger uploads are limited to 5 MiB per image.
+- `file://` image inputs must resolve to an existing local file that is both under the request cwd and under a configured A2A allowed cwd root. Local URLs outside either boundary are rejected.
+- The A2A debugger sends image parts. The Selling Console web UI currently sends text input only.
diff --git a/scripts/a2a/debugger.py b/scripts/a2a/debugger.py
index 8eb94386..2bfbfc79 100644
--- a/scripts/a2a/debugger.py
+++ b/scripts/a2a/debugger.py
@@ -1,6 +1,7 @@
 from __future__ import annotations
 
 import argparse
+import base64
 import errno
 import html
 import json
@@ -20,6 +21,8 @@
 A2A_VERSION_HEADERS = {"A2A-Version": "1.0"}
 DEBUG_LOG_ROOT_NAME = "iac-code-a2a-debugger-runs"
 _DEBUG_LOG_LOCK = threading.Lock()
+DEBUGGER_SUPPORTED_IMAGE_MEDIA_TYPES = frozenset(("image/png", "image/jpeg", "image/webp", "image/gif"))
+DEBUGGER_MAX_IMAGE_BYTES = 5 * 1024 * 1024
 
 
 @dataclass(frozen=True)
@@ -130,6 +133,41 @@ def fetch_json(
         return ProxyResult(status_code=0, data=None, text="", headers={}, error=str(exc))
 
 
+def _normalize_image_part(raw: Any) -> dict[str, Any]:
+    if not isinstance(raw, dict):
+        raise ValueError("images entries must be objects")
+    media_type = str(
+        raw.get("mediaType") or raw.get("media_type") or raw.get("mimeType") or raw.get("type") or "",
+    ).lower()
+    if media_type not in DEBUGGER_SUPPORTED_IMAGE_MEDIA_TYPES:
+        supported = ", ".join(sorted(DEBUGGER_SUPPORTED_IMAGE_MEDIA_TYPES))
+        raise ValueError(f"images must use one of these mediaType values: {supported}")
+
+    encoded = raw.get("bytes") or raw.get("base64")
+    if not isinstance(encoded, str) or not encoded:
+        raise ValueError("images entries must include base64 bytes")
+    try:
+        decoded = base64.b64decode(encoded.encode("ascii"), validate=True)
+    except (ValueError, UnicodeEncodeError) as exc:
+        raise ValueError("images entries must include valid base64 bytes") from exc
+    if len(decoded) > DEBUGGER_MAX_IMAGE_BYTES:
+        raise ValueError("images entries must be 5 MiB or smaller")
+
+    filename = os.path.basename(str(raw.get("filename") or raw.get("name") or "image"))
+    return {
+        "data": {"filename": filename or "image", "bytes": encoded},
+        "mediaType": media_type,
+    }
+
+
+def _normalize_image_parts(images: Any) -> list[dict[str, Any]]:
+    if images in (None, ""):
+        return []
+    if not isinstance(images, list):
+        raise ValueError("images must be a list")
+    return [_normalize_image_part(image) for image in images]
+
+
 def build_message_stream_payload(
     *,
     cwd: str,
@@ -138,11 +176,16 @@ def build_message_stream_payload(
     task_id: str,
     request_id: str,
     message_id: str,
+    images: Any = None,
 ) -> dict[str, Any]:
+    parts = []
+    if prompt:
+        parts.append({"text": prompt})
+    parts.extend(_normalize_image_parts(images))
     message: dict[str, Any] = {
         "messageId": message_id,
         "role": "ROLE_USER",
-        "parts": [{"text": prompt}],
+        "parts": parts,
         "metadata": {"iac_code": {"cwd": cwd}},
     }
     if context_id:
@@ -206,6 +249,9 @@ def _extract_pipeline_envelope(payload: Any) -> dict[str, Any] | None:
                 return envelope
         return None
 
+    if isinstance(payload.get("eventType") or payload.get("event_type"), str):
+        return payload
+
     for key in ("pipeline", "pipelineEvent", "pipelineSnapshot"):
         if isinstance(payload.get(key), dict):
             return payload[key]
@@ -322,11 +368,27 @@ def load_debug_log_export(log_dir: str | Path) -> dict[str, Any]:
     snapshots = _load_debug_log_raw_values(path / "snapshots.jsonl")
     requests = _load_debug_log_raw_values(path / "requests.jsonl")
     latest_snapshot = snapshots[-1] if snapshots else None
+    snapshot_events = [
+        event
+        for snapshot in snapshots
+        if isinstance(snapshot, dict) and isinstance(snapshot.get("events"), list)
+        for event in snapshot["events"]
+    ]
+    replay_events = [*sse_events, *snapshot_events]
     latest_pipeline = None
     active_task_id = ""
     task_history: dict[str, dict[str, str]] = {}
     last_sequence = 0
 
+    def sequence_value(value: Any) -> int | None:
+        if isinstance(value, bool) or not isinstance(value, int | float):
+            return None
+        return int(value)
+
+    def terminal_pipeline_status(value: Any) -> bool:
+        state = str(value or "").lower().replace("task_state_", "").replace("-", "_")
+        return state in {"canceled", "cancelled", "failed", "denied", "completed"}
+
     def remember_task(*, task_id: Any, context_id: Any = "", state: Any = "", role: str = "active") -> None:
         normalized_task_id = str(task_id or "")
         if not normalized_task_id:
@@ -339,7 +401,7 @@ def remember_task(*, task_id: Any, context_id: Any = "", state: Any = "", role:
             "role": role or existing.get("role") or "active",
         }
 
-    for item in sse_events:
+    for item in replay_events:
         identity = _a2a_task_identity(item)
         if identity is not None:
             active_task_id = str(identity.get("taskId") or active_task_id)
@@ -359,9 +421,13 @@ def remember_task(*, task_id: Any, context_id: Any = "", state: Any = "", role:
             state=envelope.get("state") or envelope.get("status"),
             role="pipeline",
         )
-        sequence = envelope.get("sequence")
-        if isinstance(sequence, int) and not isinstance(sequence, bool):
+        sequence = sequence_value(envelope.get("sequence"))
+        if sequence is not None:
             last_sequence = max(last_sequence, sequence)
+        if terminal_pipeline_status(envelope.get("state") or envelope.get("status")) and active_task_id == str(
+            envelope.get("taskId") or ""
+        ):
+            active_task_id = ""
     return {
         "schemaVersion": "iac-code-a2a-debugger-export-v1",
         "exportedAt": _utc_now(),
@@ -378,7 +444,7 @@ def remember_task(*, task_id: Any, context_id: Any = "", state: Any = "", role:
         "waitingInput": "",
         "latestPermission": None,
         "snapshot": latest_snapshot,
-        "sseEvents": sse_events,
+        "sseEvents": replay_events,
         "requests": requests,
         "executionTree": {"rootIds": [], "nodes": {}},
         "uiState": {},
@@ -504,6 +570,10 @@ def render_index_html(config: DebuggerConfig) -> str:
       outline: none;
     }
 
+    input[type="file"] {
+      padding: 7px 10px;
+    }
+
     input:focus,
     textarea:focus {
       border-color: var(--accent);
@@ -568,6 +638,18 @@ def render_index_html(config: DebuggerConfig) -> str:
       gap: 12px;
     }
 
+    .prompt-stack {
+      display: grid;
+      gap: 10px;
+    }
+
+    .image-summary {
+      min-height: 18px;
+      color: var(--muted);
+      font-size: 12px;
+      overflow-wrap: anywhere;
+    }
+
     .debug-log-line {
       display: flex;
       align-items: center;
@@ -890,6 +972,11 @@ def render_index_html(config: DebuggerConfig) -> str:
       background: #fef2f2;
     }
 
+    .timeline-canceled {
+      border-color: #fecaca;
+      background: #fff1f2;
+    }
+
     .pill {
       display: inline-flex;
       align-items: center;
@@ -1315,9 +1402,15 @@ def render_index_html(config: DebuggerConfig) -> str:
       </div>
       <div id="task-history" class="task-history" aria-label="Task history"></div>
       <div class="prompt-row">
-        <label for="prompt">Prompt
-          <textarea id="prompt" spellcheck="false"></textarea>
-        </label>
+        <div class="prompt-stack">
+          <label for="prompt">Prompt
+            <textarea id="prompt" spellcheck="false"></textarea>
+          </label>
+          <label for="image-input">Images
+            <input id="image-input" type="file" accept="image/png,image/jpeg,image/webp,image/gif" multiple>
+          </label>
+          <div id="image-summary" class="image-summary">No images selected.</div>
+        </div>
         <div class="button-row" aria-label="Actions">
           <button id="health-button" type="button">Health</button>
           <button id="stream-button" class="primary" type="button">Stream</button>
@@ -1400,6 +1493,8 @@ def render_index_html(config: DebuggerConfig) -> str:
     };
 
     const byId = (id) => document.getElementById(id);
+    const supportedImageMediaTypes = new Set(["image/png", "image/jpeg", "image/webp", "image/gif"]);
+    const maxImageBytes = 5 * 1024 * 1024;
 
     function createExecutionTree() {
       return {
@@ -1495,6 +1590,78 @@ def render_index_html(config: DebuggerConfig) -> str:
       };
     }
 
+    function selectedImageFiles() {
+      const input = byId("image-input");
+      if (!input || !input.files) {
+        return [];
+      }
+      return Array.from(input.files);
+    }
+
+    function formatBytes(value) {
+      const bytes = Number(value) || 0;
+      if (bytes < 1024) {
+        return `${bytes} B`;
+      }
+      if (bytes < 1024 * 1024) {
+        return `${(bytes / 1024).toFixed(1)} KiB`;
+      }
+      return `${(bytes / (1024 * 1024)).toFixed(1)} MiB`;
+    }
+
+    function updateImageSummary() {
+      const summary = byId("image-summary");
+      if (!summary) {
+        return;
+      }
+      const files = selectedImageFiles();
+      if (!files.length) {
+        summary.textContent = "No images selected.";
+        return;
+      }
+      summary.textContent = files
+        .map((file) => `${file.name || "image"} (${formatBytes(file.size)})`)
+        .join(", ");
+    }
+
+    function readFileAsDataUrl(file) {
+      return new Promise((resolve, reject) => {
+        const reader = new FileReader();
+        reader.addEventListener("load", () => resolve(String(reader.result || "")));
+        reader.addEventListener("error", () => reject(reader.error || new Error("Failed to read image file.")));
+        reader.readAsDataURL(file);
+      });
+    }
+
+    function imageBase64FromDataUrl(dataUrl) {
+      const commaIndex = dataUrl.indexOf(",");
+      if (commaIndex < 0) {
+        throw new Error("Image file did not produce a valid data URL.");
+      }
+      return dataUrl.slice(commaIndex + 1);
+    }
+
+    async function readSelectedImages() {
+      const files = selectedImageFiles();
+      const images = [];
+      for (const file of files) {
+        const mediaType = String(file.type || "").toLowerCase();
+        if (!supportedImageMediaTypes.has(mediaType)) {
+          throw new Error(`${file.name || "Selected image"} uses unsupported image type ${mediaType || "unknown"}.`);
+        }
+        if (file.size > maxImageBytes) {
+          throw new Error(`${file.name || "Selected image"} is larger than 5 MiB.`);
+        }
+        const dataUrl = await readFileAsDataUrl(file);
+        images.push({
+          filename: file.name || "image",
+          mediaType,
+          bytes: imageBase64FromDataUrl(dataUrl)
+        });
+      }
+      return images;
+    }
+
     function appendRawEvent(kind, value) {
       let row = null;
       if (kind === "snapshot") {
@@ -1647,18 +1814,30 @@ def render_index_html(config: DebuggerConfig) -> str:
         const status = statusUpdate.status && typeof statusUpdate.status === "object" ? statusUpdate.status : {};
         return {
           kind: "status_update",
-          taskId: statusUpdate.taskId || statusUpdate.task_id || "",
-          contextId: statusUpdate.contextId || statusUpdate.context_id || "",
+          taskId: (
+            statusUpdate.deliveryTaskId ||
+            statusUpdate.delivery_task_id ||
+            statusUpdate.taskId ||
+            statusUpdate.task_id ||
+            ""
+          ),
+          contextId: (
+            statusUpdate.deliveryContextId ||
+            statusUpdate.delivery_context_id ||
+            statusUpdate.contextId ||
+            statusUpdate.context_id ||
+            ""
+          ),
           state: status.state || ""
         };
       }
       const task = payload.task && typeof payload.task === "object" ? payload.task : payload;
-      if (task.id || task.taskId || task.task_id) {
+      if (task.id || task.taskId || task.task_id || task.deliveryTaskId || task.delivery_task_id) {
         const status = task.status && typeof task.status === "object" ? task.status : {};
         return {
           kind: "task_submitted",
-          taskId: task.id || task.taskId || task.task_id || "",
-          contextId: task.contextId || task.context_id || "",
+          taskId: task.deliveryTaskId || task.delivery_task_id || task.id || task.taskId || task.task_id || "",
+          contextId: task.deliveryContextId || task.delivery_context_id || task.contextId || task.context_id || "",
           state: status.state || ""
         };
       }
@@ -1672,11 +1851,31 @@ def render_index_html(config: DebuggerConfig) -> str:
     }
 
     function recordTaskIdentity(identity, role = "active") {
-      const taskId = String(identity && (identity.taskId || identity.task_id || identity.id) || "");
+      const taskId = String(
+        identity &&
+          (
+            identity.deliveryTaskId ||
+            identity.delivery_task_id ||
+            identity.taskId ||
+            identity.task_id ||
+            identity.id
+          ) ||
+          ""
+      );
       if (!taskId) {
         return null;
       }
-      const contextId = String(identity && (identity.contextId || identity.context_id || state.contextId) || "");
+      const contextId = String(
+        identity &&
+          (
+            identity.deliveryContextId ||
+            identity.delivery_context_id ||
+            identity.contextId ||
+            identity.context_id ||
+            state.contextId
+          ) ||
+          ""
+      );
       const taskState = String(identity && (identity.state || identity.status || "") || "");
       const existing = state.taskHistory.find((item) => item.taskId === taskId);
       const next = {
@@ -1726,6 +1925,14 @@ def render_index_html(config: DebuggerConfig) -> str:
       return stateValue === "TASK_STATE_SUBMITTED" || stateValue === "TASK_STATE_WORKING";
     }
 
+    function isTerminalPipelineTaskState(value) {
+      const stateValue = String(value || "")
+        .toLowerCase()
+        .replace(/^task_state_/, "")
+        .replace(/-/g, "_");
+      return ["canceled", "cancelled", "failed", "denied", "completed"].includes(stateValue);
+    }
+
     function shouldKeepActiveTaskId(identity) {
       return identity && isWorkingA2ATaskState(identity.state);
     }
@@ -1769,14 +1976,12 @@ def render_index_html(config: DebuggerConfig) -> str:
       if (activeTaskInput && state.activeTaskId && activeTaskInput.value.trim() !== state.activeTaskId) {
         activeTaskInput.value = state.activeTaskId;
       }
-      if (activeTaskInput && !state.activeTaskId && state.normalHandoffReady && activeTaskInput.value.trim()) {
-        activeTaskInput.value = "";
-      }
       if (
         activeTaskInput &&
         !state.activeTaskId &&
-        state.normalHandoffReady &&
-        activeTaskInput.value.trim() === state.taskId
+        activeTaskInput.value.trim() &&
+        (state.normalHandoffReady ||
+          (isTerminalPipelineTaskState(state.status) && activeTaskInput.value.trim() === state.taskId))
       ) {
         activeTaskInput.value = "";
       }
@@ -1815,10 +2020,15 @@ def render_index_html(config: DebuggerConfig) -> str:
     }
 
     function streamTaskIdForControls(controls) {
-      if (state.normalHandoffReady && !controls.activeTaskId) {
+      const activeTaskId = controls.activeTaskId || state.activeTaskId;
+      const pipelineTaskId = controls.taskId || state.taskId;
+      if (activeTaskId && !(isTerminalPipelineTaskState(state.status) && activeTaskId === pipelineTaskId)) {
+        return activeTaskId;
+      }
+      if (state.normalHandoffReady || isTerminalPipelineTaskState(state.status)) {
         return "";
       }
-      return controls.activeTaskId || state.activeTaskId || controls.taskId || state.taskId;
+      return pipelineTaskId;
     }
 
     function cancelTaskIdForControls(controls) {
@@ -2598,6 +2808,13 @@ def render_index_html(config: DebuggerConfig) -> str:
       if (type === "input_required") {
         return {label: "input required", text: summarizeValue(data), className: "timeline-permission"};
       }
+      if (type === "pipeline_canceled") {
+        return {
+          label: "pipeline canceled",
+          text: data.reason || summarizeValue(data),
+          className: "timeline-canceled"
+        };
+      }
       if (type.endsWith("_completed") && Object.prototype.hasOwnProperty.call(data, "conclusion")) {
         return {
           label: type.replace(/_/g, " "),
@@ -2848,8 +3065,22 @@ def render_index_html(config: DebuggerConfig) -> str:
       }
 
       state.status = String(envelope.status || envelope.state || envelope.pipelineStatus || state.status || "running");
-      state.taskId = String(envelope.taskId || envelope.task_id || state.taskId || "");
-      state.contextId = String(envelope.contextId || envelope.context_id || state.contextId || "");
+      state.taskId = String(
+        envelope.deliveryTaskId ||
+          envelope.delivery_task_id ||
+          envelope.taskId ||
+          envelope.task_id ||
+          state.taskId ||
+          ""
+      );
+      state.contextId = String(
+        envelope.deliveryContextId ||
+          envelope.delivery_context_id ||
+          envelope.contextId ||
+          envelope.context_id ||
+          state.contextId ||
+          ""
+      );
       if (state.taskId) {
         if (!state.normalHandoffReady && !state.activeTaskId) {
           state.activeTaskId = state.taskId;
@@ -3340,7 +3571,8 @@ def render_index_html(config: DebuggerConfig) -> str:
     }
 
     function snapshotNormalHandoff(snapshot) {
-      return snapshotObject(snapshot && (snapshot.normalHandoff || snapshot.normal_handoff));
+      const envelope = snapshotEnvelope(snapshot);
+      return snapshotObject(envelope && (envelope.normalHandoff || envelope.normal_handoff));
     }
 
     function normalHandoffSummary(snapshot) {
@@ -4021,6 +4253,7 @@ def render_index_html(config: DebuggerConfig) -> str:
         updateRawRequest(requestRow, {status: "ok", response: body});
         appendRawEvent("sse", {type: "cancel", body});
         applyPipelineEvent(body);
+        await fetchStateIfAvailable();
       } catch (error) {
         updateRawRequest(requestRow, {
           status: "error",
@@ -4034,6 +4267,7 @@ def render_index_html(config: DebuggerConfig) -> str:
 
     async function streamMessage() {
       const controls = readControls();
+      const images = await readSelectedImages();
       const payload = {
         serverUrl: controls.serverUrl,
         cwd: controls.cwd,
@@ -4041,6 +4275,9 @@ def render_index_html(config: DebuggerConfig) -> str:
         taskId: streamTaskIdForControls(controls),
         prompt: controls.prompt
       };
+      if (images.length) {
+        payload.images = images;
+      }
       const requestRow = appendRawEvent("request", {method: "POST", path: "/api/message/stream", payload});
       state.streamsInFlight += 1;
       state.status = "streaming";
@@ -4100,6 +4337,9 @@ def render_index_html(config: DebuggerConfig) -> str:
             } catch {
               parsed = raw;
             }
+            if (parsed && typeof parsed === "object" && (parsed.type === "error" || parsed.error)) {
+              state.status = "error";
+            }
             const rawRow = appendRawEvent("sse", parsed);
             if (rawRow) {
               applyPipelineEvent(parsed, rawRow, {alreadyRecorded: true});
@@ -4308,6 +4548,10 @@ def render_index_html(config: DebuggerConfig) -> str:
           element.readOnly = true;
         }
       });
+      const imageInput = byId("image-input");
+      if (imageInput) {
+        imageInput.disabled = true;
+      }
       ["health-button", "stream-button", "fetch-state-button", "cancel-button"].forEach((id) => {
         const button = byId(id);
         if (button) {
@@ -4351,6 +4595,10 @@ def render_index_html(config: DebuggerConfig) -> str:
           element.setAttribute("readonly", "readonly");
         }
       });
+      const imageInput = clone.querySelector("#image-input");
+      if (imageInput) {
+        imageInput.setAttribute("disabled", "disabled");
+      }
       ["health-button", "stream-button", "fetch-state-button", "cancel-button"].forEach((id) => {
         const button = clone.querySelector(`#${cssEscape(id)}`);
         if (button) {
@@ -4435,11 +4683,13 @@ def render_index_html(config: DebuggerConfig) -> str:
     byId("cancel-button").addEventListener("click", (event) => withButtonState(event.currentTarget, cancelTask));
     byId("stream-button").addEventListener("click", (event) => withStreamAction(event.currentTarget, streamMessage));
     byId("export-html-button").addEventListener("click", exportCurrentHtmlSnapshot);
+    byId("image-input").addEventListener("change", updateImageSummary);
 
     if (isExportMode) {
       restoreExportState(exportPayload);
       configureExportMode();
     }
+    updateImageSummary();
     renderPipeline();
     renderRaw();
   </script>
@@ -4595,8 +4845,8 @@ def _message_stream_body(body: dict[str, Any]) -> tuple[str, dict[str, Any]]:
     task_id = str(body.get("taskId", ""))
     if not cwd:
         raise ValueError("cwd is required")
-    if not prompt:
-        raise ValueError("prompt is required")
+    if not prompt and not body.get("images"):
+        raise ValueError("prompt or image is required")
     payload = build_message_stream_payload(
         cwd=cwd,
         prompt=prompt,
@@ -4604,6 +4854,7 @@ def _message_stream_body(body: dict[str, Any]) -> tuple[str, dict[str, Any]]:
         task_id=task_id,
         request_id=str(uuid.uuid4()),
         message_id=str(uuid.uuid4()),
+        images=body.get("images"),
     )
     return server_url, payload
 
@@ -4634,6 +4885,58 @@ def _send_sse_error(handler: BaseHTTPRequestHandler, status: int, message: str)
         raise
 
 
+def _send_sse_event(handler: BaseHTTPRequestHandler, status: int, event: dict[str, Any]) -> None:
+    body = f"data: {json.dumps(event, ensure_ascii=False)}\n\n".encode("utf-8")
+    try:
+        handler.send_response(status)
+        handler.send_header("Content-Type", "text/event-stream; charset=utf-8")
+        handler.send_header("Content-Length", str(len(body)))
+        handler.end_headers()
+        handler.wfile.write(body)
+    except OSError as exc:
+        if _is_client_disconnect_error(exc):
+            return
+        raise
+
+
+def _jsonrpc_error_message(value: Any) -> str | None:
+    if not isinstance(value, dict):
+        return None
+    error = value.get("error")
+    if isinstance(error, dict):
+        message = error.get("message")
+        recoverable_task_id = _recoverable_task_id_from_jsonrpc_error(error)
+        if isinstance(message, str) and message:
+            if recoverable_task_id and not _message_has_resume_guidance(message, recoverable_task_id):
+                return f"{message} Resume task {recoverable_task_id}."
+            return message
+        return json.dumps(error, ensure_ascii=False)
+    if isinstance(error, str) and error:
+        return error
+    return None
+
+
+def _message_has_resume_guidance(message: str, task_id: str) -> bool:
+    return f"resume task {task_id}".casefold() in message.casefold()
+
+
+def _recoverable_task_id_from_jsonrpc_error(error: dict[str, Any]) -> str | None:
+    data = error.get("data")
+    if isinstance(data, dict):
+        task_id = data.get("recoverableTaskId")
+        return task_id if isinstance(task_id, str) and task_id else None
+    if isinstance(data, list):
+        for item in data:
+            if not isinstance(item, dict):
+                continue
+            metadata = item.get("metadata")
+            if isinstance(metadata, dict):
+                task_id = metadata.get("recoverableTaskId")
+                if isinstance(task_id, str) and task_id:
+                    return task_id
+    return None
+
+
 def create_server(config: DebuggerConfig) -> ThreadingHTTPServer:
     class A2APipelineDebuggerHandler(BaseHTTPRequestHandler):
         def log_message(self, format: str, *args: object) -> None:
@@ -4679,6 +4982,32 @@ def do_POST(self) -> None:
                     server_url, payload = _message_stream_body(body)
                     try:
                         with _open_sse_stream(server_url, payload) as response:
+                            content_type = str(response.headers.get("Content-Type", "")).lower()
+                            if "text/event-stream" not in content_type:
+                                raw = response.read()
+                                data, _text = _decode_json_text(raw)
+                                message = _jsonrpc_error_message(data)
+                                if message:
+                                    event = {
+                                        "type": "error",
+                                        "error": message,
+                                        "statusCode": response.status,
+                                        "body": data,
+                                    }
+                                    append_debug_log(config, "sse", event)
+                                    _send_sse_event(self, 200, event)
+                                    return
+                                append_debug_log(
+                                    config,
+                                    "error",
+                                    {
+                                        "ok": False,
+                                        "error": "Target server returned a non-SSE response",
+                                        "statusCode": response.status,
+                                    },
+                                )
+                                _send_sse_error(self, 502, "Target server returned a non-SSE response")
+                                return
                             self.send_response(response.status)
                             self.send_header("Content-Type", "text/event-stream; charset=utf-8")
                             self.end_headers()
@@ -4738,7 +5067,7 @@ def main(argv: list[str] | None = None) -> None:
         replay_export=load_debug_log_export(args.load_log_dir) if args.load_log_dir else None,
     )
     server = create_server(config)
-    host, port = server.server_address
+    host, port = server.server_address[:2]
     print(f"A2A pipeline debugger listening on http://{host}:{port}", flush=True)
     print(f"A2A pipeline debugger logs: {config.log_dir}", flush=True)
     try:
diff --git a/scripts/a2a/e2e/README.md b/scripts/a2a/e2e/README.md
index 1e158d52..0898ba5d 100644
--- a/scripts/a2a/e2e/README.md
+++ b/scripts/a2a/e2e/README.md
@@ -60,6 +60,11 @@ uv run python scripts/a2a/e2e/run_recovery_scenarios.py \
   --scenario scenario1 \
   --scenario selection-waiting \
   --scenario ask-waiting \
+  --scenario image-initial \
+  --scenario image-ask-waiting \
+  --scenario image-selection-waiting \
+  --scenario image-normal-handoff \
+  --scenario image-interrupt \
   --scenario step1-running \
   --scenario step2-running \
   --scenario step3-running \
@@ -75,12 +80,17 @@ uv run python scripts/a2a/e2e/run_recovery_scenarios.py \
   --scenario rollback-step2 \
   --scenario rollback-step3 \
   --scenario rollback-step4 \
-  --scenario rollback-step5
+  --scenario rollback-step5 \
+  --scenario rollback-step5-cleanup \
+  --scenario rollback-step5-cleanup-recovery
 ```
 
 Provider, tool, and cloud execution scenarios are guarded by default. Use
 `--allow-real-cloud` only when you intentionally want to run against real
 providers and Alibaba Cloud credentials.
+The rollback step5 cleanup scenarios intentionally leave the second stack in
+ROS as proof that cleanup only removed the rollback leftover; delete that stack
+after you finish inspecting the run.
 
 ## What Each Scenario Covers
 
@@ -88,11 +98,16 @@ providers and Alibaba Cloud credentials.
 not a separate runner or a special mode; it lives in the same scenario matrix as
 the rest of the tests.
 
-| Scenario | Where the server is killed | Recovery input | Main assertion |
+| Scenario | Cut point / special condition | Recovery input | Main assertion |
 | --- | --- | --- | --- |
 | `scenario1` | After pipeline completion and one normal-chat follow-up | Ask what the previous normal-chat question was | Normal-chat history survives restart; VSwitch evidence exists. |
 | `selection-waiting` | Step 4 waits for candidate selection | `你随便选一个方案。` without `taskId` | Waiting step4 task is recovered and selected; VSwitch evidence exists. |
 | `ask-waiting` | `ask_user_question` waits for user input | Clarification answers without `taskId` | Pending ask input is recovered and pipeline completes; VSwitch evidence exists. |
+| `image-initial` | Initial user message is the static `initial.png` image fixture | Candidate selection text | The image starts the pipeline, reaches step4 selection, completes, and produces VSwitch evidence. |
+| `image-ask-waiting` | `ask_user_question` waits for user input, then the server restarts | Static `ask-first-answer.png` / `ask-second-answer.png` image fixtures without `taskId` | Pending ask input is recovered, image answers hydrate the recovered task, and the pipeline completes with VSwitch evidence. |
+| `image-selection-waiting` | Step 4 waits for candidate selection, then the server restarts | Static `selection.png` image fixture without `taskId` | Waiting step4 task is recovered, the image selection is accepted, and VSwitch evidence exists. |
+| `image-normal-handoff` | Pipeline completes and hands off to normal chat; the normal follow-up is static `normal-followup.png`, then the server restarts | Normal-chat recovery question without `taskId` | Image follow-up stays in the same `contextId`, uses a new normal-chat task, and completed handoff state survives restart. |
+| `image-interrupt` | Step 3 receives static `rollback-interrupt.png` as an image rollback to `intent_parsing`, then the server restarts | `继续`, plus selection when needed | The image interrupt is recognized, the pipeline completes as a security-group task, and final deployment evidence is not VSwitch. |
 | `step1-running` | `intent_parsing` running | `继续` | Running pipeline task is recovered and completes; VSwitch evidence exists. |
 | `step2-running` | `architecture_planning` running | `继续` | Running pipeline task is recovered and completes; VSwitch evidence exists. |
 | `step3-running` | `evaluate_candidates` candidate/sub-pipeline running | `继续` | Sub-pipeline state is recovered and completes; VSwitch evidence exists. |
@@ -101,6 +116,8 @@ the rest of the tests.
 | `normal-running` | Normal-chat response streaming after pipeline handoff | `继续`, then history check | Normal-chat task recovery keeps same `contextId` history. |
 | `cancel-step1` ... `cancel-step5` | Active pipeline task is canceled at the named step | Normal-chat follow-up after cancel, then restart and history check | Canceled snapshot stays canceled; normal-chat history survives restart. |
 | `rollback-step1` ... `rollback-step5` | Step 3 receives rollback to `intent_parsing`, then the named post-rollback step is killed | `继续`, plus selection when needed | Post-rollback pipeline completes as a security-group task, not VSwitch. |
+| `rollback-step5-cleanup` | First step5 stack is observed, then rollback creates a second stack and hands off to normal chat | A normal-chat follow-up triggers cleanup | First rollback stack reaches cleanup complete and is deleted in ROS; second stack remains. |
+| `rollback-step5-cleanup-recovery` | Same as `rollback-step5-cleanup`, then the server is killed after cleanup starts | `继续` in normal chat after restart | Cleanup is triggered again after restart; first stack is deleted and second stack remains. |
 | `fault-after-snapshot` | Deterministic crash after A2A pipeline snapshot persistence | `继续`, plus selection when needed | `GetTask` / `ListTasks` expose the recovered task and the pipeline completes. |
 
 ## Representative Inputs
@@ -136,6 +153,12 @@ Rollback scenarios interrupt step 3 with:
 回退到 intent_parsing，选择一个已有vpc，创建一个安全组
 ```
 
+Image scenarios send a small text prompt plus static PNG fixtures from
+`scripts/a2a/e2e/fixtures/text-images/`. The fixture manifest pins the text,
+file name, media type, byte size, and SHA-256 hash. A scenario run also writes
+`image-fixtures/manifest.json`; fixed prompts should show `source: static`.
+Only ad-hoc or CLI-overridden text falls back to runtime image rendering.
+
 ## Recommended Order
 
 When stabilizing changes, run the smaller or more diagnostic cases first:
@@ -144,10 +167,13 @@ When stabilizing changes, run the smaller or more diagnostic cases first:
 2. `scenario1`
 3. `selection-waiting`
 4. `ask-waiting`
-5. `step1-running` through `step5-running`
-6. `normal-running`
-7. `cancel-step1` through `cancel-step5`
-8. `rollback-step1` through `rollback-step5`
+5. `image-initial`, `image-ask-waiting`, and `image-selection-waiting`
+6. `image-normal-handoff` and `image-interrupt`
+7. `step1-running` through `step5-running`
+8. `normal-running`
+9. `cancel-step1` through `cancel-step5`
+10. `rollback-step1` through `rollback-step5`
+11. `rollback-step5-cleanup`, then `rollback-step5-cleanup-recovery`
 
 ## Preflight
 
@@ -224,6 +250,7 @@ Important files:
 - `*.task-get.json` and `*.task-list.json`: redacted `GetTask` / `ListTasks` artifacts when captured by the scenario.
 - `server-1.*.log` and `server-2.*.log`: server logs before and after restart.
 - `a2a-server.yml`: generated server config.
+- `image-fixtures/manifest.json`: image input fixture usage for image scenarios, including whether each image came from a static repository fixture or runtime rendering.
 - `workspace/`: default A2A metadata cwd and generated tool outputs unless `--cwd` is provided.
 - `preflight.json`: provider preflight result unless `--skip-preflight` is used.
 
diff --git a/scripts/a2a/e2e/README.zh-CN.md b/scripts/a2a/e2e/README.zh-CN.md
index 76aa4727..0fa7c431 100644
--- a/scripts/a2a/e2e/README.zh-CN.md
+++ b/scripts/a2a/e2e/README.zh-CN.md
@@ -56,6 +56,11 @@ uv run python scripts/a2a/e2e/run_recovery_scenarios.py \
   --scenario scenario1 \
   --scenario selection-waiting \
   --scenario ask-waiting \
+  --scenario image-initial \
+  --scenario image-ask-waiting \
+  --scenario image-selection-waiting \
+  --scenario image-normal-handoff \
+  --scenario image-interrupt \
   --scenario step1-running \
   --scenario step2-running \
   --scenario step3-running \
@@ -71,22 +76,31 @@ uv run python scripts/a2a/e2e/run_recovery_scenarios.py \
   --scenario rollback-step2 \
   --scenario rollback-step3 \
   --scenario rollback-step4 \
-  --scenario rollback-step5
+  --scenario rollback-step5 \
+  --scenario rollback-step5-cleanup \
+  --scenario rollback-step5-cleanup-recovery
 ```
 
 provider、tool、真实云调用场景默认会被保护住。只有确认要使用真实 provider 和阿里云凭证
 时，才加 `--allow-real-cloud`。
+`rollback-step5-cleanup` 这两个场景会故意保留第 2 个 stack，作为“只清理回滚残留”的验收
+证据；检查完 run 产物后请再手工或通过后续流程删除它。
 
 ## 每个场景覆盖什么
 
 `scenario1` 是历史遗留名称，表示“pipeline 完成后恢复 normal chat”的基线场景。它不是
 单独 runner，也不是特殊模式，而是完整场景矩阵中的一个场景。
 
-| 场景 | kill server 的位置 | 恢复时输入 | 主要验收 |
+| 场景 | 切点 / 特殊条件 | 恢复时输入 | 主要验收 |
 | --- | --- | --- | --- |
 | `scenario1` | pipeline 完成并完成一轮 normal-chat follow-up 后 | 询问上一条 normal-chat 问题是什么 | normal-chat 历史重启后仍可用；存在 VSwitch 证据。 |
 | `selection-waiting` | step4 等待候选方案选择时 | 不带 `taskId` 发送 `你随便选一个方案。` | 能恢复等待中的 step4 task 并完成选择；存在 VSwitch 证据。 |
 | `ask-waiting` | `ask_user_question` 等待用户输入时 | 不带 `taskId` 发送澄清回答 | 能恢复 pending ask 输入并完成 pipeline；存在 VSwitch 证据。 |
+| `image-initial` | 首轮用户消息就是静态 `initial.png` 图片 fixture | 文本选择候选方案 | 图片能启动 pipeline，进入 step4 选择，最终完成并产生 VSwitch 证据。 |
+| `image-ask-waiting` | `ask_user_question` 等待用户输入，随后重启 server | 不带 `taskId` 发送静态 `ask-first-answer.png` / `ask-second-answer.png` 图片 fixture | pending ask 输入能恢复，图片回答能 hydrate 到恢复后的 task，最终完成并产生 VSwitch 证据。 |
+| `image-selection-waiting` | step4 等待候选方案选择，随后重启 server | 不带 `taskId` 发送静态 `selection.png` 图片 fixture | 能恢复等待中的 step4 task，图片选择被接受，并产生 VSwitch 证据。 |
+| `image-normal-handoff` | pipeline 完成并 handoff 到 normal chat；normal follow-up 是静态 `normal-followup.png`，随后重启 server | 不带 `taskId` 发送 normal-chat 恢复问题 | 图片 follow-up 保持同一个 `contextId`，使用新的 normal-chat task；completed handoff 状态重启后仍可恢复。 |
+| `image-interrupt` | step3 收到静态 `rollback-interrupt.png` 图片，表示回滚到 `intent_parsing`，随后重启 server | `继续`，必要时再选择方案 | 图片 interrupt 能被识别；pipeline 以安全组任务完成，最终部署证据不是 VSwitch。 |
 | `step1-running` | `intent_parsing` 运行中 | `继续` | running pipeline task 能恢复并完成；存在 VSwitch 证据。 |
 | `step2-running` | `architecture_planning` 运行中 | `继续` | running pipeline task 能恢复并完成；存在 VSwitch 证据。 |
 | `step3-running` | `evaluate_candidates` 的 candidate/sub-pipeline 运行中 | `继续` | sub-pipeline 状态能恢复并完成；存在 VSwitch 证据。 |
@@ -95,6 +109,8 @@ provider、tool、真实云调用场景默认会被保护住。只有确认要
 | `normal-running` | pipeline handoff 后的 normal-chat 响应流式输出中 | `继续`，随后检查历史 | normal-chat task 恢复后仍保持同一个 `contextId` 历史。 |
 | `cancel-step1` ... `cancel-step5` | 在指定 step cancel 活跃 pipeline task | cancel 后 normal-chat follow-up，重启后检查历史 | canceled snapshot 保持 canceled；normal-chat 历史重启后仍可用。 |
 | `rollback-step1` ... `rollback-step5` | step3 收到回滚到 `intent_parsing`，随后在回滚后的指定 step kill | `继续`，必要时再选择方案 | 回滚后的 pipeline 以安全组任务完成，不再是 VSwitch。 |
+| `rollback-step5-cleanup` | 第一次 step5 stack 已被观测后触发回滚，随后第二次 step5 创建新 stack 并进入 normal chat | normal-chat follow-up 触发 cleanup | 第 1 个回滚残留 stack 在 cleanup snapshot 中完成，且 ROS 中已删除；第 2 个 stack 仍保留。 |
+| `rollback-step5-cleanup-recovery` | 基于 `rollback-step5-cleanup`，在第 1 个 stack cleanup 开始后 kill server | 重启后在 normal chat 发送 `继续` | 恢复后重新触发 cleanup；第 1 个 stack 被删除，第 2 个 stack 仍保留。 |
 | `fault-after-snapshot` | A2A pipeline snapshot 持久化后确定性 crash | `继续`，必要时再选择方案 | `GetTask` / `ListTasks` 能看到恢复 task，pipeline 能完成。 |
 
 ## 代表输入
@@ -129,6 +145,12 @@ rollback 场景会在 step3 发送：
 回退到 intent_parsing，选择一个已有vpc，创建一个安全组
 ```
 
+图片场景会发送一个很短的读图提示词，并附带
+`scripts/a2a/e2e/fixtures/text-images/` 下的静态 PNG fixture。fixture manifest 会固化
+文本、文件名、媒体类型、字节数和 SHA-256。每次场景运行还会写
+`image-fixtures/manifest.json`；固定 prompt 应显示 `source: static`。只有临时输入或通过
+CLI 覆盖后的文本，才会回退到运行时渲染图片。
+
 ## 推荐执行顺序
 
 稳定或回归时，建议从更小、更容易定位问题的场景开始：
@@ -137,10 +159,13 @@ rollback 场景会在 step3 发送：
 2. `scenario1`
 3. `selection-waiting`
 4. `ask-waiting`
-5. `step1-running` 到 `step5-running`
-6. `normal-running`
-7. `cancel-step1` 到 `cancel-step5`
-8. `rollback-step1` 到 `rollback-step5`
+5. `image-initial`、`image-ask-waiting` 和 `image-selection-waiting`
+6. `image-normal-handoff` 和 `image-interrupt`
+7. `step1-running` 到 `step5-running`
+8. `normal-running`
+9. `cancel-step1` 到 `cancel-step5`
+10. `rollback-step1` 到 `rollback-step5`
+11. `rollback-step5-cleanup`，再跑 `rollback-step5-cleanup-recovery`
 
 ## Preflight
 
@@ -215,6 +240,7 @@ uv run python scripts/a2a/e2e/run_recovery_scenarios.py \
 - `*.task-get.json` 和 `*.task-list.json`：场景捕获到的、经过脱敏的 `GetTask` / `ListTasks` artifact。
 - `server-1.*.log` 和 `server-2.*.log`：重启前后的 server 日志。
 - `a2a-server.yml`：生成的 server 配置。
+- `image-fixtures/manifest.json`：图片场景的图片输入 fixture 使用情况，包括每张图来自仓库静态 fixture 还是运行时渲染。
 - `workspace/`：默认 A2A metadata cwd；除非指定 `--cwd`，工具输出和生成模板会写到这里。
 - `preflight.json`：provider preflight 结果；使用 `--skip-preflight` 时不会生成。
 
diff --git a/scripts/a2a/e2e/common.py b/scripts/a2a/e2e/common.py
index f881daf9..5438e06b 100644
--- a/scripts/a2a/e2e/common.py
+++ b/scripts/a2a/e2e/common.py
@@ -172,6 +172,7 @@ def stream_message(
     timeout: float,
     context_id: str = "",
     task_id: str = "",
+    images: list[dict[str, Any]] | None = None,
     redaction_env: dict[str, str] | None = None,
 ) -> StreamSummary:
     payload = build_message_stream_payload(
@@ -181,6 +182,7 @@ def stream_message(
         task_id=task_id,
         request_id=str(uuid.uuid4()),
         message_id=str(uuid.uuid4()),
+        images=images,
     )
     _append_jsonl(run_dir / "requests.jsonl", {"name": name, "payload": payload, "at": _utc_now()}, redaction_env)
     request = Request(
@@ -253,14 +255,16 @@ def run_llm_preflight(
         }
     except subprocess.TimeoutExpired as exc:
         elapsed = time.monotonic() - started
-        output = _redact_sensitive_text("\n".join(part for part in [exc.stdout, exc.stderr] if part), preflight_env)
+        stdout = _subprocess_output_text(exc.stdout)
+        stderr = _subprocess_output_text(exc.stderr)
+        output = _redact_sensitive_text("\n".join(part for part in [stdout, stderr] if part), preflight_env)
         payload = {
             "ok": False,
             "returnCode": None,
             "elapsedSeconds": round(elapsed, 3),
             "summary": f"timed out after {timeout:.0f}s" + (f": {_compact_text(output)}" if output else ""),
-            "stdout": _redact_sensitive_text(exc.stdout or "", preflight_env),
-            "stderr": _redact_sensitive_text(exc.stderr or "", preflight_env),
+            "stdout": _redact_sensitive_text(stdout, preflight_env),
+            "stderr": _redact_sensitive_text(stderr, preflight_env),
         }
     _write_json(run_dir / "preflight.json", payload)
     return payload
@@ -452,6 +456,14 @@ def _split_python_command(value: str) -> list[str]:
     return parts
 
 
+def _subprocess_output_text(value: str | bytes | None) -> str:
+    if value is None:
+        return ""
+    if isinstance(value, bytes):
+        return value.decode("utf-8", errors="replace")
+    return value
+
+
 def _redact_sensitive_text(text: str, env: dict[str, str] | None) -> str:
     redacted = text
     for name, value in (env or {}).items():
diff --git a/scripts/a2a/e2e/fixtures/text-images/ask-first-answer.png b/scripts/a2a/e2e/fixtures/text-images/ask-first-answer.png
new file mode 100644
index 00000000..92c5a9e1
Binary files /dev/null and b/scripts/a2a/e2e/fixtures/text-images/ask-first-answer.png differ
diff --git a/scripts/a2a/e2e/fixtures/text-images/ask-second-answer.png b/scripts/a2a/e2e/fixtures/text-images/ask-second-answer.png
new file mode 100644
index 00000000..c776f80e
Binary files /dev/null and b/scripts/a2a/e2e/fixtures/text-images/ask-second-answer.png differ
diff --git a/scripts/a2a/e2e/fixtures/text-images/initial.png b/scripts/a2a/e2e/fixtures/text-images/initial.png
new file mode 100644
index 00000000..a4fae552
Binary files /dev/null and b/scripts/a2a/e2e/fixtures/text-images/initial.png differ
diff --git a/scripts/a2a/e2e/fixtures/text-images/manifest.json b/scripts/a2a/e2e/fixtures/text-images/manifest.json
new file mode 100644
index 00000000..d8586e39
--- /dev/null
+++ b/scripts/a2a/e2e/fixtures/text-images/manifest.json
@@ -0,0 +1,44 @@
+{
+  "initial": {
+    "filename": "initial.png",
+    "text": "选择一个已有vpc，创建一个vswitch",
+    "mediaType": "image/png",
+    "byteSize": 12697,
+    "sha256": "2f773773c5b528cb7fdafde969d464b19d4d3022c1e6f2ad85b162f98f7ff82e"
+  },
+  "selection": {
+    "filename": "selection.png",
+    "text": "你随便选一个方案。",
+    "mediaType": "image/png",
+    "byteSize": 9907,
+    "sha256": "3aa92a48eed5c37115f18dc89a058ebbb06ac5eeea59f2870d4d58b355ac924b"
+  },
+  "normal-followup": {
+    "filename": "normal-followup.png",
+    "text": "你刚才创建了什么",
+    "mediaType": "image/png",
+    "byteSize": 8684,
+    "sha256": "03a9b1006f840c0bb8ef4f2bd75819033489f4e4f14d92abd7e12b591dd9c26d"
+  },
+  "ask-first-answer": {
+    "filename": "ask-first-answer.png",
+    "text": "我要创建云网络资源；本次只选择已有 VPC 创建一个 VSwitch，不部署 ECS、EIP、SLB 或 Nginx。",
+    "mediaType": "image/png",
+    "byteSize": 35073,
+    "sha256": "499fd5648baafe7d9904259a1eb3408b65556a39a778b2a2a89b89058bcd61b0"
+  },
+  "ask-second-answer": {
+    "filename": "ask-second-answer.png",
+    "text": "选择一个已有 VPC，创建一个 VSwitch；地域、可用区和网段你按低成本默认值推荐。",
+    "mediaType": "image/png",
+    "byteSize": 32302,
+    "sha256": "0fdb1c4d4fce2038f9e5a4107ba8a7e96658a3ca2c705c834c4c93ca23b93dc5"
+  },
+  "rollback-interrupt": {
+    "filename": "rollback-interrupt.png",
+    "text": "回退到 intent_parsing，选择一个已有vpc，创建一个安全组",
+    "mediaType": "image/png",
+    "byteSize": 20967,
+    "sha256": "1dfa25bba58757704b27a7ee8f44a42f4e69045730bba5320986194c873a5937"
+  }
+}
diff --git a/scripts/a2a/e2e/fixtures/text-images/normal-followup.png b/scripts/a2a/e2e/fixtures/text-images/normal-followup.png
new file mode 100644
index 00000000..2f9864a7
Binary files /dev/null and b/scripts/a2a/e2e/fixtures/text-images/normal-followup.png differ
diff --git a/scripts/a2a/e2e/fixtures/text-images/rollback-interrupt.png b/scripts/a2a/e2e/fixtures/text-images/rollback-interrupt.png
new file mode 100644
index 00000000..50512a84
Binary files /dev/null and b/scripts/a2a/e2e/fixtures/text-images/rollback-interrupt.png differ
diff --git a/scripts/a2a/e2e/fixtures/text-images/selection.png b/scripts/a2a/e2e/fixtures/text-images/selection.png
new file mode 100644
index 00000000..cf8f0407
Binary files /dev/null and b/scripts/a2a/e2e/fixtures/text-images/selection.png differ
diff --git a/scripts/a2a/e2e/run_recovery_scenarios.py b/scripts/a2a/e2e/run_recovery_scenarios.py
index 52bea6b6..82c782d3 100644
--- a/scripts/a2a/e2e/run_recovery_scenarios.py
+++ b/scripts/a2a/e2e/run_recovery_scenarios.py
@@ -11,6 +11,9 @@
 from __future__ import annotations
 
 import argparse
+import base64
+import hashlib
+import io
 import json
 import os
 import signal
@@ -26,6 +29,9 @@
 from urllib.error import HTTPError, URLError
 from urllib.request import Request, urlopen
 
+import yaml
+from PIL import Image, ImageDraw, ImageFont
+
 E2E_SCRIPTS_DIR = Path(__file__).resolve().parent
 A2A_SCRIPTS_DIR = E2E_SCRIPTS_DIR.parent
 for scripts_dir in (E2E_SCRIPTS_DIR, A2A_SCRIPTS_DIR):
@@ -76,10 +82,35 @@
 INTERVENING_ASK_ANSWER = "使用默认配置（可用区和网段自动规划），继续。"
 ROLLBACK_PROMPT = "回退到 intent_parsing，选择一个已有vpc，创建一个安全组"
 CONTINUE_PROMPT = "继续"
+CLEANUP_RECOVERY_PROMPT = (
+    "请只回复“OK，继续”。不要调用任何工具，不要查询任何云资源，不要删除任何资源。"
+    "如果系统有后台 cleanup 恢复流程，请让它自行完成。"
+)
+CLEANUP_PROMPT_METADATA_TYPE = "pipeline_cleanup_prompt"
+CLEANUP_EVENT_TYPES = frozenset(
+    {
+        "cleanup_started",
+        "cleanup_progress",
+        "cleanup_completed",
+        "cleanup_failed",
+    }
+)
+CLEANUP_ACTIVE_STATUSES = frozenset({"pending", "started", "in_progress", "failed"})
+IMAGE_TEXT_PROMPT = "请读取图片中的文字，并将图片中的文字作为本轮用户输入执行。"
+STATIC_TEXT_IMAGE_FIXTURE_ROOT = E2E_SCRIPTS_DIR / "fixtures" / "text-images"
+STATIC_TEXT_IMAGE_FIXTURES = {
+    "initial": DEFAULT_INITIAL_PROMPT,
+    "selection": DEFAULT_SELECTION_PROMPT,
+    "normal-followup": DEFAULT_NORMAL_FOLLOWUP_PROMPT,
+    "ask-first-answer": ASK_FIRST_ANSWER,
+    "ask-second-answer": ASK_SECOND_ANSWER,
+    "rollback-interrupt": ROLLBACK_PROMPT,
+}
 
 VSWITCH_MARKERS = ("ALIYUN::ECS::VSwitch", "VSwitchId", "vsw-", "VSwitch", "交换机")
 SECURITY_GROUP_MARKERS = ("ALIYUN::ECS::SecurityGroup", "SecurityGroupId", "sg-", "安全组")
 TERMINAL_STATES = {"TASK_STATE_COMPLETED", "TASK_STATE_FAILED", "TASK_STATE_CANCELED", "TASK_STATE_INPUT_REQUIRED"}
+ROS_STACK_DELETED_STATUSES = {"DELETE_COMPLETE"}
 
 
 @dataclass
@@ -102,6 +133,127 @@ class EventMatch:
     summary: StreamSummary
 
 
+class TextImageFixtureStore:
+    def __init__(self, root: Path, static_root: Path = STATIC_TEXT_IMAGE_FIXTURE_ROOT) -> None:
+        self.root = root
+        self.root.mkdir(parents=True, exist_ok=True)
+        self.manifest_path = self.root / "manifest.json"
+        self.static_root = static_root
+
+    def part(self, key: str, text: str) -> dict[str, Any]:
+        safe_key = _safe_fixture_key(key)
+        path = self._static_fixture_path(safe_key, text)
+        source = "static"
+        if path is None:
+            path = self.root / f"{safe_key}.png"
+            source = "generated"
+            if not path.exists():
+                path.write_bytes(_render_text_png(text))
+        raw = path.read_bytes()
+        self._record_manifest(safe_key, text=text, path=path, byte_size=len(raw), source=source)
+        return {
+            "filename": path.name,
+            "mediaType": "image/png",
+            "bytes": base64.b64encode(raw).decode("ascii"),
+        }
+
+    def _static_fixture_path(self, key: str, text: str) -> Path | None:
+        try:
+            manifest = json.loads((self.static_root / "manifest.json").read_text(encoding="utf-8"))
+        except (OSError, json.JSONDecodeError):
+            return None
+        if not isinstance(manifest, dict):
+            return None
+        entry = manifest.get(key)
+        if not isinstance(entry, dict) or entry.get("text") != text or entry.get("mediaType") != "image/png":
+            return None
+        filename = entry.get("filename")
+        if not isinstance(filename, str) or not filename:
+            return None
+        path = self.static_root / filename
+        return path if path.is_file() else None
+
+    def _record_manifest(self, key: str, *, text: str, path: Path, byte_size: int, source: str) -> None:
+        try:
+            manifest = json.loads(self.manifest_path.read_text(encoding="utf-8"))
+        except (OSError, json.JSONDecodeError):
+            manifest = {}
+        if not isinstance(manifest, dict):
+            manifest = {}
+        manifest[key] = {
+            "text": text,
+            "path": str(path),
+            "mediaType": "image/png",
+            "byteSize": byte_size,
+            "sha256": hashlib.sha256(path.read_bytes()).hexdigest(),
+            "source": source,
+        }
+        _write_json(self.manifest_path, manifest)
+
+
+def _safe_fixture_key(value: str) -> str:
+    safe = "".join(ch if ch.isalnum() or ch in {"-", "_"} else "-" for ch in value.strip().lower())
+    return safe.strip("-") or "input"
+
+
+def _render_text_png(text: str) -> bytes:
+    font = _load_text_image_font(size=34)
+    lines = _wrap_text_for_image(text)
+    padding = 40
+    line_spacing = 12
+    probe = Image.new("RGB", (1, 1), "white")
+    draw = ImageDraw.Draw(probe)
+    boxes = [draw.textbbox((0, 0), line, font=font) for line in lines]
+    text_width = int(max((right - left for left, _top, right, _bottom in boxes), default=360))
+    line_heights = [int(bottom - top) for _left, top, _right, bottom in boxes] or [40]
+    width = int(max(760, min(1600, text_width + padding * 2)))
+    height = int(max(220, sum(line_heights) + line_spacing * max(0, len(lines) - 1) + padding * 2))
+    image = Image.new("RGB", (width, height), "white")
+    draw = ImageDraw.Draw(image)
+    y = padding
+    for line, line_height in zip(lines, line_heights, strict=False):
+        draw.text((padding, y), line, fill=(16, 24, 39), font=font)
+        y += line_height + line_spacing
+    output = io.BytesIO()
+    image.save(output, format="PNG")
+    return output.getvalue()
+
+
+def _wrap_text_for_image(text: str, *, max_chars: int = 26) -> list[str]:
+    lines: list[str] = []
+    for raw_line in text.splitlines() or [text]:
+        line = raw_line.strip()
+        if not line:
+            lines.append("")
+            continue
+        while len(line) > max_chars:
+            lines.append(line[:max_chars])
+            line = line[max_chars:]
+        if line:
+            lines.append(line)
+    return lines or [""]
+
+
+def _load_text_image_font(*, size: int) -> Any:
+    candidates = [
+        "/System/Library/Fonts/PingFang.ttc",
+        "/System/Library/Fonts/Hiragino Sans GB.ttc",
+        "/System/Library/Fonts/STHeiti Light.ttc",
+        "/Library/Fonts/Arial Unicode.ttf",
+        "/usr/share/fonts/opentype/noto/NotoSansCJK-Regular.ttc",
+        "/usr/share/fonts/truetype/noto/NotoSansCJK-Regular.ttc",
+        "/usr/share/fonts/truetype/wqy/wqy-microhei.ttc",
+        "/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf",
+    ]
+    for candidate in candidates:
+        if Path(candidate).is_file():
+            try:
+                return ImageFont.truetype(candidate, size=size)
+            except OSError:
+                continue
+    return ImageFont.load_default()
+
+
 class BackgroundStream:
     def __init__(
         self,
@@ -114,6 +266,7 @@ def __init__(
         timeout: float,
         context_id: str = "",
         task_id: str = "",
+        images: list[dict[str, Any]] | None = None,
         redaction_env: dict[str, str] | None = None,
     ) -> None:
         self.server_url = server_url
@@ -124,6 +277,7 @@ def __init__(
         self.timeout = timeout
         self.context_id = context_id
         self.task_id = task_id
+        self.images = images
         self.redaction_env = redaction_env
         self.summary = StreamSummary(name=name, prompt=prompt, request_task_id=task_id)
         self.events: list[Any] = []
@@ -182,6 +336,7 @@ def _run(self) -> None:
             task_id=self.task_id,
             request_id=str(uuid.uuid4()),
             message_id=str(uuid.uuid4()),
+            images=self.images,
         )
         _append_jsonl(
             self.run_dir / "requests.jsonl",
@@ -230,6 +385,7 @@ def __init__(self, args: argparse.Namespace, *, scenario: str) -> None:
         self.server_cwd = str(Path(args.server_cwd).expanduser().resolve())
         self.run_dir = _scenario_run_dir(args, scenario)
         self.run_dir.mkdir(parents=True, exist_ok=True)
+        self.image_fixtures = TextImageFixtureStore(self.run_dir / "image-fixtures")
         self.workspace_dir = Path(args.cwd).expanduser().resolve() if args.cwd else self.run_dir / "workspace"
         self.workspace_dir.mkdir(parents=True, exist_ok=True)
         self.cwd = str(self.workspace_dir)
@@ -314,6 +470,7 @@ def stream(
         name: str,
         context_id: str | None = None,
         task_id: str | None = None,
+        images: list[dict[str, Any]] | None = None,
     ) -> StreamSummary:
         summary = stream_message(
             server_url=self.server_url,
@@ -324,12 +481,31 @@ def stream(
             name=name,
             run_dir=self.run_dir,
             timeout=self.args.stream_timeout,
+            images=images,
             redaction_env=self.server_env,
         )
         self._remember_identity(summary)
         self.summaries[name] = summary
         return summary
 
+    def stream_image_text(
+        self,
+        *,
+        text: str,
+        image_key: str,
+        name: str,
+        context_id: str | None = None,
+        task_id: str | None = None,
+        prompt: str = IMAGE_TEXT_PROMPT,
+    ) -> StreamSummary:
+        return self.stream(
+            prompt=prompt,
+            name=name,
+            context_id=context_id,
+            task_id=task_id,
+            images=[self.image_fixtures.part(image_key, text)],
+        )
+
     def start_stream(
         self,
         *,
@@ -337,6 +513,7 @@ def start_stream(
         name: str,
         context_id: str | None = None,
         task_id: str | None = None,
+        images: list[dict[str, Any]] | None = None,
     ) -> BackgroundStream:
         stream = BackgroundStream(
             server_url=self.server_url,
@@ -347,6 +524,7 @@ def start_stream(
             name=name,
             run_dir=self.run_dir,
             timeout=self.args.stream_timeout,
+            images=images,
             redaction_env=self.server_env,
         )
         stream.start()
@@ -359,6 +537,24 @@ def start_stream(
         self.summaries[name] = stream.summary
         return stream
 
+    def start_stream_image_text(
+        self,
+        *,
+        text: str,
+        image_key: str,
+        name: str,
+        context_id: str | None = None,
+        task_id: str | None = None,
+        prompt: str = IMAGE_TEXT_PROMPT,
+    ) -> BackgroundStream:
+        return self.start_stream(
+            prompt=prompt,
+            name=name,
+            context_id=context_id,
+            task_id=task_id,
+            images=[self.image_fixtures.part(image_key, text)],
+        )
+
     def fetch_state(self, name: str) -> Any:
         snapshot = fetch_pipeline_state(
             server_url=self.server_url,
@@ -573,6 +769,9 @@ def callback(h: ScenarioHarness) -> None:
             context_id=h.context_id,
             task_id=h.pipeline_task_id,
         )
+        h.checks["after-pipeline state has no cleanup activity"] = not _snapshot_has_cleanup_activity(
+            h.snapshots["after_pipeline"]
+        )
         normal = h.stream(prompt=args.normal_followup_prompt, name="03-normal-followup", task_id="")
         h.checks["normal follow-up stayed in same context"] = normal.context_id == h.context_id
         h.checks["normal follow-up used a new task"] = bool(normal.task_id) and normal.task_id != h.pipeline_task_id
@@ -587,6 +786,9 @@ def callback(h: ScenarioHarness) -> None:
             context_id=h.context_id,
             task_id=h.pipeline_task_id,
         )
+        h.checks["after-restart state has no cleanup activity"] = not _snapshot_has_cleanup_activity(
+            h.snapshots["after_restart"]
+        )
         recovery = h.stream(prompt=args.recovery_prompt, name="04-recovery-question", task_id="")
         h.checks["recovery stayed in same context"] = recovery.context_id == h.context_id
         h.checks["recovery used a new task"] = bool(recovery.task_id) and recovery.task_id not in {
@@ -596,6 +798,9 @@ def callback(h: ScenarioHarness) -> None:
         h.checks["recovery finished turn"] = _normal_turn_finished(recovery)
         h.checks["recovery answer mentions previous question"] = args.expected_text in recovery.text
         h.checks["VSwitch evidence found"] = _has_any_marker(_all_evidence(h), VSWITCH_MARKERS)
+        h.checks["scenario1 emitted no cleanup events"] = not _run_dir_has_cleanup_events(h.run_dir)
+        h.checks["scenario1 persisted no cleanup prompt"] = not _session_has_cleanup_prompt(h)
+        h.checks["scenario1 ledger has no cleanup-required resources"] = not _cleanup_ledger_has_required_resources(h)
 
     return _run_with_harness(args, scenario, callback)
 
@@ -704,6 +909,164 @@ def callback(h: ScenarioHarness) -> None:
     return _run_with_harness(args, scenario, callback)
 
 
+def run_image_initial(args: argparse.Namespace, scenario: str) -> int:
+    def callback(h: ScenarioHarness) -> None:
+        initial = h.stream_image_text(
+            text=args.initial_prompt,
+            image_key="initial",
+            name="01-initial-image",
+            context_id="",
+            task_id="",
+        )
+        initial = _answer_intervening_ask_inputs(h, initial, name_prefix="01-initial-image")
+        h.checks["image initial reached step4 input_required"] = (
+            initial.last_input_required_step_id == "confirm_and_select"
+        )
+        selection = h.stream(prompt=args.selection_prompt, name="02-select-candidate")
+        h.checks["image initial selection completed pipeline"] = _pipeline_completed(selection)
+        h.checks["image initial VSwitch evidence found"] = _has_any_marker(_all_evidence(h), VSWITCH_MARKERS)
+
+    return _run_with_harness(args, scenario, callback)
+
+
+def run_image_ask_waiting(args: argparse.Namespace, scenario: str) -> int:
+    def callback(h: ScenarioHarness) -> None:
+        initial = h.stream(prompt=ASK_TRIGGER_PROMPT, name="01-ask-trigger", context_id="", task_id="")
+        h.checks["initial reached input_required"] = _reached_input_required(initial)
+        h.checks["input_required is ask_user_question"] = (
+            _latest_pending_kind(h.run_dir / "01-ask-trigger.events.jsonl") == "ask_user_question"
+        )
+        h.kill9_and_restart()
+        snapshot = h.fetch_state("after-restart")
+        h.checks["snapshot still waiting input"] = _snapshot_value(snapshot, "status") == "waiting_input"
+        h.checks["pending input is ask_user_question"] = _pending_kind(snapshot) == "ask_user_question"
+        answer = h.stream_image_text(
+            text=ASK_FIRST_ANSWER,
+            image_key="ask-first-answer",
+            name="02-answer-first-ask-image",
+            task_id="",
+        )
+        _add_hydrated_task_checks(h, answer, "first ask image answer")
+        final_summary = answer
+        if answer.last_input_required_step_id:
+            second = h.stream_image_text(
+                text=ASK_SECOND_ANSWER,
+                image_key="ask-second-answer",
+                name="03-answer-second-ask-image",
+            )
+            _add_same_task_checks(h, second, "second ask image answer")
+            _finish_pipeline_after_possible_input(h, second, args)
+            final_summary = second
+        else:
+            _finish_pipeline_after_possible_input(h, answer, args)
+        h.checks["pipeline completed after ask image recovery"] = _completed_snapshot_or_stream(h, final_summary)
+        h.checks["VSwitch evidence found"] = _has_any_marker(_all_evidence(h), VSWITCH_MARKERS)
+
+    return _run_with_harness(args, scenario, callback)
+
+
+def run_image_selection_waiting(args: argparse.Namespace, scenario: str) -> int:
+    def callback(h: ScenarioHarness) -> None:
+        initial = h.stream(prompt=args.initial_prompt, name="01-initial", context_id="", task_id="")
+        initial = _answer_intervening_ask_inputs(h, initial, name_prefix="01-initial")
+        h.checks["initial reached step4 input_required"] = initial.last_input_required_step_id == "confirm_and_select"
+        h.kill9_and_restart()
+        snapshot = h.fetch_state("after-restart")
+        h.checks["snapshot still waiting input"] = _snapshot_value(snapshot, "status") == "waiting_input"
+        h.checks["pending input is confirm_and_select"] = _pending_step_id(snapshot) == "confirm_and_select"
+        selection = h.stream_image_text(
+            text=args.selection_prompt,
+            image_key="selection",
+            name="02-select-after-restart-image",
+            task_id="",
+        )
+        _add_hydrated_task_checks(h, selection, "selection image answer")
+        h.checks["selection image completed pipeline"] = _pipeline_completed(selection)
+        h.checks["VSwitch evidence found"] = _has_any_marker(_all_evidence(h), VSWITCH_MARKERS)
+
+    return _run_with_harness(args, scenario, callback)
+
+
+def run_image_normal_handoff(args: argparse.Namespace, scenario: str) -> int:
+    def callback(h: ScenarioHarness) -> None:
+        _complete_pipeline(h, args)
+        normal = h.stream_image_text(
+            text=args.normal_followup_prompt,
+            image_key="normal-followup",
+            name="03-normal-followup-image",
+            task_id="",
+        )
+        h.checks["normal image follow-up stayed in same context"] = normal.context_id == h.context_id
+        h.checks["normal image follow-up used a new task"] = (
+            bool(normal.task_id) and normal.task_id != h.pipeline_task_id
+        )
+        h.checks["normal image follow-up finished turn"] = _normal_turn_finished(normal)
+        h.checks["normal image follow-up produced text"] = bool(normal.text.strip())
+        h.kill9_and_restart()
+        h.snapshots["after_restart"] = h.fetch_state("after-restart")
+        _add_completed_snapshot_checks(
+            h.checks,
+            "after-restart state",
+            h.snapshots["after_restart"],
+            context_id=h.context_id,
+            task_id=h.pipeline_task_id,
+        )
+        recovery = h.stream(prompt=args.recovery_prompt, name="04-recovery-question", task_id="")
+        h.checks["normal image recovery stayed in same context"] = recovery.context_id == h.context_id
+        h.checks["normal image recovery finished turn"] = _normal_turn_finished(recovery)
+
+    return _run_with_harness(args, scenario, callback)
+
+
+def run_image_interrupt(args: argparse.Namespace, scenario: str) -> int:
+    def callback(h: ScenarioHarness) -> None:
+        initial = h.start_stream(prompt=args.initial_prompt, name="01-initial-running", context_id="", task_id="")
+        observed_streams = _wait_for_with_intervening_ask_inputs(
+            h,
+            [initial],
+            _candidate_started,
+            description="candidate started before image interrupt",
+            timeout=args.event_timeout,
+            name_prefix="initial-running",
+        )
+        rollback = h.start_stream_image_text(
+            text=ROLLBACK_PROMPT,
+            image_key="rollback-interrupt",
+            name="02-rollback-image-interrupt",
+        )
+        _wait_any(
+            [*observed_streams, rollback],
+            _event_type("rollback_completed"),
+            description="image rollback_completed",
+            timeout=args.event_timeout,
+        )
+        streams_to_join = [*observed_streams, rollback]
+        _wait_any(
+            [*observed_streams, rollback],
+            _step_started("intent_parsing"),
+            description="post-image-rollback step_started(intent_parsing)",
+            timeout=args.event_timeout,
+        )
+        h.fetch_state("before-kill")
+        h.kill9_and_restart()
+        for stream in streams_to_join:
+            _join_after_kill(stream, h)
+        snapshot = h.fetch_state("after-restart")
+        h.checks["state endpoint returned snapshot after image interrupt restart"] = _snapshot(snapshot) is not None
+        resumed = h.stream(prompt=CONTINUE_PROMPT, name="03-continue-after-restart")
+        _finish_pipeline_after_possible_input(h, resumed, args)
+        h.checks["pipeline completed after image interrupt recovery"] = _completed_snapshot_or_stream(h, resumed)
+        final_state = h.fetch_state("after-image-interrupt-completion")
+        final_deploying = _final_deployment_evidence(final_state)
+        h.checks["final deploying target is security group"] = _has_any_marker(
+            final_deploying,
+            SECURITY_GROUP_MARKERS,
+        )
+        h.checks["final deploying target is not VSwitch"] = not _has_any_marker(final_deploying, VSWITCH_MARKERS)
+
+    return _run_with_harness(args, scenario, callback)
+
+
 def run_rollback(args: argparse.Namespace, scenario: str) -> int:
     target_step = _ROLLBACK_SCENARIOS[scenario]
 
@@ -868,11 +1231,14 @@ def callback(h: ScenarioHarness) -> None:
         _add_hydrated_task_checks(h, resumed, "continue")
         _finish_pipeline_after_possible_input(h, resumed, args)
         after_continue = h.capture_task_snapshots("after-continue")
-        h.checks["task_get_after_continue_completed"] = _task_response_matches(
-            after_continue["task_get"],
-            task_id=h.pipeline_task_id,
-            context_id=h.context_id,
-        ) and _task_status_state(after_continue["task_get"]) == "TASK_STATE_COMPLETED"
+        h.checks["task_get_after_continue_completed"] = (
+            _task_response_matches(
+                after_continue["task_get"],
+                task_id=h.pipeline_task_id,
+                context_id=h.context_id,
+            )
+            and _task_status_state(after_continue["task_get"]) == "TASK_STATE_COMPLETED"
+        )
         h.checks["task_list_after_continue_kept_recovered_task"] = _task_list_contains(
             after_continue["task_list"],
             task_id=h.pipeline_task_id,
@@ -884,6 +1250,138 @@ def callback(h: ScenarioHarness) -> None:
     return _run_with_harness(args, scenario, callback)
 
 
+def run_rollback_step5_cleanup(args: argparse.Namespace, scenario: str) -> int:
+    return _run_rollback_step5_cleanup(args, scenario, kill_during_cleanup=False)
+
+
+def run_rollback_step5_cleanup_recovery(args: argparse.Namespace, scenario: str) -> int:
+    return _run_rollback_step5_cleanup(args, scenario, kill_during_cleanup=True)
+
+
+def _run_rollback_step5_cleanup(
+    args: argparse.Namespace,
+    scenario: str,
+    *,
+    kill_during_cleanup: bool,
+) -> int:
+    def callback(h: ScenarioHarness) -> None:
+        initial = h.stream(prompt=args.initial_prompt, name="01-initial", context_id="", task_id="")
+        initial = _answer_intervening_ask_inputs(h, initial, name_prefix="01-initial")
+        h.checks["initial reached step4 selection"] = initial.last_input_required_step_id == "confirm_and_select"
+
+        first_deploy = h.start_stream(
+            prompt=_cleanup_deployment_prompt(args.selection_prompt, h, "first"),
+            name="02-create-first-stack",
+        )
+        first_stack_id = _wait_for_created_stack(
+            first_deploy,
+            exclude=set(),
+            timeout=args.event_timeout,
+        )
+        h.checks["first rollback stack observed before rollback"] = bool(first_stack_id)
+
+        rollback = h.start_stream(prompt=ROLLBACK_PROMPT, name="03-rollback-after-first-stack")
+        _wait_any(
+            [first_deploy, rollback],
+            _event_type("rollback_completed"),
+            description="rollback_completed after first stack",
+            timeout=args.event_timeout,
+        )
+        _wait_any(
+            [first_deploy, rollback],
+            _input_required_step("confirm_and_select"),
+            description="post-rollback input_required(confirm_and_select)",
+            timeout=_post_rollback_timeout(args),
+        )
+        cleanup_stack_ids = _cleanup_target_stack_ids(h, exclude=set())
+        h.checks["rollback cleanup ledger includes first stack"] = bool(first_stack_id) and (
+            first_stack_id in cleanup_stack_ids
+        )
+        h.checks["rollback cleanup target stacks observed"] = bool(cleanup_stack_ids)
+
+        second_deploy = h.start_stream(
+            prompt=_cleanup_deployment_prompt(args.selection_prompt, h, "second"),
+            name="04-select-second-stack",
+        )
+        _wait_any(
+            [second_deploy],
+            _step_started("deploying"),
+            description="second deployment step_started(deploying)",
+            timeout=args.event_timeout,
+        )
+        for stream in (first_deploy, rollback, second_deploy):
+            _join_stream_or_note(stream, h)
+
+        _finish_pipeline_after_possible_input(h, second_deploy.summary, args)
+        h.checks["pipeline completed after second deployment"] = _completed_snapshot_or_stream(h, second_deploy.summary)
+        h.fetch_state("after-second-stack")
+        second_stack_id = _created_stack_id_from_stream(second_deploy, exclude=set(cleanup_stack_ids))
+        h.checks["second stack created after rollback"] = bool(second_stack_id)
+        h.checks["second stack differs from first rollback stack"] = bool(second_stack_id) and (
+            second_stack_id != first_stack_id
+        )
+        cleanup_stack_ids = _cleanup_target_stack_ids(
+            h,
+            exclude={stack_id for stack_id in [second_stack_id] if stack_id},
+        )
+        h.checks["rollback cleanup ledger includes first stack"] = bool(first_stack_id) and (
+            first_stack_id in cleanup_stack_ids
+        )
+        h.checks["rollback cleanup target stacks observed"] = bool(cleanup_stack_ids)
+
+        if kill_during_cleanup:
+            cleanup_stream = h.start_stream(
+                prompt=args.normal_followup_prompt,
+                name="05-cleanup-running",
+                task_id="",
+            )
+            _wait_for_cleanup_started(h, cleanup_stream, first_stack_id, timeout=args.event_timeout)
+            h.kill9_and_restart()
+            _join_after_kill(cleanup_stream, h)
+            h.snapshots["after_cleanup_restart"] = h.fetch_state("after-cleanup-restart")
+            cleanup_summary = h.stream(prompt=CLEANUP_RECOVERY_PROMPT, name="06-cleanup-after-restart", task_id="")
+            h.checks["cleanup retriggered after restart"] = _events_file_has_cleanup_event(
+                h.run_dir / "06-cleanup-after-restart.events.jsonl",
+                stack_id=first_stack_id,
+                event_types={"cleanup_started", "cleanup_progress", "cleanup_completed"},
+            )
+        else:
+            cleanup_summary = h.stream(
+                prompt=args.normal_followup_prompt,
+                name="05-cleanup-normal-turn",
+                task_id="",
+            )
+        h.checks["cleanup normal turn stayed in same context"] = cleanup_summary.context_id == h.context_id
+        h.checks["cleanup normal turn used normal task"] = cleanup_summary.task_id != h.pipeline_task_id
+
+        after_cleanup = h.fetch_state("after-cleanup")
+        cleanup_resource = _cleanup_resource_for_stack(after_cleanup, first_stack_id)
+        h.checks["first rollback stack cleanup completed in snapshot"] = _cleanup_resource_completed(cleanup_resource)
+        h.checks["rollback cleanup stacks completed in snapshot"] = bool(cleanup_stack_ids) and all(
+            _cleanup_resource_completed(_cleanup_resource_for_stack(after_cleanup, stack_id))
+            for stack_id in cleanup_stack_ids
+        )
+        h.checks["cleanup snapshot does not target second stack"] = (
+            bool(second_stack_id) and _cleanup_resource_for_stack(after_cleanup, second_stack_id) is None
+        )
+
+        ros_stack_ids = _unique_strings([*cleanup_stack_ids, second_stack_id])
+        ros_states = _capture_ros_stack_states(
+            h,
+            ros_stack_ids,
+            "after-cleanup",
+        )
+        h.checks["ROS first rollback stack deleted"] = _ros_stack_deleted(ros_states.get(first_stack_id, {}))
+        h.checks["ROS rollback cleanup stacks deleted"] = bool(cleanup_stack_ids) and all(
+            _ros_stack_deleted(ros_states.get(stack_id, {})) for stack_id in cleanup_stack_ids
+        )
+        h.checks["ROS second stack retained"] = bool(second_stack_id) and _ros_stack_retained(
+            ros_states.get(second_stack_id, {})
+        )
+
+    return _run_with_harness(args, scenario, callback)
+
+
 def _complete_pipeline(h: ScenarioHarness, args: argparse.Namespace) -> None:
     initial = h.stream(prompt=args.initial_prompt, name="01-initial", context_id="", task_id="")
     initial = _answer_intervening_ask_inputs(h, initial, name_prefix="01-initial")
@@ -985,10 +1483,7 @@ def predicate(event: Any, _summary: StreamSummary) -> bool:
         return (
             isinstance(envelope, dict)
             and envelope.get("eventType") == "input_required"
-            and (
-                (isinstance(step, dict) and step.get("id") == step_id)
-                or data_step_id == step_id
-            )
+            and ((isinstance(step, dict) and step.get("id") == step_id) or data_step_id == step_id)
         )
 
     return predicate
@@ -1023,14 +1518,18 @@ def _wait_any(
 ) -> EventMatch:
     deadline = time.monotonic() + timeout
     last_error = ""
+    active_streams = list(streams)
     while time.monotonic() < deadline:
-        for stream in streams:
+        for stream in list(active_streams):
             try:
                 return stream.wait_for(predicate, description=description, timeout=0.25)
             except TimeoutError:
                 continue
             except RuntimeError as exc:
                 last_error = str(exc)
+                active_streams.remove(stream)
+        if not active_streams:
+            break
         time.sleep(0.05)
     raise TimeoutError(f"Timed out waiting for {description}; last_error={last_error}")
 
@@ -1067,9 +1566,7 @@ def _wait_for_with_intervening_ask_inputs(
                 answered_count += 1
                 if answered_count > 4:
                     raise RuntimeError(f"too many intervening ask_user_question inputs before {description}") from exc
-                h.notes.append(
-                    f"answered intervening ask_user_question while waiting for {description}: {stream.name}"
-                )
+                h.notes.append(f"answered intervening ask_user_question while waiting for {description}: {stream.name}")
                 answer = h.start_stream(
                     prompt=INTERVENING_ASK_ANSWER,
                     name=f"{name_prefix}-answer-ask-{answered_count}",
@@ -1265,11 +1762,7 @@ def _jsonrpc_result(response: Any) -> Any:
 def _task_response_matches(response: Any, *, task_id: str, context_id: str) -> bool:
     result = _jsonrpc_result(response)
     identity = _a2a_task_identity(result)
-    return (
-        isinstance(identity, dict)
-        and identity.get("taskId") == task_id
-        and identity.get("contextId") == context_id
-    )
+    return isinstance(identity, dict) and identity.get("taskId") == task_id and identity.get("contextId") == context_id
 
 
 def _task_status_state(response: Any) -> str:
@@ -1286,11 +1779,7 @@ def _task_list_contains(response: Any, *, task_id: str, context_id: str) -> bool
         return False
     for task in tasks:
         identity = _a2a_task_identity(task)
-        if (
-            isinstance(identity, dict)
-            and identity.get("taskId") == task_id
-            and identity.get("contextId") == context_id
-        ):
+        if isinstance(identity, dict) and identity.get("taskId") == task_id and identity.get("contextId") == context_id:
             return True
     return False
 
@@ -1420,6 +1909,560 @@ def _has_any_marker(text: str, markers: Iterable[str]) -> bool:
     return any(marker in text for marker in markers)
 
 
+def _join_stream_or_note(stream: BackgroundStream, h: ScenarioHarness) -> None:
+    try:
+        stream.join(timeout=h.args.stream_timeout)
+    except Exception as exc:
+        h.notes.append(f"{stream.name} ended while joining: {type(exc).__name__}: {exc}")
+
+
+def _post_rollback_timeout(args: argparse.Namespace) -> float:
+    event_timeout = float(getattr(args, "event_timeout", 0) or 0)
+    stream_timeout = float(getattr(args, "stream_timeout", 0) or 0)
+    return max(event_timeout, min(stream_timeout, 900.0))
+
+
+def _cleanup_deployment_prompt(base_prompt: str, h: ScenarioHarness, label: str) -> str:
+    stack_name = _cleanup_stack_name(h, label)
+    completion_instruction = (
+        "本轮是回滚窗口验证：CreateStack 成功后不要调用 complete_step，不要结束 deploying step；"
+        "只简短说明新建的 stack_id，并等待用户下一条指令。"
+        if label == "first"
+        else "complete_step 前必须在本轮对话中看到一次新的 CreateStack 成功，部署总结的 stack_id 必须来自这次新建。"
+    )
+    return (
+        f"{base_prompt}\n\n"
+        "E2E 强制部署约束：\n"
+        f"- 本轮唯一成功条件是新建一个 ROS stack，StackName 必须精确等于 `{stack_name}`。\n"
+        "- 任何已有 stack（即使是 CREATE_COMPLETE）都必须视为失败结果，不能作为部署成功依据。\n"
+        f"- 调用 ros_stack 或 aliyun_api CreateStack 前，必须复核工具参数里的 StackName 精确等于 `{stack_name}`。\n"
+        f"- 如果模板、文件名、候选方案或默认值给出了其他 StackName，必须覆盖为 `{stack_name}` 后再调用 CreateStack。\n"
+        f"- 如果已经用其他 StackName 调用失败，不能 GetStack 或复用那个 stack，必须改用 `{stack_name}` "
+        "重新 CreateStack。\n"
+        "- 如果无法使用上述 StackName 新建 stack，就停下来说明失败，不要调用 complete_step。\n"
+        f"{completion_instruction}"
+        "创建 VSwitch 时请先检查目标 VPC 已有 VSwitch CIDR，选择未占用且属于 VPC CIDR 的网段；"
+        "如果 CIDR 冲突，请选择另一个未占用网段并继续使用上述指定 StackName。"
+    )
+
+
+def _cleanup_stack_name(h: ScenarioHarness, label: str) -> str:
+    suffix = Path(getattr(h, "run_dir", "")).name.rsplit("-", maxsplit=1)[-1] or "stack"
+    safe_label = "".join(ch if ch.isalnum() else "-" for ch in label.lower()).strip("-") or "stack"
+    return f"iac-e2e-{suffix[:12]}-{safe_label}"[:128]
+
+
+def _wait_for_observed_cleanup_stack(
+    h: ScenarioHarness,
+    *,
+    exclude: set[str],
+    timeout: float,
+) -> str:
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        stack_id = _latest_observed_stack_id(h, exclude=exclude)
+        if stack_id:
+            return stack_id
+        time.sleep(1.0)
+    raise TimeoutError("Timed out waiting for rollback cleanup ledger to observe a ROS stack")
+
+
+def _wait_for_created_stack(
+    stream: BackgroundStream,
+    *,
+    exclude: set[str],
+    timeout: float,
+) -> str:
+    match = _wait_any(
+        [stream],
+        _created_stack_event(exclude),
+        description="successful CreateStack stack_current_changed",
+        timeout=timeout,
+    )
+    envelope = _extract_pipeline_envelope(match.event)
+    data = envelope.get("data") if isinstance(envelope, dict) else None
+    stack_id = _string_from_mapping(data, "stackId", "stack_id", "StackId")
+    if not stack_id:
+        raise RuntimeError("successful CreateStack event did not include a stack id")
+    return stack_id
+
+
+def _created_stack_id_from_stream(stream: Any, *, exclude: set[str]) -> str | None:
+    for event in getattr(stream, "events", []) or []:
+        envelope = _extract_pipeline_envelope(event)
+        if not isinstance(envelope, dict) or envelope.get("eventType") != "stack_current_changed":
+            continue
+        data = envelope.get("data")
+        if not isinstance(data, dict):
+            continue
+        if str(data.get("provider") or "").lower() != "ros":
+            continue
+        if data.get("action") != "CreateStack" or data.get("isSuccess") is not True:
+            continue
+        stack_id = _string_from_mapping(data, "stackId", "stack_id", "StackId")
+        if stack_id and stack_id not in exclude:
+            return stack_id
+    return None
+
+
+def _created_stack_event(exclude: set[str]) -> Callable[[Any, StreamSummary], bool]:
+    def predicate(event: Any, _summary: StreamSummary) -> bool:
+        envelope = _extract_pipeline_envelope(event)
+        if not isinstance(envelope, dict) or envelope.get("eventType") != "stack_current_changed":
+            return False
+        data = envelope.get("data")
+        if not isinstance(data, dict):
+            return False
+        if str(data.get("provider") or "").lower() != "ros":
+            return False
+        if data.get("action") != "CreateStack" or data.get("isSuccess") is not True:
+            return False
+        stack_id = _string_from_mapping(data, "stackId", "stack_id", "StackId")
+        return bool(stack_id and stack_id not in exclude)
+
+    return predicate
+
+
+def _latest_observed_stack_id(h: ScenarioHarness, *, exclude: set[str]) -> str | None:
+    resources = _cleanup_ledger_items(h, "observed_resources")
+    for resource in reversed(resources):
+        if not _is_ros_stack_resource(resource):
+            continue
+        if str(resource.get("observed_action") or resource.get("action") or "") != "CreateStack":
+            continue
+        stack_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if stack_id and stack_id not in exclude:
+            return stack_id
+    return None
+
+
+def _cleanup_ledger_items(h: ScenarioHarness, key: str) -> list[dict[str, Any]]:
+    if not getattr(h, "context_id", ""):
+        return []
+    try:
+        from iac_code.services.session_storage import SessionStorage
+
+        cwd, session_id = _pipeline_session_identity(h)
+        session_dir = SessionStorage().session_dir(cwd, session_id)
+        paths = [session_dir / "pipeline" / "cleanup.yaml", session_dir / "a2a" / "pipeline" / "cleanup.yaml"]
+        data = None
+        for path in paths:
+            if path.exists():
+                data = yaml.safe_load(path.read_text(encoding="utf-8"))
+                break
+    except (OSError, UnicodeDecodeError, yaml.YAMLError):
+        return []
+    if not isinstance(data, dict):
+        return []
+    values = data.get(key)
+    return [item for item in values if isinstance(item, dict)] if isinstance(values, list) else []
+
+
+def _pipeline_session_identity(h: ScenarioHarness) -> tuple[str, str]:
+    context_id = str(getattr(h, "context_id", "") or "")
+    cwd = str(getattr(h, "cwd", "") or "")
+    run_dir_value = getattr(h, "run_dir", None)
+    if context_id and run_dir_value is not None:
+        path = Path(run_dir_value) / "a2a-persistence" / "contexts" / f"{context_id}.json"
+        try:
+            data = json.loads(path.read_text(encoding="utf-8"))
+        except (OSError, UnicodeDecodeError, json.JSONDecodeError):
+            data = None
+        if isinstance(data, dict):
+            session_id = data.get("session_id")
+            persisted_cwd = data.get("cwd")
+            if isinstance(session_id, str) and session_id:
+                return (persisted_cwd if isinstance(persisted_cwd, str) and persisted_cwd else cwd, session_id)
+    return cwd, context_id
+
+
+def _wait_for_cleanup_started(
+    h: ScenarioHarness,
+    stream: BackgroundStream,
+    stack_id: str,
+    *,
+    timeout: float,
+) -> None:
+    try:
+        _wait_any(
+            [stream],
+            _cleanup_event_for_stack(stack_id, {"cleanup_started", "cleanup_progress"}),
+            description=f"cleanup_started({stack_id})",
+            timeout=timeout,
+        )
+        return
+    except Exception as exc:
+        h.notes.append(f"did not observe cleanup_started event before fallback: {exc}")
+    _wait_for_cleanup_ledger_status(h, stack_id, {"started", "in_progress"}, timeout=timeout)
+
+
+def _wait_for_cleanup_ledger_status(
+    h: ScenarioHarness,
+    stack_id: str,
+    statuses: set[str],
+    *,
+    timeout: float,
+) -> None:
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        for resource in _cleanup_ledger_items(h, "cleanup_resources"):
+            if _string_from_mapping(resource, "resource_id", "resourceId") != stack_id:
+                continue
+            if str(resource.get("cleanup_status") or resource.get("cleanupStatus") or "") in statuses:
+                return
+        time.sleep(0.5)
+    raise TimeoutError(f"Timed out waiting for cleanup ledger status {sorted(statuses)} on {stack_id}")
+
+
+def _cleanup_event_for_stack(
+    stack_id: str,
+    event_types: set[str],
+) -> Callable[[Any, StreamSummary], bool]:
+    def predicate(event: Any, _summary: StreamSummary) -> bool:
+        envelope = _extract_pipeline_envelope(event)
+        if not isinstance(envelope, dict) or envelope.get("eventType") not in event_types:
+            return False
+        data = envelope.get("data")
+        return isinstance(data, dict) and data.get("resourceId") == stack_id
+
+    return predicate
+
+
+def _events_file_has_cleanup_event(path: Path, *, stack_id: str, event_types: set[str]) -> bool:
+    try:
+        lines = path.read_text(encoding="utf-8").splitlines()
+    except OSError:
+        return False
+    for line in lines:
+        try:
+            value = json.loads(line)
+        except json.JSONDecodeError:
+            continue
+        envelope = _extract_pipeline_envelope(value)
+        if not isinstance(envelope, dict) or envelope.get("eventType") not in event_types:
+            continue
+        data = envelope.get("data")
+        if isinstance(data, dict) and data.get("resourceId") == stack_id:
+            return True
+    return False
+
+
+def _run_dir_has_cleanup_events(run_dir: Path) -> bool:
+    return any(_events_file_has_cleanup_activity(path) for path in sorted(run_dir.glob("*.events.jsonl")))
+
+
+def _events_file_has_cleanup_activity(path: Path) -> bool:
+    try:
+        lines = path.read_text(encoding="utf-8").splitlines()
+    except OSError:
+        return False
+    for line in lines:
+        try:
+            value = json.loads(line)
+        except json.JSONDecodeError:
+            continue
+        envelope = _extract_pipeline_envelope(value)
+        if isinstance(envelope, dict) and _pipeline_envelope_has_cleanup_activity(envelope):
+            return True
+    return False
+
+
+def _pipeline_envelope_has_cleanup_activity(envelope: dict[str, Any]) -> bool:
+    if envelope.get("eventType") in CLEANUP_EVENT_TYPES or envelope.get("scope") == "cleanup":
+        return True
+    data = envelope.get("data")
+    cleanup = data.get("cleanup") if isinstance(data, dict) else None
+    return isinstance(cleanup, dict) and _cleanup_payload_has_targets(cleanup)
+
+
+def _cleanup_resource_for_stack(response: Any, stack_id: str | None) -> dict[str, Any] | None:
+    if not stack_id:
+        return None
+    cleanup = _snapshot_cleanup(response)
+    resources = cleanup.get("resources") if isinstance(cleanup, dict) else None
+    if not isinstance(resources, list):
+        return None
+    for resource in resources:
+        if isinstance(resource, dict) and resource.get("resourceId") == stack_id:
+            return resource
+    return None
+
+
+def _cleanup_target_stack_ids(h: ScenarioHarness, *, exclude: set[str]) -> list[str]:
+    stack_ids: list[str] = []
+    for resource in _cleanup_ledger_items(h, "cleanup_resources"):
+        if not _is_ros_stack_resource(resource):
+            continue
+        if resource.get("cleanup_required") is False or resource.get("cleanupRequired") is False:
+            continue
+        stack_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if stack_id and stack_id not in exclude:
+            stack_ids.append(stack_id)
+    return _unique_strings(stack_ids)
+
+
+def _cleanup_resource_completed(resource: dict[str, Any] | None) -> bool:
+    if not isinstance(resource, dict):
+        return False
+    cleanup_status = resource.get("cleanupStatus") or resource.get("cleanup_status") or resource.get("status")
+    stack_status = resource.get("stackStatus") or resource.get("progressStatus") or resource.get("progress_status")
+    return cleanup_status == "completed" and stack_status == "DELETE_COMPLETE"
+
+
+def _snapshot_cleanup(response: Any) -> dict[str, Any]:
+    snapshot = _snapshot(response)
+    cleanup = snapshot.get("cleanup") if isinstance(snapshot, dict) else None
+    return cleanup if isinstance(cleanup, dict) else {}
+
+
+def _snapshot_has_cleanup_activity(response: Any) -> bool:
+    return _cleanup_payload_has_targets(_snapshot_cleanup(response))
+
+
+def _cleanup_payload_has_targets(cleanup: dict[str, Any]) -> bool:
+    resources = cleanup.get("resources")
+    if isinstance(resources, list) and any(isinstance(item, dict) for item in resources):
+        return True
+    history = cleanup.get("history")
+    if isinstance(history, list) and history:
+        return True
+    resource_count = cleanup.get("resourceCount", cleanup.get("resource_count"))
+    if _positive_int(resource_count):
+        return True
+    status = str(cleanup.get("status") or "")
+    return status in CLEANUP_ACTIVE_STATUSES
+
+
+def _positive_int(value: Any) -> bool:
+    if isinstance(value, bool):
+        return False
+    if isinstance(value, int):
+        return value > 0
+    if isinstance(value, str):
+        try:
+            return int(value) > 0
+        except ValueError:
+            return False
+    return False
+
+
+def _cleanup_ledger_has_required_resources(h: ScenarioHarness) -> bool:
+    for resource in _cleanup_ledger_items(h, "cleanup_resources"):
+        if resource.get("cleanup_required") is False or resource.get("cleanupRequired") is False:
+            continue
+        return True
+    return False
+
+
+def _session_has_cleanup_prompt(h: ScenarioHarness) -> bool:
+    if not getattr(h, "context_id", ""):
+        return False
+    try:
+        from iac_code.services.session_storage import SessionStorage
+
+        cwd, session_id = _pipeline_session_identity(h)
+        return _session_file_has_cleanup_prompt(SessionStorage().session_path(cwd, session_id))
+    except OSError:
+        return False
+
+
+def _session_file_has_cleanup_prompt(path: Path) -> bool:
+    try:
+        lines = path.read_text(encoding="utf-8").splitlines()
+    except (OSError, UnicodeDecodeError):
+        return False
+    for line in lines:
+        try:
+            value = json.loads(line)
+        except json.JSONDecodeError:
+            continue
+        metadata = value.get("metadata") if isinstance(value, dict) else None
+        if isinstance(metadata, dict) and metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE:
+            return True
+    return False
+
+
+def _snapshot_current_stack_id(response: Any, *, exclude: set[str]) -> str | None:
+    snapshot = _snapshot(response)
+    stacks = snapshot.get("stacks") if isinstance(snapshot, dict) else None
+    if not isinstance(stacks, dict):
+        return None
+    current = stacks.get("current")
+    current_id = _active_stack_id_from_record(current)
+    if current_id and current_id not in exclude:
+        return current_id
+    by_id = stacks.get("byId")
+    if isinstance(by_id, dict):
+        for record in reversed(list(by_id.values())):
+            stack_id = _active_stack_id_from_record(record)
+            if stack_id and stack_id not in exclude:
+                return stack_id
+    history = stacks.get("history")
+    if isinstance(history, list):
+        for record in reversed(history):
+            stack_id = _active_stack_id_from_record(record)
+            if stack_id and stack_id not in exclude:
+                return stack_id
+    return None
+
+
+def _active_stack_id_from_record(record: Any) -> str | None:
+    if not isinstance(record, dict):
+        return None
+    if record.get("current") is False or record.get("cleared") is True:
+        return None
+    if record.get("isSuccess") is False:
+        return None
+    status = str(record.get("stackStatus") or record.get("status") or "")
+    if status.endswith("_FAILED"):
+        return None
+    action = record.get("action")
+    if action == "DeleteStack":
+        return None
+    return _string_from_mapping(record, "stackId", "stack_id", "StackId", "id")
+
+
+def _capture_ros_stack_states(h: ScenarioHarness, stack_ids: Iterable[str], name: str) -> dict[str, dict[str, Any]]:
+    states: dict[str, dict[str, Any]] = {}
+    for stack_id in stack_ids:
+        region_id = _region_for_stack(h, stack_id)
+        states[stack_id] = _get_ros_stack_state(stack_id=stack_id, region_id=region_id, redaction_env=h.server_env)
+    redacted = _redact_json_value(states, h.server_env)
+    _write_json(h.run_dir / f"{name}.ros-stack-states.json", redacted)
+    h.snapshots[f"{name}.ros-stack-states"] = redacted
+    return states
+
+
+def _get_ros_stack_state(
+    *,
+    stack_id: str,
+    region_id: str,
+    redaction_env: dict[str, str] | None,
+) -> dict[str, Any]:
+    try:
+        from alibabacloud_ros20190910 import models as ros_models
+
+        from iac_code.services.cloud_credentials import CloudCredentials
+        from iac_code.tools.cloud.aliyun.ros_client import RosClientFactory
+
+        credential = CloudCredentials().get_provider("aliyun")
+        effective_region = region_id or (credential.region_id if credential is not None else "")
+        client = RosClientFactory.create(credential, effective_region)
+        request = ros_models.GetStackRequest(stack_id=stack_id, region_id=effective_region)
+        response = client.get_stack(request)
+        body = response.body.to_map()
+        return {
+            "stack_id": str(body.get("StackId") or stack_id),
+            "stack_name": str(body.get("StackName") or ""),
+            "region_id": effective_region,
+            "status": str(body.get("Status") or ""),
+            "status_reason": str(body.get("StatusReason") or ""),
+            "not_found": False,
+        }
+    except Exception as exc:
+        message = _redact_sensitive_text(str(exc), redaction_env)
+        return {
+            "stack_id": stack_id,
+            "region_id": region_id,
+            "status": "",
+            "not_found": _is_ros_stack_not_found(exc),
+            "error": _compact_text(message, max_chars=1000),
+        }
+
+
+def _is_ros_stack_not_found(exc: BaseException) -> bool:
+    code = str(getattr(exc, "code", "") or "")
+    message = str(exc)
+    combined = f"{code} {message}".lower()
+    not_found_tokens = (
+        "stacknotfound",
+        "notfound.stack",
+        "entitynotexist.stack",
+        "specified stack does not exist",
+        "stack could not be found",
+        "stack not found",
+    )
+    return any(token in combined for token in not_found_tokens)
+
+
+def _region_for_stack(h: ScenarioHarness, stack_id: str) -> str:
+    for snapshot in reversed(list(h.snapshots.values())):
+        region = _region_for_stack_in_snapshot(snapshot, stack_id)
+        if region:
+            return region
+    for key in ("cleanup_resources", "observed_resources"):
+        for resource in reversed(_cleanup_ledger_items(h, key)):
+            if _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId") == stack_id:
+                region = _string_from_mapping(resource, "region_id", "regionId", "RegionId")
+                if region:
+                    return region
+    return h.server_env.get("ALIBABA_CLOUD_REGION_ID", "")
+
+
+def _region_for_stack_in_snapshot(response: Any, stack_id: str) -> str:
+    cleanup_resource = _cleanup_resource_for_stack(response, stack_id)
+    if cleanup_resource is not None:
+        region = _string_from_mapping(cleanup_resource, "regionId", "region_id", "RegionId")
+        if region:
+            return region
+    snapshot = _snapshot(response)
+    stacks = snapshot.get("stacks") if isinstance(snapshot, dict) else None
+    if not isinstance(stacks, dict):
+        return ""
+    by_id = stacks.get("byId")
+    if isinstance(by_id, dict):
+        record = by_id.get(stack_id)
+        region = _string_from_mapping(record, "regionId", "region_id", "RegionId") if isinstance(record, dict) else None
+        if region:
+            return region
+    current = stacks.get("current")
+    if isinstance(current, dict) and _string_from_mapping(current, "stackId", "stack_id", "StackId") == stack_id:
+        return _string_from_mapping(current, "regionId", "region_id", "RegionId") or ""
+    return ""
+
+
+def _ros_stack_deleted(state: dict[str, Any]) -> bool:
+    if not isinstance(state, dict):
+        return False
+    if state.get("not_found") is True:
+        return True
+    return state.get("status") in ROS_STACK_DELETED_STATUSES
+
+
+def _ros_stack_retained(state: dict[str, Any]) -> bool:
+    if not isinstance(state, dict) or state.get("not_found") is True:
+        return False
+    status = state.get("status")
+    return isinstance(status, str) and bool(status) and not status.startswith("DELETE_")
+
+
+def _is_ros_stack_resource(resource: dict[str, Any]) -> bool:
+    provider = str(resource.get("provider") or "").lower()
+    resource_type = str(resource.get("resource_type") or resource.get("resourceType") or "").lower()
+    return provider == "ros" and resource_type == "stack"
+
+
+def _unique_strings(values: Iterable[str | None]) -> list[str]:
+    result: list[str] = []
+    seen: set[str] = set()
+    for value in values:
+        if not isinstance(value, str) or not value or value in seen:
+            continue
+        seen.add(value)
+        result.append(value)
+    return result
+
+
+def _string_from_mapping(mapping: Any, *keys: str) -> str | None:
+    if not isinstance(mapping, dict):
+        return None
+    for key in keys:
+        value = mapping.get(key)
+        if isinstance(value, str) and value:
+            return value
+    return None
+
+
 def _scenario_run_dir(args: argparse.Namespace, scenario: str) -> Path:
     if args.run_dir:
         return Path(args.run_dir).expanduser()
@@ -1477,20 +2520,34 @@ def _validate_scenario_execution(args: argparse.Namespace, scenario: str) -> Non
 }
 _REAL_CLOUD_SCENARIOS = {
     "fault-after-snapshot",
+    "image-ask-waiting",
+    "image-initial",
+    "image-interrupt",
+    "image-normal-handoff",
+    "image-selection-waiting",
     "scenario1",
     "normal-running",
     "ask-waiting",
     "selection-waiting",
+    "rollback-step5-cleanup",
+    "rollback-step5-cleanup-recovery",
     *_RUNNING_STEP_SCENARIOS,
     *_ROLLBACK_SCENARIOS,
     *_CANCEL_SCENARIOS,
 }
 _SCENARIOS: dict[str, Callable[[argparse.Namespace, str], int]] = {
+    "image-ask-waiting": run_image_ask_waiting,
+    "image-initial": run_image_initial,
+    "image-interrupt": run_image_interrupt,
+    "image-normal-handoff": run_image_normal_handoff,
+    "image-selection-waiting": run_image_selection_waiting,
     "scenario1": run_scenario1,
     "normal-running": run_normal_running,
     "ask-waiting": run_ask_waiting,
     "selection-waiting": run_selection_waiting,
     "fault-after-snapshot": run_fault_after_snapshot,
+    "rollback-step5-cleanup": run_rollback_step5_cleanup,
+    "rollback-step5-cleanup-recovery": run_rollback_step5_cleanup_recovery,
     **{name: run_running_step for name in _RUNNING_STEP_SCENARIOS},
     **{name: run_rollback for name in _ROLLBACK_SCENARIOS},
     **{name: run_cancel for name in _CANCEL_SCENARIOS},
diff --git a/scripts/a2a/selling_console.py b/scripts/a2a/selling_console.py
new file mode 100644
index 00000000..80805a26
--- /dev/null
+++ b/scripts/a2a/selling_console.py
@@ -0,0 +1,294 @@
+"""Local web console for A2A selling pipelines.
+
+The bundled web UI currently sends text input only; use the A2A debugger for
+image-part request coverage.
+"""
+
+from __future__ import annotations
+
+import argparse
+import hashlib
+import html
+import importlib
+import json
+import os
+import sys
+from dataclasses import dataclass
+from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
+from pathlib import Path
+from urllib.error import HTTPError, URLError
+from urllib.parse import urlparse
+
+REPO_ROOT = Path(__file__).resolve().parents[2]
+if str(REPO_ROOT) not in sys.path:
+    sys.path.insert(0, str(REPO_ROOT))
+
+a2a_debugger = importlib.import_module("scripts.a2a.debugger")
+
+WEB_ROOT = Path(__file__).resolve().with_name("selling_console_web")
+TEMPLATE_PLACEHOLDERS = (
+    "__DEFAULTS_JSON__",
+    "__DEFAULT_SERVER_URL_ATTR__",
+    "__DEFAULT_CWD_ATTR__",
+    "__STATIC_ASSET_VERSION__",
+)
+
+
+@dataclass(frozen=True)
+class StaticAsset:
+    path: Path
+    content_type: str
+
+
+STYLE_ASSET = StaticAsset(WEB_ROOT / "styles.css", "text/css; charset=utf-8")
+APP_ASSET = StaticAsset(WEB_ROOT / "app.js", "application/javascript; charset=utf-8")
+STATIC_ASSETS = (STYLE_ASSET, APP_ASSET)
+
+
+@dataclass(frozen=True)
+class SellingConsoleConfig:
+    host: str
+    port: int
+    default_server_url: str
+    default_cwd: str
+
+
+def parse_args(argv: list[str] | None = None) -> argparse.Namespace:
+    parser = argparse.ArgumentParser(description="Run a local A2A selling pipeline console.")
+    parser.add_argument("--host", default="127.0.0.1")
+    parser.add_argument("--port", type=int, default=41980)
+    parser.add_argument("--default-server-url", default="http://127.0.0.1:41299")
+    parser.add_argument("--default-cwd", default=os.getcwd())
+    return parser.parse_args(argv)
+
+
+def _html_attribute_value(value: str) -> str:
+    escaped = html.escape(value, quote=True)
+    for placeholder in TEMPLATE_PLACEHOLDERS:
+        escaped = escaped.replace(placeholder, placeholder.replace("_", "&#95;"))
+    return escaped
+
+
+def _json_for_template(value: object) -> str:
+    json_value = a2a_debugger._json_for_script(value)
+    for placeholder in TEMPLATE_PLACEHOLDERS:
+        json_value = json_value.replace(placeholder, placeholder.replace("_", "\\u005f"))
+    return json_value
+
+
+def _static_asset_version() -> str:
+    digest = hashlib.sha256()
+    for asset in STATIC_ASSETS:
+        digest.update(asset.path.name.encode("utf-8"))
+        digest.update(asset.path.read_bytes())
+    return digest.hexdigest()[:12]
+
+
+def render_index_html(config: SellingConsoleConfig) -> str:
+    defaults_json = _json_for_template(
+        {
+            "serverUrl": config.default_server_url,
+            "cwd": config.default_cwd,
+        }
+    )
+    return (
+        (WEB_ROOT / "index.html")
+        .read_text(encoding="utf-8")
+        .replace("__DEFAULT_SERVER_URL_ATTR__", _html_attribute_value(config.default_server_url))
+        .replace("__DEFAULT_CWD_ATTR__", _html_attribute_value(config.default_cwd))
+        .replace("__DEFAULTS_JSON__", defaults_json)
+        .replace("__STATIC_ASSET_VERSION__", _static_asset_version())
+    )
+
+
+def _send_text(handler: BaseHTTPRequestHandler, status: int, body: str, content_type: str) -> None:
+    raw_body = body.encode("utf-8")
+    handler.send_response(status)
+    handler.send_header("Content-Type", content_type)
+    handler.send_header("Content-Length", str(len(raw_body)))
+    handler.end_headers()
+    handler.wfile.write(raw_body)
+
+
+def _static_asset_for_request(path: str) -> StaticAsset | None:
+    if path == "/styles.css":
+        return STYLE_ASSET
+    if path == "/app.js":
+        return APP_ASSET
+    return None
+
+
+def _send_static(handler: BaseHTTPRequestHandler, path: str) -> bool:
+    asset = _static_asset_for_request(path)
+    if asset is None:
+        return False
+    web_root = WEB_ROOT.resolve()
+    candidate = asset.path.resolve()
+    try:
+        candidate.relative_to(web_root)
+    except ValueError:
+        return False
+    if not candidate.is_file():
+        return False
+    _send_text(handler, 200, candidate.read_text(encoding="utf-8"), asset.content_type)
+    return True
+
+
+def _proxy_error_body(exc: BaseException) -> dict[str, object]:
+    if isinstance(exc, HTTPError):
+        raw = exc.read()
+        data, text = a2a_debugger._decode_json_text(raw)
+        return a2a_debugger._proxy_error(
+            a2a_debugger.ProxyResult(
+                status_code=exc.code,
+                data=data,
+                text=text,
+                headers=dict(exc.headers.items()),
+                error=f"HTTP {exc.code}",
+            )
+        )
+    return a2a_debugger._proxy_error(
+        a2a_debugger.ProxyResult(status_code=0, data=None, text="", headers={}, error=str(exc))
+    )
+
+
+def _write_sse_error_event(handler: BaseHTTPRequestHandler, message: str) -> None:
+    body = f"data: {json.dumps({'ok': False, 'error': message}, ensure_ascii=False)}\n\n".encode("utf-8")
+    try:
+        handler.wfile.write(body)
+        handler.wfile.flush()
+    except OSError:
+        return
+
+
+def create_server(config: SellingConsoleConfig) -> ThreadingHTTPServer:
+    class SellingConsoleHTTPServer(ThreadingHTTPServer):
+        allow_reuse_address = sys.platform != "win32"
+
+    class SellingConsoleHandler(BaseHTTPRequestHandler):
+        def log_message(self, format: str, *args: object) -> None:
+            return None
+
+        def do_GET(self) -> None:
+            parsed = urlparse(self.path)
+            try:
+                if parsed.path == "/":
+                    _send_text(self, 200, render_index_html(config), "text/html; charset=utf-8")
+                    return
+                if parsed.path == "/api/health":
+                    status, body = a2a_debugger._health_response(
+                        a2a_debugger._query_params(self.path).get("serverUrl", "")
+                    )
+                    a2a_debugger._send_json(self, status, body)
+                    return
+                if parsed.path == "/api/pipeline/state":
+                    status, body = a2a_debugger._pipeline_state_response(a2a_debugger._query_params(self.path))
+                    a2a_debugger._send_json(self, status, body)
+                    return
+                if parsed.path == "/api/task/get":
+                    status, body = a2a_debugger._task_get_response(a2a_debugger._query_params(self.path))
+                    a2a_debugger._send_json(self, status, body)
+                    return
+                if _send_static(self, parsed.path):
+                    return
+            except ValueError as exc:
+                a2a_debugger._send_json(self, 400, {"ok": False, "error": str(exc)})
+                return
+            except (HTTPError, URLError, TimeoutError, OSError) as exc:
+                a2a_debugger._send_json(self, 502, _proxy_error_body(exc))
+                return
+            a2a_debugger._send_json(self, 404, {"ok": False, "error": "Not found"})
+
+        def do_POST(self) -> None:
+            parsed = urlparse(self.path)
+            try:
+                if parsed.path == "/api/message/stream":
+                    body = a2a_debugger._read_json_body(self)
+                    server_url, payload = a2a_debugger._message_stream_body(body)
+                    try:
+                        with a2a_debugger._open_sse_stream(server_url, payload) as response:
+                            headers = getattr(response, "headers", {})
+                            content_type = ""
+                            if hasattr(headers, "get"):
+                                content_type = str(headers.get("Content-Type", "")).lower()
+                            if content_type and "text/event-stream" not in content_type:
+                                raw = response.read()
+                                data, _text = a2a_debugger._decode_json_text(raw)
+                                message = a2a_debugger._jsonrpc_error_message(data)
+                                if message:
+                                    a2a_debugger._send_sse_event(
+                                        self,
+                                        200,
+                                        {
+                                            "type": "error",
+                                            "error": message,
+                                            "statusCode": response.status,
+                                            "body": data,
+                                        },
+                                    )
+                                    return
+                                a2a_debugger._send_sse_error(self, 502, "Target server returned a non-SSE response")
+                                return
+                            self.send_response(response.status)
+                            self.send_header("Content-Type", "text/event-stream; charset=utf-8")
+                            self.end_headers()
+                            response_iter = iter(response)
+                            while True:
+                                try:
+                                    line = next(response_iter)
+                                except StopIteration:
+                                    break
+                                except (TimeoutError, URLError, OSError) as exc:
+                                    _write_sse_error_event(self, str(exc))
+                                    return
+                                try:
+                                    self.wfile.write(line)
+                                    self.wfile.flush()
+                                except OSError as exc:
+                                    if a2a_debugger._is_client_disconnect_error(exc):
+                                        return
+                                    return
+                    except HTTPError as exc:
+                        a2a_debugger._send_sse_error(self, 502, f"HTTP {exc.code}")
+                    except (TimeoutError, URLError, OSError) as exc:
+                        a2a_debugger._send_sse_error(self, 502, str(exc))
+                    return
+                if parsed.path == "/api/task/cancel":
+                    body = a2a_debugger._read_json_body(self)
+                    status, response_body = a2a_debugger._task_cancel_response(body)
+                    a2a_debugger._send_json(self, status, response_body)
+                    return
+            except ValueError as exc:
+                a2a_debugger._send_json(self, 400, {"ok": False, "error": str(exc)})
+                return
+            except (HTTPError, URLError, TimeoutError, OSError) as exc:
+                a2a_debugger._send_json(self, 502, _proxy_error_body(exc))
+                return
+            a2a_debugger._send_json(self, 404, {"ok": False, "error": "Not found"})
+
+    return SellingConsoleHTTPServer((config.host, config.port), SellingConsoleHandler)
+
+
+def main(argv: list[str] | None = None) -> int:
+    args = parse_args(argv)
+    config = SellingConsoleConfig(
+        host=args.host,
+        port=args.port,
+        default_server_url=args.default_server_url,
+        default_cwd=args.default_cwd,
+    )
+    server = create_server(config)
+    host, port = server.server_address
+    print(f"Selling pipeline console listening on http://{host}:{port}")
+    try:
+        server.serve_forever()
+    except KeyboardInterrupt:
+        return 0
+    finally:
+        server.shutdown()
+        server.server_close()
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/scripts/a2a/selling_console_web/README.md b/scripts/a2a/selling_console_web/README.md
new file mode 100644
index 00000000..029d2781
--- /dev/null
+++ b/scripts/a2a/selling_console_web/README.md
@@ -0,0 +1,34 @@
+# Selling Console Web
+
+Standalone static frontend for `scripts/a2a/selling_console.py`. It is used to drive the selling pipeline, inspect step progress, select candidate plans, and continue into normal chat after deployment.
+
+The web console currently sends text input only. Use `scripts/a2a/debugger.py` for A2A image-part coverage.
+
+## Run
+
+From the repository root, start the A2A server first:
+
+```bash
+PATH="$HOME/.local/bin:$PATH" IAC_CODE_MODE=pipeline \
+uv run iac-code a2a --transport http --host 127.0.0.1 --port 41299
+```
+
+Then start the web console:
+
+```bash
+PATH="$HOME/.local/bin:$PATH" \
+uv run python scripts/a2a/selling_console.py --port 41980 \
+  --default-server-url http://127.0.0.1:41299 \
+  --default-cwd "$PWD"
+```
+
+Then open `http://127.0.0.1:41980`.
+
+## Files
+
+- `index.html` renders the page shell.
+- `styles.css` contains layout, chat, plan cards, and progress visuals.
+- `app.js` handles A2A stream parsing, UI state, debug controls, and interactions.
+- `design/` keeps standalone visual explorations for progress variants.
+
+The debug panel is collapsed by default. Expand it only when checking connection settings, progress variant parameters, context IDs, or recent stream diagnostics.
diff --git a/scripts/a2a/selling_console_web/app.js b/scripts/a2a/selling_console_web/app.js
new file mode 100644
index 00000000..01105ded
--- /dev/null
+++ b/scripts/a2a/selling_console_web/app.js
@@ -0,0 +1,4327 @@
+(function () {
+  const STEP_ORDER = ["intent_parsing", "architecture_planning", "evaluate_candidates", "confirm_and_select", "deploying"];
+  const STEP_LABELS = {
+    intent_parsing: "需求理解",
+    architecture_planning: "架构规划",
+    evaluate_candidates: "方案评估",
+    confirm_and_select: "方案选择",
+    deploying: "确认部署",
+  };
+  const PROGRESS_VARIANT_ORDER = ["a", "b", "d"];
+  const PROGRESS_VARIANT_LABELS = {
+    a: "A 箭头轨道",
+    b: "B 脉冲线路",
+    d: "D 输入框融合",
+  };
+  const DEFAULT_PROGRESS_UI = {
+    variant: "b",
+    activeStepIndex: null,
+    a: {
+      sweepMs: 1800,
+    },
+    b: {
+      xPercent: 28,
+      yPercent: 49,
+      t1: 140,
+      t2: 540,
+      maxAmplitude: 9,
+      pauseTime: 510,
+    },
+    d: {
+      t1: 1800,
+      t2: 300,
+    },
+  };
+  const PROGRESS_PARAM_DEFS = {
+    a: [
+      { key: "sweepMs", label: "扫光周期", min: 800, max: 2800, step: 100, unit: "ms" },
+    ],
+    b: [
+      { key: "xPercent", label: "X", min: 6, max: 38, step: 1, unit: "%" },
+      { key: "yPercent", label: "Y", min: 20, max: 90, step: 1, unit: "%" },
+      { key: "t1", label: "T1", min: 80, max: 700, step: 20, unit: "ms" },
+      { key: "t2", label: "T2", min: 160, max: 1400, step: 20, unit: "ms" },
+      { key: "maxAmplitude", label: "最大振幅", min: 8, max: 22, step: 1, unit: "" },
+      { key: "pauseTime", label: "停顿时间", min: 120, max: 1200, step: 30, unit: "ms" },
+    ],
+    d: [
+      { key: "t1", label: "T1", min: 800, max: 3200, step: 100, unit: "ms" },
+      { key: "t2", label: "T2", min: 0, max: 1200, step: 50, unit: "ms" },
+    ],
+  };
+  const MAX_CANDIDATE_SUB_EVENTS = 96;
+  const CURRENT_STEP_EVENT_TYPES = new Set([
+    "permission_requested",
+    "text_delta",
+    "tool_call",
+    "tool_result",
+    "tool_started",
+    "tool_use",
+  ]);
+  const NORMAL_HANDOFF_TEXT = "部署流程已完成，已进入普通会话。可以继续追问资源、运维或变更需求。";
+  const CANDIDATE_SUBSTEP_LABELS = {
+    template_generating: "模板生成",
+    template_generation: "模板生成",
+    template_validating: "模板校验",
+    template_validation: "模板校验",
+    cost_estimating: "成本估算",
+    cost_estimation: "成本估算",
+    cost_estimate: "成本估算",
+    price_estimating: "价格估算",
+    quality_review: "质量复核",
+    architecture_review: "架构复核",
+    risk_review: "风险复核",
+    resource_planning: "资源规划",
+    requirement_matching: "需求匹配",
+  };
+  const CANDIDATE_STEP_IDS = new Set([
+    "candidate",
+    "candidate_generation",
+    "candidate_selection",
+    "candidate_summary",
+    "cost_estimation",
+    "evaluate_candidate",
+    "evaluate_candidates",
+    "resource_evaluation",
+  ]);
+
+  function createSteps() {
+    return STEP_ORDER.reduce((steps, stepId) => {
+      steps[stepId] = {
+        id: stepId,
+        label: STEP_LABELS[stepId],
+        status: "pending",
+        events: [],
+      };
+      return steps;
+    }, {});
+  }
+
+  function mergeProgressParams(variant, params) {
+    const defaults = DEFAULT_PROGRESS_UI[variant] || {};
+    const source = params && typeof params === "object" ? params : {};
+    return Object.keys(defaults).reduce((result, key) => {
+      const numericValue = Number(source[key]);
+      result[key] = Number.isFinite(numericValue) ? numericValue : defaults[key];
+      return result;
+    }, {});
+  }
+
+  function mergeProgressUi(value) {
+    const source = value && typeof value === "object" ? value : {};
+    const variant = PROGRESS_VARIANT_ORDER.includes(source.variant) ? source.variant : DEFAULT_PROGRESS_UI.variant;
+    const rawActiveStepIndex =
+      source.activeStepIndex === null || source.activeStepIndex === undefined ? null : Number(source.activeStepIndex);
+    return {
+      variant,
+      activeStepIndex:
+        Number.isInteger(rawActiveStepIndex) && rawActiveStepIndex >= 0 && rawActiveStepIndex < STEP_ORDER.length
+          ? rawActiveStepIndex
+          : null,
+      a: mergeProgressParams("a", source.a),
+      b: mergeProgressParams("b", source.b),
+      d: mergeProgressParams("d", source.d),
+    };
+  }
+
+  function createInitialState(defaults = {}) {
+    const stateDefaults = clonePlainData(defaults && typeof defaults === "object" ? defaults : {});
+    return {
+      defaults: stateDefaults,
+      serverUrl: stateDefaults.serverUrl || "",
+      cwd: stateDefaults.cwd || "",
+      contextId: "",
+      pipelineTaskId: "",
+      activeTaskId: "",
+      currentStepId: "",
+      lastSequence: 0,
+      status: "idle",
+      pipelineStarted: Boolean(stateDefaults.pipelineStarted),
+      normalHandoffReady: false,
+      steps: createSteps(),
+      candidates: [],
+      selectedCandidateIndex: null,
+      selectedPendingInputOptionId: stateDefaults.selectedPendingInputOptionId || "",
+      pendingInput: null,
+      permission: null,
+      userMessages: Array.isArray(stateDefaults.userMessages) ? clonePlainData(stateDefaults.userMessages) : [],
+      normalTurns: Array.isArray(stateDefaults.normalTurns) ? clonePlainData(stateDefaults.normalTurns) : [],
+      pendingNormalUserMessageId: stateDefaults.pendingNormalUserMessageId || "",
+      expandedStepDetails: clonePlainData(stateDefaults.expandedStepDetails || {}),
+      expandedCandidateSubpipelines: clonePlainData(stateDefaults.expandedCandidateSubpipelines || {}),
+      expandedNormalProcesses: clonePlainData(stateDefaults.expandedNormalProcesses || {}),
+      progressUi: mergeProgressUi(stateDefaults.progressUi),
+      diagnostics: { requests: [], sse: [], snapshots: [] },
+    };
+  }
+
+  function cloneStep(step) {
+    return {
+      ...step,
+      events: Array.isArray(step.events) ? step.events.map(clonePlainData) : [],
+    };
+  }
+
+  function cloneCandidate(candidate) {
+    return clonePlainData({
+      ...candidate,
+      costItems: Array.isArray(candidate.costItems) ? candidate.costItems : [],
+      subEvents: Array.isArray(candidate.subEvents) ? candidate.subEvents : [],
+    });
+  }
+
+  function clonePendingInput(pendingInput) {
+    if (!pendingInput) {
+      return null;
+    }
+    const nextPendingInput = clonePlainData(pendingInput);
+    return {
+      ...nextPendingInput,
+      prompt: nextPendingInput.prompt || nextPendingInput.question || "",
+      options: Array.isArray(nextPendingInput.options) ? nextPendingInput.options : [],
+    };
+  }
+
+  function cloneDiagnostics(diagnostics) {
+    const source = diagnostics || {};
+    return clonePlainData({
+      requests: Array.isArray(source.requests) ? [...source.requests] : [],
+      sse: Array.isArray(source.sse) ? [...source.sse] : [],
+      snapshots: Array.isArray(source.snapshots) ? [...source.snapshots] : [],
+    });
+  }
+
+  function clonePlainData(value) {
+    if (Array.isArray(value)) {
+      return value.map(clonePlainData);
+    }
+    if (value && typeof value === "object") {
+      return Object.keys(value).reduce((result, key) => {
+        result[key] = clonePlainData(value[key]);
+        return result;
+      }, {});
+    }
+    return value;
+  }
+
+  function cloneState(state) {
+    if (!state) {
+      return createInitialState();
+    }
+    const steps = {};
+    const defaultSteps = createSteps();
+    STEP_ORDER.forEach((stepId) => {
+      steps[stepId] = cloneStep(state.steps && state.steps[stepId] ? state.steps[stepId] : defaultSteps[stepId]);
+    });
+    return {
+      ...state,
+      defaults: clonePlainData(state.defaults || {}),
+      steps,
+      candidates: Array.isArray(state.candidates) ? state.candidates.map(cloneCandidate) : [],
+      selectedPendingInputOptionId: state.selectedPendingInputOptionId || "",
+      pendingInput: clonePendingInput(state.pendingInput),
+      permission: clonePlainData(state.permission),
+      currentStepId: state.currentStepId || "",
+      userMessages: Array.isArray(state.userMessages) ? state.userMessages.map(clonePlainData) : [],
+      normalTurns: Array.isArray(state.normalTurns) ? state.normalTurns.map(clonePlainData) : [],
+      pendingNormalUserMessageId: state.pendingNormalUserMessageId || "",
+      expandedStepDetails: clonePlainData(state.expandedStepDetails || {}),
+      expandedCandidateSubpipelines: clonePlainData(state.expandedCandidateSubpipelines || {}),
+      expandedNormalProcesses: clonePlainData(state.expandedNormalProcesses || {}),
+      pipelineStarted: Boolean(state.pipelineStarted),
+      progressUi: mergeProgressUi(state.progressUi),
+      diagnostics: cloneDiagnostics(state.diagnostics),
+    };
+  }
+
+  function pipelineFromMetadata(metadata) {
+    if (!metadata || typeof metadata !== "object") {
+      return null;
+    }
+    if (metadata.pipeline) {
+      return metadata.pipeline;
+    }
+    const iacCode = metadata.iac_code || metadata.iacCode || metadata["iac-code"];
+    if (iacCode && typeof iacCode === "object") {
+      return iacCode.pipeline || iacCode.pipelineEvent || iacCode.pipelineSnapshot || null;
+    }
+    return null;
+  }
+
+  function valueOf(source, ...keys) {
+    if (!source || typeof source !== "object") {
+      return undefined;
+    }
+    for (const key of keys) {
+      if (Object.prototype.hasOwnProperty.call(source, key)) {
+        return source[key];
+      }
+    }
+    return undefined;
+  }
+
+  function eventTypeOf(source) {
+    return valueOf(source, "eventType", "event_type");
+  }
+
+  function taskIdOf(source) {
+    return valueOf(source, "deliveryTaskId", "delivery_task_id", "taskId", "task_id");
+  }
+
+  function contextIdOf(source) {
+    return valueOf(source, "deliveryContextId", "delivery_context_id", "contextId", "context_id");
+  }
+
+  function sequenceOf(source) {
+    const sequence = valueOf(source, "sequence", "lastSequence", "last_sequence");
+    const numericSequence = Number(sequence);
+    return Number.isFinite(numericSequence) ? numericSequence : null;
+  }
+
+  function pendingInputOf(source) {
+    return valueOf(source, "pendingInput", "pending_input", "input");
+  }
+
+  function normalHandoffOf(source) {
+    return valueOf(source, "normalHandoff", "normal_handoff");
+  }
+
+  function targetModeOf(source) {
+    return valueOf(source, "targetMode", "target_mode");
+  }
+
+  function updateLastSequence(state, sequence) {
+    if (typeof sequence === "number") {
+      state.lastSequence = Math.max(state.lastSequence || 0, sequence);
+    }
+  }
+
+  function extractPipelineEnvelope(payload) {
+    if (!payload || typeof payload !== "object") {
+      return null;
+    }
+    if (Array.isArray(payload)) {
+      for (const item of payload) {
+        const envelope = extractPipelineEnvelope(item);
+        if (envelope) {
+          return envelope;
+        }
+      }
+      return null;
+    }
+
+    const metadataPipeline = pipelineFromMetadata(payload.metadata);
+    if (metadataPipeline) {
+      return metadataPipeline;
+    }
+    if (payload.iac_code && payload.iac_code.pipeline) {
+      return payload.iac_code.pipeline;
+    }
+    if (payload.iacCode && payload.iacCode.pipeline) {
+      return payload.iacCode.pipeline;
+    }
+    if (payload["iac-code"] && payload["iac-code"].pipeline) {
+      return payload["iac-code"].pipeline;
+    }
+    if (payload.pipeline || payload.pipelineEvent || payload.pipelineSnapshot) {
+      return payload.pipeline || payload.pipelineEvent || payload.pipelineSnapshot;
+    }
+    if (eventTypeOf(payload) || taskIdOf(payload) || contextIdOf(payload) || payload.step) {
+      return payload;
+    }
+
+    const wrapperKeys = [
+      "result",
+      "params",
+      "task",
+      "statusUpdate",
+      "status_update",
+      "status",
+      "message",
+      "event",
+      "events",
+      "snapshot",
+    ];
+    for (const key of wrapperKeys) {
+      if (payload[key] && typeof payload[key] === "object") {
+        const envelope = extractPipelineEnvelope(payload[key]);
+        if (envelope) {
+          return envelope;
+        }
+      }
+    }
+    return null;
+  }
+
+  function normalizeStatus(status) {
+    if (status === "input_required") {
+      return "waiting_input";
+    }
+    return status || "";
+  }
+
+  function statusFromEventType(eventType, fallbackStatus) {
+    const statuses = {
+      step_started: "working",
+      step_completed: "completed",
+      step_failed: "failed",
+      input_required: "waiting_input",
+    };
+    return statuses[eventType] || normalizeStatus(fallbackStatus);
+  }
+
+  function normalizeStepId(step) {
+    const rawStepId = typeof step === "string" ? step : step && (step.id || step.name || step.stepId);
+    if (!rawStepId) {
+      return "";
+    }
+    const stepId = String(rawStepId);
+    if (CANDIDATE_STEP_IDS.has(stepId) || stepId.startsWith("candidate_") || stepId.includes("candidate")) {
+      return "evaluate_candidates";
+    }
+    if (STEP_ORDER.includes(stepId)) {
+      return stepId;
+    }
+    return stepId;
+  }
+
+  function normalizeCandidateIndexValue(candidateIndex) {
+    if (candidateIndex === null || candidateIndex === undefined || candidateIndex === "") {
+      return candidateIndex;
+    }
+    const numericIndex = Number(candidateIndex);
+    return Number.isFinite(numericIndex) ? numericIndex : candidateIndex;
+  }
+
+  function candidateFromDisplayItem(item) {
+    if (!item || typeof item !== "object") {
+      return null;
+    }
+    const detail = item.detail && typeof item.detail === "object" ? item.detail : item;
+    const nestedCandidate =
+      item.candidate && typeof item.candidate === "object"
+        ? item.candidate
+        : detail.candidate && typeof detail.candidate === "object"
+          ? detail.candidate
+          : {};
+    const cost =
+      item.cost && typeof item.cost === "object"
+        ? item.cost
+        : detail.cost && typeof detail.cost === "object"
+          ? detail.cost
+          : {};
+    const conclusions =
+      item.conclusions && typeof item.conclusions === "object"
+        ? item.conclusions
+        : detail.conclusions && typeof detail.conclusions === "object"
+          ? detail.conclusions
+          : {};
+    const templateConclusion = conclusions.template && typeof conclusions.template === "object" ? conclusions.template : {};
+    const costConclusion = conclusions.cost && typeof conclusions.cost === "object" ? conclusions.cost : {};
+    const primitiveCost = (value) => (value && typeof value === "object" ? undefined : value);
+    const candidateIndex =
+      item.candidateIndex ??
+      item.candidate_index ??
+      item.optionIndex ??
+      item.option_index ??
+      item.index ??
+      item.id ??
+      (item.candidate && item.candidate.index) ??
+      detail.candidateIndex ??
+      detail.candidate_index ??
+      detail.optionIndex ??
+      detail.option_index ??
+      detail.index ??
+      detail.id ??
+      null;
+    return {
+      name:
+        item.name ||
+        item.candidateName ||
+        item.candidate_name ||
+        detail.candidateName ||
+        detail.candidate_name ||
+        nestedCandidate.candidateName ||
+        nestedCandidate.candidate_name ||
+        detail.name ||
+        nestedCandidate.name ||
+        item.title ||
+        detail.title ||
+        nestedCandidate.title ||
+        item.label ||
+        detail.label ||
+        nestedCandidate.label ||
+        item.template ||
+        detail.template ||
+        "",
+      candidateIndex: normalizeCandidateIndexValue(candidateIndex),
+      summary:
+        item.summary ||
+        item.firstVersionDescription ||
+        item.first_version_description ||
+        item.planDescription ||
+        item.plan_description ||
+        item.pros ||
+        item.topology ||
+        detail.summary ||
+        detail.firstVersionDescription ||
+        detail.first_version_description ||
+        detail.planDescription ||
+        detail.plan_description ||
+        detail.pros ||
+        detail.topology ||
+        templateConclusion.summary ||
+        templateConclusion.description ||
+        nestedCandidate.summary ||
+        nestedCandidate.firstVersionDescription ||
+        nestedCandidate.first_version_description ||
+        item.description ||
+        detail.description ||
+        nestedCandidate.description ||
+        nestedCandidate.topology ||
+        nestedCandidate.pros ||
+        "",
+      template: item.template || detail.template || "",
+      totalMonthlyCost:
+        item.totalMonthlyCost ??
+        item.total_monthly_cost ??
+        item.monthlyCost ??
+        item.monthly_cost ??
+        item.monthlyEstimate ??
+        item.monthly_estimate ??
+        item.roughMonthlyEstimate ??
+        item.rough_monthly_estimate ??
+        item.estimatedMonthlyCost ??
+        item.estimated_monthly_cost ??
+        primitiveCost(item.cost) ??
+        item.price ??
+        detail.totalMonthlyCost ??
+        detail.total_monthly_cost ??
+        detail.monthlyCost ??
+        detail.monthly_cost ??
+        detail.monthlyEstimate ??
+        detail.monthly_estimate ??
+        detail.roughMonthlyEstimate ??
+        detail.rough_monthly_estimate ??
+        detail.estimatedMonthlyCost ??
+        detail.estimated_monthly_cost ??
+        primitiveCost(detail.cost) ??
+        detail.price ??
+        cost.totalMonthlyCost ??
+        cost.total_monthly_cost ??
+        cost.monthlyCost ??
+        cost.monthly_cost ??
+        cost.monthlyEstimate ??
+        cost.monthly_estimate ??
+        costConclusion.totalMonthlyCost ??
+        costConclusion.total_monthly_cost ??
+        costConclusion.monthlyEstimate ??
+        costConclusion.monthly_estimate ??
+        nestedCandidate.totalMonthlyCost ??
+        nestedCandidate.total_monthly_cost ??
+        nestedCandidate.monthlyEstimate ??
+        nestedCandidate.monthly_estimate ??
+        "",
+      outputPath:
+        item.outputPath ||
+        item.output_path ||
+        detail.outputPath ||
+        detail.output_path ||
+        templateConclusion.outputPath ||
+        templateConclusion.output_path ||
+        templateConclusion.filePath ||
+        templateConclusion.file_path ||
+        nestedCandidate.outputPath ||
+        nestedCandidate.output_path ||
+        "",
+      costItems: Array.isArray(item.costItems)
+        ? clonePlainData(item.costItems)
+        : Array.isArray(detail.costItems)
+          ? clonePlainData(detail.costItems)
+          : Array.isArray(cost.costItems)
+            ? clonePlainData(cost.costItems)
+            : Array.isArray(cost.items)
+              ? clonePlainData(cost.items)
+              : Array.isArray(cost.resources)
+                ? clonePlainData(cost.resources)
+                : Array.isArray(costConclusion.costItems)
+                  ? clonePlainData(costConclusion.costItems)
+                  : Array.isArray(costConclusion.items)
+                    ? clonePlainData(costConclusion.items)
+                    : Array.isArray(costConclusion.resources)
+                      ? clonePlainData(costConclusion.resources)
+                      : [],
+    };
+  }
+
+  function candidateIndexFromSource(source) {
+    if (!source || typeof source !== "object") {
+      return null;
+    }
+    const data = source.data && typeof source.data === "object" ? source.data : {};
+    const candidate = source.candidate && typeof source.candidate === "object" ? source.candidate : {};
+    const rawIndex =
+      source.candidateIndex ??
+      source.candidate_index ??
+      source.optionIndex ??
+      source.option_index ??
+      candidate.index ??
+      candidate.id ??
+      candidate.candidateIndex ??
+      candidate.candidate_index ??
+      data.candidateIndex ??
+      data.candidate_index ??
+      data.optionIndex ??
+      data.option_index ??
+      null;
+    const normalizedIndex = normalizeCandidateIndexValue(rawIndex);
+    return normalizedIndex === "" || normalizedIndex === null || normalizedIndex === undefined ? null : normalizedIndex;
+  }
+
+  function candidateSelectionInputKind(source) {
+    if (!source || typeof source !== "object") {
+      return "";
+    }
+    return String(source.kind || source.inputKind || source.input_kind || source.type || "");
+  }
+
+  function hasCandidateSelectionOptions(source) {
+    const kind = candidateSelectionInputKind(source);
+    return (kind === "candidate_selection" || kind === "candidate_select") && Array.isArray(source.options);
+  }
+
+  function isCandidateSubPipelineEvent(envelope, stepId) {
+    const eventType = eventTypeOf(envelope || {});
+    const candidateIndex = candidateIndexFromSource(envelope);
+    if (candidateIndex === null || candidateIndex === undefined) {
+      return false;
+    }
+    if (String(eventType || "").startsWith("candidate_step")) {
+      return true;
+    }
+    if (eventType === "candidate_started" || eventType === "candidate_completed" || eventType === "candidate_failed") {
+      return true;
+    }
+    if (envelope.candidateStep || envelope.candidate_step) {
+      return true;
+    }
+    return (
+      stepId === "evaluate_candidates" &&
+      ["text_delta", "tool_result", "tool_use", "tool_call", "tool_started", "permission_requested"].includes(eventType)
+    );
+  }
+
+  function appendCandidateSubEventInPlace(state, envelope) {
+    const candidateIndex = candidateIndexFromSource(envelope);
+    if (candidateIndex === null || candidateIndex === undefined) {
+      return state;
+    }
+    upsertCandidateInPlace(state, {
+      candidateIndex,
+      name:
+        envelope &&
+        envelope.candidate &&
+        typeof envelope.candidate === "object" &&
+        (envelope.candidate.name || envelope.candidate.title || envelope.candidate.label),
+    });
+    const targetIndex = state.candidates.findIndex(
+      (candidate) => normalizeCandidateIndexValue(candidate.candidateIndex) === candidateIndex
+    );
+    if (targetIndex < 0) {
+      return state;
+    }
+    const target = cloneCandidate(state.candidates[targetIndex]);
+    target.subEvents = Array.isArray(target.subEvents) ? target.subEvents : [];
+    target.subEvents.push(clonePlainData(envelope));
+    target.subEvents = target.subEvents.slice(-MAX_CANDIDATE_SUB_EVENTS);
+    state.candidates[targetIndex] = target;
+    return state;
+  }
+
+  function candidateCollectionsFromSource(source) {
+    if (!source || typeof source !== "object") {
+      return [];
+    }
+    const collections = [];
+    const collectFromObject = (target, options = {}) => {
+      if (!target || typeof target !== "object") {
+        return;
+      }
+      collections.push(
+        target.candidateDetails,
+        target.candidate_details,
+        target.candidates,
+        target.draftCandidates,
+        target.draft_candidates,
+        target.planCandidates,
+        target.plan_candidates,
+        target.candidateOptions,
+        target.candidate_options,
+        target.candidateSummaries,
+        target.candidate_summaries,
+        target.plans,
+        target.proposals
+      );
+      if (options.includeGenericOptions) {
+        collections.push(target.options);
+      }
+    };
+    const display = source.display && typeof source.display === "object" ? source.display : null;
+    if (display) {
+      collectFromObject(display, { includeGenericOptions: true });
+    }
+    collectFromObject(source);
+    if (hasCandidateSelectionOptions(source)) {
+      collections.push(source.options);
+    }
+    const pendingInput = pendingInputOf(source);
+    if (pendingInput && typeof pendingInput === "object" && hasCandidateSelectionOptions(pendingInput)) {
+      collections.push(pendingInput.options);
+    }
+    const conclusion = source.conclusion && typeof source.conclusion === "object" ? source.conclusion : null;
+    if (conclusion) {
+      collectFromObject(conclusion, { includeGenericOptions: true });
+    }
+    const data = source.data && typeof source.data === "object" ? source.data : null;
+    if (data && data !== source) {
+      collections.push(...candidateCollectionsFromSource(data));
+    }
+    return collections.filter(Array.isArray);
+  }
+
+  function numericConclusionItems(conclusion) {
+    if (!conclusion || typeof conclusion !== "object" || Array.isArray(conclusion)) {
+      return [];
+    }
+    return Object.keys(conclusion)
+      .filter((key) => /^\d+$/.test(key) && conclusion[key] && typeof conclusion[key] === "object")
+      .map((key) => ({
+        index: Number(key),
+        candidateIndex: Number(key),
+        ...conclusion[key],
+      }));
+  }
+
+  function upsertCandidatesFromSource(state, source) {
+    candidateCollectionsFromSource(source).forEach((collection) => {
+      collection.forEach((item) => {
+        upsertCandidateInPlace(state, candidateFromDisplayItem(item));
+      });
+    });
+    const upsertNumericConclusionItems = (current) => {
+      const conclusion = current && current.conclusion && typeof current.conclusion === "object" ? current.conclusion : null;
+      numericConclusionItems(conclusion).forEach((item) => {
+        upsertCandidateInPlace(state, candidateFromDisplayItem(item));
+      });
+      const data = current && current.data && typeof current.data === "object" ? current.data : null;
+      if (data && data !== current) {
+        upsertNumericConclusionItems(data);
+      }
+    };
+    upsertNumericConclusionItems(source);
+    return state;
+  }
+
+  function candidateFromEnvelope(envelope) {
+    if (!envelope || typeof envelope !== "object") {
+      return null;
+    }
+    const data = envelope.data && typeof envelope.data === "object" ? envelope.data : {};
+    const conclusion = data.conclusion && typeof data.conclusion === "object" ? data.conclusion : {};
+    const detail =
+      data.detail && typeof data.detail === "object"
+        ? data.detail
+        : data.candidate_detail && typeof data.candidate_detail === "object"
+          ? data.candidate_detail
+          : {};
+    const eventCandidate = envelope.candidate && typeof envelope.candidate === "object" ? envelope.candidate : {};
+    const dataCandidate = data.candidate && typeof data.candidate === "object" ? data.candidate : {};
+    const conclusionCandidate =
+      conclusion.candidate && typeof conclusion.candidate === "object" ? conclusion.candidate : {};
+    const conclusions = data.conclusions && typeof data.conclusions === "object" ? data.conclusions : {};
+    const templateConclusion = conclusions.template && typeof conclusions.template === "object" ? conclusions.template : {};
+    const costConclusion = conclusions.cost && typeof conclusions.cost === "object" ? conclusions.cost : {};
+    const candidateIndex = candidateIndexFromSource(envelope);
+    return candidateFromDisplayItem({
+      ...data,
+      ...conclusion,
+      ...templateConclusion,
+      detail: Object.keys(detail).length ? detail : { ...conclusion, ...templateConclusion },
+      cost: Object.keys(costConclusion).length ? costConclusion : data.cost,
+      candidate: {
+        ...eventCandidate,
+        ...dataCandidate,
+        ...conclusionCandidate,
+      },
+      candidateIndex,
+    });
+  }
+
+  function hasCandidateValue(value) {
+    if (Array.isArray(value)) {
+      return value.length > 0;
+    }
+    return value !== "" && value !== null && value !== undefined;
+  }
+
+  function mergeCandidate(existing, candidate) {
+    const result = cloneCandidate(existing || {});
+    Object.keys(candidate || {}).forEach((key) => {
+      const value = candidate[key];
+      if (hasCandidateValue(value)) {
+        result[key] = clonePlainData(value);
+      } else if (!Object.prototype.hasOwnProperty.call(result, key)) {
+        result[key] = clonePlainData(value);
+      }
+    });
+    return cloneCandidate(result);
+  }
+
+  function upsertCandidateInPlace(state, candidate) {
+    if (!candidate) {
+      return state;
+    }
+    const nextCandidate = cloneCandidate(candidate);
+    nextCandidate.candidateIndex = normalizeCandidateIndexValue(nextCandidate.candidateIndex);
+    const hasNextIndex = nextCandidate.candidateIndex !== null && nextCandidate.candidateIndex !== undefined;
+    const index = state.candidates.findIndex((existing) => {
+      if (hasNextIndex && normalizeCandidateIndexValue(existing.candidateIndex) === nextCandidate.candidateIndex) {
+        return true;
+      }
+      if (existing.name && nextCandidate.name && existing.name === nextCandidate.name) {
+        return true;
+      }
+      return false;
+    });
+    if (index >= 0) {
+      state.candidates[index] = mergeCandidate(state.candidates[index], nextCandidate);
+    } else {
+      state.candidates.push(nextCandidate);
+    }
+    return state;
+  }
+
+  function upsertCandidate(state, candidate) {
+    const nextState = cloneState(state);
+    return upsertCandidateInPlace(nextState, candidate);
+  }
+
+  function pendingInputFromSnapshot(snapshot) {
+    const pendingInput = pendingInputOf(snapshot);
+    if (!pendingInput) {
+      return null;
+    }
+    return pendingInputFromInput(pendingInput);
+  }
+
+  function pendingInputFromInput(input) {
+    if (!input || typeof input !== "object") {
+      return null;
+    }
+    const pendingInput = clonePlainData(input);
+    return {
+      ...pendingInput,
+      prompt: pendingInput.prompt || pendingInput.question || "",
+      options: Array.isArray(pendingInput.options) ? pendingInput.options : [],
+    };
+  }
+
+  function applySnapshot(state, snapshot) {
+    if (!snapshot || typeof snapshot !== "object") {
+      return state;
+    }
+    const taskId = taskIdOf(snapshot);
+    if (taskId) {
+      state.pipelineTaskId = taskId;
+    }
+    const contextId = contextIdOf(snapshot);
+    if (contextId) {
+      state.contextId = contextId;
+    }
+    updateLastSequence(state, sequenceOf(snapshot));
+    if (snapshot.status) {
+      state.status = normalizeStatus(snapshot.status);
+      if (state.status && state.status !== "idle") {
+        state.pipelineStarted = true;
+      }
+    }
+
+    if (Array.isArray(snapshot.steps)) {
+      snapshot.steps.forEach((step) => {
+        const stepId = normalizeStepId(step);
+        if (stepId && state.steps[stepId]) {
+          const status = normalizeStatus(step.status) || state.steps[stepId].status;
+          state.steps[stepId].status = status;
+          if (status && status !== "pending") {
+            state.pipelineStarted = true;
+          }
+          if (status === "working" || status === "waiting_input") {
+            state.currentStepId = stepId;
+          }
+        }
+      });
+    }
+
+    upsertCandidatesFromSource(state, snapshot);
+
+    const pendingInput = pendingInputFromSnapshot(snapshot);
+    if (
+      Object.prototype.hasOwnProperty.call(snapshot, "pendingInput") ||
+      Object.prototype.hasOwnProperty.call(snapshot, "pending_input")
+    ) {
+      state.pendingInput = pendingInputFromInput(pendingInputOf(snapshot));
+    } else if (pendingInput) {
+      state.pendingInput = pendingInput;
+    }
+
+    const normalHandoff = normalHandoffOf(snapshot);
+    if (
+      normalHandoff &&
+      typeof normalHandoff === "object" &&
+      normalHandoff.action === "switch_to_normal" &&
+      targetModeOf(normalHandoff) === "normal"
+    ) {
+      state.normalHandoffReady = true;
+      state.activeTaskId = "";
+    }
+    return state;
+  }
+
+  function currentStepIdFromState(state) {
+    const isActive = (stepId) => {
+      const status = stepStatusClass(normalizeStatus(state && state.steps && state.steps[stepId] && state.steps[stepId].status));
+      return status === "working" || status === "waiting_input";
+    };
+    if (state && state.currentStepId && state.steps && state.steps[state.currentStepId] && isActive(state.currentStepId)) {
+      return state.currentStepId;
+    }
+    const activeStepId = STEP_ORDER.find((stepId) => isActive(stepId));
+    return activeStepId || "";
+  }
+
+  function inferredStepIdForEvent(state, envelope, explicitStepId) {
+    if (explicitStepId) {
+      return explicitStepId;
+    }
+    if (!CURRENT_STEP_EVENT_TYPES.has(eventTypeOf(envelope))) {
+      return "";
+    }
+    return currentStepIdFromState(state);
+  }
+
+  function applyPipelineEnvelope(state, envelope) {
+    if (!envelope) {
+      return state;
+    }
+    const eventType = eventTypeOf(envelope);
+    const taskId = taskIdOf(envelope);
+    if (taskId) {
+      state.pipelineTaskId = taskId;
+    }
+    const contextId = contextIdOf(envelope);
+    if (contextId) {
+      state.contextId = contextId;
+    }
+    updateLastSequence(state, sequenceOf(envelope));
+    if (envelope.status) {
+      state.status = normalizeStatus(envelope.status);
+    }
+
+    const explicitStepId = normalizeStepId(envelope.step);
+    const stepId = inferredStepIdForEvent(state, envelope, explicitStepId);
+    if (eventType === "pipeline_started" || stepId) {
+      state.pipelineStarted = true;
+    }
+    if (stepId && state.steps[stepId]) {
+      state.currentStepId = stepId;
+      state.steps[stepId].status =
+        statusFromEventType(eventType, (envelope.step && envelope.step.status) || envelope.status) ||
+        state.steps[stepId].status;
+      state.steps[stepId].events.push(clonePlainData(envelope));
+      if (eventType === "step_completed" && state.expandedStepDetails) {
+        state.expandedStepDetails[stepId] = false;
+      }
+    }
+    if (isCandidateSubPipelineEvent(envelope, stepId)) {
+      appendCandidateSubEventInPlace(state, envelope);
+    }
+
+    const data = envelope.data || {};
+    if (eventType === "candidate_completed" || eventType === "candidate_failed") {
+      upsertCandidateInPlace(state, candidateFromEnvelope(envelope));
+      const candidateIndex = candidateIndexFromSource(envelope);
+      if (candidateIndex !== null && candidateIndex !== undefined) {
+        state.expandedCandidateSubpipelines = state.expandedCandidateSubpipelines || {};
+        state.expandedCandidateSubpipelines[String(candidateIndex)] = false;
+      }
+    }
+    if (eventType === "candidate_detail_shown") {
+      upsertCandidateInPlace(
+        state,
+        candidateFromDisplayItem({
+          ...data,
+          candidate: envelope.candidate || data.candidate,
+          step: envelope.step || data.step,
+        })
+      );
+    }
+    upsertCandidatesFromSource(state, envelope);
+    if (eventType === "input_required") {
+      state.pendingInput = pendingInputFromInput(pendingInputOf(envelope) || data);
+    }
+    if (eventType === "input_received") {
+      state.pendingInput = null;
+    }
+    if (
+      eventType === "pipeline_handoff_ready" ||
+      (data.action === "switch_to_normal" && targetModeOf(data) === "normal")
+    ) {
+      state.normalHandoffReady = true;
+      state.activeTaskId = "";
+      if (envelope.status) {
+        state.status = normalizeStatus(envelope.status);
+      }
+    }
+    return state;
+  }
+
+  function isSnapshotLike(payload) {
+    if (!payload || typeof payload !== "object") {
+      return false;
+    }
+    if (eventTypeOf(payload)) {
+      return false;
+    }
+    return Boolean(
+      payload.display ||
+        Object.prototype.hasOwnProperty.call(payload, "pendingInput") ||
+        Object.prototype.hasOwnProperty.call(payload, "pending_input") ||
+        normalHandoffOf(payload) ||
+        taskIdOf(payload) ||
+        contextIdOf(payload) ||
+        sequenceOf(payload) !== null ||
+        Array.isArray(payload.steps)
+    );
+  }
+
+  function reducePipelinePayload(state, payload) {
+    const nextState = cloneState(state);
+    const hasEvents = payload && Array.isArray(payload.events);
+    applyPipelineEnvelope(nextState, hasEvents ? null : extractPipelineEnvelope(payload));
+    if (payload && payload.snapshot) {
+      applySnapshot(nextState, payload.snapshot);
+    } else if (isSnapshotLike(payload)) {
+      applySnapshot(nextState, payload);
+    }
+    if (payload && Array.isArray(payload.events)) {
+      payload.events.forEach((event) => {
+        applyPipelineEnvelope(nextState, extractPipelineEnvelope(event));
+      });
+    }
+    applyNormalChatPayload(nextState, payload);
+    return nextState;
+  }
+
+  function a2aSource(payload) {
+    if (!payload || typeof payload !== "object") {
+      return null;
+    }
+    if (Array.isArray(payload)) {
+      for (const item of payload) {
+        const source = a2aSource(item);
+        if (source) {
+          return source;
+        }
+      }
+      return null;
+    }
+    if (payload.status && typeof payload.status === "object") {
+      return payload;
+    }
+    if (payload.metadata && typeof payload.metadata === "object") {
+      return payload;
+    }
+    for (const key of ["result", "params", "event", "task"]) {
+      if (payload[key] && typeof payload[key] === "object") {
+        const source = a2aSource(payload[key]);
+        if (source) {
+          return source;
+        }
+      }
+    }
+    return null;
+  }
+
+  function a2aTaskId(source) {
+    return (
+      taskIdOf(source || {}) ||
+      valueOf(source || {}, "id") ||
+      (source && source.task && typeof source.task === "object" && (taskIdOf(source.task) || source.task.id)) ||
+      ""
+    );
+  }
+
+  function normalizeA2aState(value) {
+    if (!value) {
+      return "";
+    }
+    const normalized = String(value)
+      .trim()
+      .toLowerCase()
+      .replace(/^task_state_/, "")
+      .replace(/-/g, "_");
+    if (normalized === "input_required") {
+      return "completed";
+    }
+    if (normalized === "completed" || normalized === "failed" || normalized === "canceled" || normalized === "working") {
+      return normalized;
+    }
+    return normalized;
+  }
+
+  function partText(part) {
+    if (typeof part === "string") {
+      return part;
+    }
+    if (!part || typeof part !== "object") {
+      return "";
+    }
+    if (typeof part.text === "string") {
+      return part.text;
+    }
+    if (part.root && typeof part.root === "object") {
+      return partText(part.root);
+    }
+    if (part.data && typeof part.data === "object" && typeof part.data.text === "string") {
+      return part.data.text;
+    }
+    return "";
+  }
+
+  function contentBlockText(block) {
+    if (typeof block === "string") {
+      return block;
+    }
+    if (!block || typeof block !== "object") {
+      return "";
+    }
+    const type = String(block.type || block.kind || "").toLowerCase();
+    if (type && type !== "text" && type !== "output_text") {
+      return "";
+    }
+    if (typeof block.text === "string") {
+      return block.text;
+    }
+    if (typeof block.content === "string") {
+      return block.content;
+    }
+    return partText(block);
+  }
+
+  function messageText(message) {
+    if (typeof message === "string") {
+      return message;
+    }
+    if (!message || typeof message !== "object") {
+      return "";
+    }
+    if (typeof message.text === "string") {
+      return message.text;
+    }
+    if (Array.isArray(message.content)) {
+      return message.content.map(contentBlockText).join("");
+    }
+    const parts = Array.isArray(message.parts) ? message.parts : [];
+    return parts.map(partText).join("");
+  }
+
+  function agentHistoryEntryText(source) {
+    const history = Array.isArray(source && source.history)
+      ? source.history
+      : Array.isArray(source && source.task && source.task.history)
+        ? source.task.history
+        : [];
+    for (let index = history.length - 1; index >= 0; index -= 1) {
+      const entry = history[index];
+      const role = String((entry && entry.role) || "")
+        .toLowerCase()
+        .replace(/^role_/, "");
+      if (!["agent", "assistant"].includes(role)) {
+        continue;
+      }
+      const text = messageText(entry);
+      if (text) {
+        return text;
+      }
+    }
+    return "";
+  }
+
+  function normalAnswerFromSource(source, status) {
+    const liveText = messageText((status && status.message) || (source && source.message));
+    if (liveText) {
+      return { text: liveText, replace: false };
+    }
+    const historyText = agentHistoryEntryText(source);
+    return historyText ? { text: historyText, replace: true } : { text: "", replace: false };
+  }
+
+  function mergeNormalAnswer(existing, next, replace) {
+    if (!next) {
+      return existing || "";
+    }
+    if (!replace) {
+      return `${existing || ""}${next}`;
+    }
+    if (!existing) {
+      return next;
+    }
+    if (next.includes(existing) || existing.includes(next)) {
+      return next.length >= existing.length ? next : existing;
+    }
+    return `${existing}${next}`;
+  }
+
+  function iacMetadata(source) {
+    const metadata = source && source.metadata && typeof source.metadata === "object" ? source.metadata : {};
+    const statusMetadata =
+      source && source.status && source.status.metadata && typeof source.status.metadata === "object"
+        ? source.status.metadata
+        : {};
+    return (
+      metadata.iac_code ||
+      metadata.iacCode ||
+      metadata["iac-code"] ||
+      statusMetadata.iac_code ||
+      statusMetadata.iacCode ||
+      statusMetadata["iac-code"] ||
+      null
+    );
+  }
+
+  function compactValueText(value) {
+    if (value === null || value === undefined) {
+      return "";
+    }
+    if (typeof value === "string") {
+      return value;
+    }
+    if (typeof value === "number" || typeof value === "boolean") {
+      return String(value);
+    }
+    if (typeof value === "object") {
+      return (
+        value.content ||
+        value.text ||
+        value.summary ||
+        value.safeSummary ||
+        value.message ||
+        value.error ||
+        ""
+      );
+    }
+    return "";
+  }
+
+  function normalToolText(tool) {
+    if (!tool || typeof tool !== "object") {
+      return "";
+    }
+    const statusMap = {
+      started: "开始",
+      input_delta: "输入中",
+      input_complete: "输入完成",
+      completed: "完成",
+      failed: "失败",
+    };
+    const name = tool.name || tool.toolName || "工具";
+    const status = statusMap[tool.status] || tool.status || "";
+    const result = compactValueText(tool.result || tool.artifact || tool.input || tool.partialJson);
+    return [name, status, result].filter(Boolean).join(" ");
+  }
+
+  function normalEventsFromMetadata(metadata) {
+    if (!metadata || typeof metadata !== "object") {
+      return [];
+    }
+    const events = [];
+    if (metadata.thinking && typeof metadata.thinking === "object") {
+      const text = compactValueText(metadata.thinking.text || metadata.thinking);
+      if (text) {
+        events.push({ kind: "thinking", label: "思考", text });
+      }
+    }
+    if (metadata.tool && typeof metadata.tool === "object") {
+      const text = normalToolText(metadata.tool);
+      if (text) {
+        events.push({ kind: "tool", label: "工具", text });
+      }
+    }
+    if (metadata.permission && typeof metadata.permission === "object") {
+      const text = metadata.permission.toolName || metadata.permission.tool_name || "权限确认";
+      events.push({ kind: "permission", label: "权限", text });
+    }
+    if (metadata.error && typeof metadata.error === "object") {
+      const text = compactValueText(metadata.error.message || metadata.error.error || metadata.error);
+      if (text) {
+        events.push({ kind: "error", label: "异常", text });
+      }
+    }
+    return events;
+  }
+
+  function lastNormalUserMessageId(state) {
+    const messages = Array.isArray(state && state.userMessages) ? state.userMessages : [];
+    for (let index = messages.length - 1; index >= 0; index -= 1) {
+      const message = messages[index];
+      const placement = userMessagePlacement(message);
+      if (placement.position === "after_normal_handoff") {
+        return userMessageKey(message, index);
+      }
+    }
+    return "";
+  }
+
+  function normalTurnForEvent(state, taskId, shouldCreate) {
+    state.normalTurns = Array.isArray(state.normalTurns) ? state.normalTurns : [];
+    const id = taskId || `normal-turn-${state.normalTurns.length + 1}`;
+    let index = state.normalTurns.findIndex((turn) => turn && (turn.taskId === taskId || turn.id === id));
+    if (index < 0) {
+      if (!shouldCreate) {
+        return null;
+      }
+      const afterUserMessageId = state.pendingNormalUserMessageId || lastNormalUserMessageId(state);
+      state.normalTurns.push({
+        id,
+        taskId,
+        afterUserMessageId,
+        status: "working",
+        answer: "",
+        events: [],
+      });
+      state.pendingNormalUserMessageId = "";
+      index = state.normalTurns.length - 1;
+    }
+    state.normalTurns[index].events = Array.isArray(state.normalTurns[index].events) ? state.normalTurns[index].events : [];
+    return state.normalTurns[index];
+  }
+
+  function applyNormalChatPayload(state, payload) {
+    if (!state || !state.normalHandoffReady) {
+      return state;
+    }
+    const pipelineEnvelope = extractPipelineEnvelope(payload);
+    if (pipelineEnvelope && eventTypeOf(pipelineEnvelope)) {
+      return state;
+    }
+    const source = a2aSource(payload);
+    if (!source) {
+      return state;
+    }
+    const status = source.status && typeof source.status === "object" ? source.status : {};
+    const stateValue = normalizeA2aState(status.state || source.state || source.status);
+    const answer = normalAnswerFromSource(source, status);
+    const answerText = answer.text;
+    const events = normalEventsFromMetadata(iacMetadata(source));
+    const taskId = a2aTaskId(source);
+    const shouldCreate = Boolean(answerText || events.length || stateValue === "working");
+    const turn = normalTurnForEvent(state, taskId, shouldCreate);
+    if (!turn) {
+      return state;
+    }
+    if (taskId) {
+      turn.taskId = taskId;
+    }
+    if (answerText) {
+      turn.answer = mergeNormalAnswer(turn.answer, answerText, answer.replace);
+    }
+    events.forEach((event) => {
+      turn.events.push(clonePlainData(event));
+    });
+    turn.events = turn.events.slice(-80);
+    if (stateValue === "working") {
+      turn.status = "working";
+    } else if (stateValue === "failed" || stateValue === "canceled") {
+      turn.status = stateValue;
+    } else if (stateValue) {
+      turn.status = "completed";
+    }
+    return state;
+  }
+
+  function buildStreamPayload(state, prompt) {
+    const source = state && typeof state === "object" ? state : {};
+    return {
+      serverUrl: source.serverUrl || "",
+      cwd: source.cwd || "",
+      contextId: source.contextId || "",
+      taskId: source.normalHandoffReady ? "" : source.activeTaskId || source.pipelineTaskId || "",
+      prompt: prompt || "",
+    };
+  }
+
+  function selectCandidate(state, candidateIndex) {
+    const nextState = state && typeof state === "object" ? state : createInitialState();
+    const numericIndex = Number(candidateIndex);
+    nextState.selectedCandidateIndex = Number.isFinite(numericIndex) ? numericIndex : null;
+    return nextState;
+  }
+
+  function promptForSelectedCandidate(state) {
+    if (!state || state.selectedCandidateIndex === null || state.selectedCandidateIndex === undefined) {
+      return "";
+    }
+    const numericIndex = Number(state.selectedCandidateIndex);
+    if (!Number.isFinite(numericIndex)) {
+      return "";
+    }
+    return `选择方案${numericIndex}`;
+  }
+
+  window.SellingConsoleReducers = {
+    STEP_ORDER,
+    STEP_LABELS,
+    createInitialState,
+    extractPipelineEnvelope,
+    normalizeStepId,
+    upsertCandidate,
+    reducePipelinePayload,
+    candidateFromDisplayItem,
+    pendingInputFromSnapshot,
+    buildStreamPayload,
+    selectCandidate,
+    promptForSelectedCandidate,
+  };
+
+  const STEP_DESCRIPTIONS = {
+    intent_parsing: "识别业务目标、地域、预算与部署约束。",
+    architecture_planning: "拆解网络、计算、存储与安全资源拓扑。",
+    evaluate_candidates: "比较规格、可用区、成本与运维复杂度。",
+    confirm_and_select: "确认推荐方案并准备转入标准部署流程。",
+    deploying: "复核资源清单、交付方式与后续部署动作。",
+  };
+  const CONCLUSION_FIELD_LABELS = {
+    architecture: "架构",
+    budget: "预算",
+    intent: "需求",
+    isInfraIntent: "基础设施需求",
+    is_infra_intent: "基础设施需求",
+    objective: "目标",
+    plan: "方案",
+    reason: "原因",
+    recommendation: "推荐",
+    region: "地域",
+    scenario: "场景",
+    selectedOption: "已选方案",
+    selectedValue: "已选项",
+    summary: "总结",
+  };
+  const STATUS_LABELS = {
+    idle: "等待输入",
+    pending: "未开始",
+    working: "进行中",
+    completed: "已完成",
+    waiting_input: "等待输入",
+    failed: "失败",
+    error: "失败",
+  };
+  const PROGRESS_STATUS_LABELS = {
+    pending: "待开始",
+    working: "思考中",
+    completed: "完成",
+    waiting_input: "待确认",
+    failed: "失败",
+    error: "失败",
+  };
+  const STEP_DETAIL_STATUS_LABELS = {
+    working: "思考中",
+    completed: "思考完成",
+    waiting_input: "等待确认",
+    failed: "执行失败",
+    error: "执行失败",
+  };
+  const STEP_STATUS_CLASSES = new Set(["pending", "working", "completed", "waiting_input", "failed", "error"]);
+
+  const controller = {
+    state: null,
+    bound: false,
+    progressAnimationFrame: null,
+    progressAnimationToken: 0,
+    progressRunTimer: 0,
+    progressWaitTimer: 0,
+  };
+
+  function hasDocument() {
+    return typeof document !== "undefined" && document !== null;
+  }
+
+  function canCreateElements() {
+    return hasDocument() && typeof document.createElement === "function";
+  }
+
+  function query(selector) {
+    if (!hasDocument() || typeof document.querySelector !== "function") {
+      return null;
+    }
+    return document.querySelector(selector);
+  }
+
+  function byId(id) {
+    if (!hasDocument()) {
+      return null;
+    }
+    if (typeof document.getElementById === "function") {
+      return document.getElementById(id);
+    }
+    return query(`#${id}`);
+  }
+
+  function clearElement(element) {
+    if (!element) {
+      return;
+    }
+    if (typeof element.replaceChildren === "function") {
+      element.replaceChildren();
+      return;
+    }
+    while (element.firstChild && typeof element.removeChild === "function") {
+      element.removeChild(element.firstChild);
+    }
+    if (!element.firstChild) {
+      element.textContent = "";
+    }
+  }
+
+  function appendChild(parent, child) {
+    if (parent && child && typeof parent.appendChild === "function") {
+      parent.appendChild(child);
+    }
+  }
+
+  function createElement(tagName, className, text) {
+    if (!canCreateElements()) {
+      return null;
+    }
+    const svgTags = new Set(["svg", "path"]);
+    const element =
+      svgTags.has(tagName) && typeof document.createElementNS === "function"
+        ? document.createElementNS("http://www.w3.org/2000/svg", tagName)
+        : document.createElement(tagName);
+    if (className) {
+      if (typeof element.setAttribute === "function") {
+        element.setAttribute("class", className);
+      } else {
+        element.className = className;
+      }
+    }
+    if (text !== undefined && text !== null) {
+      element.textContent = String(text);
+    }
+    return element;
+  }
+
+  function addClassName(element, className) {
+    if (!element || !className) {
+      return element;
+    }
+    const current =
+      (typeof element.getAttribute === "function" && element.getAttribute("class")) || element.className || "";
+    const classes = new Set(String(current || "").split(/\s+/).filter(Boolean));
+    String(className || "")
+      .split(/\s+/)
+      .filter(Boolean)
+      .forEach((item) => classes.add(item));
+    const nextClassName = Array.from(classes).join(" ");
+    if (typeof element.setAttribute === "function") {
+      element.setAttribute("class", nextClassName);
+    } else {
+      element.className = nextClassName;
+    }
+    return element;
+  }
+
+  function markMarkdownNode(element, kind) {
+    if (element && kind) {
+      element.setAttribute("data-markdown-node", kind);
+    }
+    return element;
+  }
+
+  function safeMarkdownUrl(value) {
+    const url = String(value || "").trim();
+    if (/^(https?:|mailto:)/i.test(url)) {
+      return url;
+    }
+    return "";
+  }
+
+  function appendInlineMarkdown(parent, text) {
+    if (!parent) {
+      return;
+    }
+    const source = String(text || "");
+    const tokenPattern = /(\*\*[^*]+\*\*|`[^`]+`|\[[^\]]+\]\([^)]+\))/g;
+    let cursor = 0;
+    source.replace(tokenPattern, (match, _token, offset) => {
+      if (offset > cursor) {
+        appendChild(parent, createElement("span", "", source.slice(cursor, offset)));
+      }
+      if (match.startsWith("**")) {
+        appendChild(parent, markMarkdownNode(createElement("strong", "", match.slice(2, -2)), "strong"));
+      } else if (match.startsWith("`")) {
+        appendChild(parent, markMarkdownNode(createElement("code", "", match.slice(1, -1)), "code"));
+      } else {
+        const linkMatch = match.match(/^\[([^\]]+)\]\(([^)]+)\)$/);
+        const link = createElement("a", "", linkMatch ? linkMatch[1] : match);
+        const href = linkMatch ? safeMarkdownUrl(linkMatch[2]) : "";
+        if (link && href) {
+          link.setAttribute("href", href);
+          link.setAttribute("target", "_blank");
+          link.setAttribute("rel", "noreferrer");
+        }
+        appendChild(parent, markMarkdownNode(link, "a"));
+      }
+      cursor = offset + match.length;
+      return match;
+    });
+    if (cursor < source.length) {
+      appendChild(parent, createElement("span", "", source.slice(cursor)));
+    }
+  }
+
+  function markdownLines(value) {
+    return String(value || "")
+      .replace(/\r\n?/g, "\n")
+      .replace(/([^\n])\s+(\d+[.)]\s+)/g, "$1\n$2")
+      .split("\n");
+  }
+
+  function renderMarkdownText(value, className) {
+    const container = createElement("div", className || "markdown-text");
+    if (container) {
+      container.setAttribute("data-markdown-rendered", "true");
+    }
+    const lines = markdownLines(value);
+    let paragraph = [];
+    const flushParagraph = () => {
+      if (paragraph.length === 0) {
+        return;
+      }
+      const node = createElement("p");
+      appendInlineMarkdown(node, paragraph.join(" ").trim());
+      appendChild(container, node);
+      paragraph = [];
+    };
+    for (let index = 0; index < lines.length; index += 1) {
+      const line = lines[index];
+      const trimmed = line.trim();
+      if (!trimmed) {
+        flushParagraph();
+        continue;
+      }
+      if (/^[-*]\s+/.test(trimmed)) {
+        flushParagraph();
+        const list = createElement("ul");
+        while (index < lines.length && /^[-*]\s+/.test(lines[index].trim())) {
+          const item = markMarkdownNode(createElement("li"), "li");
+          appendInlineMarkdown(item, lines[index].trim().replace(/^[-*]\s+/, ""));
+          appendChild(list, item);
+          index += 1;
+        }
+        index -= 1;
+        appendChild(container, list);
+        continue;
+      }
+      if (/^\d+[.)]\s+/.test(trimmed)) {
+        flushParagraph();
+        const list = markMarkdownNode(createElement("ol"), "ol");
+        while (index < lines.length && /^\d+[.)]\s+/.test(lines[index].trim())) {
+          const item = markMarkdownNode(createElement("li"), "li");
+          appendInlineMarkdown(item, lines[index].trim().replace(/^\d+[.)]\s+/, ""));
+          appendChild(list, item);
+          index += 1;
+        }
+        index -= 1;
+        appendChild(container, list);
+        continue;
+      }
+      paragraph.push(trimmed);
+    }
+    flushParagraph();
+    if (container && container.children.length === 0) {
+      appendChild(container, createElement("p", "", ""));
+    }
+    return container;
+  }
+
+  function statusLabel(status) {
+    return STATUS_LABELS[status] || status || "等待输入";
+  }
+
+  function stepStatusClass(status) {
+    return STEP_STATUS_CLASSES.has(status) ? status : "pending";
+  }
+
+  function progressStatusLabel(status) {
+    return PROGRESS_STATUS_LABELS[status] || statusLabel(status);
+  }
+
+  function stepDetailStatusLabel(status) {
+    return STEP_DETAIL_STATUS_LABELS[status] || statusLabel(status);
+  }
+
+  function stepStateIcon(status) {
+    const icons = {
+      completed: "✓",
+      error: "!",
+      failed: "!",
+      waiting_input: "?",
+      working: "…",
+    };
+    return icons[status] || "";
+  }
+
+  function stepIsVisible(step) {
+    const status = stepStatusClass(normalizeStatus(step && step.status) || "pending");
+    return status !== "pending" || (Array.isArray(step && step.events) && step.events.length > 0);
+  }
+
+  function stepIsOpen(status) {
+    return status === "working" || status === "waiting_input";
+  }
+
+  function eventData(event) {
+    return event && event.data && typeof event.data === "object" ? event.data : {};
+  }
+
+  function firstTextValue(source, keys) {
+    if (!source || typeof source !== "object") {
+      return "";
+    }
+    for (const key of keys) {
+      const value = source[key];
+      if (value === 0 || value) {
+        return String(value);
+      }
+    }
+    return "";
+  }
+
+  function friendlyFieldLabel(key) {
+    return CONCLUSION_FIELD_LABELS[key] || key.replace(/_/g, " ");
+  }
+
+  function friendlyValue(value) {
+    if (value === true) {
+      return "是";
+    }
+    if (value === false) {
+      return "否";
+    }
+    if (Array.isArray(value)) {
+      return value
+        .map((item) => {
+          if (item && typeof item === "object") {
+            return firstTextValue(item, ["title", "name", "label", "summary", "description"]);
+          }
+          return item === 0 || item ? String(item) : "";
+        })
+        .filter(Boolean)
+        .slice(0, 3)
+        .join("、");
+    }
+    if (value && typeof value === "object") {
+      return conclusionText(value);
+    }
+    return value === 0 || value ? String(value) : "";
+  }
+
+  function optionsConclusionText(options) {
+    if (!Array.isArray(options) || options.length === 0) {
+      return "";
+    }
+    const names = options
+      .map((option) => {
+        if (option && typeof option === "object") {
+          return firstTextValue(option, ["title", "name", "label", "candidateName"]);
+        }
+        return option === 0 || option ? String(option) : "";
+      })
+      .filter(Boolean)
+      .slice(0, 2);
+    return names.length > 0 ? `已生成 ${options.length} 个方案：${names.join("、")}` : `已生成 ${options.length} 个方案`;
+  }
+
+  function conclusionText(conclusion) {
+    if (conclusion === 0 || conclusion) {
+      if (typeof conclusion !== "object") {
+        return String(conclusion);
+      }
+    } else {
+      return "";
+    }
+    const direct = firstTextValue(conclusion, [
+      "summary",
+      "title",
+      "description",
+      "text",
+      "result",
+      "decision",
+      "recommendation",
+      "selectedOption",
+      "selectedValue",
+    ]);
+    if (direct) {
+      return direct;
+    }
+    const optionsText = optionsConclusionText(conclusion.options || conclusion.candidates || conclusion.candidateDetails);
+    if (optionsText) {
+      return optionsText;
+    }
+    const numericItems = numericConclusionItems(conclusion);
+    if (numericItems.length > 0) {
+      return `已完成 ${numericItems.length} 个方案评估`;
+    }
+    return Object.keys(conclusion)
+      .filter((key) => !["options", "candidates", "candidateDetails"].includes(key))
+      .map((key) => {
+        const value = friendlyValue(conclusion[key]);
+        return value ? `${friendlyFieldLabel(key)}：${value}` : "";
+      })
+      .filter(Boolean)
+      .join("，");
+  }
+
+  function conclusionOptionItems(conclusion) {
+    if (!conclusion || typeof conclusion !== "object") {
+      return [];
+    }
+    const options = conclusion.options || conclusion.candidates || conclusion.candidateDetails;
+    if (Array.isArray(options)) {
+      return options;
+    }
+    return numericConclusionItems(conclusion);
+  }
+
+  function conclusionFieldEntries(conclusion) {
+    if (!conclusion || typeof conclusion !== "object" || Array.isArray(conclusion)) {
+      return [];
+    }
+    if (
+      firstTextValue(conclusion, [
+        "summary",
+        "title",
+        "description",
+        "text",
+        "result",
+        "decision",
+        "recommendation",
+        "selectedOption",
+        "selectedValue",
+      ])
+    ) {
+      return [];
+    }
+    if (optionsConclusionText(conclusion.options || conclusion.candidates || conclusion.candidateDetails)) {
+      return [];
+    }
+    return Object.keys(conclusion)
+      .filter((key) => !["options", "candidates", "candidateDetails"].includes(key))
+      .map((key) => {
+        const value = friendlyValue(conclusion[key]);
+        return value ? { key, label: friendlyFieldLabel(key), value } : null;
+      })
+      .filter(Boolean);
+  }
+
+  function latestStepCompletion(step) {
+    const events = Array.isArray(step && step.events) ? step.events : [];
+    for (let index = events.length - 1; index >= 0; index -= 1) {
+      const event = events[index];
+      const data = eventData(event);
+      const conclusion = data.conclusion || event.conclusion;
+      const text = conclusionText(conclusion) || firstTextValue(data, ["summary", "statusMessage", "text", "errorSummary"]);
+      if (conclusion || text) {
+        return { conclusion, text };
+      }
+    }
+    return { conclusion: null, text: "已完成本步骤。" };
+  }
+
+  function completionTextForStep(step) {
+    return latestStepCompletion(step).text || "已完成本步骤。";
+  }
+
+  function eventText(event) {
+    const data = eventData(event);
+    const eventType = eventTypeOf(event || {});
+    const text =
+      firstTextValue(data, ["summary", "text", "statusMessage", "question", "prompt", "candidateName", "errorSummary"]) ||
+      conclusionText(data.conclusion || event.conclusion);
+    if (text) {
+      return text;
+    }
+    if (eventType === "step_started") {
+      return "开始思考";
+    }
+    if (eventType === "input_required") {
+      return "等待您确认或补充信息";
+    }
+    if (eventType === "candidate_detail_shown") {
+      return "生成候选方案详情";
+    }
+    if (eventType === "permission_requested") {
+      return "等待权限确认";
+    }
+    return eventType || "收到新事件";
+  }
+
+  function compactText(value, maxLength = 180) {
+    if (value === "" || value === null || value === undefined) {
+      return "";
+    }
+    const text = String(value).replace(/\s+/g, " ").trim();
+    return text.length > maxLength ? `${text.slice(0, maxLength - 1)}…` : text;
+  }
+
+  function summarizeValue(value, maxLength = 180) {
+    if (value === "" || value === null || value === undefined) {
+      return "";
+    }
+    if (typeof value === "string" || typeof value === "number" || typeof value === "boolean") {
+      return compactText(value, maxLength);
+    }
+    try {
+      return compactText(JSON.stringify(value), maxLength);
+    } catch (_error) {
+      return compactText(value, maxLength);
+    }
+  }
+
+  function toolNameFromEvent(event) {
+    const data = eventData(event);
+    return data.toolName || data.tool_name || data.name || (data.tool && data.tool.name) || "";
+  }
+
+  function objectHasKeys(value) {
+    return Boolean(value && typeof value === "object" && Object.keys(value).length > 0);
+  }
+
+  function toolSummaryFromEvent(event) {
+    const data = eventData(event);
+    const result = data.result && typeof data.result === "object" ? data.result : {};
+    const directSummary =
+      firstTextValue(data, ["safeSummary", "safe_summary", "summary", "text", "statusMessage", "message"]) ||
+      firstTextValue(result, ["safeSummary", "safe_summary", "summary", "message", "content", "text"]);
+    if (directSummary) {
+      return directSummary;
+    }
+    const stackId = data.stackId || data.stack_id || result.stackId || result.stack_id;
+    const stackStatus = data.stackStatus || data.stack_status || result.stackStatus || result.stack_status;
+    const resourceId = data.resourceId || data.resource_id || result.resourceId || result.resource_id;
+    const resourceName = data.resourceName || data.resource_name || result.resourceName || result.resource_name;
+    const status = data.statusMessage || data.statusText || data.status || result.status || "";
+    const parts = [stackId, stackStatus, resourceName, resourceId, status]
+      .map((part) => compactText(part, 80))
+      .filter(Boolean);
+    if (parts.length > 0) {
+      return parts.join(" · ");
+    }
+    if (objectHasKeys(result)) {
+      return summarizeValue(result, 120);
+    }
+    return data.action || "";
+  }
+
+  function stepEventKind(event) {
+    const data = eventData(event);
+    const eventType = eventTypeOf(event || {});
+    const type = data.type || eventType || "";
+    if (type === "tool_result" || eventType === "tool_result") {
+      return "tool_result";
+    }
+    if (type === "tool_use" || eventType === "tool_use" || eventType === "tool_call" || eventType === "tool_started") {
+      return "tool_use";
+    }
+    if (eventType === "input_required") {
+      return "input_required";
+    }
+    if (eventType === "candidate_detail_shown") {
+      return "candidate_detail";
+    }
+    if (eventType === "permission_requested") {
+      return "permission";
+    }
+    if (eventType === "text_delta") {
+      return "text_delta";
+    }
+    return eventType || "event";
+  }
+
+  function textDeltaText(event) {
+    const data = eventData(event);
+    return firstTextValue(data, ["text", "delta", "content", "summary"]);
+  }
+
+  function textDeltaMergeKey(event) {
+    const candidateIndex = candidateIndexFromSource(event);
+    const subStep = candidateSubStepOf(event);
+    const subStepId = subStep.id || subStep.stepId || subStep.name || subStep.label || "";
+    return `${candidateIndex === null || candidateIndex === undefined ? "" : candidateIndex}|${subStepId}`;
+  }
+
+  function compactDisplayEvents(events) {
+    return (Array.isArray(events) ? events : []).reduce((result, event) => {
+      const kind = stepEventKind(event);
+      if (kind !== "text_delta") {
+        result.push(clonePlainData(event));
+        return result;
+      }
+      const fragment = textDeltaText(event);
+      const previous = result[result.length - 1];
+      if (previous && stepEventKind(previous) === "text_delta" && textDeltaMergeKey(previous) === textDeltaMergeKey(event)) {
+        previous.data = previous.data && typeof previous.data === "object" ? previous.data : {};
+        previous.data.text = `${textDeltaText(previous)}${fragment}`;
+      } else {
+        const nextEvent = clonePlainData(event);
+        nextEvent.data = nextEvent.data && typeof nextEvent.data === "object" ? nextEvent.data : {};
+        nextEvent.data.text = fragment;
+        result.push(nextEvent);
+      }
+      return result;
+    }, []);
+  }
+
+  function stepEventLabel(kind) {
+    const labels = {
+      candidate_detail: "方案详情",
+      input_required: "等待输入",
+      permission: "权限确认",
+      step_started: "步骤开始",
+      text_delta: "思考片段",
+      tool_result: "工具结果",
+      tool_use: "工具调用",
+    };
+    return labels[kind] || kind.replace(/_/g, " ");
+  }
+
+  function eventTitle(event) {
+    const data = eventData(event);
+    const kind = stepEventKind(event);
+    if (kind === "tool_result" || kind === "tool_use") {
+      return toolNameFromEvent(event) || "工具";
+    }
+    if (kind === "input_required") {
+      return firstTextValue(data, ["question", "prompt", "summary"]) || "等待您确认或补充信息";
+    }
+    if (kind === "candidate_detail") {
+      const detail = data.detail && typeof data.detail === "object" ? data.detail : data;
+      return firstTextValue(detail, ["candidateName", "name", "title"]) || "生成候选方案详情";
+    }
+    return eventText(event);
+  }
+
+  function eventMetaEntries(event) {
+    const data = eventData(event);
+    const kind = stepEventKind(event);
+    if (kind === "tool_result" || kind === "tool_use") {
+      return [
+        ["摘要", toolSummaryFromEvent(event)],
+        ["地域", data.regionId || data.region_id],
+      ];
+    }
+    if (kind === "input_required") {
+      return [["类型", data.kind], ["选项", Array.isArray(data.options) ? `${data.options.length} 个` : ""]];
+    }
+    if (kind === "permission") {
+      return [["工具", data.toolName || data.tool_name], ["原因", data.reason || data.safeSummary]];
+    }
+    return [];
+  }
+
+  function appendKeyValueList(parent, entries, className) {
+    const filteredEntries = entries
+      .map(([label, value]) => [label, summarizeValue(value)])
+      .filter(([_label, value]) => value);
+    if (filteredEntries.length === 0) {
+      return;
+    }
+    const list = createElement("dl", className || "key-value-list");
+    filteredEntries.forEach(([label, value]) => {
+      const row = createElement("div");
+      appendChild(row, createElement("dt", "", `${label}：`));
+      appendChild(row, createElement("dd", "", value));
+      appendChild(list, row);
+    });
+    appendChild(parent, list);
+  }
+
+  function renderStepEvent(event) {
+    const kind = stepEventKind(event);
+    const item = createElement("li", `step-event-card ${kind}`);
+    if (item) {
+      item.setAttribute("data-step-event-kind", kind);
+    }
+    appendChild(item, createElement("span", "step-event-label", stepEventLabel(kind)));
+    appendChild(item, createElement("p", "step-event-title", eventTitle(event)));
+    appendKeyValueList(item, eventMetaEntries(event), "step-event-meta");
+    return item;
+  }
+
+  function renderStepProcess(detail, step) {
+    const events = compactDisplayEvents(Array.isArray(step && step.events) ? step.events : []);
+    if (events.length === 0) {
+      return;
+    }
+    const process = createElement("details", "step-process");
+    if (process) {
+      process.setAttribute("data-step-process", step.id || "");
+    }
+    const head = createElement("summary", "step-process-head");
+    appendChild(head, createElement("strong", "", "思考过程"));
+    appendChild(head, createElement("span", "", `${events.length} 条事件`));
+    appendChild(process, head);
+    const eventList = createElement("ul", "step-event-list step-process-events");
+    events.forEach((event) => {
+      const item = renderStepEvent(event);
+      if (item) {
+        item.setAttribute("data-step-process-event", stepEventKind(event));
+      }
+      appendChild(eventList, item);
+    });
+    appendChild(process, eventList);
+    appendChild(detail, process);
+  }
+
+  function renderStepResult(detail, step) {
+    const completion = latestStepCompletion(step);
+    const options = conclusionOptionItems(completion.conclusion);
+    if (options.length > 0) {
+      const list = createElement("div", "step-result-options");
+      options.forEach((option, index) => {
+        const candidate = candidateFromDisplayItem(option);
+        const candidateIndex = candidateIndexOf(candidate, index);
+        const item = createElement("article", "step-result-option");
+        if (item) {
+          item.setAttribute("data-step-result-option", String(candidateIndex));
+        }
+        appendChild(item, createElement("strong", "", candidate.name || `方案 ${candidateIndex}`));
+        if (candidate.summary) {
+          appendChild(item, createElement("span", "", candidate.summary));
+        }
+        if (candidate.template && candidate.template !== candidate.summary && candidate.template !== candidate.name) {
+          appendChild(item, createElement("span", "", candidate.template));
+        }
+        if (candidate.totalMonthlyCost !== "" && candidate.totalMonthlyCost !== null && candidate.totalMonthlyCost !== undefined) {
+          appendChild(item, createElement("span", "price", candidate.totalMonthlyCost));
+        }
+        if (candidate.outputPath) {
+          appendChild(item, createElement("span", "template-path", `模板：${candidate.outputPath}`));
+        }
+        appendChild(list, item);
+      });
+      appendChild(detail, list);
+      return;
+    }
+    const entries = conclusionFieldEntries(completion.conclusion);
+    if (entries.length > 0) {
+      const list = createElement("dl", "step-result-list");
+      entries.forEach((entry) => {
+        const row = createElement("div");
+        if (row) {
+          row.setAttribute("data-step-result-field", entry.key);
+        }
+        appendChild(row, createElement("dt", "", `${entry.label}：`));
+        appendChild(row, createElement("dd", "", entry.value));
+        appendChild(list, row);
+      });
+      appendChild(detail, list);
+      return;
+    }
+    appendChild(detail, createElement("p", "step-result", completion.text || "已完成本步骤。"));
+  }
+
+  function candidateResultSummary(candidate) {
+    return (
+      (candidate && (candidate.summary || candidate.template || candidate.description || candidate.pros)) ||
+      "方案摘要已生成，可在右侧查看完整方案。"
+    );
+  }
+
+  function isTemplateLikeText(value) {
+    const text = String(value || "");
+    if (!text) {
+      return false;
+    }
+    return (
+      /ROSTemplateFormatVersion|ALIYUN::|Resources:\s|Parameters:\s|Metadata:\s/.test(text) ||
+      (text.length > 240 && /Type:\s|Properties:\s|Description:\s/.test(text))
+    );
+  }
+
+  function candidateResultSummaryDisplay(candidate) {
+    const rawSummary = candidateResultSummary(candidate);
+    const templateText = candidate && isTemplateLikeText(candidate.template) ? String(candidate.template) : "";
+    if (isTemplateLikeText(rawSummary)) {
+      return {
+        text: "模板内容已生成，悬浮查看完整模板。",
+        template: String(rawSummary),
+      };
+    }
+    const compactSummary = compactText(rawSummary, 140);
+    return {
+      text: compactSummary,
+      template: templateText,
+      title: compactSummary !== String(rawSummary || "") ? String(rawSummary || "") : "",
+    };
+  }
+
+  function attachTemplatePopover(host, templateText) {
+    if (!host || !templateText) {
+      return host;
+    }
+    addClassName(host, "template-popover-host");
+    const popover = createElement("div", "template-popover");
+    if (popover) {
+      popover.setAttribute("data-template-popover", "true");
+      popover.setAttribute("role", "tooltip");
+      popover.setAttribute("tabindex", "0");
+    }
+    appendChild(popover, createElement("div", "template-popover-title", "模板内容"));
+    appendChild(popover, createElement("pre", "", templateText));
+    appendChild(host, popover);
+    return host;
+  }
+
+  function renderCandidateProcess(process, candidate, candidateIndex) {
+    const events = compactDisplayEvents(Array.isArray(candidate && candidate.subEvents) ? candidate.subEvents : []);
+    const renderableEvents = candidateRenderableSubEvents(events);
+    if (renderableEvents.length === 0) {
+      return;
+    }
+    const details = createElement("details", "step-candidate-result-process");
+    if (details) {
+      details.setAttribute("data-step-candidate-result-process", String(candidateIndex));
+      details.open = false;
+    }
+    const head = createElement("summary", "step-process-head");
+    appendChild(head, createElement("strong", "", "思考过程"));
+    const groups = groupCandidateSubEvents(renderableEvents, { forceComplete: candidateEvaluationIsComplete() });
+    appendChild(head, createElement("span", "", `${groups.length} 个子步骤`));
+    appendChild(details, head);
+    const body = createElement("div", "step-candidate-result-process-body");
+    const substeps = createElement("div", "candidate-substeps");
+    groups.forEach((group) => {
+      appendChild(substeps, renderCandidateSubstepGroup(group));
+    });
+    appendChild(body, substeps);
+    appendChild(details, body);
+    appendChild(process, details);
+  }
+
+  function renderStepCandidateResults(detail, step) {
+    if (!step || step.id !== "evaluate_candidates") {
+      return false;
+    }
+    const state = ensureState();
+    const candidates = Array.isArray(state.candidates) ? state.candidates : [];
+    if (candidates.length === 0) {
+      return false;
+    }
+    const list = createElement("div", "step-candidate-result-list");
+    candidates.forEach((candidate, index) => {
+      const candidateIndex = candidateIndexOf(candidate, index);
+      const item = createElement("article", "step-candidate-result");
+      if (item) {
+        item.setAttribute("data-step-candidate-result", String(candidateIndex));
+      }
+      const summary = candidateResultSummaryDisplay(candidate);
+      const head = createElement("div", "step-candidate-result-head");
+      appendChild(head, createElement("strong", "", `方案 ${candidateIndex}`));
+      appendChild(head, createElement("span", "", candidate.name || `方案 ${candidateIndex}`));
+      appendChild(item, head);
+      appendChild(item, createElement("span", "step-candidate-result-label", "评估结论"));
+      const summaryNode = createElement("p", "step-candidate-result-summary", summary.text);
+      if (summaryNode) {
+        summaryNode.setAttribute("data-step-candidate-result-summary", String(candidateIndex));
+      }
+      appendChild(item, summaryNode);
+      if (candidate.template && candidate.template !== candidate.summary && !isTemplateLikeText(candidate.template)) {
+        appendChild(item, createElement("span", "step-candidate-result-template", candidate.template));
+      }
+      if (candidate.totalMonthlyCost !== "" && candidate.totalMonthlyCost !== null && candidate.totalMonthlyCost !== undefined) {
+        appendChild(item, createElement("span", "step-candidate-result-price", candidate.totalMonthlyCost));
+      }
+      renderCandidateProcess(item, candidate, candidateIndex);
+      attachTemplatePopover(item, summary.template);
+      appendChild(list, item);
+    });
+    appendChild(detail, list);
+    return true;
+  }
+
+  function candidateProgressText(event) {
+    const kind = candidateSubEventKind(event);
+    if (kind === "tool_result" || kind === "tool_use") {
+      return { label: candidateSubEventLabel(kind), title: eventTitle(event) };
+    }
+    if (String(kind || "").startsWith("candidate_step")) {
+      return { label: candidateSubStepLabel(event), title: eventTitle(event) };
+    }
+    return { label: stepEventLabel(kind), title: eventTitle(event) };
+  }
+
+  function renderStepCandidateProgress(detail) {
+    const state = ensureState();
+    const candidates = Array.isArray(state.candidates) ? state.candidates : [];
+    const rows = candidates
+      .map((candidate, index) => {
+        const events = compactDisplayEvents(Array.isArray(candidate && candidate.subEvents) ? candidate.subEvents : []);
+        return { candidate, candidateIndex: candidateIndexOf(candidate, index), event: events[events.length - 1] };
+      })
+      .filter((row) => row.event);
+    if (rows.length === 0) {
+      return false;
+    }
+    const list = createElement("div", "step-candidate-progress-list");
+    rows.forEach((row) => {
+      const item = createElement("article", "step-candidate-progress");
+      const progress = candidateProgressText(row.event);
+      const head = createElement("div", "step-candidate-progress-head");
+      if (item) {
+        item.setAttribute("data-step-candidate-progress", String(row.candidateIndex));
+      }
+      if (head) {
+        head.setAttribute("data-step-candidate-progress-head", String(row.candidateIndex));
+      }
+      appendChild(head, createElement("strong", "", `方案 ${row.candidateIndex}`));
+      appendChild(head, createElement("span", "", row.candidate.name || `方案 ${row.candidateIndex}`));
+      appendChild(item, head);
+      appendChild(item, createElement("span", "", progress.label));
+      appendChild(item, createElement("p", "", progress.title));
+      appendChild(list, item);
+    });
+    appendChild(detail, list);
+    return true;
+  }
+
+  function stepCanToggle(status) {
+    return status === "completed";
+  }
+
+  function stepDetailsExpanded(stepId, status) {
+    const state = ensureState();
+    return stepCanToggle(status) && Boolean(state.expandedStepDetails && state.expandedStepDetails[stepId]);
+  }
+
+  function toggleStepDetails(stepId) {
+    const state = ensureState();
+    state.expandedStepDetails = state.expandedStepDetails || {};
+    state.expandedStepDetails[stepId] = !Boolean(state.expandedStepDetails[stepId]);
+    renderAll();
+  }
+
+  function renderStepDetails(card, step, status, expanded) {
+    if (stepCanToggle(status) && !expanded) {
+      return;
+    }
+    const detail = createElement("div", "step-detail");
+
+    if (stepIsOpen(status)) {
+      const badge = createElement("span", "step-status", stepDetailStatusLabel(status));
+      appendChild(detail, badge);
+      if (status === "waiting_input") {
+        const state = ensureState();
+        renderPendingInputCard(detail, state);
+        renderStepProcess(detail, step);
+        appendChild(card, detail);
+        return;
+      }
+      const handledByCandidateSummary = step.id === "evaluate_candidates" && renderStepCandidateProgress(detail);
+      if (!handledByCandidateSummary) {
+        const events = compactDisplayEvents(Array.isArray(step.events) ? step.events : []);
+        const eventList = createElement("ul", "step-event-list");
+        if (eventList) {
+          eventList.setAttribute("data-step-event-list", step.id || "");
+        }
+        events.forEach((event) => {
+          appendChild(eventList, renderStepEvent(event));
+        });
+        if (events.length === 0) {
+          appendChild(eventList, createElement("li", "step-event-card", STEP_DESCRIPTIONS[step.id] || "正在处理当前步骤"));
+        }
+        appendChild(detail, eventList);
+        scrollElementToBottom(eventList);
+      }
+    } else if (status === "completed" && expanded) {
+      if (!renderStepCandidateResults(detail, step)) {
+        renderStepResult(detail, step);
+        renderStepProcess(detail, step);
+      }
+    } else if (status === "failed" || status === "error") {
+      const badge = createElement("span", "step-status", stepDetailStatusLabel(status));
+      appendChild(detail, badge);
+      renderStepResult(detail, step);
+      renderStepProcess(detail, step);
+    }
+    appendChild(card, detail);
+  }
+
+  function candidateChoiceText(candidate, fallbackIndex) {
+    const candidateIndex = candidateIndexOf(candidate, fallbackIndex);
+    const name = candidate && candidate.name ? candidate.name : `方案 ${candidateIndex}`;
+    const summary = candidate && candidate.summary ? candidate.summary : "";
+    const price = presentValue(candidate && candidate.totalMonthlyCost, "");
+    return `${name}${summary}${price}`;
+  }
+
+  function pendingInputIsCandidateSelection(pendingInput) {
+    if (!pendingInput || typeof pendingInput !== "object") {
+      return false;
+    }
+    const kind = pendingInput.kind || "";
+    return kind === "candidate_selection" || kind === "candidate_select";
+  }
+
+  function candidatesForPendingSelection(state) {
+    const pendingInput = state && state.pendingInput;
+    if (!pendingInputIsCandidateSelection(pendingInput)) {
+      return [];
+    }
+    const candidates = Array.isArray(state.candidates) ? state.candidates : [];
+    if (candidates.length > 0) {
+      return candidates;
+    }
+    return Array.isArray(pendingInput.options) ? pendingInput.options.map(candidateFromDisplayItem).filter(Boolean) : [];
+  }
+
+  function renderCandidateChoiceList(parent, state) {
+    const candidates = candidatesForPendingSelection(state);
+    if (candidates.length === 0) {
+      return false;
+    }
+    const list = createElement("div", "candidate-choice-list");
+    candidates.forEach((candidate, index) => {
+      const candidateIndex = candidateIndexOf(candidate, index);
+      const isSelected = state.selectedCandidateIndex === candidateIndex;
+      const choice = createElement("button", `candidate-choice${isSelected ? " selected" : ""}`);
+      if (choice) {
+        choice.setAttribute("type", "button");
+        choice.setAttribute("data-candidate-choice", String(candidateIndex));
+        choice.setAttribute("aria-pressed", isSelected ? "true" : "false");
+        choice.addEventListener("click", () => {
+          controller.state = selectCandidate(ensureState(), candidateIndex);
+          syncComposerWithSelectedCandidate(controller.state);
+          renderAll();
+        });
+      }
+      appendChild(choice, createElement("strong", "", candidate.name || `方案 ${candidateIndex}`));
+      const summary = candidate.summary || candidate.template || "";
+      if (summary) {
+        appendChild(choice, createElement("span", "", summary));
+      }
+      if (candidate.totalMonthlyCost !== "" && candidate.totalMonthlyCost !== null && candidate.totalMonthlyCost !== undefined) {
+        appendChild(choice, createElement("span", "price", candidate.totalMonthlyCost));
+      }
+      appendChild(list, choice);
+    });
+    appendChild(parent, list);
+    return true;
+  }
+
+  function pendingInputKindLabel(kind) {
+    if (kind === "candidate_selection" || kind === "candidate_select") {
+      return "请选择方案";
+    }
+    if (kind === "ask_user_question") {
+      return "需要您确认";
+    }
+    return "需要您处理";
+  }
+
+  function pendingInputPrompt(pendingInput) {
+    return pendingInput && (pendingInput.prompt || pendingInput.question || pendingInput.freeTextPrompt || pendingInput.free_text_prompt)
+      ? pendingInput.prompt || pendingInput.question || pendingInput.freeTextPrompt || pendingInput.free_text_prompt
+      : "请补充信息后继续。";
+  }
+
+  function pendingOptionId(option, index) {
+    const rawId = option && (option.id ?? option.value ?? option.candidateIndex ?? option.candidate_index ?? index);
+    return rawId === null || rawId === undefined ? String(index) : String(rawId);
+  }
+
+  function candidateIndexFromPendingOption(option, index) {
+    if (option && typeof option === "object") {
+      const nestedCandidate = option.candidate && typeof option.candidate === "object" ? option.candidate : {};
+      const rawCandidateIndex =
+        option.candidateIndex ??
+        option.candidate_index ??
+        option.optionIndex ??
+        option.option_index ??
+        nestedCandidate.index ??
+        nestedCandidate.candidateIndex ??
+        nestedCandidate.candidate_index ??
+        null;
+      if (rawCandidateIndex !== null && rawCandidateIndex !== undefined && rawCandidateIndex !== "") {
+        const numericIndex = Number(rawCandidateIndex);
+        return Number.isFinite(numericIndex) ? numericIndex : rawCandidateIndex;
+      }
+    }
+    const optionId = pendingOptionId(option, index);
+    const numericOptionId = Number(optionId);
+    return Number.isFinite(numericOptionId) ? numericOptionId : null;
+  }
+
+  function pendingOptionLabel(option, index) {
+    if (!option || typeof option !== "object") {
+      return option === 0 || option ? String(option) : `选项 ${index + 1}`;
+    }
+    return option.label || option.title || option.name || option.candidateName || `选项 ${index + 1}`;
+  }
+
+  function pendingOptionDescription(option) {
+    if (!option || typeof option !== "object") {
+      return "";
+    }
+    return [option.description || option.summary || "", option.totalMonthlyCost || option.total_monthly_cost || option.price || ""]
+      .filter(Boolean)
+      .join("");
+  }
+
+  function syncComposerWithSelectedCandidate(state) {
+    const composer = byId("composer-input");
+    if (composer && "value" in composer) {
+      composer.value = promptForSelectedCandidate(state || ensureState());
+    }
+  }
+
+  function handlePendingInputOption(option, index) {
+    const state = ensureState();
+    const pendingInput = state.pendingInput || {};
+    const kind = pendingInput.kind || "";
+    const optionId = pendingOptionId(option, index);
+    const candidateIndex = candidateIndexFromPendingOption(option, index);
+    const composer = byId("composer-input");
+    state.selectedPendingInputOptionId = optionId;
+    if (kind === "candidate_selection" || kind === "candidate_select") {
+      if (candidateIndex !== null && candidateIndex !== undefined) {
+        controller.state = selectCandidate(state, candidateIndex);
+        controller.state.selectedPendingInputOptionId = optionId;
+        syncComposerWithSelectedCandidate(controller.state);
+      } else if (composer && "value" in composer) {
+        composer.value = optionId || pendingOptionLabel(option, index);
+      }
+      renderAll();
+      return;
+    }
+    if (candidateIndex !== null && candidateIndex !== undefined) {
+      controller.state = selectCandidate(state, candidateIndex);
+      controller.state.selectedPendingInputOptionId = optionId;
+    }
+    if (composer && "value" in composer) {
+      composer.value = optionId || pendingOptionLabel(option, index);
+    }
+    renderAll();
+  }
+
+  function renderPendingInputCard(parent, state) {
+    const pendingInput = state && state.pendingInput;
+    if (!pendingInput) {
+      return;
+    }
+    const kind = pendingInput.kind || "input";
+    const isCandidateSelection = pendingInputIsCandidateSelection(pendingInput);
+    const card = createElement("section", "pending-input-card");
+    if (card) {
+      card.setAttribute("data-pending-input-kind", kind);
+    }
+    appendChild(card, createElement("h2", "", pendingInputKindLabel(kind)));
+    appendChild(card, renderMarkdownText(pendingInputPrompt(pendingInput), "pending-input-prompt"));
+    const options = Array.isArray(pendingInput.options) ? pendingInput.options : [];
+    if (options.length > 0) {
+      const optionList = createElement("div", "pending-input-options");
+      options.forEach((option, index) => {
+        const optionId = pendingOptionId(option, index);
+        const candidateIndex = candidateIndexFromPendingOption(option, index);
+        const isSelected =
+          state.selectedPendingInputOptionId === optionId ||
+          (candidateIndex !== null && candidateIndex !== undefined && state.selectedCandidateIndex === candidateIndex);
+        const optionButton = createElement("button", `pending-input-option${isSelected ? " selected" : ""}`);
+        if (optionButton) {
+          optionButton.setAttribute("type", "button");
+          optionButton.setAttribute("data-pending-input-option", optionId);
+          optionButton.setAttribute("aria-pressed", isSelected ? "true" : "false");
+          if (candidateIndex !== null && candidateIndex !== undefined) {
+            optionButton.setAttribute("data-candidate-choice", String(candidateIndex));
+          }
+          optionButton.addEventListener("click", () => handlePendingInputOption(option, index));
+        }
+        appendChild(optionButton, createElement("strong", "", pendingOptionLabel(option, index)));
+        const description = pendingOptionDescription(option);
+        if (description) {
+          appendChild(optionButton, renderMarkdownText(description, "pending-input-option-description"));
+        }
+        appendChild(optionList, optionButton);
+      });
+      appendChild(card, optionList);
+    }
+    appendChild(parent, card);
+  }
+
+  function ensureState() {
+    if (!controller.state) {
+      const defaults =
+        window.SELLING_CONSOLE_DEFAULTS && typeof window.SELLING_CONSOLE_DEFAULTS === "object"
+          ? window.SELLING_CONSOLE_DEFAULTS
+          : {};
+      controller.state = createInitialState(defaults);
+    }
+    return controller.state;
+  }
+
+  function syncConnectionControlsFromState() {
+    const state = ensureState();
+    const serverInput = byId("server-url");
+    const cwdInput = byId("cwd");
+    if (serverInput && "value" in serverInput && !serverInput.value && state.serverUrl) {
+      serverInput.value = state.serverUrl;
+    }
+    if (cwdInput && "value" in cwdInput && !cwdInput.value && state.cwd) {
+      cwdInput.value = state.cwd;
+    }
+  }
+
+  function syncStateFromConnectionControls() {
+    const state = ensureState();
+    const serverInput = byId("server-url");
+    const cwdInput = byId("cwd");
+    if (serverInput && "value" in serverInput) {
+      state.serverUrl = String(serverInput.value || "").trim();
+    }
+    if (cwdInput && "value" in cwdInput) {
+      state.cwd = String(cwdInput.value || "").trim();
+    }
+    return state;
+  }
+
+  function renderStatus() {
+    const state = ensureState();
+    const statusPill = byId("status-pill");
+    if (statusPill) {
+      statusPill.textContent = statusLabel(state.pendingInput ? "waiting_input" : state.status);
+    }
+  }
+
+  function stepModelsForProgress(state, ui, options = {}) {
+    const steps = STEP_ORDER.map((stepId, index) => {
+      const step = state.steps && state.steps[stepId] ? state.steps[stepId] : createSteps()[stepId];
+      const status = stepStatusClass(normalizeStatus(step.status) || "pending");
+      return {
+        id: stepId,
+        index,
+        label: step.label || STEP_LABELS[stepId] || stepId,
+        status,
+      };
+    });
+    if (options.useConfiguredActiveStep && ui && Number.isInteger(ui.activeStepIndex)) {
+      return { steps, activeIndex: ui.activeStepIndex };
+    }
+    const currentIndex = steps.findIndex((step) => step.status === "working" || step.status === "waiting_input");
+    if (currentIndex >= 0) {
+      return { steps, activeIndex: currentIndex };
+    }
+    const lastCompletedIndex = steps.reduce((lastIndex, step, index) => (step.status === "completed" ? index : lastIndex), -1);
+    return { steps, activeIndex: Math.max(0, lastCompletedIndex) };
+  }
+
+  function progressVisualStatus(step, activeIndex) {
+    if (step.status === "failed" || step.status === "error") {
+      return "failed";
+    }
+    if (step.status === "completed" || step.index < activeIndex) {
+      return "done";
+    }
+    if (step.index === activeIndex) {
+      return "active";
+    }
+    return "pending";
+  }
+
+  function stepTipText(step, activeIndex) {
+    const visualStatus = progressVisualStatus(step, activeIndex);
+    if (visualStatus === "done") {
+      return `${step.label}：已完成`;
+    }
+    if (visualStatus === "active") {
+      return `${step.label}：当前步骤`;
+    }
+    if (visualStatus === "failed") {
+      return `${step.label}：处理异常`;
+    }
+    return `${step.label}：等待前序步骤`;
+  }
+
+  function applyProgressRoot(progress, variant) {
+    const className = variant === "a" ? "composer-progress chevrons" : `composer-progress progress-shell progress-variant-${variant}`;
+    progress.className = className;
+    if (typeof progress.setAttribute === "function") {
+      progress.setAttribute("class", className);
+    }
+    progress.setAttribute("data-progress-variant", variant);
+  }
+
+  function debugDrawerIsOpen() {
+    const drawer = byId("debug-drawer");
+    return Boolean(drawer && drawer.open);
+  }
+
+  function hideComposerProgress(progress, ui) {
+    clearElement(progress);
+    cancelProgressAnimation();
+    progress.hidden = true;
+    progress.className = "composer-progress";
+    if (typeof progress.setAttribute === "function") {
+      progress.setAttribute("class", "composer-progress");
+      progress.setAttribute("data-progress-variant", ui.variant);
+      progress.setAttribute("data-progress-mode", "pipeline");
+      progress.setAttribute("data-progress-visible", "false");
+    }
+  }
+
+  function renderChevronProgress(progress, models, params) {
+    applyProgressRoot(progress, "a");
+    progress.setAttribute("style", `--progress-a-sweep-ms: ${params.sweepMs}ms;`);
+    models.steps.forEach((step) => {
+      const visualStatus = progressVisualStatus(step, models.activeIndex);
+      const item = createElement("div", `step ${visualStatus === "done" ? "done" : visualStatus === "active" ? "active" : ""}`);
+      if (item) {
+        item.setAttribute("data-step-index", String(step.index));
+        item.setAttribute("data-progress-step", step.id);
+        item.setAttribute("data-status", step.status);
+        item.setAttribute("title", stepTipText(step, models.activeIndex));
+      }
+      appendChild(item, document.createTextNode ? document.createTextNode(step.label) : createElement("span", "", step.label));
+      appendChild(item, createElement("span", "tip", stepTipText(step, models.activeIndex)));
+      appendChild(progress, item);
+    });
+  }
+
+  function pathLine(startX, endX, y = 22) {
+    return startX === endX ? "" : `M ${startX} ${y} L ${endX} ${y}`;
+  }
+
+  function renderSignalProgress(progress, models, params) {
+    applyProgressRoot(progress, "b");
+    const activeIndex = models.activeIndex;
+    const stepPercents = [6, 28, 50, 72, 94];
+    const stepXs = [20, 96, 172, 248, 324];
+    const railStartX = stepXs[0];
+    const railEndX = stepXs[stepXs.length - 1];
+    const previousX = activeIndex > 0 ? stepXs[activeIndex - 1] : 0;
+    const currentX = stepXs[activeIndex];
+    const nextX = activeIndex < stepXs.length - 1 ? stepXs[activeIndex + 1] : 344;
+    const shell = createElement("div", "signal-circuit");
+    if (shell) {
+      shell.setAttribute("data-active-index", String(activeIndex));
+      shell.setAttribute("style", `--absorb-duration: ${params.pauseTime}ms;`);
+    }
+    const svg = createElement("svg", "signal-svg");
+    if (svg) {
+      svg.setAttribute("viewBox", "0 0 344 44");
+      svg.setAttribute("preserveAspectRatio", "none");
+      svg.setAttribute("aria-hidden", "true");
+      [
+        ["signal-rail", pathLine(railStartX, railEndX)],
+        ["signal-done", activeIndex > 0 ? pathLine(railStartX, stepXs[activeIndex - 1]) : ""],
+        ["signal-active-base signal-active-in", pathLine(previousX, currentX)],
+        ["signal-active-base signal-active-out", pathLine(currentX, nextX)],
+        ["signal-moving-wave", ""],
+      ].forEach(([className, pathValue]) => {
+        const path = createElement("path", className);
+        if (path) {
+          path.setAttribute("d", pathValue);
+        }
+        appendChild(svg, path);
+      });
+    }
+    appendChild(shell, svg);
+    const halo = createElement("span", "signal-absorb-halo");
+    if (halo) {
+      halo.setAttribute("aria-hidden", "true");
+      halo.setAttribute("style", `left:${stepPercents[activeIndex]}%`);
+    }
+    appendChild(shell, halo);
+    models.steps.forEach((step) => {
+      const visualStatus = progressVisualStatus(step, activeIndex);
+      const nodeClass = [
+        "signal-node",
+        visualStatus === "active" ? "active" : "",
+        visualStatus === "pending" ? "pending" : "",
+        step.index === activeIndex + 1 ? "next" : "",
+      ].filter(Boolean).join(" ");
+      const node = createElement("span", nodeClass);
+      if (node) {
+        node.setAttribute("data-step-index", String(step.index));
+        node.setAttribute("data-progress-step", step.id);
+        node.setAttribute("data-status", step.status);
+        node.setAttribute("style", `left: ${stepPercents[step.index]}%`);
+        node.setAttribute("title", stepTipText(step, activeIndex));
+      }
+      appendChild(node, createElement("span", "signal-node-charge"));
+      appendChild(node, createElement("span", "signal-node-core"));
+      appendChild(shell, node);
+    });
+    const labels = createElement("div", "signal-labels");
+    models.steps.forEach((step) => {
+      const label = createElement("span", progressVisualStatus(step, activeIndex) === "active" ? "active" : "", step.label);
+      if (label) {
+        label.setAttribute("data-step-index", String(step.index));
+        label.setAttribute("style", `left: ${stepPercents[step.index]}%`);
+      }
+      appendChild(labels, label);
+    });
+    appendChild(shell, labels);
+    appendChild(progress, shell);
+  }
+
+  function renderFusionProgress(progress, models, params) {
+    applyProgressRoot(progress, "d");
+    const activeIndex = models.activeIndex;
+    const shell = createElement("div", "fusion-label");
+    if (shell) {
+      shell.setAttribute("data-active-index", String(activeIndex));
+      shell.setAttribute("style", `--fusion-sweep-duration: ${params.t1}ms;`);
+    }
+    const steps = createElement("div", "fusion-steps");
+    models.steps.forEach((step) => {
+      const visualStatus = progressVisualStatus(step, activeIndex);
+      const item = createElement("div", `fusion-step ${visualStatus === "done" ? "done" : visualStatus === "active" ? "active" : ""}`);
+      if (item) {
+        item.setAttribute("data-step-index", String(step.index));
+        item.setAttribute("data-progress-step", step.id);
+        item.setAttribute("data-status", step.status);
+        item.setAttribute("title", stepTipText(step, activeIndex));
+      }
+      appendChild(item, createElement("span", "label", step.label));
+      appendChild(item, createElement("span", "tip", stepTipText(step, activeIndex)));
+      appendChild(steps, item);
+    });
+    appendChild(shell, steps);
+    appendChild(progress, shell);
+  }
+
+  function renderNormalHandoffMessage(stepList, state) {
+    if (!stepList || !state || !state.normalHandoffReady) {
+      return false;
+    }
+    const message = createElement("article", "normal-handoff-message");
+    if (message) {
+      message.setAttribute("data-normal-handoff-message", "true");
+      message.setAttribute("role", "status");
+    }
+    appendChild(message, createElement("p", "", NORMAL_HANDOFF_TEXT));
+    appendChild(stepList, createChatMessage("system", message));
+    return true;
+  }
+
+  function createChatMessage(role, content) {
+    const messageRole = role === "user" ? "user" : "system";
+    const message = createElement("div", `chat-message ${messageRole}`);
+    if (message) {
+      message.setAttribute("data-chat-message", messageRole);
+    }
+    const avatar = createElement("span", `chat-avatar ${messageRole}`, messageRole === "user" ? "U" : "AI");
+    if (avatar) {
+      avatar.setAttribute("data-chat-avatar", messageRole);
+    }
+    const bubble = createElement("div", "chat-bubble");
+    appendChild(bubble, content);
+    appendChild(message, avatar);
+    appendChild(message, bubble);
+    return message;
+  }
+
+  function createUserMessage(text) {
+    return createChatMessage("user", createElement("p", "user-message-text", text));
+  }
+
+  function normalProcessIsExpanded(turn) {
+    const state = ensureState();
+    if (turn && turn.status === "working") {
+      return true;
+    }
+    return Boolean(state.expandedNormalProcesses && turn && state.expandedNormalProcesses[turn.id]);
+  }
+
+  function normalProcessEventLabel(kind) {
+    return {
+      thinking: "思考",
+      tool: "工具",
+      permission: "权限",
+      error: "异常",
+    }[kind] || "过程";
+  }
+
+  function renderNormalProcess(turn) {
+    const events = Array.isArray(turn && turn.events) ? turn.events : [];
+    if (!events.length) {
+      return null;
+    }
+    const details = createElement("details", "normal-process");
+    if (details) {
+      details.setAttribute("data-normal-process", turn.id);
+      details.open = normalProcessIsExpanded(turn);
+      details.addEventListener("toggle", () => {
+        if (turn.status === "working") {
+          return;
+        }
+        const state = ensureState();
+        state.expandedNormalProcesses = state.expandedNormalProcesses || {};
+        state.expandedNormalProcesses[turn.id] = Boolean(details.open);
+      });
+    }
+    const summary = createElement("summary", "normal-process-summary");
+    appendChild(summary, createElement("span", "normal-process-title", "思考过程"));
+    appendChild(summary, createElement("span", "normal-process-count", `${events.length} 条`));
+    appendChild(details, summary);
+    const list = createElement("ul", "normal-process-events");
+    events.forEach((event) => {
+      const kind = event && event.kind ? String(event.kind) : "event";
+      const item = createElement("li", `normal-process-event ${kind}`);
+      if (item) {
+        item.setAttribute("data-normal-process-event", kind);
+      }
+      appendChild(item, createElement("span", "normal-process-event-label", event.label || normalProcessEventLabel(kind)));
+      appendChild(item, createElement("p", "", event.text || ""));
+      appendChild(list, item);
+    });
+    appendChild(details, list);
+    return details;
+  }
+
+  function renderNormalTurn(stepList, turn, renderedTurnIds) {
+    if (!stepList || !turn || (renderedTurnIds && renderedTurnIds.has(turn.id))) {
+      return;
+    }
+    const content = createElement("article", `normal-turn ${turn.status || "completed"}`);
+    if (content) {
+      content.setAttribute("data-normal-turn", turn.id);
+    }
+    appendChild(content, renderNormalProcess(turn));
+    const answer = createElement(
+      "p",
+      "normal-answer",
+      turn.answer || (turn.status === "working" ? "正在整理回复..." : "")
+    );
+    if (answer) {
+      answer.setAttribute("data-normal-answer", turn.id);
+    }
+    appendChild(content, answer);
+    appendChild(stepList, createChatMessage("system", content));
+    if (renderedTurnIds) {
+      renderedTurnIds.add(turn.id);
+    }
+  }
+
+  function userMessageKey(item, index) {
+    return item && item.id ? String(item.id) : `user-message-${index}`;
+  }
+
+  function userMessagePlacement(item) {
+    const placement = item && item.placement && typeof item.placement === "object" ? item.placement : {};
+    if (placement.position === "after_normal_handoff" || placement.after === "normal_handoff") {
+      return { position: "after_normal_handoff" };
+    }
+    if (placement.afterStepId || item.afterStepId) {
+      return { position: "after_step", afterStepId: placement.afterStepId || item.afterStepId };
+    }
+    return { position: "start" };
+  }
+
+  function messageBelongsToPosition(item, position, value) {
+    const placement = userMessagePlacement(item);
+    if (position === "start") {
+      return placement.position === "start";
+    }
+    if (position === "after_normal_handoff") {
+      return placement.position === "after_normal_handoff";
+    }
+    if (position === "after_step") {
+      return placement.position === "after_step" && placement.afterStepId === value;
+    }
+    return false;
+  }
+
+  function renderUserMessages(stepList, state, position, value, renderedKeys) {
+    const messages = Array.isArray(state && state.userMessages) ? state.userMessages : [];
+    messages.forEach((item, index) => {
+      const key = userMessageKey(item, index);
+      if (renderedKeys && renderedKeys.has(key)) {
+        return;
+      }
+      if (!messageBelongsToPosition(item, position, value)) {
+        return;
+      }
+      const text = item && item.text ? String(item.text) : "";
+      if (!text) {
+        return;
+      }
+      appendChild(stepList, createUserMessage(text));
+      if (renderedKeys) {
+        renderedKeys.add(key);
+      }
+    });
+  }
+
+  function renderNormalHandoffConversation(stepList, state, renderedKeys) {
+    const messages = Array.isArray(state && state.userMessages) ? state.userMessages : [];
+    const turns = Array.isArray(state && state.normalTurns) ? state.normalTurns : [];
+    const renderedTurnIds = new Set();
+    messages.forEach((item, index) => {
+      const key = userMessageKey(item, index);
+      if (renderedKeys && renderedKeys.has(key)) {
+        return;
+      }
+      if (!messageBelongsToPosition(item, "after_normal_handoff", "")) {
+        return;
+      }
+      const text = item && item.text ? String(item.text) : "";
+      if (!text) {
+        return;
+      }
+      appendChild(stepList, createUserMessage(text));
+      if (renderedKeys) {
+        renderedKeys.add(key);
+      }
+      turns
+        .filter((turn) => turn && turn.afterUserMessageId === key)
+        .forEach((turn) => renderNormalTurn(stepList, turn, renderedTurnIds));
+    });
+    turns
+      .filter((turn) => turn && !renderedTurnIds.has(turn.id))
+      .forEach((turn) => renderNormalTurn(stepList, turn, renderedTurnIds));
+  }
+
+  function userMessagePlacementForState(state) {
+    if (state && state.normalHandoffReady) {
+      return { position: "after_normal_handoff" };
+    }
+    if (state && pendingInputIsCandidateSelection(state.pendingInput)) {
+      return { position: "after_step", afterStepId: "confirm_and_select" };
+    }
+    const steps = (state && state.steps) || {};
+    const activeStepId = STEP_ORDER.find((stepId) => {
+      const status = stepStatusClass(normalizeStatus(steps[stepId] && steps[stepId].status));
+      return status === "working" || status === "waiting_input";
+    });
+    if (state && state.pendingInput && activeStepId) {
+      return { position: "after_step", afterStepId: activeStepId };
+    }
+    return { position: "start" };
+  }
+
+  function renderSteps() {
+    const state = ensureState();
+    const stepList = byId("step-list");
+    if (!stepList || !canCreateElements()) {
+      return;
+    }
+    clearElement(stepList);
+    const renderedUserMessages = new Set();
+    renderUserMessages(stepList, state, "start", "", renderedUserMessages);
+    STEP_ORDER.forEach((stepId, index) => {
+      const step = state.steps && state.steps[stepId] ? state.steps[stepId] : createSteps()[stepId];
+      if (!stepIsVisible(step)) {
+        return;
+      }
+      const status = stepStatusClass(normalizeStatus(step.status) || "pending");
+      const isCurrent = stepIsOpen(status);
+      const isExpanded = stepDetailsExpanded(stepId, status);
+      const card = createElement("article", `step-card ${status}${isCurrent ? " current" : ""}`);
+      const marker = createElement("span", "step-index");
+      const body = createElement("div", "step-card-body");
+      const title = createElement("h2", "", step.label || STEP_LABELS[stepId] || stepId);
+      if (card) {
+        card.setAttribute("data-step-id", stepId);
+        card.setAttribute("data-status", status);
+        if (isCurrent) {
+          card.setAttribute("aria-current", "step");
+        }
+      }
+      const iconText = stepStateIcon(status);
+      if (iconText) {
+        const icon = createElement("span", `step-state-icon ${status}`, iconText);
+        if (icon) {
+          icon.setAttribute("data-step-state-icon", status);
+        }
+        appendChild(marker, icon);
+      }
+      if (stepCanToggle(status)) {
+        const toggle = createElement("button", "step-toggle");
+        if (toggle) {
+          toggle.setAttribute("type", "button");
+          toggle.setAttribute("data-step-toggle", stepId);
+          toggle.setAttribute("aria-expanded", isExpanded ? "true" : "false");
+          toggle.addEventListener("click", () => toggleStepDetails(stepId));
+        }
+        appendChild(toggle, title);
+        appendChild(toggle, createElement("span", `step-toggle-icon${isExpanded ? " expanded" : ""}`));
+        appendChild(body, toggle);
+      } else {
+        appendChild(body, title);
+      }
+      appendChild(card, marker);
+      appendChild(card, body);
+      renderStepDetails(card, step, status, isExpanded);
+      appendChild(stepList, createChatMessage("system", card));
+      renderUserMessages(stepList, state, "after_step", stepId, renderedUserMessages);
+    });
+    if (renderNormalHandoffMessage(stepList, state)) {
+      renderNormalHandoffConversation(stepList, state, renderedUserMessages);
+    }
+    renderUserMessages(stepList, state, "after_step", "", renderedUserMessages);
+    if (stepList.children && stepList.children.length > 0) {
+      scrollElementToBottom(stepList);
+    }
+  }
+
+  function renderComposerProgress() {
+    const state = ensureState();
+    const progress = byId("composer-progress");
+    if (!progress || !canCreateElements()) {
+      return;
+    }
+    clearElement(progress);
+    const ui = mergeProgressUi(state.progressUi);
+    state.progressUi = ui;
+    const isDebugPreview = debugDrawerIsOpen();
+    if (!isDebugPreview && !state.pipelineStarted) {
+      hideComposerProgress(progress, ui);
+      return;
+    }
+    progress.hidden = false;
+    progress.setAttribute("data-progress-mode", isDebugPreview ? "debug" : "pipeline");
+    progress.setAttribute("data-progress-visible", "true");
+    const models = stepModelsForProgress(state, ui, { useConfiguredActiveStep: isDebugPreview });
+    if (ui.variant === "a") {
+      renderChevronProgress(progress, models, ui.a);
+    } else if (ui.variant === "d") {
+      renderFusionProgress(progress, models, ui.d);
+    } else {
+      renderSignalProgress(progress, models, ui.b);
+    }
+    startProgressAnimation();
+  }
+
+  function smoothstep(edge0, edge1, value) {
+    if (edge0 === edge1) {
+      return value < edge0 ? 0 : 1;
+    }
+    const t = Math.max(0, Math.min(1, (value - edge0) / (edge1 - edge0)));
+    return t * t * (3 - 2 * t);
+  }
+
+  function cancelProgressAnimation() {
+    controller.progressAnimationToken += 1;
+    if (controller.progressAnimationFrame !== null && typeof cancelAnimationFrame === "function") {
+      cancelAnimationFrame(controller.progressAnimationFrame);
+    }
+    if (typeof window !== "undefined" && window.clearTimeout) {
+      window.clearTimeout(controller.progressRunTimer);
+      window.clearTimeout(controller.progressWaitTimer);
+    }
+    controller.progressAnimationFrame = null;
+    controller.progressRunTimer = 0;
+    controller.progressWaitTimer = 0;
+  }
+
+  function startFusionProgressAnimation(progress, ui) {
+    const label = progress.querySelector ? progress.querySelector(".fusion-label") : null;
+    if (!label || typeof requestAnimationFrame !== "function") {
+      return;
+    }
+    const activeIndex = Number(label.getAttribute("data-active-index"));
+    const timing = ui.d;
+
+    const percent = (value) => `${Math.max(0, Math.min(100, value)).toFixed(2)}%`;
+    const syncBorder = () => {
+      const activeStep = label.querySelector(`.fusion-step[data-step-index="${activeIndex}"]`);
+      if (!activeStep || !label.getBoundingClientRect || !activeStep.getBoundingClientRect) {
+        return;
+      }
+      const labelRect = label.getBoundingClientRect();
+      const activeRect = activeStep.getBoundingClientRect();
+      if (!labelRect.width) {
+        return;
+      }
+      const activeStart = ((activeRect.left - labelRect.left) / labelRect.width) * 100;
+      const activeEnd = ((activeRect.right - labelRect.left) / labelRect.width) * 100;
+      const blueStart = activeIndex === 0 ? 0 : activeStart;
+      const greenEnd = activeIndex === 0 ? 0 : activeStart;
+      const blueEnd = activeIndex === STEP_ORDER.length - 1 ? 100 : activeEnd;
+      label.style.setProperty("--fusion-green-end", percent(greenEnd));
+      label.style.setProperty("--fusion-blue-start", percent(blueStart));
+      label.style.setProperty("--fusion-blue-end", percent(blueEnd));
+      label.style.setProperty("--fusion-sweep-duration", `${timing.t1}ms`);
+    };
+
+    const restartSweeps = () => {
+      window.clearTimeout(controller.progressRunTimer);
+      window.clearTimeout(controller.progressWaitTimer);
+      label.classList.remove("sweep-wait");
+      label.classList.add("sweep-reset");
+      void label.offsetWidth;
+      label.classList.remove("sweep-reset");
+      controller.progressRunTimer = window.setTimeout(() => {
+        label.classList.add("sweep-wait");
+        controller.progressWaitTimer = window.setTimeout(restartSweeps, timing.t2);
+      }, timing.t1);
+    };
+
+    requestAnimationFrame(() => {
+      syncBorder();
+      restartSweeps();
+    });
+  }
+
+  function startSignalProgressAnimation(progress, ui) {
+    if (typeof requestAnimationFrame !== "function") {
+      return;
+    }
+    const wave = progress.querySelector ? progress.querySelector(".signal-moving-wave") : null;
+    const demo = progress.querySelector ? progress.querySelector(".signal-circuit") : null;
+    if (!wave || !demo) {
+      return;
+    }
+
+    const params = ui.b;
+    const stepXs = [20, 96, 172, 248, 324];
+    const baseY = 22;
+    const viewMinX = 0;
+    const viewMaxX = 344;
+    const virtualPadding = 66;
+    const virtualLeftX = stepXs[0] - virtualPadding;
+    const virtualRightX = stepXs[stepXs.length - 1] + virtualPadding;
+    const nodeClearance = 10;
+    const outboundTailClearance = 6;
+    let activeIndex = Number(demo.getAttribute("data-active-index"));
+    let phase = "inbound";
+    let elapsed = 0;
+    let pauseLeft = 0;
+    let last = typeof performance !== "undefined" && performance.now ? performance.now() : Date.now();
+    let cycleSalt = 0;
+    let absorbTimer = 0;
+    const token = controller.progressAnimationToken;
+
+    const clampToView = (x) => Math.max(viewMinX, Math.min(viewMaxX, x));
+    const inboundSegment = () => {
+      const currentX = stepXs[activeIndex];
+      return {
+        from: activeIndex === 0 ? virtualLeftX : stepXs[activeIndex - 1] + nodeClearance,
+        to: currentX - nodeClearance,
+        color: "#1677ff",
+        nextPhase: "pause-current",
+      };
+    };
+    const outboundSegment = () => {
+      const currentX = stepXs[activeIndex];
+      return {
+        from: currentX + nodeClearance,
+        to: activeIndex === stepXs.length - 1 ? virtualRightX : stepXs[activeIndex + 1] - outboundTailClearance,
+        color: "#8f9bae",
+        nextPhase: "pause-next",
+      };
+    };
+    const currentSegment = () => (phase === "outbound" || phase === "pause-next" ? outboundSegment() : inboundSegment());
+    const segmentMotion = (timeMs) => {
+      const x = Math.max(0.04, Math.min(0.48, params.xPercent / 100));
+      const y = Math.max(0, Math.min(1, params.yPercent / 100));
+      const t1 = Math.max(40, params.t1);
+      const t2 = Math.max(80, params.t2);
+      if (timeMs < t1) {
+        const u = Math.max(0, Math.min(1, timeMs / t1));
+        return { anchor: "right", progress: x * u, amplitudeScale: y * smoothstep(0, 1, u), done: false };
+      }
+      if (timeMs < t1 + t2) {
+        const u = Math.max(0, Math.min(1, (timeMs - t1) / t2));
+        return { anchor: "right", progress: x + (1 - x) * u, amplitudeScale: y + (1 - y) * Math.sin(Math.PI * u), done: false };
+      }
+      if (timeMs < t1 * 2 + t2) {
+        const u = Math.max(0, Math.min(1, (timeMs - t1 - t2) / t1));
+        return { anchor: "left", progress: 1 - x + x * u, amplitudeScale: y * (1 - smoothstep(0, 1, u)), done: false };
+      }
+      return { anchor: "left", progress: 1, amplitudeScale: 0, done: true };
+    };
+    const pulseShape = (t) => {
+      const micro = 0.1 * Math.sin((t * 2.6 + cycleSalt) * Math.PI);
+      const lift = Math.sin(Math.PI * smoothstep(0.16, 0.38, t));
+      const drop = Math.sin(Math.PI * smoothstep(0.37, 0.62, t));
+      const settle = 0.2 * Math.sin((t - 0.62) * Math.PI * 4.5 + cycleSalt * 0.4);
+      return micro + lift - drop * 0.86 + settle * smoothstep(0.58, 0.96, t);
+    };
+    const movingWavePath = () => {
+      if (phase === "pause-current" || phase === "pause-next") {
+        return "";
+      }
+      const segment = currentSegment();
+      const segmentLength = segment.to - segment.from;
+      const xRatio = Math.max(0.04, Math.min(0.48, params.xPercent / 100));
+      const waveLength = segmentLength * xRatio;
+      const motion = segmentMotion(elapsed);
+      const amplitude = params.maxAmplitude * motion.amplitudeScale;
+      if (amplitude < 0.2) {
+        return "";
+      }
+      const right =
+        motion.anchor === "left"
+          ? segment.from + motion.progress * segmentLength + waveLength
+          : segment.from + motion.progress * segmentLength;
+      const left = motion.anchor === "left" ? segment.from + motion.progress * segmentLength : right - waveLength;
+      const start = Math.max(segment.from, left);
+      const end = Math.min(segment.to, right);
+      if (end <= segment.from || start >= segment.to || end - start < 1) {
+        return "";
+      }
+      const points = [];
+      const samples = 54;
+      for (let i = 0; i <= samples; i += 1) {
+        const t = i / samples;
+        const x = start + t * (end - start);
+        const packetT = left < segment.from ? t : (x - left) / waveLength;
+        const envelope = smoothstep(0, 0.16, packetT) * (1 - smoothstep(0.84, 1, packetT));
+        const y = baseY - pulseShape(packetT) * amplitude * envelope;
+        points.push(`${i === 0 ? "M" : "L"} ${clampToView(x).toFixed(2)} ${y.toFixed(2)}`);
+      }
+      return points.join(" ");
+    };
+    const render = () => {
+      const segment = currentSegment();
+      wave.style.stroke = segment.color;
+      wave.setAttribute("d", movingWavePath());
+    };
+    const triggerAbsorbHalo = () => {
+      demo.classList.remove("absorbing");
+      window.clearTimeout(absorbTimer);
+      void demo.offsetWidth;
+      demo.classList.add("absorbing");
+      absorbTimer = window.setTimeout(() => {
+        demo.classList.remove("absorbing");
+      }, params.pauseTime);
+    };
+    const tick = (now) => {
+      if (token !== controller.progressAnimationToken) {
+        return;
+      }
+      const dt = Math.min(48, now - last) / 1000;
+      last = now;
+      if (phase === "pause-current" || phase === "pause-next") {
+        pauseLeft -= dt * 1000;
+        if (pauseLeft <= 0) {
+          if (phase === "pause-current") {
+            demo.classList.remove("absorbing");
+            window.clearTimeout(absorbTimer);
+          }
+          phase = phase === "pause-current" ? "outbound" : "inbound";
+          elapsed = 0;
+          cycleSalt = (cycleSalt + 0.73) % (Math.PI * 2);
+        }
+        render();
+        controller.progressAnimationFrame = requestAnimationFrame(tick);
+        return;
+      }
+      const segment = currentSegment();
+      elapsed += dt * 1000;
+      if (segmentMotion(elapsed).done) {
+        pauseLeft = params.pauseTime;
+        phase = segment.nextPhase;
+        if (phase === "pause-current") {
+          triggerAbsorbHalo();
+        }
+        elapsed = params.t1 * 2 + params.t2;
+      }
+      render();
+      controller.progressAnimationFrame = requestAnimationFrame(tick);
+    };
+
+    requestAnimationFrame((now) => {
+      last = now;
+      render();
+      tick(now);
+    });
+  }
+
+  function startProgressAnimation() {
+    cancelProgressAnimation();
+    const progress = byId("composer-progress");
+    if (!progress || progress.hidden) {
+      return;
+    }
+    const ui = mergeProgressUi(ensureState().progressUi);
+    if (progress.getAttribute("data-progress-variant") === "b") {
+      startSignalProgressAnimation(progress, ui);
+    }
+    if (progress.getAttribute("data-progress-variant") === "d") {
+      startFusionProgressAnimation(progress, ui);
+    }
+  }
+
+  function costItemLabel(item) {
+    if (!item || typeof item !== "object") {
+      return "";
+    }
+    const name = item.name || item.resource || item.type || item.product || "费用项";
+    const spec = item.spec || item.instanceType || item.instance_type || item.description || "";
+    const cost = item.monthly_cost ?? item.monthlyCost ?? item.totalMonthlyCost ?? item.cost ?? "";
+    return [name, spec, cost].filter((value) => value !== "" && value !== null && value !== undefined).join(" · ");
+  }
+
+  function presentValue(value, fallback) {
+    if (value === 0 || value) {
+      return String(value);
+    }
+    return fallback;
+  }
+
+  function candidateSubStepOf(event) {
+    const data = eventData(event);
+    return (
+      (event && event.candidateStep && typeof event.candidateStep === "object" ? event.candidateStep : null) ||
+      (event && event.candidate_step && typeof event.candidate_step === "object" ? event.candidate_step : null) ||
+      (data.candidateStep && typeof data.candidateStep === "object" ? data.candidateStep : null) ||
+      (data.candidate_step && typeof data.candidate_step === "object" ? data.candidate_step : null) ||
+      {}
+    );
+  }
+
+  function candidateSubStepLabel(event) {
+    const subStep = candidateSubStepOf(event);
+    const rawLabel = subStep.label || subStep.name || subStep.title || subStep.id || "";
+    const normalizedLabel = String(rawLabel || "").trim();
+    if (CANDIDATE_SUBSTEP_LABELS[normalizedLabel]) {
+      return CANDIDATE_SUBSTEP_LABELS[normalizedLabel];
+    }
+    return normalizedLabel || "方案思考";
+  }
+
+  function candidateSubEventKind(event) {
+    const eventType = eventTypeOf(event || {});
+    return String(eventType || "").startsWith("candidate_step") ? eventType : stepEventKind(event);
+  }
+
+  function isCandidateLifecycleEvent(event) {
+    const eventType = eventTypeOf(event || {});
+    return eventType === "candidate_started" || eventType === "candidate_completed" || eventType === "candidate_failed";
+  }
+
+  function candidateRenderableSubEvents(events) {
+    return (Array.isArray(events) ? events : []).filter((event) => !isCandidateLifecycleEvent(event));
+  }
+
+  function candidateSubEventLabel(kind) {
+    const labels = {
+      candidate_step_completed: "子步骤完成",
+      candidate_step_failed: "子步骤失败",
+      candidate_step_started: "子步骤开始",
+      candidate_started: "方案开始",
+      candidate_completed: "方案完成",
+      candidate_failed: "方案异常",
+      text_delta: "思考片段",
+      tool_result: "工具结果",
+      tool_use: "工具调用",
+    };
+    return labels[kind] || stepEventLabel(kind);
+  }
+
+  function candidateSubPipelineState(candidate) {
+    const events = Array.isArray(candidate && candidate.subEvents) ? candidate.subEvents : [];
+    const latest = events[events.length - 1];
+    const eventType = eventTypeOf(latest || {});
+    const status = normalizeStatus((latest && latest.status) || candidateSubStepOf(latest).status || "");
+    if (eventType === "candidate_completed") {
+      return "completed";
+    }
+    if (eventType === "candidate_failed") {
+      return "failed";
+    }
+    if (eventType === "candidate_step_failed" || status === "failed" || status === "error") {
+      return "failed";
+    }
+    return "working";
+  }
+
+  function candidateSubPipelineStatus(candidate) {
+    const state = candidateSubPipelineState(candidate);
+    if (state === "completed") {
+      return "思考完成";
+    }
+    if (state === "failed") {
+      return "思考异常";
+    }
+    return "思考中";
+  }
+
+  function candidatePlanStatus(candidate) {
+    const events = Array.isArray(candidate && candidate.subEvents) ? candidate.subEvents : [];
+    if (events.length === 0) {
+      return null;
+    }
+    const state = candidateSubPipelineState(candidate);
+    if (state === "completed") {
+      return { state: "completed", label: "已完成" };
+    }
+    if (state === "failed") {
+      return { state: "failed", label: "异常" };
+    }
+    return { state: "working", label: "生成中" };
+  }
+
+  function candidateSubStepId(event, fallbackIndex) {
+    const subStep = candidateSubStepOf(event);
+    return String(subStep.id || subStep.stepId || subStep.name || subStep.label || `step-${fallbackIndex}`);
+  }
+
+  function candidateSubStepStatus(events, forceComplete = false) {
+    const latest = events[events.length - 1];
+    const eventType = eventTypeOf(latest || {});
+    const status = normalizeStatus((latest && latest.status) || candidateSubStepOf(latest).status || "");
+    if (eventType === "candidate_step_completed" || status === "completed" || forceComplete) {
+      return "completed";
+    }
+    if (eventType === "candidate_step_failed" || status === "failed" || status === "error") {
+      return "failed";
+    }
+    return "working";
+  }
+
+  function groupCandidateSubEvents(events, options = {}) {
+    const forceComplete = Boolean(options.forceComplete);
+    const groups = [];
+    events.forEach((event, index) => {
+      const id = candidateSubStepId(event, index);
+      let group = groups.find((item) => item.id === id);
+      if (!group) {
+        group = {
+          id,
+          label: candidateSubStepLabel(event),
+          events: [],
+        };
+        groups.push(group);
+      }
+      group.events.push(event);
+      group.label = group.label || candidateSubStepLabel(event);
+      group.status = candidateSubStepStatus(group.events, forceComplete);
+    });
+    return groups;
+  }
+
+  function candidateEvaluationIsComplete() {
+    const state = ensureState();
+    const steps = state.steps || {};
+    const evaluationStatus = stepStatusClass(normalizeStatus(steps.evaluate_candidates && steps.evaluate_candidates.status));
+    const selectionStatus = stepStatusClass(normalizeStatus(steps.confirm_and_select && steps.confirm_and_select.status));
+    const deploymentStatus = stepStatusClass(normalizeStatus(steps.deploying && steps.deploying.status));
+    return (
+      evaluationStatus === "completed" ||
+      ["working", "waiting_input", "completed"].includes(selectionStatus) ||
+      ["working", "waiting_input", "completed"].includes(deploymentStatus)
+    );
+  }
+
+  function candidateEvaluationIsWorking() {
+    const state = ensureState();
+    const steps = state.steps || {};
+    return stepStatusClass(normalizeStatus(steps.evaluate_candidates && steps.evaluate_candidates.status)) === "working";
+  }
+
+  function scrollElementToBottom(element) {
+    if (!element || typeof element.scrollTop === "undefined") {
+      return;
+    }
+    const scroll = () => {
+      element.scrollTop = element.scrollHeight || 0;
+    };
+    scroll();
+    if (typeof requestAnimationFrame === "function") {
+      requestAnimationFrame(scroll);
+    }
+  }
+
+  function renderCandidateSubstepGroup(group) {
+    const substep = createElement("details", "candidate-substep");
+    if (substep) {
+      substep.setAttribute("data-candidate-substep", group.id);
+      substep.open = group.status !== "completed";
+    }
+    const substepHead = createElement("summary", "candidate-substep-head");
+    appendChild(substepHead, createElement("strong", "", group.label));
+    appendChild(substepHead, createElement("span", "", group.status === "completed" ? "完成" : group.status === "failed" ? "异常" : "进行中"));
+    appendChild(substep, substepHead);
+    const list = createElement("ul", "candidate-subpipeline-events");
+    group.events.forEach((event) => {
+      const kind = candidateSubEventKind(event);
+      const item = createElement("li", `candidate-subpipeline-event ${kind}`);
+      if (item) {
+        item.setAttribute("data-candidate-subpipeline-event", kind);
+      }
+      appendChild(item, createElement("span", "candidate-subpipeline-label", candidateSubEventLabel(kind)));
+      appendChild(item, createElement("p", "", eventTitle(event)));
+      appendChild(list, item);
+    });
+    appendChild(substep, list);
+    return substep;
+  }
+
+  function renderCandidateSubPipeline(card, candidate, candidateIndex) {
+    const events = compactDisplayEvents(Array.isArray(candidate && candidate.subEvents) ? candidate.subEvents : []);
+    const renderableEvents = candidateRenderableSubEvents(events);
+    if (renderableEvents.length === 0) {
+      return;
+    }
+    const state = ensureState();
+    const pipelineKey = String(candidateIndex);
+    const pipelineState = candidateSubPipelineState(candidate);
+    const shouldAutoOpen = candidateEvaluationIsWorking() && pipelineState === "working";
+    const section = createElement("details", "candidate-subpipeline");
+    if (section) {
+      section.setAttribute("data-candidate-subpipeline", pipelineKey);
+      section.open = shouldAutoOpen || Boolean(state.expandedCandidateSubpipelines && state.expandedCandidateSubpipelines[pipelineKey]);
+      section.addEventListener("click", (event) => {
+        if (event && typeof event.stopPropagation === "function") {
+          event.stopPropagation();
+        }
+      });
+      section.addEventListener("toggle", () => {
+        const nextState = ensureState();
+        nextState.expandedCandidateSubpipelines = nextState.expandedCandidateSubpipelines || {};
+        nextState.expandedCandidateSubpipelines[pipelineKey] = Boolean(section.open);
+      });
+      section.addEventListener("keydown", (event) => {
+        if (event && (event.key === "Enter" || event.key === " ")) {
+          event.stopPropagation();
+        }
+      });
+    }
+    const head = createElement("summary", "candidate-subpipeline-head");
+    if (head) {
+      head.setAttribute("data-candidate-subpipeline-toggle", String(candidateIndex));
+    }
+    appendChild(head, createElement("strong", "", "思考过程"));
+    appendChild(head, createElement("span", "candidate-subpipeline-arrow"));
+    appendChild(section, head);
+    const body = createElement("div", "candidate-subpipeline-body");
+    if (body) {
+      body.setAttribute("data-candidate-subpipeline-body", pipelineKey);
+    }
+    const substeps = createElement("div", "candidate-substeps");
+    groupCandidateSubEvents(renderableEvents, { forceComplete: pipelineState === "completed" || candidateEvaluationIsComplete() }).forEach((group) => {
+      appendChild(substeps, renderCandidateSubstepGroup(group));
+    });
+    appendChild(body, substeps);
+    appendChild(section, body);
+    appendChild(card, section);
+    if (section && section.open) {
+      scrollElementToBottom(body);
+    }
+  }
+
+  function candidateIndexOf(candidate, fallbackIndex) {
+    const rawIndex = candidate && candidate.candidateIndex !== null && candidate.candidateIndex !== undefined
+      ? candidate.candidateIndex
+      : fallbackIndex;
+    const numericIndex = Number(rawIndex);
+    return Number.isFinite(numericIndex) ? numericIndex : fallbackIndex;
+  }
+
+  function renderPlans() {
+    const state = ensureState();
+    const plansGrid = byId("plans-grid");
+    if (!plansGrid || !canCreateElements()) {
+      return;
+    }
+    clearElement(plansGrid);
+    (Array.isArray(state.candidates) ? state.candidates : []).forEach((candidate, index) => {
+      const candidateIndex = candidateIndexOf(candidate, index);
+      const isSelected = state.selectedCandidateIndex === candidateIndex;
+      const isRecommended = isSelected || (state.selectedCandidateIndex === null && index === 0);
+      const cardClasses = ["plan-card", isSelected ? "selected" : "", isRecommended ? "recommended" : ""]
+        .filter(Boolean)
+        .join(" ");
+      const card = createElement("article", cardClasses);
+      const header = createElement("div", "plan-card-header");
+      const tag = createElement("span", `tag${isRecommended ? "" : " muted"}`, isSelected ? "已选" : index === 0 ? "推荐" : "备选");
+      const score = createElement("span", "score", `方案 ${candidateIndex}`);
+      const planStatus = candidatePlanStatus(candidate);
+      const title = createElement("h2", "", candidate.name || `方案 ${candidateIndex}`);
+      const summary = createElement("p", "", candidate.summary || "等待方案摘要");
+      const price = createElement("div", "price");
+      const meta = createElement("dl", "plan-meta");
+      const costItems = Array.isArray(candidate.costItems) ? candidate.costItems : [];
+      const templateHoverText = isTemplateLikeText(candidate.template) ? String(candidate.template) : "";
+
+      if (card) {
+        card.setAttribute("role", "button");
+        card.setAttribute("tabindex", "0");
+        card.setAttribute("aria-pressed", isSelected ? "true" : "false");
+        card.setAttribute("data-candidate-index", String(candidateIndex));
+        card.addEventListener("click", () => {
+          controller.state = selectCandidate(ensureState(), candidateIndex);
+          syncComposerWithSelectedCandidate(controller.state);
+          renderAll();
+        });
+        card.addEventListener("keydown", (event) => {
+          if (event.key === "Enter" || event.key === " ") {
+            event.preventDefault();
+            controller.state = selectCandidate(ensureState(), candidateIndex);
+            syncComposerWithSelectedCandidate(controller.state);
+            renderAll();
+          }
+        });
+      }
+
+      appendChild(header, tag);
+      const headerMeta = createElement("div", "plan-card-header-meta");
+      appendChild(headerMeta, score);
+      if (planStatus) {
+        const status = createElement("span", `plan-status ${planStatus.state}`, planStatus.label);
+        if (status) {
+          status.setAttribute("data-candidate-status", planStatus.state);
+        }
+        appendChild(headerMeta, status);
+      }
+      appendChild(header, headerMeta);
+      appendChild(card, header);
+      appendChild(card, title);
+      appendChild(card, summary);
+      appendChild(price, createElement("span", "price-label", "预估价格"));
+      appendChild(price, createElement("strong", "", presentValue(candidate.totalMonthlyCost, "价格待确认")));
+      appendChild(card, price);
+
+      costItems.slice(0, 4).forEach((item) => {
+        const row = createElement("div");
+        const term = createElement("dt", "", item && (item.name || item.resource || item.product) ? item.name || item.resource || item.product : "资源");
+        const detail = createElement("dd", "", costItemLabel(item));
+        appendChild(row, term);
+        appendChild(row, detail);
+        appendChild(meta, row);
+      });
+      appendChild(card, meta);
+      renderCandidateSubPipeline(card, candidate, candidateIndex);
+      attachTemplatePopover(card, templateHoverText);
+      appendChild(plansGrid, card);
+    });
+  }
+
+  function formatProgressParamValue(definition, value) {
+    const numericValue = Number(value);
+    const rendered = Number.isFinite(numericValue) && definition.step < 1 ? numericValue.toFixed(1) : String(value);
+    return `${rendered}${definition.unit || ""}`;
+  }
+
+  function setProgressVariant(variant) {
+    const state = ensureState();
+    const ui = mergeProgressUi(state.progressUi);
+    if (PROGRESS_VARIANT_ORDER.includes(variant)) {
+      ui.variant = variant;
+    }
+    state.progressUi = ui;
+    renderAll();
+  }
+
+  function setProgressParam(variant, key, value) {
+    const state = ensureState();
+    const ui = mergeProgressUi(state.progressUi);
+    if (!PROGRESS_VARIANT_ORDER.includes(variant) || !Object.prototype.hasOwnProperty.call(ui[variant], key)) {
+      return;
+    }
+    const numericValue = Number(value);
+    if (Number.isFinite(numericValue)) {
+      ui[variant][key] = numericValue;
+      state.progressUi = ui;
+      renderAll();
+    }
+  }
+
+  function setProgressStep(index) {
+    const state = ensureState();
+    const ui = mergeProgressUi(state.progressUi);
+    const numericIndex = Number(index);
+    ui.activeStepIndex = Number.isInteger(numericIndex) && numericIndex >= 0 && numericIndex < STEP_ORDER.length ? numericIndex : null;
+    state.progressUi = ui;
+    renderAll();
+  }
+
+  function renderProgressDebugPanel() {
+    const panel = byId("progress-debug-panel");
+    if (!panel || !canCreateElements()) {
+      return;
+    }
+    const state = ensureState();
+    const ui = mergeProgressUi(state.progressUi);
+    state.progressUi = ui;
+    clearElement(panel);
+
+    const title = createElement("div", "progress-debug-title");
+    appendChild(title, createElement("strong", "", "进度条方案"));
+    appendChild(title, createElement("span", "", "用于切换视觉方案与调参，不影响 pipeline 状态"));
+    appendChild(panel, title);
+
+    const variants = createElement("div", "progress-variant-switch");
+    PROGRESS_VARIANT_ORDER.forEach((variant) => {
+      const button = createElement("button", ui.variant === variant ? "selected" : "", PROGRESS_VARIANT_LABELS[variant]);
+      if (button) {
+        button.setAttribute("type", "button");
+        button.setAttribute("data-progress-variant-option", variant);
+        button.setAttribute("aria-pressed", ui.variant === variant ? "true" : "false");
+        button.addEventListener("click", () => setProgressVariant(variant));
+      }
+      appendChild(variants, button);
+    });
+    appendChild(panel, variants);
+
+    const activeIndex = stepModelsForProgress(state, ui, { useConfiguredActiveStep: true }).activeIndex;
+    const stepControl = createElement("div", "demo-step-control progress-demo-step-control");
+    const stepLabel = createElement("label");
+    appendChild(stepLabel, createElement("span", "", "演示 Step"));
+    appendChild(stepLabel, createElement("output", "", STEP_LABELS[STEP_ORDER[activeIndex]]));
+    appendChild(stepControl, stepLabel);
+    const stepSwitch = createElement("div", "step-switch");
+    if (stepSwitch) {
+      stepSwitch.setAttribute("aria-label", "进度条演示当前步骤");
+    }
+    STEP_ORDER.forEach((stepId, index) => {
+      const button = createElement("button", index === activeIndex ? "active" : "", String(index + 1));
+      if (button) {
+        button.setAttribute("type", "button");
+        button.setAttribute("data-progress-step-option", String(index));
+        button.setAttribute("aria-pressed", index === activeIndex ? "true" : "false");
+        button.setAttribute("title", STEP_LABELS[stepId]);
+        button.addEventListener("click", () => setProgressStep(index));
+      }
+      appendChild(stepSwitch, button);
+    });
+    appendChild(stepControl, stepSwitch);
+    appendChild(panel, stepControl);
+
+    PROGRESS_VARIANT_ORDER.forEach((variant) => {
+      const group = createElement("div", "progress-param-grid");
+      if (group) {
+        group.setAttribute("data-progress-param-group", variant);
+        group.hidden = ui.variant !== variant;
+      }
+      PROGRESS_PARAM_DEFS[variant].forEach((definition) => {
+        const value = ui[variant][definition.key];
+        const field = createElement("label", "progress-param");
+        const head = createElement("span", "progress-param-head");
+        appendChild(head, createElement("span", "", definition.label));
+        appendChild(head, createElement("output", "", formatProgressParamValue(definition, value)));
+        const input = createElement("input");
+        if (input) {
+          input.setAttribute("type", "range");
+          input.setAttribute("min", String(definition.min));
+          input.setAttribute("max", String(definition.max));
+          input.setAttribute("step", String(definition.step));
+          input.setAttribute("data-progress-param", definition.key);
+          input.setAttribute("data-progress-param-variant", variant);
+          input.value = String(value);
+          input.addEventListener("input", () => setProgressParam(variant, definition.key, input.value));
+        }
+        appendChild(field, head);
+        appendChild(field, input);
+        appendChild(group, field);
+      });
+      appendChild(panel, group);
+    });
+  }
+
+  function renderDebugSessionInfo(state) {
+    const container = byId("debug-session-info");
+    if (!container) {
+      return;
+    }
+    clearElement(container);
+    const fields = [
+      ["serverUrl", "Server URL", state.serverUrl || ""],
+      ["cwd", "CWD", state.cwd || ""],
+      ["contextId", "Context ID", state.contextId || "未获取"],
+      ["pipelineTaskId", "Pipeline Task", state.pipelineTaskId || "未获取"],
+      ["activeTaskId", "Active Task", state.activeTaskId || "未获取"],
+      ["lastSequence", "Last Sequence", String(state.lastSequence || 0)],
+      ["status", "Status", state.status || "idle"],
+      ["handoff", "Normal Handoff", state.normalHandoffReady ? "是" : "否"],
+      ["logs", "Logs", "默认 ~/.iac-code/logs，或 IAC_CODE_CONFIG_DIR/logs"],
+    ];
+    fields.forEach(([key, label, value]) => {
+      const row = createElement("div", "debug-session-field");
+      if (row) {
+        row.setAttribute("data-debug-session-field", key);
+      }
+      appendChild(row, createElement("span", "", label));
+      appendChild(row, createElement("code", "", value));
+      appendChild(container, row);
+    });
+  }
+
+  function renderDebug() {
+    const output = byId("debug-output") || query("#debug-drawer pre");
+    const state = ensureState();
+    renderDebugSessionInfo(state);
+    if (!output) {
+      return;
+    }
+    output.textContent = JSON.stringify(state.diagnostics || {}, null, 2);
+  }
+
+  function renderAll() {
+    renderStatus();
+    renderSteps();
+    renderComposerProgress();
+    renderPlans();
+    renderProgressDebugPanel();
+    renderDebug();
+  }
+
+  function diagnosticBucket(kind) {
+    if (kind === "sse") {
+      return "sse";
+    }
+    if (kind === "snapshot" || kind === "state") {
+      return "snapshots";
+    }
+    return "requests";
+  }
+
+  function appendDiagnostic(kind, value) {
+    const state = ensureState();
+    const diagnostics = state.diagnostics || { requests: [], sse: [], snapshots: [] };
+    const bucket = diagnosticBucket(kind);
+    const nextValue = clonePlainData({
+      at: new Date().toISOString(),
+      kind,
+      value,
+    });
+    diagnostics[bucket] = Array.isArray(diagnostics[bucket]) ? diagnostics[bucket] : [];
+    diagnostics[bucket].push(nextValue);
+    diagnostics[bucket] = diagnostics[bucket].slice(-40);
+    state.diagnostics = diagnostics;
+    renderDebug();
+  }
+
+  function showStatus(message, kind) {
+    const alert = byId("status-alert");
+    if (!alert) {
+      return;
+    }
+    if (!message) {
+      alert.hidden = true;
+      alert.textContent = "";
+      alert.removeAttribute("data-kind");
+      return;
+    }
+    alert.hidden = false;
+    alert.textContent = message;
+    alert.setAttribute("data-kind", kind || "info");
+  }
+
+  function ensureFetchAvailable() {
+    if (typeof fetch === "function") {
+      return true;
+    }
+    appendDiagnostic("error", { error: "fetch is not available" });
+    showStatus("当前环境不支持 fetch，无法连接 A2A 服务。", "error");
+    return false;
+  }
+
+  function queryString(params) {
+    if (typeof URLSearchParams === "function") {
+      const search = new URLSearchParams();
+      Object.keys(params).forEach((key) => {
+        search.set(key, params[key] === undefined || params[key] === null ? "" : String(params[key]));
+      });
+      return search.toString();
+    }
+    return Object.keys(params)
+      .map((key) => `${encodeURIComponent(key)}=${encodeURIComponent(params[key] || "")}`)
+      .join("&");
+  }
+
+  async function readJsonResponse(response) {
+    const text = await response.text();
+    if (!text) {
+      return null;
+    }
+    try {
+      return JSON.parse(text);
+    } catch (error) {
+      return { ok: false, error: String(error), text };
+    }
+  }
+
+  function errorMessage(error) {
+    return error && error.message ? error.message : String(error);
+  }
+
+  function activeTaskIdFromPayload(payload) {
+    const envelope = extractPipelineEnvelope(payload);
+    const envelopeTaskId = taskIdOf(envelope || {});
+    if (envelopeTaskId) {
+      return envelopeTaskId;
+    }
+    if (payload && payload.result && typeof payload.result === "object") {
+      return payload.result.taskId || payload.result.task_id || payload.result.id || "";
+    }
+    if (payload && payload.task && typeof payload.task === "object") {
+      return payload.task.taskId || payload.task.task_id || payload.task.id || "";
+    }
+    return taskIdOf(payload || {}) || "";
+  }
+
+  function isWaitingForInputPayload(payload, state) {
+    const envelope = extractPipelineEnvelope(payload);
+    return (
+      Boolean(state && state.pendingInput) ||
+      (state && state.status === "waiting_input") ||
+      eventTypeOf(envelope || {}) === "input_required" ||
+      normalizeStatus((envelope && envelope.status) || "") === "waiting_input"
+    );
+  }
+
+  function waitForNextPaint() {
+    return new Promise((resolve) => {
+      if (typeof requestAnimationFrame === "function") {
+        requestAnimationFrame(() => resolve());
+        return;
+      }
+      if (typeof window !== "undefined" && typeof window.setTimeout === "function") {
+        window.setTimeout(resolve, 16);
+        return;
+      }
+      if (typeof setTimeout === "function") {
+        setTimeout(resolve, 0);
+        return;
+      }
+      resolve();
+    });
+  }
+
+  function reduceControllerPayload(payload) {
+    const currentState = ensureState();
+    const nextState = reducePipelinePayload(currentState, payload);
+    const activeTaskId = activeTaskIdFromPayload(payload);
+    if (!nextState.normalHandoffReady && activeTaskId) {
+      nextState.activeTaskId = activeTaskId;
+    }
+    controller.state = nextState;
+    renderAll();
+    return nextState;
+  }
+
+  function handleSseBlock(block) {
+    const dataLines = String(block || "")
+      .split("\n")
+      .filter((line) => line.startsWith("data:"))
+      .map((line) => line.slice(5).trimStart());
+    if (dataLines.length === 0) {
+      return false;
+    }
+    const data = dataLines.join("\n").trim();
+    if (!data || data === "[DONE]") {
+      return false;
+    }
+    let payload;
+    try {
+      payload = JSON.parse(data);
+    } catch (error) {
+      appendDiagnostic("sse", { error: String(error), data });
+      showStatus("收到无法解析的 SSE 数据，详情见调试信息。", "error");
+      return false;
+    }
+    appendDiagnostic("sse", payload);
+    if (payload && payload.ok === false) {
+      throw new Error(payload.error || payload.message || "SSE stream reported an error");
+    }
+    const nextState = reduceControllerPayload(payload);
+    return isWaitingForInputPayload(payload, nextState);
+  }
+
+  async function consumeSseResponse(response) {
+    if (!response.ok) {
+      const errorText = typeof response.text === "function" ? await response.text() : "";
+      throw new Error(`HTTP ${response.status}: ${errorText}`);
+    }
+    if (!response.body || typeof response.body.getReader !== "function") {
+      const text = typeof response.text === "function" ? await response.text() : "";
+      const blocks = text
+        .replace(/\r\n/g, "\n")
+        .split("\n\n")
+        .filter((block) => block.trim());
+      for (const block of blocks) {
+        const shouldStop = handleSseBlock(block);
+        await waitForNextPaint();
+        if (shouldStop) {
+          break;
+        }
+      }
+      return;
+    }
+
+    const reader = response.body.getReader();
+    const decoder = new TextDecoder();
+    let buffer = "";
+    let shouldStop = false;
+    while (!shouldStop) {
+      const { value, done } = await reader.read();
+      if (done) {
+        buffer += decoder.decode();
+        break;
+      }
+      buffer += decoder.decode(value, { stream: true }).replace(/\r\n/g, "\n");
+      let boundary = buffer.indexOf("\n\n");
+      while (boundary >= 0) {
+        const block = buffer.slice(0, boundary);
+        buffer = buffer.slice(boundary + 2);
+        shouldStop = handleSseBlock(block);
+        await waitForNextPaint();
+        if (shouldStop) {
+          break;
+        }
+        boundary = buffer.indexOf("\n\n");
+      }
+    }
+    if (!shouldStop && buffer.trim()) {
+      handleSseBlock(buffer);
+      await waitForNextPaint();
+    }
+    if (shouldStop && typeof reader.cancel === "function") {
+      await reader.cancel();
+    }
+  }
+
+  async function sendComposerMessage() {
+    if (!ensureFetchAvailable()) {
+      return;
+    }
+    const state = syncStateFromConnectionControls();
+    const composer = byId("composer-input");
+    const typedPrompt = composer && "value" in composer ? String(composer.value || "").trim() : "";
+    const prompt = typedPrompt || promptForSelectedCandidate(state);
+    if (!prompt) {
+      showStatus("请输入需求，或先选择一个方案。", "error");
+      return;
+    }
+    state.userMessages = Array.isArray(state.userMessages) ? state.userMessages : [];
+    const userMessageId = `user-${Date.now()}-${state.userMessages.length}`;
+    state.userMessages.push({
+      id: userMessageId,
+      text: prompt,
+      placement: userMessagePlacementForState(state),
+    });
+    if (state.normalHandoffReady) {
+      state.pendingNormalUserMessageId = userMessageId;
+    }
+    if (composer && "value" in composer && typedPrompt) {
+      composer.value = "";
+    }
+    renderAll();
+    const payload = buildStreamPayload(state, prompt);
+    appendDiagnostic("request", { method: "POST", path: "/api/message/stream", payload });
+    showStatus("正在发送消息并接收 pipeline 事件...", "info");
+    try {
+      const response = await fetch("/api/message/stream", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify(payload),
+      });
+      await consumeSseResponse(response);
+      showStatus(ensureState().pendingInput ? "请选择或补充输入后继续。" : "消息已发送，状态已更新。", "info");
+    } catch (error) {
+      const message = errorMessage(error);
+      appendDiagnostic("error", { action: "send", error: message });
+      showStatus(`消息发送失败：${message}`, "error");
+    }
+  }
+
+  async function healthCheck() {
+    if (!ensureFetchAvailable()) {
+      return;
+    }
+    const state = syncStateFromConnectionControls();
+    const path = `/api/health?${queryString({ serverUrl: state.serverUrl })}`;
+    appendDiagnostic("request", { method: "GET", path });
+    try {
+      const response = await fetch(path);
+      const body = await readJsonResponse(response);
+      appendDiagnostic("request", { method: "GET", path, status: response.status, body });
+      showStatus(response.ok ? "连接检查完成。" : `连接检查失败：HTTP ${response.status}`, response.ok ? "info" : "error");
+    } catch (error) {
+      const message = errorMessage(error);
+      appendDiagnostic("error", { action: "health", error: message });
+      showStatus(`连接检查失败：${message}`, "error");
+    }
+  }
+
+  async function fetchState() {
+    if (!ensureFetchAvailable()) {
+      return;
+    }
+    const state = syncStateFromConnectionControls();
+    const taskId = state.activeTaskId || state.pipelineTaskId || "";
+    const path = `/api/pipeline/state?${queryString({
+      serverUrl: state.serverUrl,
+      contextId: state.contextId || "",
+      taskId,
+      afterSequence: state.lastSequence || 0,
+    })}`;
+    appendDiagnostic("request", { method: "GET", path });
+    try {
+      const response = await fetch(path);
+      const body = await readJsonResponse(response);
+      appendDiagnostic("state", { status: response.status, body });
+      if (body) {
+        reduceControllerPayload(body);
+      }
+      showStatus(response.ok ? "状态已同步。" : `同步状态失败：HTTP ${response.status}`, response.ok ? "info" : "error");
+    } catch (error) {
+      const message = errorMessage(error);
+      appendDiagnostic("error", { action: "fetchState", error: message });
+      showStatus(`同步状态失败：${message}`, "error");
+    }
+  }
+
+  async function cancelTask() {
+    if (!ensureFetchAvailable()) {
+      return;
+    }
+    const state = syncStateFromConnectionControls();
+    const payload = {
+      serverUrl: state.serverUrl || "",
+      contextId: state.contextId || "",
+      taskId: state.activeTaskId || state.pipelineTaskId || "",
+    };
+    appendDiagnostic("request", { method: "POST", path: "/api/task/cancel", payload });
+    try {
+      const response = await fetch("/api/task/cancel", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify(payload),
+      });
+      const body = await readJsonResponse(response);
+      appendDiagnostic("request", { method: "POST", path: "/api/task/cancel", status: response.status, body });
+      showStatus(response.ok ? "取消请求已发送。" : `取消任务失败：HTTP ${response.status}`, response.ok ? "info" : "error");
+    } catch (error) {
+      const message = errorMessage(error);
+      appendDiagnostic("error", { action: "cancel", error: message });
+      showStatus(`取消任务失败：${message}`, "error");
+    }
+  }
+
+  function bindEvents() {
+    if (controller.bound) {
+      return;
+    }
+    const serverInput = byId("server-url");
+    const cwdInput = byId("cwd");
+    const sendButton = byId("send-button");
+    const composer = byId("composer-input");
+    const healthButton = byId("health-button");
+    const fetchStateButton = byId("fetch-state-button");
+    const cancelButton = byId("cancel-button");
+    const debugDrawer = byId("debug-drawer");
+    const addListener = (element, eventName, handler) => {
+      if (element && typeof element.addEventListener === "function") {
+        element.addEventListener(eventName, handler);
+      }
+    };
+
+    addListener(serverInput, "input", syncStateFromConnectionControls);
+    addListener(cwdInput, "input", syncStateFromConnectionControls);
+    addListener(sendButton, "click", sendComposerMessage);
+    addListener(healthButton, "click", healthCheck);
+    addListener(fetchStateButton, "click", fetchState);
+    addListener(cancelButton, "click", cancelTask);
+    addListener(debugDrawer, "toggle", renderAll);
+    addListener(composer, "keydown", (event) => {
+      if ((event.key === "Enter" && !event.shiftKey) || (event.key === "Enter" && (event.metaKey || event.ctrlKey))) {
+        event.preventDefault();
+        sendComposerMessage();
+      }
+    });
+    controller.bound = Boolean(
+      serverInput || cwdInput || sendButton || composer || healthButton || fetchStateButton || cancelButton || debugDrawer
+    );
+  }
+
+  function loadDemoCandidates() {
+    let state = ensureState();
+    state = upsertCandidate(state, {
+      name: "ECS 经典网络方案",
+      candidateIndex: 0,
+      summary: "使用 VPC、ECS 与弹性公网 IP 搭建轻量 Web 服务，保留后续扩容空间。",
+      totalMonthlyCost: "¥33.89/月",
+      costItems: [
+        { name: "ECS", spec: "1vCPU/1GiB", monthly_cost: "¥33.89/月" },
+        { name: "EIP", spec: "按量公网带宽", monthly_cost: "按实际流量" },
+      ],
+    });
+    state = upsertCandidate(state, {
+      name: "轻量应用服务器一体化方案",
+      candidateIndex: 1,
+      summary: "面向演示、测试与低流量站点，预置应用环境并降低运维复杂度。",
+      totalMonthlyCost: "¥0/月",
+      costItems: [
+        { name: "轻量应用服务器", spec: "试用规格", monthly_cost: "¥0/月" },
+        { name: "基础监控", spec: "默认启用", monthly_cost: "¥0/月" },
+      ],
+    });
+    state.steps.intent_parsing.status = "completed";
+    state.steps.architecture_planning.status = "completed";
+    state.steps.evaluate_candidates.status = "completed";
+    state.steps.confirm_and_select.status = "waiting_input";
+    state.status = "waiting_input";
+    state.pipelineStarted = true;
+    state.pendingInput = {
+      kind: "candidate_selection",
+      prompt: "请选择推荐方案",
+      options: [
+        { id: "0", label: "ECS 经典网络方案" },
+        { id: "1", label: "轻量应用服务器一体化方案" },
+      ],
+    };
+    controller.state = state;
+    renderAll();
+    return state;
+  }
+
+  function init() {
+    ensureState();
+    syncConnectionControlsFromState();
+    syncStateFromConnectionControls();
+    bindEvents();
+    renderAll();
+    return controller.state;
+  }
+
+  window.SellingConsoleController = {
+    init,
+    renderSteps,
+    renderPlans,
+    sendComposerMessage,
+    healthCheck,
+    fetchState,
+    cancelTask,
+    appendDiagnostic,
+    renderDebug,
+  };
+  window.SellingConsoleDebug = {
+    loadDemoCandidates,
+    state: () => ensureState(),
+    render: renderAll,
+  };
+
+  if (hasDocument()) {
+    if (document.readyState === "loading" && typeof document.addEventListener === "function") {
+      document.addEventListener("DOMContentLoaded", init, { once: true });
+    } else {
+      init();
+    }
+  }
+})();
diff --git a/scripts/a2a/selling_console_web/design/selling-pipeline-progress-options.html b/scripts/a2a/selling_console_web/design/selling-pipeline-progress-options.html
new file mode 100644
index 00000000..78f5d72e
--- /dev/null
+++ b/scripts/a2a/selling_console_web/design/selling-pipeline-progress-options.html
@@ -0,0 +1,1655 @@
+<!DOCTYPE html>
+<html lang="zh-CN">
+<head>
+  <meta charset="UTF-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1.0">
+  <title>进度控件方案 v61 B 标签对齐</title>
+  <style>
+    * { box-sizing: border-box; }
+    :root {
+      --ink: #1f2937;
+      --muted: #667085;
+      --line: #d9e2ef;
+      --blue: #1677ff;
+      --cyan: #40d9ff;
+      --green: #13a36f;
+      --orange: #ff6a00;
+    }
+    body {
+      margin: 0;
+      background: #f5f7fb;
+      color: var(--ink);
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "PingFang SC", sans-serif;
+    }
+    .page {
+      max-width: 888px;
+      margin: 0 auto;
+      padding: 20px 18px 36px;
+    }
+    .intro {
+      display: flex;
+      align-items: flex-end;
+      justify-content: space-between;
+      gap: 24px;
+      margin-bottom: 14px;
+    }
+    h1 {
+      margin: 0;
+      font-size: 16px;
+      line-height: 1.35;
+      letter-spacing: 0;
+    }
+    .subtitle {
+      margin: 6px 0 0;
+      color: var(--muted);
+      font-size: 11px;
+      line-height: 1.6;
+    }
+    .hint {
+      color: #667085;
+      font-size: 10px;
+      white-space: nowrap;
+    }
+    .grid {
+      display: grid;
+      grid-template-columns: repeat(2, minmax(0, 1fr));
+      gap: 14px;
+    }
+    .option {
+      min-width: 0;
+      padding: 12px;
+      border: 1px solid #cfd9e8;
+      border-radius: 8px;
+      background: #fff;
+      box-shadow: 0 1px 2px rgba(15, 23, 42, .045);
+      cursor: pointer;
+    }
+    .option:hover {
+      border-color: #9fc7ff;
+      box-shadow: 0 2px 6px rgba(22, 119, 255, .08);
+    }
+    .option[data-choice="b2"] {
+      display: none;
+    }
+    .head {
+      display: flex;
+      align-items: center;
+      justify-content: space-between;
+      gap: 10px;
+      margin-bottom: 8px;
+    }
+    .title {
+      font-size: 11px;
+      font-weight: 720;
+    }
+    .meta {
+      color: #667085;
+      font-size: 9px;
+      white-space: nowrap;
+    }
+    .composer {
+      width: min(100%, 360px);
+      margin: 0 auto;
+      padding: 9px;
+      border: 1px solid #cbd8e8;
+      border-radius: 8px;
+      background: #fff;
+    }
+    .input {
+      height: 82px;
+      margin-top: 8px;
+      padding: 11px;
+      border: 1px solid #bfccdc;
+      border-radius: 8px;
+      color: #687386;
+      font-size: 11px;
+      line-height: 1.5;
+    }
+    .actions {
+      display: flex;
+      align-items: center;
+      justify-content: space-between;
+      gap: 8px;
+      margin-top: 8px;
+    }
+    .ghosts { display: flex; gap: 6px; }
+    .ghost,
+    .send {
+      height: 28px;
+      border-radius: 7px;
+      font-size: 10px;
+      font-weight: 650;
+    }
+    .ghost {
+      min-width: 56px;
+      border: 1px solid #c4d0df;
+      background: #fff;
+      color: #344054;
+    }
+    .send {
+      width: 54px;
+      border: 0;
+      background: var(--orange);
+      color: #fff;
+    }
+    .tip {
+      position: absolute;
+      z-index: 50;
+      left: 50%;
+      top: calc(100% + 8px);
+      width: max-content;
+      max-width: 196px;
+      transform: translateX(-50%) translateY(-3px);
+      padding: 8px 10px;
+      border-radius: 8px;
+      background: #111827;
+      color: #f8fafc;
+      font-size: 10px;
+      font-weight: 500;
+      line-height: 1.45;
+      white-space: normal;
+      opacity: 0;
+      pointer-events: none;
+      transition: opacity .15s ease, transform .15s ease;
+      box-shadow: 0 12px 28px rgba(15, 23, 42, .22);
+    }
+    .step:hover .tip,
+    .node:hover .tip,
+    .fusion-step:hover .tip {
+      opacity: 1;
+      transform: translateX(-50%) translateY(0);
+    }
+    .chevrons {
+      display: grid;
+      grid-template-columns: repeat(5, minmax(0, 1fr));
+      height: 26px;
+      isolation: isolate;
+    }
+    .chevrons .step {
+      position: relative;
+      display: flex;
+      align-items: center;
+      justify-content: center;
+      min-width: 0;
+      margin-left: -6px;
+      padding: 0 8px 0 12px;
+      clip-path: polygon(0 0, calc(100% - 8px) 0, 100% 50%, calc(100% - 8px) 100%, 0 100%, 8px 50%);
+      background: #edf2f7;
+      color: #405066;
+      font-size: 9px;
+      font-weight: 700;
+      white-space: nowrap;
+    }
+    .chevrons .step:first-child {
+      margin-left: 0;
+      border-radius: 7px 0 0 7px;
+      clip-path: polygon(0 0, calc(100% - 8px) 0, 100% 50%, calc(100% - 8px) 100%, 0 100%);
+    }
+    .chevrons .step:last-child { border-radius: 0 7px 7px 0; }
+    .chevrons .done { background: #e9f7f1; color: #14704d; }
+    .chevrons .active {
+      z-index: 2;
+      background: linear-gradient(90deg, #1677ff, #28a4ff);
+      color: #fff;
+      box-shadow: 0 4px 11px rgba(22, 119, 255, .2);
+    }
+    .chevrons .active::after {
+      content: "";
+      position: absolute;
+      inset: 0;
+      background: linear-gradient(110deg, transparent 0%, transparent 38%, rgba(255,255,255,.5) 50%, transparent 62%, transparent 100%);
+      animation: sweep 1.8s linear infinite;
+    }
+    .circuit {
+      position: relative;
+      height: 42px;
+      padding: 0 7px;
+      border: 1px solid #cfd9e8;
+      border-radius: 8px;
+      background: linear-gradient(180deg, #fbfdff, #f7faff);
+      overflow: hidden;
+    }
+    .track {
+      position: absolute;
+      left: 31px;
+      right: 31px;
+      top: 19px;
+      height: 2px;
+      border-radius: 999px;
+      background:
+        linear-gradient(90deg,
+          var(--green) 0%,
+          var(--green) 49%,
+          transparent 49%,
+          transparent 89%,
+          #d7e1ee 89%,
+          #d7e1ee 100%);
+    }
+    .quiet-segment {
+      position: absolute;
+      left: 49%;
+      right: 11%;
+      top: 18px;
+      height: 4px;
+      border-radius: 999px;
+      background: linear-gradient(90deg, rgba(22,119,255,.2), rgba(22,119,255,.1), rgba(22,119,255,0));
+    }
+    .pulse-soft .quiet-segment,
+    .pulse-dense .quiet-segment {
+      display: none;
+    }
+    .pulse-soft .quiet-segment {
+      background: linear-gradient(90deg, rgba(22,119,255,.22), rgba(64,217,255,.16), rgba(22,119,255,0));
+      animation: pulseBaseSoft 2.6s ease-in-out infinite;
+    }
+    .pulse-dense .quiet-segment {
+      background:
+        repeating-linear-gradient(90deg, rgba(22,119,255,.05) 0 5px, rgba(64,217,255,.18) 5px 7px, rgba(22,119,255,.05) 7px 13px),
+        linear-gradient(90deg, rgba(22,119,255,.14), rgba(22,119,255,0));
+      animation: pulseBaseDense 1.45s linear infinite;
+    }
+    .electric {
+      position: absolute;
+      left: 49%;
+      right: 10%;
+      top: 0;
+      height: 20px;
+      pointer-events: none;
+      overflow: visible;
+    }
+    .pulse-soft .electric::before,
+    .pulse-soft .electric::after,
+    .pulse-dense .electric::before,
+    .pulse-dense .electric::after {
+      content: none;
+      position: absolute;
+      pointer-events: none;
+      border-radius: 999px;
+    }
+    .pulse-soft .electric::before {
+      left: 4%;
+      top: 11px;
+      width: 34%;
+      height: 7px;
+      z-index: 1;
+      background: linear-gradient(90deg, transparent, rgba(64,217,255,.62), rgba(255,255,255,.78), rgba(22,119,255,.34), transparent);
+      filter: none;
+      animation: pulsePacketSoft 2.6s cubic-bezier(.37, 0, .18, 1) infinite;
+    }
+    .pulse-soft .electric::after {
+      display: none;
+      left: 38%;
+      top: 5px;
+      width: 25px;
+      height: 16px;
+      z-index: 0;
+      background: radial-gradient(ellipse at center, rgba(64,217,255,.18), rgba(64,217,255,0) 70%);
+      animation: pulseHaloSoft 2.6s cubic-bezier(.37, 0, .18, 1) infinite;
+    }
+    .pulse-dense .electric::before {
+      left: 0;
+      top: 10px;
+      width: 72%;
+      height: 8px;
+      z-index: 1;
+      background:
+        repeating-linear-gradient(90deg, transparent 0 4px, rgba(244,253,255,.96) 4px 6px, rgba(64,217,255,.72) 6px 8px, transparent 8px 11px);
+      -webkit-mask-image: linear-gradient(90deg, transparent, #000 12%, #000 76%, transparent);
+      mask-image: linear-gradient(90deg, transparent, #000 12%, #000 76%, transparent);
+      filter: none;
+      animation: pulsePacketDense 1.55s cubic-bezier(.35, 0, .14, 1) infinite;
+    }
+    .pulse-dense .electric::after {
+      display: none;
+      left: 28%;
+      top: 4px;
+      width: 48%;
+      height: 16px;
+      z-index: 0;
+      background:
+        radial-gradient(ellipse at 32% 72%, rgba(64,217,255,.4), rgba(64,217,255,0) 38%),
+        radial-gradient(ellipse at 58% 66%, rgba(22,119,255,.34), rgba(22,119,255,0) 42%),
+        radial-gradient(ellipse at 78% 70%, rgba(244,253,255,.28), rgba(244,253,255,0) 34%);
+      animation: pulseHaloDense 1.55s steps(3, end) infinite;
+    }
+    .electric svg {
+      width: 100%;
+      height: 100%;
+      overflow: visible;
+      position: relative;
+      z-index: 2;
+    }
+    .electric .glow {
+      display: none;
+      fill: none;
+      stroke-linecap: round;
+      stroke-linejoin: round;
+      opacity: .18;
+      filter: none;
+    }
+    .electric .bolt,
+    .electric .spark {
+      fill: none;
+      stroke-linecap: round;
+      stroke-linejoin: round;
+      vector-effect: non-scaling-stroke;
+      shape-rendering: geometricPrecision;
+      animation: boltGlide 2.35s cubic-bezier(.42, 0, .18, 1) infinite;
+    }
+    .electric .bolt {
+      stroke-dasharray: 28 132;
+      stroke-width: 2.2px;
+    }
+    .electric .spark {
+      stroke-dasharray: 9 122;
+      stroke-width: 1.1px;
+      animation-duration: 2.05s;
+      opacity: 1;
+    }
+    .electric .peak {
+      opacity: 0;
+      transform-origin: 68% 100%;
+      animation: peakFlash 2.35s cubic-bezier(.42, 0, .18, 1) infinite;
+    }
+    .dense .bolt {
+      stroke-dasharray: 9 42;
+      stroke-width: 2.25px;
+    }
+    .dense .spark {
+      stroke-dasharray: 5 30;
+      stroke-width: 1px;
+      opacity: .96;
+    }
+    .dense .peak {
+      animation-name: densePeakFlash;
+    }
+    .dense .dense-extra {
+      display: none;
+      stroke-dasharray: 6 28;
+      opacity: .9;
+      animation-duration: 1.55s;
+    }
+    .blue-pulse .track {
+      top: 17px;
+      height: 6px;
+      background:
+        linear-gradient(90deg,
+          var(--green) 0%,
+          var(--green) 49%,
+          var(--blue) 49%,
+          #2aa3ff 88%,
+          #d7e1ee 88%,
+          #d7e1ee 100%);
+    }
+    .blue-pulse .electric {
+      left: 49%;
+      right: 11%;
+      top: 6px;
+      height: 26px;
+      overflow: hidden;
+    }
+    .blue-pulse .electric svg {
+      display: none;
+    }
+    .blue-pulse .electric::before,
+    .blue-pulse .electric::after {
+      content: "";
+      position: absolute;
+      left: 0;
+      top: 0;
+      bottom: 0;
+      height: auto;
+      width: 58px;
+      z-index: 3;
+      pointer-events: none;
+      border-radius: 0;
+      background: linear-gradient(105deg,
+        transparent 0%,
+        transparent 20%,
+        rgba(255,255,255,.22) 30%,
+        rgba(255,255,255,.98) 48%,
+        rgba(255,255,255,.44) 64%,
+        transparent 78%,
+        transparent 100%);
+      animation: blueLineSweep 2.25s cubic-bezier(.42, 0, .2, 1) infinite;
+    }
+    .blue-pulse .electric::after {
+      display: none;
+    }
+    .blue-pulse-dense .electric::before {
+      width: 40px;
+      animation-duration: 1.55s;
+    }
+    .blue-pulse-dense .electric::after {
+      display: block;
+      width: 32px;
+      opacity: .72;
+      animation: blueLineSweep 1.55s cubic-bezier(.42, 0, .2, 1) infinite;
+      animation-delay: .38s;
+    }
+    .pulse-wave .track {
+      top: 18px;
+      height: 3px;
+      background:
+        linear-gradient(90deg,
+          var(--green) 0%,
+          var(--green) 49%,
+          transparent 49%,
+          transparent 88%,
+          #d7e1ee 88%,
+          #d7e1ee 100%);
+    }
+    .pulse-wave .electric {
+      left: 54%;
+      right: 18%;
+      top: 0;
+      height: 17px;
+      overflow: visible;
+    }
+    .pulse-wave .electric::before,
+    .pulse-wave .electric::after {
+      content: none;
+    }
+    .pulse-wave .electric svg {
+      display: block;
+      width: 100%;
+      height: 100%;
+      overflow: visible;
+    }
+    .pulse-wave .wave-base,
+    .pulse-wave .wave-sweep,
+    .pulse-wave .wave-sweep-2 {
+      fill: none;
+      stroke-linecap: round;
+      stroke-linejoin: round;
+      vector-effect: non-scaling-stroke;
+      shape-rendering: geometricPrecision;
+    }
+    .pulse-wave .wave-base {
+      stroke: #1677ff;
+      stroke-width: 1.65px;
+    }
+    .pulse-wave .wave-sweep,
+    .pulse-wave .wave-sweep-2 {
+      stroke-width: 3.4px;
+      stroke-dasharray: 30 210;
+      stroke-dashoffset: 170;
+      opacity: .94;
+      animation: waveSheen 2.15s cubic-bezier(.42, 0, .2, 1) infinite;
+    }
+    .pulse-wave-dense .wave-base {
+      stroke-width: 1.55px;
+    }
+    .pulse-wave-dense .wave-sweep,
+    .pulse-wave-dense .wave-sweep-2 {
+      stroke-width: 3.2px;
+      stroke-dasharray: 24 190;
+      animation-duration: 1.6s;
+    }
+    .pulse-wave .wave-sweep-2 {
+      display: none;
+    }
+    .pulse-wave-dense .wave-sweep-2 {
+      display: block;
+      opacity: .62;
+      animation-delay: .38s;
+    }
+    .nodes {
+      position: relative;
+      display: grid;
+      grid-template-columns: repeat(5, minmax(0, 1fr));
+      height: 100%;
+      align-items: start;
+    }
+    .node {
+      position: relative;
+      min-width: 0;
+      padding-top: 25px;
+      color: #42526a;
+      font-size: 9px;
+      font-weight: 650;
+      text-align: center;
+      white-space: nowrap;
+    }
+    .node::before {
+      content: "";
+      position: absolute;
+      left: 50%;
+      top: 19px;
+      width: 7px;
+      height: 7px;
+      transform: translate(-50%, -50%);
+      border: 2px solid #7cc8a6;
+      border-radius: 999px;
+      background: #fff;
+      box-shadow: 0 0 0 3px #fff;
+    }
+    .node.active {
+      color: #0b62cf;
+      font-weight: 760;
+    }
+    .node.next::before { border-color: #b9c5d4; }
+    .node.active::before {
+      border-color: var(--blue);
+      box-shadow: 0 0 0 3px #fff, 0 0 0 6px rgba(22,119,255,.12), 0 0 11px rgba(22,119,255,.5);
+      animation: nodePulse 2.35s ease-out infinite;
+    }
+    .signal-circuit {
+      position: relative;
+      height: 62px;
+      padding: 4px 8px 0;
+      border: 1px solid #cfd9e8;
+      border-radius: 8px;
+      background: linear-gradient(180deg, #fbfdff, #f8fbff);
+      overflow: hidden;
+      --absorb-duration: 510ms;
+    }
+    .signal-svg {
+      position: absolute;
+      inset: 0 8px auto 8px;
+      width: calc(100% - 16px);
+      height: 44px;
+      overflow: visible;
+    }
+    .signal-active-base,
+    .signal-moving-wave,
+    .signal-rail,
+    .signal-done {
+      fill: none;
+      stroke-linecap: round;
+      stroke-linejoin: round;
+      vector-effect: non-scaling-stroke;
+    }
+    .signal-rail {
+      stroke: #d5dfec;
+      stroke-width: 2px;
+    }
+    .signal-done {
+      stroke: var(--green);
+      stroke-width: 2px;
+    }
+    .signal-active-base {
+      stroke-width: 1.35px;
+    }
+    .signal-active-in {
+      stroke: rgba(22, 119, 255, .46);
+    }
+    .signal-active-out {
+      stroke: rgba(143, 155, 174, .6);
+    }
+    .signal-moving-wave {
+      stroke: var(--blue);
+      stroke-width: 1.2px;
+      opacity: .98;
+    }
+    .signal-node {
+      position: absolute;
+      top: 22px;
+      width: 12px;
+      height: 12px;
+      border: 2px solid #7cc8a6;
+      border-radius: 50%;
+      background: #fff;
+      transform: translate(-50%, -50%);
+      z-index: 2;
+    }
+    .signal-node.active {
+      width: 15px;
+      height: 15px;
+      border-color: var(--blue);
+      box-shadow: 0 0 0 3px #fff;
+      overflow: hidden;
+    }
+    .signal-absorb-halo {
+      position: absolute;
+      left: 72%;
+      top: 22px;
+      width: 20px;
+      height: 20px;
+      transform: translate(-50%, -50%);
+      pointer-events: none;
+      z-index: 1;
+    }
+    .signal-absorb-halo::before {
+      content: "";
+      position: absolute;
+      inset: 0;
+      border-radius: 999px;
+      opacity: 0;
+      transform: scale(.78);
+      transform-origin: center;
+      background: radial-gradient(circle, rgba(64, 217, 255, .34) 0 34%, rgba(22, 119, 255, .16) 52%, rgba(22, 119, 255, 0) 76%);
+      filter: blur(.3px);
+    }
+    .signal-node-core {
+      position: absolute;
+      inset: 1.5px;
+      border-radius: 999px;
+      background: radial-gradient(circle at 50% 48%, rgba(255, 255, 255, 1) 0 12%, rgba(110, 230, 255, .98) 30%, rgba(22, 119, 255, .92) 68%, rgba(22, 119, 255, .16) 100%);
+      opacity: 0;
+      transform: scale(.08);
+      transform-origin: center;
+      box-shadow: inset 0 0 3px rgba(255, 255, 255, .7), 0 0 10px rgba(22, 119, 255, .56);
+    }
+    .signal-node-charge {
+      position: absolute;
+      inset: 1.5px;
+      border-radius: 999px;
+      opacity: 0;
+      transform: scale(.76) rotate(-90deg);
+      transform-origin: center;
+      background:
+        conic-gradient(from 210deg,
+          rgba(22, 119, 255, 0) 0deg,
+          rgba(22, 119, 255, .22) 42deg,
+          rgba(64, 217, 255, .95) 86deg,
+          rgba(255, 255, 255, .98) 126deg,
+          rgba(22, 119, 255, .92) 178deg,
+          rgba(22, 119, 255, .16) 232deg,
+          rgba(22, 119, 255, 0) 300deg,
+          rgba(22, 119, 255, 0) 360deg);
+      box-shadow: inset 0 0 5px rgba(255, 255, 255, .45), 0 0 7px rgba(22, 119, 255, .44);
+      filter: saturate(1.08);
+    }
+    .signal-circuit.absorbing .signal-absorb-halo::before {
+      animation: signalAbsorbGlow var(--absorb-duration) ease-out both;
+    }
+    .signal-circuit.absorbing .signal-node.active .signal-node-charge {
+      animation: signalNodeChargeRing var(--absorb-duration) cubic-bezier(.18, .78, .24, 1) both;
+    }
+    .signal-circuit.absorbing .signal-node.active .signal-node-core {
+      animation: signalNodeInnerAbsorb var(--absorb-duration) ease-out both;
+    }
+    .signal-circuit.absorbing .signal-node.active {
+      animation: signalAbsorbCore var(--absorb-duration) ease-out both;
+    }
+    .signal-node.next {
+      border-color: #b9c5d4;
+    }
+    .signal-node.pending {
+      border-color: #b9c5d4;
+    }
+    .signal-labels {
+      position: absolute;
+      left: 0;
+      right: 0;
+      top: 38px;
+      color: #42526a;
+      font-size: 9px;
+      font-weight: 650;
+      text-align: center;
+      white-space: nowrap;
+    }
+    .signal-labels span {
+      position: absolute;
+      top: 0;
+      transform: translateX(-50%);
+    }
+    .signal-labels .active {
+      color: var(--blue);
+      font-weight: 760;
+    }
+    .param-panel {
+      display: grid;
+      grid-template-columns: repeat(2, minmax(0, 1fr));
+      gap: 7px 10px;
+      margin-top: 12px;
+      padding: 8px;
+      padding-top: 10px;
+      border-top: 2px solid rgba(22, 119, 255, .78);
+      border-right: 1px solid #e0e7f2;
+      border-bottom: 1px solid #e0e7f2;
+      border-left: 1px solid #e0e7f2;
+      border-radius: 8px;
+      background: #fbfdff;
+    }
+    .param {
+      min-width: 0;
+    }
+    .param-wide {
+      grid-column: 1 / -1;
+    }
+    .step-switch {
+      display: grid;
+      grid-template-columns: repeat(5, minmax(0, 1fr));
+      gap: 5px;
+      margin-top: 6px;
+    }
+    .step-switch button {
+      height: 22px;
+      border: 1px solid #cbd8e8;
+      border-radius: 6px;
+      background: #fff;
+      color: #475569;
+      font-size: 9px;
+      font-weight: 720;
+      cursor: pointer;
+    }
+    .step-switch button.active {
+      border-color: rgba(22, 119, 255, .72);
+      background: rgba(22, 119, 255, .1);
+      color: var(--blue);
+    }
+    .demo-step-control {
+      margin-top: 12px;
+      padding: 7px 8px;
+      padding-top: 10px;
+      border-top: 2px solid rgba(22, 119, 255, .78);
+      border-right: 1px solid #e0e7f2;
+      border-bottom: 1px solid #e0e7f2;
+      border-left: 1px solid #e0e7f2;
+      border-radius: 8px;
+      background: #fbfdff;
+    }
+    .demo-step-control label {
+      display: flex;
+      justify-content: space-between;
+      gap: 6px;
+      color: #475569;
+      font-size: 9px;
+      font-weight: 650;
+      line-height: 1.2;
+    }
+    .demo-step-control output {
+      color: var(--blue);
+      font-weight: 760;
+    }
+    .timing-grid {
+      display: grid;
+      grid-template-columns: repeat(2, minmax(0, 1fr));
+      gap: 8px 10px;
+      margin-top: 9px;
+      padding-top: 8px;
+      border-top: 1px solid rgba(203,216,232,.82);
+    }
+    .param label {
+      display: flex;
+      justify-content: space-between;
+      gap: 6px;
+      color: #475569;
+      font-size: 9px;
+      font-weight: 650;
+      line-height: 1.2;
+    }
+    .param output {
+      color: var(--blue);
+      font-variant-numeric: tabular-nums;
+    }
+    .param input {
+      width: 100%;
+      margin: 5px 0 0;
+      accent-color: var(--blue);
+    }
+    .fusion-label {
+      --fusion-green-end: 69.6%;
+      --fusion-blue-start: 69.6%;
+      --fusion-blue-end: 83.2%;
+      --fusion-sweep-duration: 1800ms;
+      position: relative;
+      display: grid;
+      grid-template-columns: 1fr;
+      align-items: center;
+      min-height: 36px;
+      padding: 5px 10px;
+      border: 1px solid transparent;
+      border-radius: 8px;
+      background:
+        linear-gradient(#fff, #fff) padding-box,
+        linear-gradient(
+          90deg,
+          #13a36f 0 var(--fusion-green-end),
+          #1677ff var(--fusion-blue-start) var(--fusion-blue-end),
+          #dce5f2 var(--fusion-blue-end) 100%
+        ) border-box;
+      box-shadow: inset 0 1px 0 rgba(22,119,255,.06);
+    }
+    .fusion-label::before {
+      content: "";
+      position: absolute;
+      left: 0;
+      right: 0;
+      top: -1px;
+      height: 2px;
+      border-radius: 999px;
+      background:
+        linear-gradient(
+          90deg,
+          transparent 0%,
+          rgba(255,255,255,0) 30%,
+          rgba(125,185,255,.34) 42%,
+          rgba(255,255,255,.96) 50%,
+          rgba(125,185,255,.32) 58%,
+          rgba(255,255,255,0) 70%,
+          transparent 100%
+        );
+      background-position: -39.29% 0;
+      background-repeat: no-repeat;
+      background-size: 44% 100%;
+      filter: drop-shadow(0 0 2px rgba(22,119,255,.3));
+      pointer-events: none;
+      animation: fusionBorderSweepSync var(--fusion-sweep-duration) linear infinite;
+      animation-iteration-count: 1;
+      animation-fill-mode: both;
+    }
+    .fusion-label.sweep-reset::before,
+    .fusion-label.sweep-reset .fusion-step.active::after {
+      animation: none !important;
+    }
+    .fusion-label.sweep-reset::before {
+      background-position: -39.29% 0;
+      opacity: .96;
+    }
+    .fusion-label.sweep-reset .fusion-step.active::after {
+      background-position: 95.45% 0, 0 0;
+    }
+    .fusion-label.sweep-wait::before {
+      animation: none !important;
+      opacity: 0;
+    }
+    .fusion-label.sweep-wait .fusion-step.active::after {
+      animation: none !important;
+      background: var(--blue);
+    }
+    .fusion-steps {
+      display: grid;
+      grid-template-columns: repeat(5, minmax(0, 1fr));
+      gap: 4px;
+      min-width: 0;
+    }
+    .fusion-step {
+      position: relative;
+      min-width: 0;
+      padding-top: 1px;
+      color: #536175;
+      font-size: 9px;
+      font-weight: 650;
+      text-align: center;
+      white-space: nowrap;
+    }
+    .fusion-step .label {
+      display: block;
+      overflow: hidden;
+      text-overflow: ellipsis;
+      white-space: nowrap;
+    }
+    .fusion-step::after {
+      content: "";
+      display: block;
+      height: 5px;
+      margin-top: 4px;
+      border-radius: 999px;
+      background: #e8edf5;
+    }
+    .fusion-step.done { color: #14704d; }
+    .fusion-step.done::after { background: #97d8ba; }
+    .fusion-step.active {
+      color: #0b62cf;
+      font-weight: 760;
+    }
+    .fusion-step.active::after {
+      background:
+        linear-gradient(100deg, transparent 0 32%, rgba(255,255,255,.7) 44%, rgba(255,255,255,.9) 50%, rgba(255,255,255,.4) 57%, transparent 68%),
+        var(--blue);
+      background-size: 210% 100%, 100% 100%;
+      background-position: 95.45% 0, 0 0;
+      background-repeat: no-repeat, no-repeat;
+      box-shadow: 0 0 0 2px rgba(22,119,255,.1);
+      animation: fusionBarSweepSync var(--fusion-sweep-duration) linear infinite;
+      animation-iteration-count: 1;
+      animation-fill-mode: both;
+    }
+    @keyframes sweep {
+      from { transform: translateX(-100%); }
+      to { transform: translateX(100%); }
+    }
+    @keyframes fusionBarSweepSync {
+      from { background-position: 95.45% 0, 0 0; }
+      to { background-position: 4.55% 0, 0 0; }
+    }
+    @keyframes boltGlide {
+      from { stroke-dashoffset: 132; opacity: .38; }
+      50% { opacity: 1; }
+      to { stroke-dashoffset: -132; opacity: .38; }
+    }
+    @keyframes peakFlash {
+      0%, 34%, 100% { opacity: 0; transform: scaleY(.35); }
+      49% { opacity: .95; transform: scaleY(1.16); }
+      58% { opacity: .45; transform: scaleY(.8); }
+    }
+    @keyframes densePeakFlash {
+      0%, 32%, 100% { opacity: 0; transform: scaleY(.35); }
+      46% { opacity: 1; transform: scaleY(1.28); }
+      52% { opacity: .55; transform: scaleY(.9); }
+      60% { opacity: .35; transform: scaleY(.72); }
+    }
+    @keyframes nodePulse {
+      0%, 34% { box-shadow: 0 0 0 3px #fff, 0 0 0 4px rgba(22,119,255,.16), 0 0 8px rgba(22,119,255,.22); }
+      50% { box-shadow: 0 0 0 3px #fff, 0 0 0 8px rgba(22,119,255,.24), 0 0 14px rgba(22,119,255,.56); }
+      100% { box-shadow: 0 0 0 3px #fff, 0 0 0 10px rgba(22,119,255,0), 0 0 9px rgba(22,119,255,.1); }
+    }
+    @keyframes signalAbsorbGlow {
+      0% { opacity: 0; transform: scale(.72); }
+      22% { opacity: .42; transform: scale(1); }
+      100% { opacity: 0; transform: scale(1.9); }
+    }
+    @keyframes signalNodeInnerAbsorb {
+      0% { opacity: 0; transform: scale(.06); }
+      22% { opacity: .98; transform: scale(1.02); }
+      58% { opacity: .86; transform: scale(.9); }
+      100% { opacity: 0; transform: scale(.28); }
+    }
+    @keyframes signalNodeChargeRing {
+      0% { opacity: 0; transform: scale(.72) rotate(-120deg); }
+      18% { opacity: .96; transform: scale(1) rotate(-20deg); }
+      58% { opacity: .82; transform: scale(1.02) rotate(140deg); }
+      100% { opacity: 0; transform: scale(.74) rotate(255deg); }
+    }
+    @keyframes signalAbsorbCore {
+      0% { box-shadow: 0 0 0 3px #fff; }
+      30% { box-shadow: 0 0 0 3px #fff, 0 0 0 5px rgba(22,119,255,.2), 0 0 14px rgba(22,119,255,.56); }
+      100% { box-shadow: 0 0 0 3px #fff; }
+    }
+    @keyframes pulseBaseSoft {
+      0%, 100% { opacity: .45; transform: scaleX(.92); }
+      48% { opacity: .95; transform: scaleX(1); }
+    }
+    @keyframes pulseBaseDense {
+      from { background-position: 0 0, 0 0; opacity: .55; }
+      50% { opacity: .95; }
+      to { background-position: 26px 0, 0 0; opacity: .55; }
+    }
+    @keyframes pulsePacketSoft {
+      0% { opacity: 0; transform: translateX(-14%) scaleX(.72); }
+      20% { opacity: .86; transform: translateX(6%) scaleX(.94); }
+      56% { opacity: 1; transform: translateX(44%) scaleX(1.24); }
+      82% { opacity: .72; transform: translateX(76%) scaleX(.88); }
+      100% { opacity: 0; transform: translateX(96%) scaleX(.58); }
+    }
+    @keyframes pulseHaloSoft {
+      0%, 18%, 100% { opacity: 0; transform: translateX(-12%) scale(.72); }
+      48% { opacity: .82; transform: translateX(18%) scale(1.16); }
+      72% { opacity: .36; transform: translateX(44%) scale(.92); }
+    }
+    @keyframes pulsePacketDense {
+      0% { opacity: 0; transform: translateX(-12%) scaleX(.8); }
+      16% { opacity: .9; transform: translateX(4%) scaleX(1); }
+      48% { opacity: 1; transform: translateX(28%) scaleX(1.18); }
+      76% { opacity: .92; transform: translateX(54%) scaleX(.96); }
+      100% { opacity: 0; transform: translateX(74%) scaleX(.72); }
+    }
+    @keyframes pulseHaloDense {
+      0%, 100% { opacity: .16; transform: translateX(-4%) scale(.92); }
+      34% { opacity: .72; transform: translateX(10%) scale(1.1); }
+      66% { opacity: .38; transform: translateX(24%) scale(.98); }
+    }
+    @keyframes blueLineSweep {
+      0% { opacity: 0; transform: translateX(-48px); }
+      14% { opacity: .95; }
+      68% { opacity: 1; }
+      100% { opacity: 0; transform: translateX(128px); }
+    }
+    @keyframes waveSheen {
+      0% { opacity: 0; stroke-dashoffset: 178; }
+      16% { opacity: .92; }
+      72% { opacity: .98; }
+      100% { opacity: 0; stroke-dashoffset: -70; }
+    }
+    @keyframes fusionBorderSweepSync {
+      0% { background-position: -39.29% 0; opacity: .96; }
+      100% { background-position: 139.29% 0; opacity: .96; }
+    }
+    @media (max-width: 980px) {
+      .grid { grid-template-columns: repeat(2, minmax(0, 1fr)); }
+      .hint { display: none; }
+    }
+    @media (max-width: 760px) {
+      .grid { grid-template-columns: 1fr; }
+      .page { max-width: 460px; }
+    }
+  </style>
+</head>
+<body>
+  <main class="page">
+    <div class="intro">
+      <div>
+        <h1>v61：B 标签对齐版</h1>
+        <p class="subtitle">B1 下方 Step 标题改为跟随节点同一组位置对齐，并移除无信息价值的底部说明文字；D 保持 v60。</p>
+      </div>
+      <div class="hint">B2 已移除</div>
+    </div>
+
+    <section class="grid">
+      <article class="option" data-choice="a" onclick="toggleSelect(this)">
+        <div class="head">
+          <div class="title">A. 箭头轨道 基准版</div>
+          <div class="meta">保留对照</div>
+        </div>
+        <div class="composer">
+          <div class="chevrons" data-demo-steps="a">
+            <div class="step done" data-step-index="0">需求理解<span class="tip">已完成：识别业务场景、规模和预算。</span></div>
+            <div class="step done" data-step-index="1">架构规划<span class="tip">已完成：拆分网络、计算、访问入口。</span></div>
+            <div class="step done" data-step-index="2">方案评估<span class="tip">已完成：比较成本、复杂度和扩展性。</span></div>
+            <div class="step active" data-step-index="3">方案选择<span class="tip">进行中：正在生成方案卡片并等待确认。</span></div>
+            <div class="step" data-step-index="4">确认部署<span class="tip">未开始：选定方案后进入部署确认。</span></div>
+          </div>
+          <div class="input">请描述业务场景、访问规模、预算范围或已有资源约束</div>
+          <div class="actions">
+            <div class="ghosts"><button class="ghost">附件</button><button class="ghost">深度思考</button></div>
+            <button class="send">发送</button>
+          </div>
+          <div class="demo-step-control">
+            <label>演示 Step <output data-output="aActiveStep">方案选择</output></label>
+            <div class="step-switch" data-demo-target="a" aria-label="A 方案演示当前步骤">
+              <button type="button" data-step-index="0">1</button>
+              <button type="button" data-step-index="1">2</button>
+              <button type="button" data-step-index="2">3</button>
+              <button class="active" type="button" data-step-index="3">4</button>
+              <button type="button" data-step-index="4">5</button>
+            </div>
+          </div>
+        </div>
+      </article>
+
+      <article class="option" data-choice="b1" onclick="toggleSelect(this)">
+        <div class="head">
+          <div class="title">B1. 虚拟端点补齐</div>
+          <div class="meta">可调参数</div>
+        </div>
+        <div class="composer">
+          <div class="signal-circuit" id="signal-demo">
+            <svg class="signal-svg" viewBox="0 0 344 44" preserveAspectRatio="none" aria-hidden="true">
+              <path class="signal-rail" d="M 20 22 L 324 22"/>
+              <path id="signal-done" class="signal-done" d="M 20 22 L 172 22"/>
+              <path id="signal-active-in" class="signal-active-base signal-active-in" d="M 172 22 L 248 22"/>
+              <path id="signal-active-out" class="signal-active-base signal-active-out" d="M 248 22 L 324 22"/>
+              <path id="signal-wave" class="signal-moving-wave" d=""/>
+            </svg>
+            <span class="signal-absorb-halo" aria-hidden="true"></span>
+            <span class="signal-node" data-step-index="0" style="left:6%"><span class="signal-node-charge"></span><span class="signal-node-core"></span></span>
+            <span class="signal-node" data-step-index="1" style="left:28%"><span class="signal-node-charge"></span><span class="signal-node-core"></span></span>
+            <span class="signal-node" data-step-index="2" style="left:50%"><span class="signal-node-charge"></span><span class="signal-node-core"></span></span>
+            <span class="signal-node active" data-step-index="3" style="left:72%"><span class="signal-node-charge"></span><span class="signal-node-core"></span></span>
+            <span class="signal-node pending next" data-step-index="4" style="left:94%"><span class="signal-node-charge"></span><span class="signal-node-core"></span></span>
+            <div class="signal-labels">
+              <span data-step-index="0" style="left:6%">需求理解</span>
+              <span data-step-index="1" style="left:28%">架构规划</span>
+              <span data-step-index="2" style="left:50%">方案评估</span>
+              <span class="active" data-step-index="3" style="left:72%">方案选择</span>
+              <span data-step-index="4" style="left:94%">确认部署</span>
+            </div>
+          </div>
+          <div class="input">请描述业务场景、访问规模、预算范围或已有资源约束</div>
+          <div class="actions">
+            <div class="ghosts"><button class="ghost">附件</button><button class="ghost">深度思考</button></div>
+            <button class="send">发送</button>
+          </div>
+          <div class="param-panel" id="signal-controls">
+            <div class="param param-wide">
+              <label>演示 Step <output data-output="activeStep">方案选择</output></label>
+              <div class="step-switch" id="signal-step-switch" data-demo-target="b" aria-label="B 方案演示当前步骤">
+                <button type="button" data-step-index="0">1</button>
+                <button type="button" data-step-index="1">2</button>
+                <button type="button" data-step-index="2">3</button>
+                <button class="active" type="button" data-step-index="3">4</button>
+                <button type="button" data-step-index="4">5</button>
+              </div>
+            </div>
+            <div class="param">
+              <label>X <output data-output="xPercent">28%</output></label>
+              <input data-param="xPercent" type="range" min="6" max="38" value="28" step="1">
+            </div>
+            <div class="param">
+              <label>Y <output data-output="yPercent">49%</output></label>
+              <input data-param="yPercent" type="range" min="20" max="90" value="49" step="1">
+            </div>
+            <div class="param">
+              <label>T1 <output data-output="t1">140ms</output></label>
+              <input data-param="t1" type="range" min="80" max="700" value="140" step="20">
+            </div>
+            <div class="param">
+              <label>T2 <output data-output="t2">540ms</output></label>
+              <input data-param="t2" type="range" min="160" max="1400" value="540" step="20">
+            </div>
+            <div class="param">
+              <label>最大振幅 <output data-output="maxAmplitude">9</output></label>
+              <input data-param="maxAmplitude" type="range" min="8" max="22" value="9" step="1">
+            </div>
+            <div class="param">
+              <label>停顿时间 <output data-output="pauseTime">510ms</output></label>
+              <input data-param="pauseTime" type="range" min="120" max="1200" value="510" step="30">
+            </div>
+          </div>
+        </div>
+      </article>
+
+      <article class="option" data-choice="b2" onclick="toggleSelect(this)">
+        <div class="head">
+          <div class="title">B2. 蓝色脉冲波形 双扫光</div>
+          <div class="meta">紧凑双峰</div>
+        </div>
+        <div class="composer">
+          <div class="circuit dense pulse-dense blue-pulse blue-pulse-dense pulse-wave pulse-wave-dense">
+            <div class="track"></div>
+            <div class="quiet-segment"></div>
+            <div class="electric">
+              <svg viewBox="0 0 220 18" preserveAspectRatio="none" aria-hidden="true">
+                <defs>
+                  <linearGradient id="wave-sheen-dense" x1="0%" x2="100%" y1="0%" y2="0%">
+                    <stop offset="0%" stop-color="#1677ff" stop-opacity="0"/>
+                    <stop offset="30%" stop-color="#ffffff" stop-opacity=".1"/>
+                    <stop offset="48%" stop-color="#ffffff" stop-opacity="1"/>
+                    <stop offset="66%" stop-color="#ffffff" stop-opacity=".24"/>
+                    <stop offset="100%" stop-color="#ffffff" stop-opacity="0"/>
+                  </linearGradient>
+                </defs>
+                <polyline class="wave-base" points="0,11 22,11 32,9 42,11 60,11 70,8 80,11 99,11 108,3 118,11 136,11 145,6.5 155,11 174,11 184,8.8 194,11 220,11"/>
+                <polyline class="wave-sweep" points="0,11 22,11 32,9 42,11 60,11 70,8 80,11 99,11 108,3 118,11 136,11 145,6.5 155,11 174,11 184,8.8 194,11 220,11" stroke="url(#wave-sheen-dense)"/>
+                <polyline class="wave-sweep-2" points="0,11 22,11 32,9 42,11 60,11 70,8 80,11 99,11 108,3 118,11 136,11 145,6.5 155,11 174,11 184,8.8 194,11 220,11" stroke="url(#wave-sheen-dense)"/>
+              </svg>
+            </div>
+            <div class="nodes">
+              <div class="node">需求理解<span class="tip">已完成：需求已归纳。</span></div>
+              <div class="node">架构规划<span class="tip">已完成：资源关系已确定。</span></div>
+              <div class="node">方案评估<span class="tip">蓝色线路从上一步进入当前步骤。</span></div>
+              <div class="node active">方案选择<span class="tip">两道白色扫光形成更强脉冲感。</span></div>
+              <div class="node next">确认部署<span class="tip">进入下一步前逐步收束。</span></div>
+            </div>
+          </div>
+          <div class="input">请描述业务场景、访问规模、预算范围或已有资源约束</div>
+          <div class="actions">
+            <div class="ghosts"><button class="ghost">附件</button><button class="ghost">深度思考</button></div>
+            <button class="send">发送</button>
+          </div>
+        </div>
+      </article>
+
+      <article class="option" data-choice="d1" onclick="toggleSelect(this)">
+        <div class="head">
+          <div class="title">D1. 输入框融合 带标签</div>
+          <div class="meta">保留</div>
+        </div>
+        <div class="composer">
+          <div class="fusion-label">
+            <div class="fusion-steps">
+              <div class="fusion-step done" data-step-index="0"><span class="label">需求理解</span><span class="tip">已完成：需求已归纳。</span></div>
+              <div class="fusion-step done" data-step-index="1"><span class="label">架构规划</span><span class="tip">已完成：资源关系已确定。</span></div>
+              <div class="fusion-step done" data-step-index="2"><span class="label">方案评估</span><span class="tip">已完成：已比较候选方案。</span></div>
+              <div class="fusion-step active" data-step-index="3"><span class="label">方案选择</span><span class="tip">进行中：正在生成方案。</span></div>
+              <div class="fusion-step" data-step-index="4"><span class="label">确认部署</span><span class="tip">未开始：等待方案选择。</span></div>
+            </div>
+          </div>
+          <div class="input">请描述业务场景、访问规模、预算范围或已有资源约束</div>
+          <div class="actions">
+            <div class="ghosts"><button class="ghost">附件</button><button class="ghost">深度思考</button></div>
+            <button class="send">发送</button>
+          </div>
+          <div class="demo-step-control">
+            <label>演示 Step <output data-output="dActiveStep">方案选择</output></label>
+            <div class="step-switch" data-demo-target="d" aria-label="D 方案演示当前步骤">
+              <button type="button" data-step-index="0">1</button>
+              <button type="button" data-step-index="1">2</button>
+              <button type="button" data-step-index="2">3</button>
+              <button class="active" type="button" data-step-index="3">4</button>
+              <button type="button" data-step-index="4">5</button>
+            </div>
+            <div class="timing-grid" id="fusion-controls">
+              <div class="param">
+                <label>T1 <output data-fusion-output="t1">1800ms</output></label>
+                <input data-fusion-param="t1" type="range" min="800" max="3200" value="1800" step="100">
+              </div>
+              <div class="param">
+                <label>T2 <output data-fusion-output="t2">300ms</output></label>
+                <input data-fusion-param="t2" type="range" min="0" max="1200" value="300" step="50">
+              </div>
+            </div>
+          </div>
+        </div>
+      </article>
+    </section>
+  </main>
+  <script>
+    (() => {
+      const stepNames = ["需求理解", "架构规划", "方案评估", "方案选择", "确认部署"];
+      const stepStatus = ["理解需求中", "规划架构中", "评估方案中", "生成方案中", "确认部署中"];
+      const completedTips = [
+        "已完成：识别业务场景、规模和预算。",
+        "已完成：拆分网络、计算、访问入口。",
+        "已完成：比较成本、复杂度和扩展性。",
+        "已完成：方案卡片已生成并确认。",
+        "已完成：部署确认已完成。",
+      ];
+      const pendingTips = [
+        "未开始：等待需求输入。",
+        "未开始：等待需求理解。",
+        "未开始：等待架构规划。",
+        "未开始：等待方案评估。",
+        "未开始：等待方案选择。",
+      ];
+
+      function setSwitchState(target, activeIndex) {
+        document.querySelectorAll(`.step-switch[data-demo-target="${target}"] [data-step-index]`).forEach((button) => {
+          button.classList.toggle("active", Number(button.dataset.stepIndex) === activeIndex);
+        });
+      }
+
+      function updateTips(step, index, activeIndex) {
+        const tip = step.querySelector(".tip");
+        if (!tip) return;
+        if (index < activeIndex) {
+          tip.textContent = completedTips[index];
+        } else if (index === activeIndex) {
+          tip.textContent = `进行中：${stepStatus[index]}。`;
+        } else {
+          tip.textContent = pendingTips[index];
+        }
+      }
+
+      function setArrowStep(activeIndex) {
+        document.querySelectorAll('[data-demo-steps="a"] .step[data-step-index]').forEach((step) => {
+          const index = Number(step.dataset.stepIndex);
+          step.classList.toggle("done", index < activeIndex);
+          step.classList.toggle("active", index === activeIndex);
+          updateTips(step, index, activeIndex);
+        });
+        document.querySelector('[data-output="aActiveStep"]').textContent = stepNames[activeIndex];
+        setSwitchState("a", activeIndex);
+      }
+
+      let fusionActiveIndex = 3;
+      const fusionTiming = { t1: 1800, t2: 300 };
+      let fusionRunTimer = 0;
+      let fusionWaitTimer = 0;
+
+      function percent(value) {
+        return `${Math.max(0, Math.min(100, value)).toFixed(2)}%`;
+      }
+
+      function syncFusionBorder(activeIndex) {
+        const label = document.querySelector('[data-choice="d1"] .fusion-label');
+        const activeStep = label?.querySelector(`.fusion-step[data-step-index="${activeIndex}"]`);
+        if (!label || !activeStep) return;
+
+        const labelRect = label.getBoundingClientRect();
+        const activeRect = activeStep.getBoundingClientRect();
+        if (!labelRect.width) return;
+
+        const activeStart = ((activeRect.left - labelRect.left) / labelRect.width) * 100;
+        const activeEnd = ((activeRect.right - labelRect.left) / labelRect.width) * 100;
+        const blueStart = activeIndex === 0 ? 0 : activeStart;
+        const greenEnd = activeIndex === 0 ? 0 : activeStart;
+        const blueEnd = activeIndex === stepNames.length - 1 ? 100 : activeEnd;
+
+        label.style.setProperty("--fusion-green-end", percent(greenEnd));
+        label.style.setProperty("--fusion-blue-start", percent(blueStart));
+        label.style.setProperty("--fusion-blue-end", percent(blueEnd));
+      }
+
+      function syncFusionTiming() {
+        const controls = document.getElementById("fusion-controls");
+        const label = document.querySelector('[data-choice="d1"] .fusion-label');
+        if (!controls || !label) return;
+        controls.querySelectorAll("input[data-fusion-param]").forEach((input) => {
+          fusionTiming[input.dataset.fusionParam] = Number(input.value);
+          const output = controls.querySelector(`[data-fusion-output="${input.dataset.fusionParam}"]`);
+          if (output) output.textContent = `${input.value}ms`;
+        });
+        label.style.setProperty("--fusion-sweep-duration", `${fusionTiming.t1}ms`);
+      }
+
+      function restartFusionSweeps() {
+        const label = document.querySelector('[data-choice="d1"] .fusion-label');
+        if (!label) return;
+        window.clearTimeout(fusionRunTimer);
+        window.clearTimeout(fusionWaitTimer);
+        syncFusionTiming();
+        label.classList.remove("sweep-wait");
+        label.classList.add("sweep-reset");
+        void label.offsetWidth;
+        label.classList.remove("sweep-reset");
+        fusionRunTimer = window.setTimeout(() => {
+          label.classList.add("sweep-wait");
+          fusionWaitTimer = window.setTimeout(() => restartFusionSweeps(), fusionTiming.t2);
+        }, fusionTiming.t1);
+      }
+
+      function setFusionStep(activeIndex) {
+        fusionActiveIndex = activeIndex;
+        document.querySelectorAll(".fusion-step[data-step-index]").forEach((step) => {
+          const index = Number(step.dataset.stepIndex);
+          step.classList.toggle("done", index < activeIndex);
+          step.classList.toggle("active", index === activeIndex);
+          updateTips(step, index, activeIndex);
+        });
+        document.querySelector('[data-output="dActiveStep"]').textContent = stepNames[activeIndex];
+        setSwitchState("d", activeIndex);
+        requestAnimationFrame(() => {
+          syncFusionBorder(activeIndex);
+          restartFusionSweeps();
+        });
+      }
+
+      function setOptionStep(target, index) {
+        const activeIndex = Math.max(0, Math.min(stepNames.length - 1, Number(index)));
+        if (Number.isNaN(activeIndex)) return;
+        if (target === "a") setArrowStep(activeIndex);
+        if (target === "d") setFusionStep(activeIndex);
+      }
+
+      document.querySelectorAll('.step-switch[data-demo-target="a"], .step-switch[data-demo-target="d"]').forEach((switcher) => {
+        switcher.addEventListener("click", (event) => {
+          const button = event.target.closest("[data-step-index]");
+          if (!button) return;
+          setOptionStep(switcher.dataset.demoTarget, button.dataset.stepIndex);
+        });
+      });
+
+      window.setOptionStep = setOptionStep;
+      window.addEventListener("resize", () => syncFusionBorder(fusionActiveIndex));
+      document.getElementById("fusion-controls")?.addEventListener("input", () => restartFusionSweeps());
+      setArrowStep(3);
+      setFusionStep(3);
+    })();
+
+    (() => {
+      const wave = document.getElementById("signal-wave");
+      const demo = document.getElementById("signal-demo");
+      const controls = document.getElementById("signal-controls");
+      const donePath = document.getElementById("signal-done");
+      const activeInPath = document.getElementById("signal-active-in");
+      const activeOutPath = document.getElementById("signal-active-out");
+      const absorbHalo = document.querySelector(".signal-absorb-halo");
+      const signalNodes = [...document.querySelectorAll(".signal-node[data-step-index]")];
+      const signalLabels = [...document.querySelectorAll(".signal-labels [data-step-index]")];
+      const stepButtons = [...document.querySelectorAll("#signal-step-switch [data-step-index]")];
+      const activeStepOutput = controls?.querySelector('[data-output="activeStep"]');
+      if (!wave || !demo || !controls || !donePath || !activeInPath || !activeOutPath) return;
+
+      const params = {
+        xPercent: 28,
+        yPercent: 49,
+        t1: 140,
+        t2: 540,
+        maxAmplitude: 9,
+        pauseTime: 510,
+      };
+      const stepNames = ["需求理解", "架构规划", "方案评估", "方案选择", "确认部署"];
+      const stepPercents = [6, 28, 50, 72, 94];
+      const stepXs = [20, 96, 172, 248, 324];
+      const baseY = 22;
+      const viewMinX = 0;
+      const viewMaxX = 344;
+      const railStartX = stepXs[0];
+      const railEndX = stepXs[stepXs.length - 1];
+      const virtualPadding = 66;
+      const virtualLeftX = railStartX - virtualPadding;
+      const virtualRightX = railEndX + virtualPadding;
+      const nodeClearance = 10;
+      const outboundTailClearance = 6;
+      let activeIndex = 3;
+      let phase = "inbound";
+      let elapsed = 0;
+      let pauseLeft = 0;
+      let last = performance.now();
+      let cycleSalt = 0;
+      let absorbTimer = 0;
+
+      function readParams() {
+        controls.querySelectorAll("input[data-param]").forEach((input) => {
+          params[input.dataset.param] = Number(input.value);
+          const output = controls.querySelector(`[data-output="${input.dataset.param}"]`);
+          if (output) {
+            if (input.dataset.param === "xPercent" || input.dataset.param === "yPercent") {
+              output.textContent = `${input.value}%`;
+            } else if (input.dataset.param === "t1" || input.dataset.param === "t2" || input.dataset.param === "pauseTime") {
+              output.textContent = `${input.value}ms`;
+            } else {
+              output.textContent = input.value;
+            }
+          }
+        });
+        if (params.xPercent >= 48) params.xPercent = 48;
+        if (params.yPercent > 100) params.yPercent = 100;
+        if (demo) demo.style.setProperty("--absorb-duration", `${params.pauseTime}ms`);
+      }
+
+      function smoothstep(edge0, edge1, value) {
+        const x = Math.max(0, Math.min(1, (value - edge0) / (edge1 - edge0)));
+        return x * x * (3 - 2 * x);
+      }
+
+      function lerp(start, end, progress) {
+        return start + (end - start) * progress;
+      }
+
+      function clampToView(x) {
+        return Math.max(viewMinX, Math.min(viewMaxX, x));
+      }
+
+      function linePath(from, to) {
+        const start = clampToView(from);
+        const end = clampToView(to);
+        if (end - start < 1) return "";
+        return `M ${start} ${baseY} L ${end} ${baseY}`;
+      }
+
+      function inboundSegment() {
+        const currentX = stepXs[activeIndex];
+        return {
+          from: activeIndex === 0 ? virtualLeftX : stepXs[activeIndex - 1] + nodeClearance,
+          to: currentX - nodeClearance,
+          color: "#1677ff",
+          nextPhase: "pause-current",
+        };
+      }
+
+      function outboundSegment() {
+        const currentX = stepXs[activeIndex];
+        return {
+          from: currentX + nodeClearance,
+          to: activeIndex === stepXs.length - 1 ? virtualRightX : stepXs[activeIndex + 1] - outboundTailClearance,
+          color: "#8f9bae",
+          nextPhase: "pause-next",
+        };
+      }
+
+      function currentSegment() {
+        return (phase === "outbound" || phase === "pause-next") ? outboundSegment() : inboundSegment();
+      }
+
+      function renderStaticState() {
+        const currentX = stepXs[activeIndex];
+        const previousBaseX = activeIndex === 0 ? viewMinX : stepXs[activeIndex - 1];
+        const nextBaseX = activeIndex === stepXs.length - 1 ? viewMaxX : stepXs[activeIndex + 1];
+
+        donePath.setAttribute("d", activeIndex > 0 ? `M ${railStartX} ${baseY} L ${stepXs[activeIndex - 1]} ${baseY}` : "");
+        activeInPath.setAttribute("d", linePath(previousBaseX, currentX));
+        activeOutPath.setAttribute("d", linePath(currentX, nextBaseX));
+
+        if (absorbHalo) absorbHalo.style.left = `${stepPercents[activeIndex]}%`;
+        signalNodes.forEach((node) => {
+          const index = Number(node.dataset.stepIndex);
+          node.classList.toggle("active", index === activeIndex);
+          node.classList.toggle("pending", index > activeIndex);
+          node.classList.toggle("next", index === activeIndex + 1);
+        });
+        signalLabels.forEach((label) => {
+          label.classList.toggle("active", Number(label.dataset.stepIndex) === activeIndex);
+        });
+        stepButtons.forEach((button) => {
+          button.classList.toggle("active", Number(button.dataset.stepIndex) === activeIndex);
+        });
+        if (activeStepOutput) activeStepOutput.textContent = stepNames[activeIndex];
+      }
+
+      function progressEase(value) {
+        return smoothstep(0, 1, value);
+      }
+
+      function segmentMotion(timeMs) {
+        const x = Math.max(0.04, Math.min(0.48, params.xPercent / 100));
+        const y = Math.max(0, Math.min(1, params.yPercent / 100));
+        const t1 = Math.max(40, params.t1);
+        const t2 = Math.max(80, params.t2);
+        const middleLength = Math.max(0.04, 1 - 2 * x);
+
+        if (timeMs < t1) {
+          const u = Math.max(0, Math.min(1, timeMs / t1));
+          return {
+            anchor: "right",
+            progress: x * u,
+            amplitudeScale: y * progressEase(u),
+            done: false,
+          };
+        }
+
+        if (timeMs < t1 + t2) {
+          const u = Math.max(0, Math.min(1, (timeMs - t1) / t2));
+          return {
+            anchor: "right",
+            progress: x + (1 - x) * u,
+            amplitudeScale: y + (1 - y) * Math.sin(Math.PI * u),
+            done: false,
+          };
+        }
+
+        if (timeMs < t1 * 2 + t2) {
+          const u = Math.max(0, Math.min(1, (timeMs - t1 - t2) / t1));
+          return {
+            anchor: "left",
+            progress: 1 - x + x * u,
+            amplitudeScale: y * (1 - progressEase(u)),
+            done: false,
+          };
+        }
+
+        return {
+          anchor: "left",
+          progress: 1,
+          amplitudeScale: 0,
+          done: true,
+        };
+      }
+
+      function pulseShape(t) {
+        const micro = 0.1 * Math.sin((t * 2.6 + cycleSalt) * Math.PI);
+        const lift = Math.sin(Math.PI * smoothstep(0.16, 0.38, t));
+        const drop = Math.sin(Math.PI * smoothstep(0.37, 0.62, t));
+        const settle = 0.2 * Math.sin((t - 0.62) * Math.PI * 4.5 + cycleSalt * 0.4);
+        return micro + lift - drop * 0.86 + settle * smoothstep(0.58, 0.96, t);
+      }
+
+      function makeMovingWavePath() {
+        if (phase === "pause-current" || phase === "pause-next") return "";
+
+        const segment = currentSegment();
+        const segmentLength = segment.to - segment.from;
+        const xRatio = Math.max(0.04, Math.min(0.48, params.xPercent / 100));
+        const waveLength = segmentLength * xRatio;
+        const motion = segmentMotion(elapsed);
+        const amplitude = params.maxAmplitude * motion.amplitudeScale;
+        if (amplitude < 0.2) return "";
+        const right = motion.anchor === "left"
+          ? segment.from + motion.progress * segmentLength + waveLength
+          : segment.from + motion.progress * segmentLength;
+        const left = motion.anchor === "left"
+          ? segment.from + motion.progress * segmentLength
+          : right - waveLength;
+        const start = Math.max(segment.from, left);
+        const end = Math.min(segment.to, right);
+        if (end <= segment.from || start >= segment.to || end - start < 1) return "";
+
+        const points = [];
+        const samples = 54;
+        for (let i = 0; i <= samples; i += 1) {
+          const t = i / samples;
+          const x = start + t * (end - start);
+          const packetT = left < segment.from ? t : (x - left) / waveLength;
+          const envelope = smoothstep(0, 0.16, packetT) * (1 - smoothstep(0.84, 1, packetT));
+          const y = baseY - pulseShape(packetT) * amplitude * envelope;
+          points.push(`${i === 0 ? "M" : "L"} ${x.toFixed(2)} ${y.toFixed(2)}`);
+        }
+        return points.join(" ");
+      }
+
+      function render() {
+        wave.style.stroke = currentSegment().color;
+        wave.setAttribute("d", makeMovingWavePath());
+      }
+
+      function triggerAbsorbHalo() {
+        if (!demo) return;
+        demo.classList.remove("absorbing");
+        window.clearTimeout(absorbTimer);
+        void demo.offsetWidth;
+        demo.classList.add("absorbing");
+        absorbTimer = window.setTimeout(() => {
+          demo.classList.remove("absorbing");
+        }, params.pauseTime);
+      }
+
+      function setActiveIndex(index) {
+        const nextIndex = Math.max(0, Math.min(stepXs.length - 1, Number(index)));
+        if (Number.isNaN(nextIndex)) return;
+        activeIndex = nextIndex;
+        phase = "inbound";
+        elapsed = 0;
+        pauseLeft = 0;
+        cycleSalt = (cycleSalt + 0.37) % (Math.PI * 2);
+        demo.classList.remove("absorbing");
+        window.clearTimeout(absorbTimer);
+        renderStaticState();
+        render();
+      }
+
+      function tick(now) {
+        const dt = Math.min(48, now - last) / 1000;
+        last = now;
+
+        if (phase === "pause-current" || phase === "pause-next") {
+          pauseLeft -= dt * 1000;
+          if (pauseLeft <= 0) {
+            if (phase === "pause-current" && demo) {
+              demo.classList.remove("absorbing");
+              window.clearTimeout(absorbTimer);
+            }
+            phase = phase === "pause-current" ? "outbound" : "inbound";
+            elapsed = 0;
+            cycleSalt = (cycleSalt + 0.73) % (Math.PI * 2);
+          }
+          render();
+          requestAnimationFrame(tick);
+          return;
+        }
+
+        const segment = currentSegment();
+        elapsed += dt * 1000;
+        if (segmentMotion(elapsed).done) {
+          pauseLeft = params.pauseTime;
+          phase = segment.nextPhase;
+          if (phase === "pause-current") triggerAbsorbHalo();
+          elapsed = params.t1 * 2 + params.t2;
+        }
+        render();
+        requestAnimationFrame(tick);
+      }
+
+      controls.addEventListener("input", () => {
+        readParams();
+        render();
+      });
+      controls.addEventListener("click", (event) => {
+        const button = event.target.closest("#signal-step-switch [data-step-index]");
+        if (button) setActiveIndex(button.dataset.stepIndex);
+      });
+      window.setSignalActiveIndex = setActiveIndex;
+      readParams();
+      renderStaticState();
+      requestAnimationFrame((now) => {
+        last = now;
+        render();
+        tick(now);
+      });
+    })();
+  </script>
+</body>
+</html>
diff --git a/scripts/a2a/selling_console_web/index.html b/scripts/a2a/selling_console_web/index.html
new file mode 100644
index 00000000..63148bfa
--- /dev/null
+++ b/scripts/a2a/selling_console_web/index.html
@@ -0,0 +1,167 @@
+<!doctype html>
+<html lang="zh-CN">
+<head>
+  <meta charset="utf-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <title>阿里云售卖 Pipeline Console</title>
+  <link rel="stylesheet" href="/styles.css?v=__STATIC_ASSET_VERSION__">
+</head>
+<body>
+  <header class="topbar">
+    <button class="icon-button" type="button" aria-label="打开菜单">☰</button>
+    <div class="brand">
+      <strong>阿里云</strong>
+      <span>售卖 Pipeline Console</span>
+    </div>
+    <nav class="topbar-nav" aria-label="主导航">
+      <a href="#">工作台</a>
+      <a href="#">资源</a>
+      <button class="nav-pill" type="button">华东 1（杭州）</button>
+    </nav>
+    <label class="topbar-search">
+      <span>搜索</span>
+      <input type="search" placeholder="搜索产品、资源、文档">
+    </label>
+    <div class="topbar-links">
+      <a href="#">文档</a>
+      <a href="#">费用</a>
+      <a href="#">备案</a>
+      <a href="#">工单</a>
+    </div>
+    <div class="user-summary">
+      <span>企业账号</span>
+      <span class="avatar" aria-hidden="true">U</span>
+    </div>
+  </header>
+
+  <main class="console-shell">
+    <section id="workflow-panel" class="workflow-panel" aria-labelledby="workflow-title">
+      <div class="panel-heading">
+        <div>
+          <p class="eyebrow">AI 购买助手</p>
+          <h1 id="workflow-title">售卖 Pipeline</h1>
+        </div>
+        <span id="status-pill" class="status-pill">等待输入</span>
+      </div>
+      <div id="status-alert" class="status-alert" role="status" hidden></div>
+
+      <div id="step-list" class="step-list" aria-label="Pipeline 实时步骤"></div>
+
+      <div class="composer" aria-label="售卖需求输入">
+        <div id="composer-progress" class="composer-progress" aria-label="Pipeline 总进度"></div>
+        <div class="composer-box">
+          <textarea
+            id="composer-input"
+            rows="2"
+            placeholder="继续补充您的需求，比如降低成本、提升可用性或约束地域"
+          ></textarea>
+          <div class="composer-toolbar">
+            <div class="composer-tools">
+              <button id="deep-think-button" class="secondary-button compact-button" type="button">深度思考</button>
+            </div>
+            <div class="composer-actions">
+              <button class="secondary-button icon-only-button" type="button" aria-label="附件" title="附件">
+                <span class="attachment-icon" aria-hidden="true"></span>
+              </button>
+              <span class="composer-divider" aria-hidden="true"></span>
+              <button id="send-button" class="primary-button send-icon-button" type="button" aria-label="发送" title="发送">
+                <span class="send-icon" aria-hidden="true"></span>
+              </button>
+            </div>
+          </div>
+        </div>
+        <p class="ai-disclaimer">内容由 AI 生成，方案与价格仅供参考</p>
+      </div>
+    </section>
+
+    <section class="plan-area" aria-labelledby="plans-title">
+      <div class="plan-header">
+        <div class="plan-title-block">
+          <p class="eyebrow">方案预览</p>
+          <h1 id="plans-title">您的购买方案</h1>
+        </div>
+      </div>
+
+      <div id="plans-grid" class="plans-grid" aria-live="polite">
+        <article class="plan-card recommended">
+          <div class="plan-card-header">
+            <span class="tag">推荐</span>
+            <span class="score">匹配度 92%</span>
+          </div>
+          <h2>轻量 Web 应用方案</h2>
+          <p>适合中小规模业务上线，包含 VPC、ECS、SLB 与基础监控。</p>
+          <div class="price">¥ 238.00 / 月</div>
+          <dl class="plan-meta">
+            <div>
+              <dt>地域</dt>
+              <dd>华东 1（杭州）</dd>
+            </div>
+            <div>
+              <dt>弹性</dt>
+              <dd>支持后续扩容</dd>
+            </div>
+          </dl>
+        </article>
+        <article class="plan-card">
+          <div class="plan-card-header">
+            <span class="tag muted">备选</span>
+            <span class="score">匹配度 86%</span>
+          </div>
+          <h2>高可用标准方案</h2>
+          <p>面向生产流量，加入多可用区部署、日志服务与云安全中心。</p>
+          <div class="price">¥ 486.00 / 月</div>
+          <dl class="plan-meta">
+            <div>
+              <dt>地域</dt>
+              <dd>华东 1（杭州）</dd>
+            </div>
+            <div>
+              <dt>容灾</dt>
+              <dd>跨可用区</dd>
+            </div>
+          </dl>
+        </article>
+      </div>
+
+      <details id="debug-drawer" class="debug-drawer">
+        <summary>调试面板</summary>
+        <div class="debug-panel">
+          <div class="connection-controls" aria-label="连接控制">
+            <label>
+              <span>Server URL</span>
+              <input id="server-url" type="url" value="__DEFAULT_SERVER_URL_ATTR__">
+            </label>
+            <label>
+              <span>CWD</span>
+              <input id="cwd" type="text" value="__DEFAULT_CWD_ATTR__">
+            </label>
+            <div class="connection-actions">
+              <button id="health-button" class="secondary-button" type="button">连接检查</button>
+              <button id="fetch-state-button" class="secondary-button" type="button">同步状态</button>
+              <button id="cancel-button" class="secondary-button danger-button" type="button">取消任务</button>
+            </div>
+          </div>
+          <div id="debug-session-info" class="debug-session-info" aria-label="调试上下文"></div>
+          <div id="progress-debug-panel" class="progress-debug-panel" aria-label="进度条视觉调试"></div>
+          <details class="debug-output-block">
+            <summary>Pipeline Diagnostics</summary>
+            <pre id="debug-output">等待 pipeline 事件...</pre>
+          </details>
+        </div>
+      </details>
+    </section>
+
+    <aside class="utility-rail" aria-label="快捷工具">
+      <button type="button" title="帮助" aria-label="帮助">?</button>
+      <button type="button" title="刷新" aria-label="刷新">↻</button>
+      <button type="button" title="反馈" aria-label="反馈">!</button>
+      <button type="button" title="设置" aria-label="设置">⚙</button>
+    </aside>
+  </main>
+
+  <script>
+    window.SELLING_CONSOLE_DEFAULTS = __DEFAULTS_JSON__;
+  </script>
+  <script src="/app.js?v=__STATIC_ASSET_VERSION__"></script>
+</body>
+</html>
diff --git a/scripts/a2a/selling_console_web/styles.css b/scripts/a2a/selling_console_web/styles.css
new file mode 100644
index 00000000..e4198e90
--- /dev/null
+++ b/scripts/a2a/selling_console_web/styles.css
@@ -0,0 +1,2371 @@
+:root {
+  color-scheme: light;
+  --aliyun-orange: #ff6a00;
+  --aliyun-blue: #1677ff;
+  --ink: #1f2937;
+  --muted: #667085;
+  --subtle: #98a2b3;
+  --line: #d8e3f0;
+  --line-strong: #b8c7d9;
+  --surface: #f4f7fb;
+  --surface-blue: #f2f8ff;
+  --white: #ffffff;
+  --success: #0f9f6e;
+  --blue: var(--aliyun-blue);
+  --green: #13a36f;
+  --shadow: 0 8px 22px rgba(31, 41, 55, 0.08);
+}
+
+* {
+  box-sizing: border-box;
+}
+
+html {
+  height: 100%;
+  overflow-x: hidden;
+}
+
+body {
+  min-height: 100%;
+  margin: 0;
+  background: var(--surface);
+  color: var(--ink);
+  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "PingFang SC", "Microsoft YaHei", sans-serif;
+  font-size: 14px;
+  letter-spacing: 0;
+  overflow-x: hidden;
+}
+
+button,
+input,
+textarea {
+  font: inherit;
+}
+
+button {
+  cursor: pointer;
+}
+
+button:focus-visible,
+input:focus-visible,
+textarea:focus-visible,
+summary:focus-visible {
+  outline: 2px solid var(--aliyun-blue);
+  outline-offset: 2px;
+}
+
+a {
+  color: inherit;
+  text-decoration: none;
+}
+
+.topbar {
+  position: sticky;
+  top: 0;
+  z-index: 10;
+  display: flex;
+  align-items: center;
+  gap: 18px;
+  height: 64px;
+  max-width: 100vw;
+  padding: 0 24px;
+  border-bottom: 1px solid var(--line);
+  background: var(--white);
+  box-shadow: 0 1px 2px rgba(31, 41, 55, 0.04);
+}
+
+.icon-button {
+  width: 36px;
+  height: 36px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  color: var(--ink);
+}
+
+.brand {
+  display: flex;
+  align-items: baseline;
+  gap: 10px;
+  min-width: 200px;
+  white-space: nowrap;
+}
+
+.brand strong {
+  color: var(--aliyun-orange);
+  font-size: 22px;
+  font-weight: 700;
+}
+
+.brand span {
+  color: var(--muted);
+  font-weight: 600;
+}
+
+.topbar-nav,
+.topbar-links,
+.user-summary {
+  display: flex;
+  align-items: center;
+  gap: 14px;
+  white-space: nowrap;
+}
+
+.topbar-nav a,
+.topbar-links a {
+  color: var(--muted);
+}
+
+.topbar-nav a:hover,
+.topbar-links a:hover {
+  color: var(--aliyun-blue);
+}
+
+.nav-pill {
+  height: 32px;
+  border: 1px solid #bed7f5;
+  border-radius: 16px;
+  background: var(--surface-blue);
+  color: #1155a3;
+  padding: 0 14px;
+}
+
+.topbar-search {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+  flex: 1;
+  min-width: 0;
+  max-width: 520px;
+  height: 38px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: #fbfdff;
+  padding: 0 12px;
+  color: var(--subtle);
+}
+
+.topbar-search input {
+  width: 100%;
+  border: 0;
+  outline: 0;
+  background: transparent;
+  color: var(--ink);
+}
+
+.topbar-search:focus-within {
+  border-color: var(--aliyun-blue);
+  box-shadow: 0 0 0 3px rgba(22, 119, 255, 0.12);
+}
+
+.user-summary {
+  margin-left: auto;
+  color: var(--muted);
+}
+
+.avatar {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 34px;
+  height: 34px;
+  border-radius: 50%;
+  background: #edf4ff;
+  color: var(--aliyun-blue);
+  font-weight: 700;
+}
+
+.console-shell {
+  display: grid;
+  grid-template-columns: minmax(280px, 400px) minmax(0, 1fr) 56px;
+  gap: 16px;
+  width: 100%;
+  max-width: 100vw;
+  height: calc(100vh - 64px);
+  padding: 16px;
+  overflow-x: hidden;
+}
+
+.utility-rail {
+  display: flex;
+  flex-direction: column;
+  align-items: center;
+  gap: 12px;
+}
+
+.workflow-panel,
+.plan-area {
+  min-width: 0;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  box-shadow: var(--shadow);
+}
+
+.workflow-panel {
+  display: flex;
+  flex-direction: column;
+  height: calc(100vh - 96px);
+  min-height: 0;
+  overflow: hidden;
+}
+
+.panel-heading {
+  display: none;
+}
+
+.plan-header {
+  display: flex;
+  align-items: flex-start;
+  justify-content: space-between;
+  gap: 18px;
+  border-bottom: 1px solid var(--line);
+  padding: 20px 22px;
+}
+
+.plan-header {
+  flex-direction: column;
+  align-items: stretch;
+  padding: 18px 20px;
+}
+
+.eyebrow {
+  margin: 0 0 6px;
+  color: var(--aliyun-blue);
+  font-size: 12px;
+  font-weight: 700;
+}
+
+h1,
+h2,
+p {
+  margin-top: 0;
+}
+
+.panel-heading h1,
+.plan-header h1 {
+  margin-bottom: 0;
+  font-size: 22px;
+  line-height: 1.25;
+}
+
+.status-pill {
+  border: 1px solid #b7dfd0;
+  border-radius: 16px;
+  background: #eefaf5;
+  color: var(--success);
+  padding: 6px 12px;
+  font-weight: 700;
+}
+
+.status-alert {
+  display: none;
+  margin: 14px 20px 0;
+  border: 1px solid #9ec9fb;
+  border-radius: 8px;
+  background: var(--surface-blue);
+  color: #1155a3;
+  padding: 10px 12px;
+}
+
+.plan-card,
+.debug-output,
+.debug-drawer pre,
+.status-alert,
+.normal-handoff-message,
+.normal-turn,
+.normal-process,
+.step-card,
+.chat-bubble,
+.user-message-text,
+.connection-controls input {
+  overflow-wrap: anywhere;
+}
+
+.step-list {
+  display: grid;
+  align-content: start;
+  align-items: start;
+  flex: 1 1 auto;
+  gap: 5px;
+  min-height: 0;
+  overflow-y: auto;
+  padding: 8px 14px;
+}
+
+.chat-message {
+  display: flex;
+  align-items: flex-start;
+  gap: 7px;
+  min-width: 0;
+}
+
+.chat-message.system {
+  justify-content: flex-start;
+}
+
+.chat-message.user {
+  justify-content: flex-end;
+}
+
+.chat-message.user .chat-bubble {
+  order: 1;
+  max-width: 82%;
+}
+
+.chat-message.user .chat-avatar {
+  order: 2;
+}
+
+.chat-bubble {
+  min-width: 0;
+  max-width: 100%;
+}
+
+.chat-message.system .chat-bubble {
+  flex: 1 1 auto;
+}
+
+.chat-avatar {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  flex: 0 0 auto;
+  width: 24px;
+  height: 24px;
+  border-radius: 999px;
+  font-size: 11px;
+  font-weight: 800;
+  letter-spacing: 0;
+}
+
+.chat-avatar.system {
+  background: linear-gradient(135deg, #ff6a00 0%, #1677ff 100%);
+  color: var(--white);
+}
+
+.chat-avatar.user {
+  border: 1px solid #cfe0f7;
+  background: #edf4ff;
+  color: var(--aliyun-blue);
+}
+
+.chat-message.system .step-card,
+.chat-message.system .normal-handoff-message {
+  width: 100%;
+}
+
+.user-message-text {
+  margin: 0;
+  border: 1px solid #cfe0f7;
+  border-radius: 8px;
+  background: #edf4ff;
+  color: var(--ink);
+  padding: 6px 9px;
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.step-card {
+  display: grid;
+  grid-template-columns: 24px 1fr;
+  gap: 6px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: #fbfdff;
+  padding: 7px 8px;
+}
+
+.step-card.current {
+  border-color: #9ec9fb;
+  background: var(--surface-blue);
+}
+
+.step-card.completed {
+  align-items: center;
+  background: #fbfffd;
+  grid-template-columns: 24px 1fr;
+  gap: 6px;
+  padding: 6px 8px;
+}
+
+.step-card.failed,
+.step-card.error {
+  border-color: #f5b5ad;
+  background: #fff7f5;
+}
+
+.step-index {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 22px;
+  height: 22px;
+  border-radius: 50%;
+  background: var(--white);
+  color: var(--aliyun-blue);
+  font-size: 11px;
+  font-weight: 800;
+}
+
+.step-card.completed .step-index {
+  width: 22px;
+  height: 22px;
+}
+
+.step-state-icon {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 16px;
+  height: 16px;
+  border-radius: 999px;
+  color: var(--white);
+  font-size: 9px;
+  line-height: 1;
+}
+
+.step-state-icon.completed {
+  background: var(--success);
+}
+
+.step-state-icon.working {
+  background: var(--aliyun-blue);
+}
+
+.step-state-icon.waiting_input {
+  background: var(--aliyun-orange);
+}
+
+.step-state-icon.failed,
+.step-state-icon.error {
+  background: #d92d20;
+}
+
+.step-card h2 {
+  margin-bottom: 0;
+  font-size: 13px;
+  font-weight: 750;
+  line-height: 1.28;
+}
+
+.step-card-body {
+  min-width: 0;
+}
+
+.step-toggle {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 8px;
+  width: 100%;
+  border: 0;
+  background: transparent;
+  color: inherit;
+  padding: 0;
+  text-align: left;
+}
+
+.step-toggle-icon {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 18px;
+  height: 18px;
+  border-radius: 999px;
+  color: var(--subtle);
+}
+
+.step-toggle-icon::before {
+  content: "";
+  width: 6px;
+  height: 6px;
+  border-right: 1.5px solid currentColor;
+  border-bottom: 1.5px solid currentColor;
+  transform: rotate(45deg) translate(-1px, -1px);
+}
+
+.step-toggle-icon.expanded::before {
+  transform: rotate(225deg) translate(-1px, -1px);
+}
+
+.step-detail {
+  display: grid;
+  gap: 6px;
+  grid-column: 2;
+  min-width: 0;
+}
+
+.step-status {
+  color: var(--muted);
+  font-size: 11px;
+  font-weight: 700;
+}
+
+.step-event-list {
+  display: grid;
+  gap: 5px;
+  max-height: 180px;
+  overflow-y: auto;
+  margin: 0;
+  padding: 0;
+  padding-right: 4px;
+  list-style: none;
+}
+
+.step-waiting-prompt {
+  margin: 0;
+  color: var(--ink);
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.step-event-card,
+.step-result,
+.step-result-list {
+  margin-bottom: 0;
+  color: var(--muted);
+  line-height: 1.5;
+}
+
+.step-event-card {
+  border-left: 2px solid #9ec9fb;
+  border-radius: 6px;
+  background: rgba(255, 255, 255, 0.72);
+  padding-left: 8px;
+}
+
+.step-event-card.tool_result,
+.step-event-card.tool_use {
+  border-left-color: var(--aliyun-blue);
+  background: rgba(22, 119, 255, 0.06);
+}
+
+.step-event-card.input_required {
+  border-left-color: var(--aliyun-orange);
+  background: rgba(255, 106, 0, 0.06);
+}
+
+.step-event-card.text_delta .step-event-title::after {
+  content: "";
+  display: inline-block;
+  width: 1px;
+  height: 1em;
+  margin-left: 2px;
+  background: currentColor;
+  transform: translateY(2px);
+  animation: typingCaret 0.9s steps(1, end) infinite;
+}
+
+.step-event-label {
+  display: inline-flex;
+  margin-bottom: 3px;
+  color: var(--aliyun-blue);
+  font-size: 11px;
+  font-weight: 800;
+}
+
+.step-event-title {
+  margin-bottom: 4px;
+  color: var(--ink);
+  font-size: 12px;
+  font-weight: 700;
+  line-height: 1.45;
+}
+
+.step-event-meta,
+.step-result-list {
+  display: grid;
+  gap: 4px;
+  margin: 0;
+}
+
+.step-event-meta div,
+.step-result-list div {
+  display: grid;
+  grid-template-columns: auto minmax(0, 1fr);
+  gap: 4px;
+  min-width: 0;
+}
+
+.step-event-meta dt,
+.step-result-list dt {
+  color: var(--subtle);
+  font-weight: 700;
+}
+
+.step-event-meta dd,
+.step-result-list dd {
+  margin: 0;
+  color: var(--ink);
+  overflow-wrap: anywhere;
+}
+
+.step-candidate-progress-list {
+  display: grid;
+  gap: 6px;
+  margin: 0;
+}
+
+.step-candidate-progress {
+  display: grid;
+  gap: 3px;
+  border-left: 2px solid #9ec9fb;
+  border-radius: 6px;
+  background: rgba(255, 255, 255, 0.74);
+  padding: 8px 9px;
+}
+
+.step-candidate-progress-head {
+  display: flex;
+  align-items: baseline;
+  gap: 6px;
+  min-width: 0;
+}
+
+.step-candidate-progress strong {
+  color: var(--ink);
+  font-size: 12px;
+  white-space: nowrap;
+}
+
+.step-candidate-progress span {
+  color: var(--muted);
+  font-size: 12px;
+  min-width: 0;
+}
+
+.step-candidate-progress-head span {
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.step-candidate-progress p {
+  margin: 0;
+  color: var(--ink);
+  font-size: 12px;
+  line-height: 1.45;
+  overflow-wrap: anywhere;
+}
+
+.step-result-options {
+  display: grid;
+  gap: 8px;
+}
+
+.step-result-option {
+  display: grid;
+  gap: 4px;
+  border: 1px solid #dbe6f5;
+  border-radius: 8px;
+  background: rgba(255, 255, 255, 0.72);
+  padding: 9px 10px;
+}
+
+.step-result-option strong {
+  color: var(--ink);
+  font-size: 12px;
+}
+
+.step-result-option span {
+  color: var(--muted);
+  font-size: 12px;
+}
+
+.step-result-option .price {
+  color: var(--aliyun-orange);
+  font-weight: 800;
+}
+
+.step-process {
+  display: grid;
+  gap: 6px;
+  border-top: 1px solid #edf2f7;
+  padding-top: 8px;
+}
+
+.step-process-head {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 8px;
+  color: var(--muted);
+  cursor: pointer;
+  font-size: 12px;
+  list-style: none;
+}
+
+.step-process-head::-webkit-details-marker {
+  display: none;
+}
+
+.step-process-head strong {
+  color: var(--aliyun-blue);
+  font-size: 12px;
+}
+
+.step-process-events {
+  margin-top: 6px;
+}
+
+.step-candidate-result-list {
+  display: grid;
+  gap: 8px;
+}
+
+.step-candidate-result {
+  display: grid;
+  gap: 6px;
+  border: 1px solid #dbe6f5;
+  border-radius: 8px;
+  background: rgba(255, 255, 255, 0.72);
+  padding: 8px 9px;
+}
+
+.step-candidate-result-head {
+  display: flex;
+  align-items: baseline;
+  gap: 8px;
+  min-width: 0;
+}
+
+.step-candidate-result-head strong {
+  color: var(--aliyun-blue);
+  font-size: 12px;
+  white-space: nowrap;
+}
+
+.step-candidate-result-head span {
+  min-width: 0;
+  color: var(--ink);
+  font-size: 12px;
+  font-weight: 800;
+}
+
+.step-candidate-result-summary {
+  margin: 0;
+  color: var(--muted);
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.step-candidate-result-label {
+  color: var(--aliyun-blue);
+  font-size: 11px;
+  font-weight: 800;
+}
+
+.step-candidate-result-template {
+  color: var(--subtle);
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.step-candidate-result-price {
+  color: var(--aliyun-orange);
+  font-size: 12px;
+  font-weight: 800;
+}
+
+.step-candidate-result-process {
+  display: grid;
+  gap: 6px;
+  border-top: 1px solid #edf2f7;
+  padding-top: 6px;
+}
+
+.step-candidate-result-process-body {
+  max-height: 180px;
+  overflow-y: auto;
+  padding-right: 4px;
+}
+
+.candidate-choice-list {
+  display: grid;
+  gap: 10px;
+}
+
+.pending-input-card {
+  display: grid;
+  gap: 10px;
+  border: 1px solid #ffd0a8;
+  border-radius: 8px;
+  background: #fffaf5;
+  padding: 12px;
+}
+
+.pending-input-card h2 {
+  margin: 0;
+  color: var(--aliyun-orange);
+  font-size: 13px;
+}
+
+.pending-input-prompt {
+  margin: 0;
+  color: var(--ink);
+  line-height: 1.55;
+}
+
+.pending-input-prompt p,
+.pending-input-option-description p {
+  margin: 0;
+}
+
+.pending-input-prompt ul,
+.pending-input-prompt ol,
+.pending-input-option-description ul,
+.pending-input-option-description ol {
+  display: grid;
+  gap: 2px;
+  margin: 4px 0 0;
+  padding-left: 18px;
+}
+
+.pending-input-prompt a,
+.pending-input-option-description a {
+  color: var(--aliyun-blue);
+  text-decoration: none;
+}
+
+.pending-input-prompt a:hover,
+.pending-input-option-description a:hover {
+  text-decoration: underline;
+}
+
+.pending-input-options {
+  display: grid;
+  gap: 8px;
+}
+
+.pending-input-option {
+  display: grid;
+  gap: 4px;
+  width: 100%;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  color: var(--ink);
+  padding: 10px 12px;
+  text-align: left;
+  line-height: 1.45;
+}
+
+.pending-input-option:hover,
+.pending-input-option.selected {
+  border-color: #9ec9fb;
+  background: var(--surface-blue);
+}
+
+.pending-input-option span {
+  color: var(--muted);
+  font-size: 12px;
+}
+
+.pending-input-option-description {
+  color: var(--muted);
+  font-size: 12px;
+}
+
+.template-popover-host {
+  position: relative;
+}
+
+.template-popover {
+  position: absolute;
+  right: 12px;
+  bottom: 12px;
+  left: 12px;
+  z-index: 30;
+  display: grid;
+  gap: 8px;
+  max-height: 260px;
+  overflow-y: auto;
+  pointer-events: auto;
+  visibility: hidden;
+  border: 1px solid #c7d7eb;
+  border-radius: 8px;
+  background: rgba(15, 23, 42, 0.96);
+  box-shadow: 0 14px 36px rgba(15, 23, 42, 0.22);
+  color: var(--white);
+  opacity: 0;
+  padding: 10px 12px;
+  transform: translateY(4px);
+  transition: opacity 140ms ease, transform 140ms ease, visibility 0ms linear 140ms;
+  transition-delay: 0ms, 0ms, 140ms;
+}
+
+.template-popover-host:hover .template-popover,
+.template-popover-host:focus-within .template-popover,
+.template-popover:hover {
+  visibility: visible;
+  opacity: 1;
+  transform: translateY(0);
+  transition-delay: 500ms, 500ms, 500ms;
+}
+
+.template-popover-title {
+  color: #dbeafe;
+  font-size: 12px;
+  font-weight: 800;
+}
+
+.template-popover pre {
+  margin: 0;
+  color: #f8fafc;
+  font-size: 11px;
+  line-height: 1.5;
+  overflow-wrap: anywhere;
+  white-space: pre-wrap;
+}
+
+.candidate-choice {
+  width: 100%;
+  min-width: 0;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  color: var(--ink);
+  padding: 12px 14px;
+  text-align: left;
+  line-height: 1.55;
+  overflow-wrap: anywhere;
+}
+
+.candidate-choice:hover,
+.candidate-choice.selected {
+  border-color: #9ec9fb;
+  background: var(--surface-blue);
+}
+
+.candidate-subpipeline {
+  display: grid;
+  gap: 8px;
+  margin-top: 12px;
+  border-top: 1px solid #edf2f7;
+  padding-top: 12px;
+}
+
+.candidate-subpipeline-head {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 10px;
+  color: var(--muted);
+  cursor: pointer;
+  font-size: 12px;
+  list-style: none;
+}
+
+.candidate-subpipeline-head::-webkit-details-marker {
+  display: none;
+}
+
+.candidate-subpipeline-head strong {
+  color: var(--aliyun-blue);
+  font-size: 12px;
+}
+
+.candidate-subpipeline-arrow {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 18px;
+  height: 18px;
+  border: 1px solid #c7d7eb;
+  border-radius: 999px;
+  color: var(--subtle);
+  flex: 0 0 auto;
+}
+
+.candidate-subpipeline-arrow::before {
+  content: "";
+  width: 5px;
+  height: 5px;
+  border-right: 1.5px solid currentColor;
+  border-bottom: 1.5px solid currentColor;
+  transform: rotate(45deg) translate(-1px, -1px);
+}
+
+.candidate-subpipeline[open] .candidate-subpipeline-arrow::before {
+  transform: rotate(225deg) translate(-1px, -1px);
+}
+
+.candidate-subpipeline-body {
+  max-height: 180px;
+  overflow-y: auto;
+  padding-right: 4px;
+}
+
+.candidate-substeps {
+  display: grid;
+  gap: 6px;
+}
+
+.candidate-substep {
+  display: grid;
+  gap: 6px;
+  border-radius: 7px;
+  background: rgba(255, 255, 255, 0.62);
+  padding: 7px 8px;
+}
+
+.candidate-substep-head {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 8px;
+  color: var(--muted);
+  cursor: pointer;
+  font-size: 12px;
+  list-style: none;
+}
+
+.candidate-substep-head::-webkit-details-marker {
+  display: none;
+}
+
+.candidate-substep-head strong {
+  color: var(--ink);
+  font-size: 12px;
+}
+
+.candidate-subpipeline-events {
+  display: grid;
+  gap: 6px;
+  margin: 0;
+  padding: 0;
+  list-style: none;
+}
+
+.candidate-subpipeline-event {
+  display: grid;
+  grid-template-columns: auto minmax(0, 1fr);
+  gap: 8px;
+  align-items: start;
+  border-left: 2px solid #9ec9fb;
+  padding-left: 8px;
+  color: var(--muted);
+  font-size: 12px;
+}
+
+.candidate-subpipeline-event p {
+  margin: 0;
+  color: var(--ink);
+  overflow-wrap: anywhere;
+}
+
+.candidate-subpipeline-label {
+  color: var(--subtle);
+  font-weight: 700;
+  white-space: nowrap;
+}
+
+.composer {
+  flex: 0 0 auto;
+  margin-top: auto;
+  padding: 6px 14px 10px;
+}
+
+.normal-handoff-message {
+  display: grid;
+  gap: 4px;
+  border: 1px solid #b7ead4;
+  border-radius: 8px;
+  background: #f2fbf7;
+  color: #12734d;
+  padding: 9px 10px;
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.normal-handoff-message strong {
+  font-weight: 800;
+}
+
+.normal-handoff-message p {
+  margin: 0;
+  color: #12734d;
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.normal-turn {
+  display: grid;
+  gap: 6px;
+  width: 100%;
+  border: 1px solid #cfe0f7;
+  border-radius: 8px;
+  background: #fbfdff;
+  padding: 8px 10px;
+  font-size: 12px;
+  line-height: 1.45;
+}
+
+.normal-turn.working {
+  border-color: #9ec9fb;
+  background: var(--surface-blue);
+}
+
+.normal-turn.failed,
+.normal-turn.error {
+  border-color: #f5b5ad;
+  background: #fff7f5;
+}
+
+.normal-process {
+  border: 0;
+  border-bottom: 1px solid #e3ebf6;
+  padding-bottom: 5px;
+}
+
+.normal-process-summary {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 8px;
+  color: var(--aliyun-blue);
+  font-size: 12px;
+  font-weight: 750;
+  line-height: 1.3;
+  list-style: none;
+  cursor: pointer;
+}
+
+.normal-process-summary::-webkit-details-marker {
+  display: none;
+}
+
+.normal-process-summary::after {
+  content: "⌄";
+  color: var(--subtle);
+  font-size: 12px;
+  transition: transform 0.16s ease;
+}
+
+.normal-process[open] .normal-process-summary::after {
+  transform: rotate(180deg);
+}
+
+.normal-process-count {
+  margin-left: auto;
+  color: var(--muted);
+  font-size: 11px;
+  font-weight: 650;
+}
+
+.normal-process-events {
+  display: grid;
+  gap: 5px;
+  max-height: 180px;
+  margin: 6px 0 0;
+  padding: 0;
+  overflow-y: auto;
+  list-style: none;
+}
+
+.normal-process-event {
+  display: grid;
+  grid-template-columns: auto minmax(0, 1fr);
+  gap: 7px;
+  align-items: start;
+  border-left: 2px solid #9ec9fb;
+  padding-left: 7px;
+  color: var(--muted);
+}
+
+.normal-process-event-label {
+  color: var(--subtle);
+  font-weight: 750;
+  white-space: nowrap;
+}
+
+.normal-process-event p {
+  margin: 0;
+  color: var(--ink);
+}
+
+.normal-answer {
+  margin: 0;
+  color: var(--ink);
+  font-size: 12px;
+  line-height: 1.5;
+}
+
+.composer-progress {
+  margin-bottom: 8px;
+  min-width: 0;
+}
+
+.composer-progress[hidden] {
+  display: none;
+}
+
+.composer-progress:not([hidden]) {
+  position: relative;
+  margin-bottom: 8px;
+  border-bottom: 1px solid var(--line);
+  padding-bottom: 8px;
+}
+
+.progress-shell {
+  display: block;
+}
+
+.composer-progress .tip {
+  position: absolute;
+  z-index: 50;
+  left: 50%;
+  top: calc(100% + 8px);
+  width: max-content;
+  max-width: 196px;
+  transform: translateX(-50%) translateY(-3px);
+  padding: 8px 10px;
+  border-radius: 8px;
+  background: #111827;
+  color: #f8fafc;
+  font-size: 10px;
+  font-weight: 500;
+  line-height: 1.45;
+  white-space: normal;
+  opacity: 0;
+  pointer-events: none;
+  transition: opacity 0.15s ease, transform 0.15s ease;
+  box-shadow: 0 12px 28px rgba(15, 23, 42, 0.22);
+}
+
+.composer-progress .step:hover .tip,
+.composer-progress .signal-node:hover .tip,
+.composer-progress .fusion-step:hover .tip {
+  opacity: 1;
+  transform: translateX(-50%) translateY(0);
+}
+
+.composer-progress.chevrons {
+  display: grid;
+  grid-template-columns: repeat(5, minmax(0, 1fr));
+  height: 32px;
+  isolation: isolate;
+}
+
+.chevrons .step {
+  position: relative;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  min-width: 0;
+  margin-left: -6px;
+  padding: 0 10px 0 14px;
+  clip-path: polygon(0 0, calc(100% - 8px) 0, 100% 50%, calc(100% - 8px) 100%, 0 100%, 8px 50%);
+  background: #edf2f7;
+  color: #405066;
+  font-size: 10px;
+  font-weight: 700;
+  line-height: 1.2;
+  white-space: nowrap;
+}
+
+.chevrons .step:first-child {
+  margin-left: 0;
+  border-radius: 7px 0 0 7px;
+  clip-path: polygon(0 0, calc(100% - 8px) 0, 100% 50%, calc(100% - 8px) 100%, 0 100%);
+}
+
+.chevrons .step:last-child {
+  border-radius: 0 7px 7px 0;
+}
+
+.chevrons .done {
+  background: #e9f7f1;
+  color: #14704d;
+}
+
+.chevrons .active {
+  z-index: 2;
+  background: linear-gradient(90deg, #1677ff, #28a4ff);
+  color: #fff;
+  box-shadow: 0 4px 11px rgba(22, 119, 255, 0.2);
+}
+
+.chevrons .active::after {
+  content: "";
+  position: absolute;
+  inset: 0;
+  background: linear-gradient(
+    110deg,
+    transparent 0%,
+    transparent 38%,
+    rgba(255, 255, 255, 0.5) 50%,
+    transparent 62%,
+    transparent 100%
+  );
+  animation: sweep var(--progress-a-sweep-ms, 1800ms) linear infinite;
+}
+
+.signal-circuit {
+  position: relative;
+  height: 50px;
+  padding: 2px 8px 0;
+  overflow: hidden;
+  --absorb-duration: 510ms;
+}
+
+.signal-svg {
+  position: absolute;
+  inset: 0 8px auto 8px;
+  width: calc(100% - 16px);
+  height: 36px;
+  overflow: visible;
+}
+
+.signal-active-base,
+.signal-moving-wave,
+.signal-rail,
+.signal-done {
+  fill: none;
+  stroke-linecap: round;
+  stroke-linejoin: round;
+  vector-effect: non-scaling-stroke;
+}
+
+.signal-rail {
+  stroke: #d5dfec;
+  stroke-width: 2px;
+}
+
+.signal-done {
+  stroke: var(--green);
+  stroke-width: 2px;
+}
+
+.signal-active-base {
+  stroke-width: 1.35px;
+}
+
+.signal-active-in {
+  stroke: rgba(22, 119, 255, 0.46);
+}
+
+.signal-active-out {
+  stroke: rgba(143, 155, 174, 0.6);
+}
+
+.signal-moving-wave {
+  stroke: var(--blue);
+  stroke-width: 1.2px;
+  opacity: 0.98;
+}
+
+.signal-node {
+  position: absolute;
+  top: 18px;
+  width: 12px;
+  height: 12px;
+  border: 2px solid #7cc8a6;
+  border-radius: 50%;
+  background: #fff;
+  transform: translate(-50%, -50%);
+  z-index: 2;
+}
+
+.signal-node.active {
+  width: 15px;
+  height: 15px;
+  border-color: var(--blue);
+  box-shadow: 0 0 0 3px #fff;
+  overflow: hidden;
+}
+
+.signal-absorb-halo {
+  position: absolute;
+  top: 18px;
+  width: 20px;
+  height: 20px;
+  transform: translate(-50%, -50%);
+  pointer-events: none;
+  z-index: 1;
+}
+
+.signal-absorb-halo::before {
+  content: "";
+  position: absolute;
+  inset: 0;
+  border-radius: 999px;
+  opacity: 0;
+  transform: scale(0.78);
+  transform-origin: center;
+  background: radial-gradient(circle, rgba(64, 217, 255, 0.34) 0 34%, rgba(22, 119, 255, 0.16) 52%, rgba(22, 119, 255, 0) 76%);
+  filter: blur(0.3px);
+}
+
+.signal-node-core {
+  position: absolute;
+  inset: 1.5px;
+  border-radius: 999px;
+  background: radial-gradient(
+    circle at 50% 48%,
+    rgba(255, 255, 255, 1) 0 12%,
+    rgba(110, 230, 255, 0.98) 30%,
+    rgba(22, 119, 255, 0.92) 68%,
+    rgba(22, 119, 255, 0.16) 100%
+  );
+  opacity: 0;
+  transform: scale(0.08);
+  transform-origin: center;
+  box-shadow: inset 0 0 3px rgba(255, 255, 255, 0.7), 0 0 10px rgba(22, 119, 255, 0.56);
+}
+
+.signal-node-charge {
+  position: absolute;
+  inset: 1.5px;
+  border-radius: 999px;
+  opacity: 0;
+  transform: scale(0.76) rotate(-90deg);
+  transform-origin: center;
+  background:
+    conic-gradient(
+      from 210deg,
+      rgba(22, 119, 255, 0) 0deg,
+      rgba(22, 119, 255, 0.22) 42deg,
+      rgba(64, 217, 255, 0.95) 86deg,
+      rgba(255, 255, 255, 0.98) 126deg,
+      rgba(22, 119, 255, 0.92) 178deg,
+      rgba(22, 119, 255, 0.16) 232deg,
+      rgba(22, 119, 255, 0) 300deg,
+      rgba(22, 119, 255, 0) 360deg
+    );
+  box-shadow: inset 0 0 5px rgba(255, 255, 255, 0.45), 0 0 7px rgba(22, 119, 255, 0.44);
+  filter: saturate(1.08);
+}
+
+.signal-circuit.absorbing .signal-absorb-halo::before {
+  animation: signalAbsorbGlow var(--absorb-duration) ease-out both;
+}
+
+.signal-circuit.absorbing .signal-node.active .signal-node-charge {
+  animation: signalNodeChargeRing var(--absorb-duration) cubic-bezier(0.18, 0.78, 0.24, 1) both;
+}
+
+.signal-circuit.absorbing .signal-node.active .signal-node-core {
+  animation: signalNodeInnerAbsorb var(--absorb-duration) ease-out both;
+}
+
+.signal-circuit.absorbing .signal-node.active {
+  animation: signalAbsorbCore var(--absorb-duration) ease-out both;
+}
+
+.signal-node.next,
+.signal-node.pending {
+  border-color: #b9c5d4;
+}
+
+.signal-labels {
+  position: absolute;
+  left: 0;
+  right: 0;
+  top: 32px;
+  color: #42526a;
+  font-size: 9px;
+  font-weight: 650;
+  text-align: center;
+  white-space: nowrap;
+}
+
+.signal-labels span {
+  position: absolute;
+  top: 0;
+  transform: translateX(-50%);
+}
+
+.signal-labels .active {
+  color: var(--blue);
+  font-weight: 760;
+}
+
+.fusion-label {
+  --fusion-green-end: 69.6%;
+  --fusion-blue-start: 69.6%;
+  --fusion-blue-end: 83.2%;
+  --fusion-sweep-duration: 1800ms;
+  position: relative;
+  display: grid;
+  grid-template-columns: 1fr;
+  align-items: center;
+  min-height: 36px;
+  padding: 5px 10px;
+  border: 1px solid transparent;
+  border-radius: 8px;
+  background:
+    linear-gradient(#fff, #fff) padding-box,
+    linear-gradient(
+      90deg,
+      #13a36f 0 var(--fusion-green-end),
+      #1677ff var(--fusion-blue-start) var(--fusion-blue-end),
+      #dce5f2 var(--fusion-blue-end) 100%
+    ) border-box;
+  box-shadow: inset 0 1px 0 rgba(22, 119, 255, 0.06);
+}
+
+.fusion-label::before {
+  content: "";
+  position: absolute;
+  left: 0;
+  right: 0;
+  top: -1px;
+  height: 2px;
+  border-radius: 999px;
+  background:
+    linear-gradient(
+      90deg,
+      transparent 0%,
+      rgba(255, 255, 255, 0) 30%,
+      rgba(125, 185, 255, 0.34) 42%,
+      rgba(255, 255, 255, 0.96) 50%,
+      rgba(125, 185, 255, 0.32) 58%,
+      rgba(255, 255, 255, 0) 70%,
+      transparent 100%
+    );
+  background-position: -39.29% 0;
+  background-repeat: no-repeat;
+  background-size: 44% 100%;
+  filter: drop-shadow(0 0 2px rgba(22, 119, 255, 0.3));
+  pointer-events: none;
+  animation: fusionBorderSweepSync var(--fusion-sweep-duration) linear infinite;
+  animation-iteration-count: 1;
+  animation-fill-mode: both;
+}
+
+.fusion-label.sweep-reset::before,
+.fusion-label.sweep-reset .fusion-step.active::after {
+  animation: none !important;
+}
+
+.fusion-label.sweep-reset::before {
+  background-position: -39.29% 0;
+  opacity: 0.96;
+}
+
+.fusion-label.sweep-reset .fusion-step.active::after {
+  background-position: 95.45% 0, 0 0;
+}
+
+.fusion-label.sweep-wait::before {
+  animation: none !important;
+  opacity: 0;
+}
+
+.fusion-label.sweep-wait .fusion-step.active::after {
+  animation: none !important;
+  background: var(--blue);
+}
+
+.fusion-steps {
+  display: grid;
+  grid-template-columns: repeat(5, minmax(0, 1fr));
+  gap: 4px;
+  min-width: 0;
+}
+
+.fusion-step {
+  position: relative;
+  min-width: 0;
+  padding-top: 1px;
+  color: #536175;
+  font-size: 9px;
+  font-weight: 650;
+  text-align: center;
+  white-space: nowrap;
+}
+
+.fusion-step .label {
+  display: block;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.fusion-step::after {
+  content: "";
+  display: block;
+  height: 5px;
+  margin-top: 4px;
+  border-radius: 999px;
+  background: #e8edf5;
+}
+
+.fusion-step.done {
+  color: #14704d;
+}
+
+.fusion-step.done::after {
+  background: #97d8ba;
+}
+
+.fusion-step.active {
+  color: #0b62cf;
+  font-weight: 760;
+}
+
+.fusion-step.active::after {
+  background:
+    linear-gradient(100deg, transparent 0 32%, rgba(255, 255, 255, 0.7) 44%, rgba(255, 255, 255, 0.9) 50%, rgba(255, 255, 255, 0.4) 57%, transparent 68%),
+    var(--blue);
+  background-size: 210% 100%, 100% 100%;
+  background-position: 95.45% 0, 0 0;
+  background-repeat: no-repeat, no-repeat;
+  box-shadow: 0 0 0 2px rgba(22, 119, 255, 0.1);
+  animation: fusionBarSweepSync var(--fusion-sweep-duration) linear infinite;
+  animation-iteration-count: 1;
+  animation-fill-mode: both;
+}
+
+@keyframes sweep {
+  from { transform: translateX(-100%); }
+  to { transform: translateX(100%); }
+}
+
+@keyframes typingCaret {
+  0%,
+  49% { opacity: 1; }
+  50%,
+  100% { opacity: 0; }
+}
+
+@keyframes fusionBarSweepSync {
+  from { background-position: 95.45% 0, 0 0; }
+  to { background-position: 4.55% 0, 0 0; }
+}
+
+@keyframes signalAbsorbGlow {
+  0% { opacity: 0; transform: scale(0.72); }
+  22% { opacity: 0.42; transform: scale(1); }
+  100% { opacity: 0; transform: scale(1.9); }
+}
+
+@keyframes signalNodeInnerAbsorb {
+  0% { opacity: 0; transform: scale(0.06); }
+  22% { opacity: 0.98; transform: scale(1.02); }
+  58% { opacity: 0.86; transform: scale(0.9); }
+  100% { opacity: 0; transform: scale(0.28); }
+}
+
+@keyframes signalNodeChargeRing {
+  0% { opacity: 0; transform: scale(0.72) rotate(-120deg); }
+  18% { opacity: 0.96; transform: scale(1) rotate(-20deg); }
+  58% { opacity: 0.82; transform: scale(1.02) rotate(140deg); }
+  100% { opacity: 0; transform: scale(0.74) rotate(255deg); }
+}
+
+@keyframes signalAbsorbCore {
+  0% { box-shadow: 0 0 0 3px #fff; }
+  30% { box-shadow: 0 0 0 3px #fff, 0 0 0 5px rgba(22, 119, 255, 0.2), 0 0 14px rgba(22, 119, 255, 0.56); }
+  100% { box-shadow: 0 0 0 3px #fff; }
+}
+
+@keyframes fusionBorderSweepSync {
+  0% { background-position: -39.29% 0; opacity: 0.96; }
+  100% { background-position: 139.29% 0; opacity: 0.96; }
+}
+
+#composer-input {
+  width: 100%;
+  min-height: 40px;
+  resize: none;
+  border: 0;
+  border-radius: 0;
+  outline: 0;
+  background: transparent;
+  color: var(--ink);
+  padding: 0;
+  line-height: 1.45;
+}
+
+#composer-input:focus {
+  box-shadow: none;
+}
+
+.composer-box {
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: #fbfdff;
+  padding: 10px 10px 9px;
+}
+
+.composer-box:focus-within {
+  border-color: var(--aliyun-blue);
+  box-shadow: 0 0 0 3px rgba(22, 119, 255, 0.1);
+}
+
+.composer-toolbar {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 10px;
+  margin-top: 8px;
+}
+
+.composer-tools,
+.composer-actions {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+}
+
+.primary-button,
+.secondary-button {
+  min-height: 36px;
+  border-radius: 8px;
+  padding: 0 16px;
+  font-weight: 700;
+}
+
+.primary-button {
+  border: 1px solid var(--aliyun-orange);
+  background: var(--aliyun-orange);
+  color: var(--white);
+}
+
+.secondary-button {
+  border: 1px solid var(--line);
+  background: var(--white);
+  color: var(--ink);
+}
+
+.secondary-button:hover {
+  border-color: #9ec9fb;
+  color: var(--aliyun-blue);
+}
+
+.composer .compact-button {
+  min-height: 32px;
+  padding: 0 12px;
+  border-radius: 6px;
+  font-size: 13px;
+}
+
+.icon-only-button {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  padding: 0;
+}
+
+.icon-only-button {
+  width: 32px;
+  height: 32px;
+  min-height: 32px;
+  border: 0;
+  background: transparent;
+  color: var(--ink);
+}
+
+.send-icon-button {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 36px;
+  height: 36px;
+  min-height: 36px;
+  border-radius: 8px;
+  padding: 0;
+}
+
+.composer-divider {
+  width: 1px;
+  height: 24px;
+  background: var(--line);
+}
+
+.attachment-icon {
+  position: relative;
+  width: 15px;
+  height: 20px;
+  transform: rotate(42deg);
+}
+
+.attachment-icon::before,
+.attachment-icon::after {
+  content: "";
+  position: absolute;
+  border: 2px solid currentColor;
+  border-bottom: 0;
+  border-radius: 999px 999px 0 0;
+}
+
+.attachment-icon::before {
+  inset: 1px 2px 6px;
+}
+
+.attachment-icon::after {
+  inset: 5px 5px 8px;
+}
+
+.send-icon {
+  position: relative;
+  width: 15px;
+  height: 15px;
+}
+
+.send-icon::before {
+  content: "";
+  position: absolute;
+  inset: 2px 1px 1px 2px;
+  border-top: 3px solid var(--white);
+  border-right: 3px solid var(--white);
+  transform: rotate(45deg);
+}
+
+.send-icon::after {
+  content: "";
+  position: absolute;
+  left: 2px;
+  top: 7px;
+  width: 12px;
+  height: 3px;
+  border-radius: 999px;
+  background: var(--white);
+  transform: rotate(-25deg);
+}
+
+.ai-disclaimer {
+  margin: 8px 0 0;
+  color: var(--subtle);
+  font-size: 12px;
+}
+
+.plan-area {
+  display: flex;
+  flex-direction: column;
+  min-height: calc(100vh - 96px);
+}
+
+.connection-controls {
+  display: grid;
+  grid-template-columns: minmax(0, 1fr) minmax(0, 1fr);
+  align-items: start;
+  gap: 10px;
+  width: 100%;
+}
+
+.connection-controls label {
+  display: grid;
+  gap: 6px;
+  color: var(--muted);
+  font-size: 12px;
+}
+
+.connection-controls input {
+  width: 100%;
+  height: 36px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  outline: 0;
+  padding: 0 10px;
+  color: var(--ink);
+}
+
+.connection-controls input:focus-visible {
+  border-color: var(--aliyun-blue);
+  box-shadow: 0 0 0 3px rgba(22, 119, 255, 0.12);
+}
+
+.connection-actions {
+  display: flex;
+  flex-wrap: wrap;
+  grid-column: 1 / -1;
+  justify-content: flex-end;
+  gap: 10px;
+}
+
+.danger-button {
+  color: #b42318;
+}
+
+.plans-grid {
+  display: grid;
+  align-items: start;
+  grid-template-columns: repeat(2, minmax(0, 1fr));
+  gap: 12px;
+  min-width: 0;
+  padding: 16px;
+}
+
+.plan-card {
+  display: flex;
+  flex-direction: column;
+  min-width: 0;
+  min-height: 248px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  padding: 16px;
+}
+
+.plan-card.recommended {
+  border-color: #9ec9fb;
+}
+
+.plan-card.selected {
+  border-color: var(--aliyun-blue);
+  background: var(--surface-blue);
+  box-shadow: 0 0 0 2px rgba(22, 119, 255, 0.14);
+}
+
+.plan-card-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  gap: 12px;
+  margin-bottom: 14px;
+}
+
+.plan-card-header-meta {
+  display: flex;
+  align-items: center;
+  justify-content: flex-end;
+  gap: 8px;
+  min-width: 0;
+}
+
+.tag {
+  border-radius: 14px;
+  background: #fff3eb;
+  color: var(--aliyun-orange);
+  padding: 4px 10px;
+  font-size: 12px;
+  font-weight: 700;
+}
+
+.tag.muted {
+  background: #eef2f6;
+  color: var(--muted);
+}
+
+.score {
+  color: var(--success);
+  font-size: 12px;
+  font-weight: 700;
+}
+
+.plan-status {
+  border-radius: 999px;
+  padding: 3px 8px;
+  font-size: 11px;
+  font-weight: 700;
+  white-space: nowrap;
+}
+
+.plan-status.working {
+  background: #eaf3ff;
+  color: var(--aliyun-blue);
+}
+
+.plan-status.completed {
+  background: #e9f8f1;
+  color: var(--success);
+}
+
+.plan-status.failed {
+  background: #fff1f0;
+  color: #b42318;
+}
+
+.plan-card h2 {
+  margin-bottom: 10px;
+  font-size: 18px;
+}
+
+.plan-card p {
+  margin-bottom: 18px;
+  color: var(--muted);
+  line-height: 1.6;
+}
+
+.price {
+  display: grid;
+  gap: 4px;
+  margin-top: auto;
+  color: var(--aliyun-orange);
+}
+
+.price-label {
+  color: var(--muted-light);
+  font-size: 12px;
+  font-weight: 700;
+}
+
+.price strong {
+  color: var(--aliyun-orange);
+  font-size: 24px;
+  font-weight: 800;
+}
+
+.plan-meta {
+  display: grid;
+  grid-template-columns: repeat(2, 1fr);
+  gap: 10px;
+  margin: 16px 0 0;
+}
+
+.plan-meta div {
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: #fbfdff;
+  padding: 10px;
+}
+
+.plan-meta dt {
+  color: var(--subtle);
+  font-size: 12px;
+}
+
+.plan-meta dd {
+  margin: 4px 0 0;
+  color: var(--ink);
+  font-weight: 700;
+}
+
+.debug-drawer {
+  margin: auto 16px 16px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: #fbfdff;
+}
+
+.debug-drawer summary {
+  padding: 12px 14px;
+  color: var(--muted);
+  font-weight: 700;
+}
+
+.debug-panel {
+  display: grid;
+  gap: 14px;
+  border-top: 1px solid var(--line);
+  padding: 14px;
+}
+
+.debug-session-info {
+  display: grid;
+  grid-template-columns: repeat(3, minmax(0, 1fr));
+  gap: 8px;
+  border: 1px solid #e0e7f2;
+  border-radius: 8px;
+  background: var(--white);
+  padding: 10px;
+}
+
+.debug-session-field {
+  display: grid;
+  gap: 3px;
+  min-width: 0;
+}
+
+.debug-session-field span {
+  color: var(--subtle);
+  font-size: 10px;
+  font-weight: 700;
+}
+
+.debug-session-field code {
+  overflow: hidden;
+  color: var(--ink);
+  font-family: inherit;
+  font-size: 11px;
+  font-weight: 700;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.progress-debug-panel {
+  display: grid;
+  gap: 12px;
+}
+
+.progress-debug-title {
+  display: flex;
+  align-items: baseline;
+  justify-content: space-between;
+  gap: 12px;
+}
+
+.progress-debug-title strong {
+  font-size: 13px;
+}
+
+.progress-debug-title span {
+  color: var(--subtle);
+  font-size: 12px;
+}
+
+.progress-variant-switch {
+  display: grid;
+  grid-template-columns: repeat(3, minmax(0, 1fr));
+  gap: 8px;
+}
+
+.progress-variant-switch button {
+  min-width: 0;
+  min-height: 32px;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  color: var(--muted);
+  font-size: 12px;
+  font-weight: 700;
+}
+
+.progress-variant-switch button.selected {
+  border-color: #8fc2ff;
+  background: var(--surface-blue);
+  color: var(--aliyun-blue);
+}
+
+.progress-param-grid {
+  display: grid;
+  grid-template-columns: repeat(2, minmax(0, 1fr));
+  gap: 10px 12px;
+}
+
+.progress-param-grid[hidden] {
+  display: none;
+}
+
+.progress-param {
+  display: grid;
+  gap: 6px;
+  min-width: 0;
+}
+
+.progress-param-head {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 8px;
+  color: #46566b;
+  font-size: 12px;
+  font-weight: 700;
+}
+
+.progress-param output {
+  color: var(--aliyun-blue);
+  font-variant-numeric: tabular-nums;
+}
+
+.progress-param input[type="range"] {
+  width: 100%;
+  accent-color: var(--aliyun-blue);
+}
+
+.step-switch {
+  display: grid;
+  grid-template-columns: repeat(5, minmax(0, 1fr));
+  gap: 5px;
+  margin-top: 6px;
+}
+
+.step-switch button {
+  height: 22px;
+  border: 1px solid #cbd8e8;
+  border-radius: 6px;
+  background: #fff;
+  color: #475569;
+  font-size: 9px;
+  font-weight: 720;
+  cursor: pointer;
+}
+
+.step-switch button.active {
+  border-color: rgba(22, 119, 255, 0.72);
+  background: rgba(22, 119, 255, 0.1);
+  color: var(--blue);
+}
+
+.progress-demo-step-control {
+  margin-top: 0;
+  padding: 7px 8px;
+  padding-top: 10px;
+  border-top: 2px solid rgba(22, 119, 255, 0.78);
+  border-right: 1px solid #e0e7f2;
+  border-bottom: 1px solid #e0e7f2;
+  border-left: 1px solid #e0e7f2;
+  border-radius: 8px;
+  background: #fbfdff;
+}
+
+.progress-demo-step-control label {
+  display: flex;
+  justify-content: space-between;
+  gap: 6px;
+  color: #475569;
+  font-size: 12px;
+  font-weight: 650;
+  line-height: 1.2;
+}
+
+.progress-demo-step-control output {
+  color: var(--blue);
+  font-weight: 760;
+}
+
+.debug-output-block {
+  display: grid;
+  gap: 8px;
+}
+
+.debug-output-block summary {
+  cursor: pointer;
+  color: var(--muted);
+  font-size: 12px;
+  font-weight: 700;
+  line-height: 1.35;
+}
+
+.debug-drawer pre {
+  margin: 0;
+  border: 1px solid var(--line);
+  border-radius: 8px;
+  background: var(--white);
+  color: var(--muted);
+  overflow: auto;
+  padding: 14px;
+}
+
+.utility-rail {
+  padding-top: 8px;
+}
+
+.utility-rail button {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 42px;
+  height: 42px;
+  border: 1px solid var(--line);
+  border-radius: 50%;
+  background: var(--white);
+  color: var(--muted);
+  box-shadow: 0 4px 12px rgba(31, 41, 55, 0.06);
+}
+
+.utility-rail button:hover {
+  border-color: #9ec9fb;
+  color: var(--aliyun-blue);
+}
+
+@media (max-width: 1180px) {
+  .topbar-links {
+    display: none;
+  }
+
+  .console-shell {
+    grid-template-columns: minmax(240px, 347px) minmax(0, 1fr);
+  }
+
+  .utility-rail {
+    display: none;
+  }
+}
+
+@media (max-width: 980px) {
+  .topbar {
+    flex-wrap: wrap;
+    height: auto;
+    min-height: 64px;
+    padding: 12px 16px;
+  }
+
+  .brand {
+    min-width: 170px;
+  }
+
+  .topbar-search {
+    order: 10;
+    width: 100%;
+    max-width: none;
+  }
+
+  .topbar-nav {
+    display: none;
+  }
+
+  .console-shell {
+    grid-template-columns: 1fr;
+    height: auto;
+    min-height: calc(100vh - 64px);
+    padding: 12px;
+  }
+
+  .workflow-panel,
+  .plan-area {
+    height: auto;
+    min-height: auto;
+  }
+
+  .panel-heading,
+  .plan-header {
+    flex-direction: column;
+  }
+
+  .connection-controls,
+  .plans-grid {
+    grid-template-columns: 1fr;
+  }
+
+  .composer-progress {
+    grid-template-columns: repeat(5, minmax(48px, 1fr));
+    overflow-x: auto;
+  }
+
+  .connection-actions {
+    justify-content: stretch;
+  }
+
+  .connection-actions .secondary-button {
+    flex: 1 1 140px;
+  }
+}
+
+@media (max-width: 560px) {
+  .topbar {
+    gap: 10px;
+  }
+
+  .user-summary {
+    width: 100%;
+    justify-content: space-between;
+  }
+
+  .composer-toolbar,
+  .composer-actions {
+    align-items: stretch;
+    flex-direction: column;
+  }
+
+  .primary-button,
+  .secondary-button {
+    width: 100%;
+  }
+
+  .composer-toolbar,
+  .composer-actions {
+    align-items: center;
+    flex-direction: row;
+  }
+
+  .composer .secondary-button {
+    width: auto;
+  }
+
+  .composer .send-icon-button {
+    width: 36px;
+  }
+
+  .composer .icon-only-button {
+    width: 32px;
+  }
+
+  .plan-meta {
+    grid-template-columns: 1fr;
+  }
+}
diff --git a/scripts/repl/e2e/README.md b/scripts/repl/e2e/README.md
new file mode 100644
index 00000000..439e5481
--- /dev/null
+++ b/scripts/repl/e2e/README.md
@@ -0,0 +1,19 @@
+# REPL Pipeline E2E Runner
+
+This directory contains real terminal end-to-end helpers for pipeline behavior. The runner drives the REPL through a real PTY and is POSIX-only because it uses `pexpect`.
+
+Run from the repository root:
+
+```bash
+uv run python scripts/repl/e2e/run_pipeline_scenarios.py --help
+```
+
+By default, run artifacts are written under the system temporary directory, in:
+
+```text
+iac-code-repl-e2e-runs/<scenario>/<timestamp>-<pid>-<id>/
+```
+
+Use `--run-dir` to choose a fixed collection directory for local debugging or CI smoke artifacts.
+
+The runner is for manual or smoke validation. It uses the developer's configured provider and may call real Alibaba Cloud tools when `--allow-real-cloud` is enabled. It must not require real LLMs or real cloud credentials in automated unit tests; pytest coverage for this directory is limited to pure helpers and argument behavior.
diff --git a/scripts/repl/e2e/README.zh-CN.md b/scripts/repl/e2e/README.zh-CN.md
new file mode 100644
index 00000000..16378b75
--- /dev/null
+++ b/scripts/repl/e2e/README.zh-CN.md
@@ -0,0 +1,150 @@
+# REPL Pipeline E2E
+
+本目录包含通过真实交互式终端回归 pipeline 功能的脚本。它和
+`scripts/a2a/e2e/run_recovery_scenarios.py` 目标相同，都是回归 pipeline；区别是这里走真实
+REPL / PTY 入口，而 A2A runner 走 JSON-RPC / SSE 入口。
+
+## 重要说明
+
+- 默认使用当前用户真实 `~/.iac-code` 配置。
+- 会调用真实 LLM provider。
+- 带 `--allow-real-cloud` 的 pipeline 场景可能调用真实阿里云工具和凭证。
+- 不属于普通 `make test`，也不会在 pytest 中执行真实场景。
+- 该 runner 通过 `pexpect` 使用真实 PTY，仅支持 POSIX 环境；Windows 会提前报错，不作为本脚本支持目标。
+
+## 快速开始
+
+```bash
+PATH="$HOME/.local/bin:$PATH" \
+uv run python scripts/repl/e2e/run_pipeline_scenarios.py \
+  --allow-real-cloud \
+  --scenario scenario1
+```
+
+指定 provider/model 但不写入 `settings.yml`：
+
+```bash
+PATH="$HOME/.local/bin:$PATH" \
+uv run python scripts/repl/e2e/run_pipeline_scenarios.py \
+  --allow-real-cloud \
+  --provider dashscope \
+  --model qwen3.6-plus \
+  --scenario scenario1
+```
+
+## 场景
+
+| 场景 | 覆盖 |
+| --- | --- |
+| `scenario1` | 通过 REPL 完成 VSwitch pipeline、候选方案选择、handoff normal chat |
+| `ask-waiting` | 通过 REPL 回复澄清问题后继续 pipeline，并完成 VSwitch 创建 |
+| `ask-waiting-resume` | ask user question 等待时杀进程，重启后重放问题并继续 |
+| `image-initial` | 首轮用户输入通过 bracketed paste 粘贴静态 `initial.png` 图片，随后选择候选并完成 VSwitch 创建 |
+| `image-ask-waiting-resume` | ask user question 等待时杀进程，`--continue` 恢复后通过静态图片回答澄清问题并继续 |
+| `image-selection-waiting-resume` | 首轮图片启动 pipeline，candidate selection 等待时杀进程，重启后恢复选择 UI 并继续 |
+| `image-normal-handoff` | pipeline handoff 到 normal chat 后，通过静态图片追问“你刚才创建了什么” |
+| `image-interrupt` | evaluate candidates 阶段发送 Esc 后，通过静态图片输入回退到安全组的 interrupt 指令 |
+| `selection-waiting-resume` | candidate selection 等待时杀进程，重启后恢复选择 UI 并继续 |
+| `selection-invalid-then-valid` | candidate selection 中先发送无效选择，再发送有效选择并完成 |
+| `evaluate-resume` | evaluate candidates 阶段杀进程，重启后重放中断点，发送 `continue` 后继续到选择并完成 |
+| `rollback-step2` | architecture planning 中发送 Esc 和回退指令，验证 streaming interrupt 路径 |
+| `rollback-step3` | pipeline 中发送 Esc 和回退指令，验证 REPL hard interrupt 路径 |
+| `rollback-step4-selection` | candidate selection 中发送 Esc 和回退指令，验证 selection tabs interrupt 路径 |
+| `rollback-step5-cleanup` | deploying 创建真实 ROS stack 后回退，验证旧 stack 被 cleanup 删除、新 stack 保留 |
+| `rollback-step5-cleanup-recovery` | cleanup 删除中杀进程，`--continue` 恢复后验证 cleanup 重新触发并完成 |
+
+## 验收标准
+
+脚本的通过条件不是“进程退出 0”或“某个 regex 被等到”本身，而是 `summary.json` 里的所有
+`checks` 都为 `true`。其中 `acceptance:` 前缀的检查项来自 PTY transcript，是回归验收标准：
+
+- 通用：必须捕获到 PTY transcript，且 transcript 中不能出现 traceback、pexpect EOF/TIMEOUT、权限拒绝等终端错误。
+- `scenario1`：必须展示 candidate selection，完成 pipeline，并在 PTY transcript 中出现 VSwitch 证据（例如 `VSwitchId`、`vsw-...` 或交换机 ID）；进入 normal chat 后，`你刚才创建了什么` 的回答必须提到 VSwitch/交换机，不能只验证“有输出”。
+- `ask-waiting`：必须展示真实 `Ask user question`，回答澄清问题后如果进入 candidate selection，必须继续选择候选并完成 pipeline；最终 PTY transcript 必须出现 VSwitch 证据。
+- `ask-waiting-resume`：必须在 `--continue` 后重放 `Ask user question`；回答后如果进入 candidate selection，必须继续选择候选并完成 pipeline；最终 PTY transcript 必须出现 VSwitch 证据。
+- `image-initial`：必须记录 `initial` 静态图片 fixture 的 paste 事件；图片输入必须启动 pipeline、展示 candidate selection、完成 pipeline，并出现 VSwitch 证据。
+- `image-ask-waiting-resume`：必须在 `--continue` 后重放 `Ask user question`；恢复后的回答必须通过 `ask-first-answer` 静态图片 fixture 输入；如果模型继续追问，runner 会再用 `ask-second-answer` 静态图片回答；最终必须继续到 candidate selection 或 pipeline completed，并出现 VSwitch 证据。
+- `image-selection-waiting-resume`：必须记录 `initial` 静态图片 fixture 的 paste 事件；candidate selection 必须在 `--continue` 后重放；随后通过真实候选 UI 数字键选择并完成 pipeline，最终出现 VSwitch 证据。
+- `image-normal-handoff`：必须完成 pipeline handoff normal chat；normal follow-up 必须通过 `normal-followup` 静态图片 fixture 输入，且回答必须提到 VSwitch/交换机。
+- `image-interrupt`：必须先到达 `Evaluate candidates (3/5)`；发送 Esc 进入 interrupt 输入后，必须通过 `rollback-interrupt` 静态图片 fixture 输入；图片 interrupt 之后必须看到新的 pipeline 进展，回退后的输出必须指向安全组目标且不能指向 VSwitch。
+- `selection-waiting-resume`：必须在 `--continue` 后重放 candidate selection，最终完成 pipeline，并出现 VSwitch 证据。
+- `selection-invalid-then-valid`：必须记录无效选择输入，然后记录有效选择输入，最终完成 pipeline，并出现 VSwitch 证据。
+- `evaluate-resume`：必须先到达 `Evaluate candidates (3/5)`，使用 `--continue` 恢复并重放该步骤；恢复后的普通 REPL prompt ready 后发送 `continue`，随后必须继续到 candidate selection 或 pipeline completed；最终 PTY transcript 必须出现 VSwitch 证据。
+- `rollback-step2`：必须先到达 `Architecture planning (2/5)`；发送回退指令之后必须看到新的 pipeline 进展；回退后的输出必须指向安全组目标，且不能把用户输入 echo 里的“安全组”当作通过证据。
+- `rollback-step3`：必须先到达 `Evaluate candidates (3/5)`；step3 的 parallel tabs 中断输入不要求 transcript 出现普通 `✎` prompt；发送回退指令之后必须看到新的 pipeline 进展（例如新的 `Intent parsing (1/5)`），不能用用户输入 echo 里的“回退”当作通过证据；回退后的输出必须指向安全组目标，且不能指向 VSwitch。
+- `rollback-step4-selection`：必须先到达 `Confirm and select (4/5)`；selection tabs 中断输入同样不要求 transcript 出现普通 `✎` prompt；发送回退指令之后必须看到新的 pipeline 进展；回退后的输出必须指向安全组目标，且不能指向 VSwitch。
+- `rollback-step5-cleanup`：必须到达 deploying 并观察到第一次 CreateStack；回退后 `cleanup.yaml` 必须把第一次 stack 记录为 cleanup target；第二次部署必须创建不同 stack；normal chat 前置 cleanup 必须完成；ROS GetStack 必须确认第一次 stack 已删除，第二次 stack 仍保留。
+- `rollback-step5-cleanup-recovery`：在 `rollback-step5-cleanup` 的基础上，cleanup 开始后必须杀掉 REPL 子进程，随后用 `--continue` 恢复；恢复后必须重新触发 cleanup 并完成；ROS GetStack 同样必须确认旧 stack 删除、新 stack 保留。
+
+会创建资源的非 cleanup 场景还必须在当前 REPL session 的 `pipeline/cleanup.yaml` 中观察到 ROS
+`CreateStack` 资源，且 StackName 必须是 runner 为当前场景注入的 `iac-e2e-*` test-owned 名称；
+teardown 前会通过 ROS GetStack 确认这些 stack 仍存在。场景结束后，runner 会自动删除这些
+observed stack；删除前会再次校验云端 StackName 必须等于 ledger 记录的 test-owned StackName，
+避免误删非本轮测试资源。
+
+`rollback-step3` 和 `rollback-step4-selection` 会在发送 Esc 后等待第二个 raw-input ready 控制序列，再输入回退指令；这对应 tabs UI 切入中断文本输入行之后的真实 PTY 状态。
+
+`rollback-step5-cleanup*` 的通过条件不只看 PTY 文本，还会读取同一个 REPL session 下的
+`pipeline/cleanup.yaml`，并在最后写出 `acceptance-after-cleanup.ros-stack-states.json` 作为真实 ROS
+状态快照。这样可以避免“终端看起来清理了，但 ledger 或云端状态不对”的假阳性。
+
+pipeline completed 的匹配必须是终态证据，例如 `Pipeline completed`、`CREATE_COMPLETE`、`部署成功` 或
+`Stack ID`；候选方案里的 `Completed` 或“参数选择完成”不能作为通过证据。
+
+## 图片场景输入方式
+
+REPL image 场景复用 `scripts/a2a/e2e/fixtures/text-images/` 下的静态 PNG fixture，避免每次运行时重新
+生成图片。runner 不依赖系统剪贴板，而是通过 PTY 发送 bracketed paste 序列：
+
+```text
+ESC [ 200 ~ <absolute image path> ESC [ 201 ~
+```
+
+REPL 会把这个路径交给普通模式相同的 bracketed-paste 处理逻辑，解析图片文件、持久化到 image cache，
+并在 prompt 中插入 `[Image #N]`。因此这些场景验证的是真实 REPL 图片入口，而不是测试脚本直接构造
+`ImageBlock`。
+
+## 产物
+
+默认写入系统临时目录下的 `iac-code-repl-e2e-runs/<scenario>/<timestamp>-<pid>-<id>/`：
+
+- `summary.json`：场景结果、检查点、耗时、失败原因。
+- `events.jsonl`：spawn/send/expect/terminate 等黑盒终端事件。
+- `child.env.json`：子进程环境摘要，敏感值会被脱敏。
+- `transcript.raw.log`：脱敏后的原始终端 transcript。
+- `transcript.normalized.log`：去 ANSI/control 字符后的 transcript，便于 diff 和排查。
+- `acceptance-after-cleanup.ros-stack-states.json`：cleanup 场景的 ROS GetStack 快照，敏感值会被脱敏。
+
+使用固定目录便于 CI 或本地脚本收集：
+
+```bash
+PATH="$HOME/.local/bin:$PATH" \
+uv run python scripts/repl/e2e/run_pipeline_scenarios.py \
+  --allow-real-cloud \
+  --scenario selection-waiting-resume \
+  --run-dir "$(python - <<'PY'
+import tempfile
+from pathlib import Path
+print(Path(tempfile.gettempdir()) / 'iac-code-repl-e2e-selection')
+PY
+)"
+```
+
+## 常用参数
+
+- `--scenario` 可重复传入；默认只跑 `scenario1`。
+- `--cwd` 指定 REPL 子进程工作目录；默认使用 run dir 下的 `workspace/`。
+- `--timeout` 控制普通终端等待。
+- `--stream-timeout` 控制 LLM/pipeline 长等待。
+- `--selection-prompt` 指定候选方案选择输入；默认发送 `1` 选择第一个候选；传空字符串时直接回车确认。
+- `--evaluate-resume-continue-prompt` 指定 `evaluate-resume` 在 `--continue` 重放后用于继续 running sidecar 的输入；默认 `continue`。
+- `--cleanup-continue-prompt` 指定 `rollback-step5-cleanup-recovery` 在 `--continue` 恢复后用于继续 cleanup 的输入；默认只允许删除待清理列表中的 stack，避免误删其他资源。
+- `--permission-prompt-response` 指定工具权限确认菜单的输入；默认 `pageup-enter`（发送 PageUp+Enter，选择第一项 `Yes, allow once`）。
+- `--skip-final-teardown` 调试时跳过测试创建 stack 的最终删除；日常回归不要开启。
+- `--leave-running` 调试时保留子进程，不自动 terminate。
+
+## 与 pytest 的关系
+
+`tests/repl_e2e/test_run_pipeline_scenarios.py` 只覆盖脚本的纯 helper、参数校验、脱敏、dispatch
+流程，不会启动真实 REPL，也不会调用真实 LLM 或云账号。真实回归必须显式运行本目录脚本，并带上
+`--allow-real-cloud`。
diff --git a/scripts/repl/e2e/run_pipeline_scenarios.py b/scripts/repl/e2e/run_pipeline_scenarios.py
new file mode 100644
index 00000000..b1a59b98
--- /dev/null
+++ b/scripts/repl/e2e/run_pipeline_scenarios.py
@@ -0,0 +1,2672 @@
+#!/usr/bin/env python3
+"""Run real interactive REPL pipeline E2E scenarios.
+
+This runner intentionally drives the public terminal interface through a PTY.
+It uses the user's real configuration by default and must not be imported by
+ordinary package code.
+"""
+
+from __future__ import annotations
+
+import argparse
+import asyncio
+import ipaddress
+import json
+import os
+import re
+import shlex
+import signal
+import tempfile
+import time
+import uuid
+from collections.abc import Callable, Iterable
+from dataclasses import asdict, dataclass, field
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any
+
+try:
+    import pexpect
+except ImportError:  # pragma: no cover - exercised manually when dependency missing
+    pexpect = None  # type: ignore[assignment]
+
+try:
+    import yaml
+except ImportError:  # pragma: no cover - PyYAML is part of the project runtime
+    yaml = None  # type: ignore[assignment]
+
+
+RUN_LOG_ROOT_NAME = "iac-code-repl-e2e-runs"
+PTY_SEND_CHUNK_SIZE = 512
+PTY_SEND_CHUNK_DELAY_SECONDS = 0.01
+TEXT_IMAGE_FIXTURE_ROOT = Path(__file__).resolve().parents[2] / "a2a" / "e2e" / "fixtures" / "text-images"
+TEXT_IMAGE_FIXTURE_FILENAMES = {
+    "initial": "initial.png",
+    "selection": "selection.png",
+    "normal-followup": "normal-followup.png",
+    "ask-first-answer": "ask-first-answer.png",
+    "ask-second-answer": "ask-second-answer.png",
+    "rollback-interrupt": "rollback-interrupt.png",
+}
+DEFAULT_INITIAL_PROMPT = "选择一个已有vpc，创建一个vswitch"
+DEFAULT_SELECTION_PROMPT = "1"
+DEFAULT_ASK_PROMPT = "我有个产品要上线"
+DEFAULT_ASK_ANSWER = "我要创建云网络资源；本次只选择已有 VPC 创建一个 VSwitch，不部署 ECS、EIP、SLB 或 Nginx。"
+DEFAULT_NORMAL_FOLLOWUP_PROMPT = "你刚才创建了什么"
+DEFAULT_ROLLBACK_PROMPT = "回退到 intent_parsing，选择一个已有vpc，创建一个安全组"
+DEFAULT_INVALID_SELECTION_PROMPT = "9"
+DEFAULT_EVALUATE_RESUME_CONTINUE_PROMPT = "continue"
+DEFAULT_CLEANUP_CONTINUE_PROMPT = (
+    "只执行上面的回滚清理：仅删除待清理列表中的 stack id，完成后停止，不要删除或检查其他 stack。"
+)
+DEFAULT_PERMISSION_PROMPT_RESPONSE = "pageup-enter"
+
+PIPELINE_STARTED_PATTERNS = (r"Pipeline", r"pipeline", r"intent_parsing", r"意图")
+CANDIDATE_SELECTION_PATTERNS = (
+    r"(?i)Confirm and select\s*\(\d+/\d+\)",
+    r"(?i)confirm[ _-]+and[ _-]+select\s*\(\d+/\d+\)",
+    r"确认并选择\s*\(\d+/\d+\)",
+    r"候选选择\s*\(\d+/\d+\)",
+)
+CANDIDATE_EVALUATION_PATTERNS = (r"(?i)Evaluate candidates\s*\(\d+/\d+\)", r"evaluate_candidates")
+ARCHITECTURE_PLANNING_PATTERNS = (r"(?i)Architecture planning\s*\(\d+/\d+\)", r"architecture_planning")
+ASK_PATTERNS = (r"Ask user question", r"请.*输入", r"请.*补充", r"请描述", r"需要.*信息", r"澄清", r"问题")
+PIPELINE_COMPLETED_PATTERNS = (
+    r"(?i)Pipeline completed",
+    r"CREATE_COMPLETE",
+    r"部署成功",
+    r"Stack ID",
+    r"(?i)handoff",
+    r"交接",
+)
+PIPELINE_FULLY_COMPLETED_PATTERNS = (r"(?i)Pipeline completed\.\s+Normal chat is now active\.",)
+POST_ROLLBACK_PROGRESS_PATTERNS = (
+    r"●\s*Intent parsing\s*\(1/5\)",
+    r"●\s*Architecture planning\s*\(2/5\)",
+    r"Step Intent parsing completed",
+)
+DEPLOYING_STEP_PATTERNS = (r"●\s*Deploying\s*\(5/5\)", r"CreateStack", r"开始部署")
+CREATE_STACK_STARTED_PATTERNS = (r"ROS Stack\(CreateStack", r"CreateStack")
+FIRST_STACK_CREATED_PATTERNS = (r"CREATE_COMPLETE", r"Stack ID", r"StackId", r"stack_id")
+CLEANUP_STARTED_PATTERNS = (
+    r"检测到\s*\d+\s*个回滚残留资源",
+    r"开始清理流程",
+    r"回滚清理\s*\[删除中\]",
+    r"DeleteStack",
+)
+CLEANUP_RESUME_SUMMARY_PATTERNS = (r"回滚清理恢复", r"回滚清理")
+CLEANUP_COMPLETED_PATTERNS = (r"DELETE_COMPLETE", r"回滚清理\s*\[完成\]", r"清理.*完成")
+CLEANUP_DEPLOYMENT_FAILURE_PATTERNS = (
+    r"\bCREATE_FAILED\b",
+    r"RouteConflict",
+    r"StackExists",
+    r"InvalidCidrBlock",
+)
+ROS_STACK_DELETED_STATUSES = {"DELETE_COMPLETE"}
+REPL_PROMPT_PATTERNS = (r"❯",)
+REPL_INPUT_READY_PATTERNS = (r"\x1b\[>4;2m",)
+INTERRUPT_INPUT_PATTERNS = (r"✎", r"interrupt", r"输入", r"Judging")
+CANDIDATE_SELECTION_READY_PATTERNS = (
+    r"Press number keys to select a candidate",
+    r"Enter to confirm",
+    r"按数字键.*候选",
+)
+PERMISSION_PROMPT_PATTERNS = (
+    r"Yes, allow once",
+    r"允许一次",
+)
+TERMINAL_ERROR_PATTERNS = (
+    r"Traceback \(most recent call last\)",
+    r"pexpect\.(?:TIMEOUT|EOF)",
+    r"rejected_in_prompt",
+    r"Permission.*reject",
+    r"权限.*拒绝",
+)
+VSWITCH_EVIDENCE_PATTERNS = (
+    r"ALIYUN::ECS::VSwitch",
+    r"VSwitchId",
+    r"vsw-[A-Za-z0-9]+",
+    r"交换机\s*ID",
+)
+VSWITCH_MENTION_PATTERNS = (
+    r"(?i)VSwitch",
+    r"交换机",
+    r"vsw-[A-Za-z0-9]+",
+)
+SECURITY_GROUP_EVIDENCE_PATTERNS = (
+    r"ALIYUN::ECS::SecurityGroup",
+    r"SecurityGroupId",
+    r"sg-[A-Za-z0-9]+",
+    r"安全组\s*ID",
+)
+SECURITY_GROUP_MENTION_PATTERNS = (
+    r"(?i)SecurityGroup",
+    r"安全组",
+    r"sg-[A-Za-z0-9]+",
+)
+POSITIVE_VSWITCH_TARGET_PATTERNS = (
+    r"ALIYUN::ECS::VSwitch",
+    r"VSwitchId",
+    r"vsw-[A-Za-z0-9]+",
+    r"(?:创建|新建|目标资源|资源类型|部署).*?(?:VSwitch|交换机)",
+)
+NEGATED_VSWITCH_TARGET_LINE_PATTERNS = (
+    r"(?i)(?:不|不要|禁止|避免|无需|不再|不能|不得|forbid|forbidden).*?(?:VSwitch|交换机)",
+    r"(?i)(?:VSwitch|交换机).*?(?:forbid|forbidden|不创建|禁止|不要|无需)",
+    r"(?i)(?:no|without).*?(?:VSwitch|switch)",
+    r"(?i)(?:VSwitch|switch).*?(?:no|without)",
+    r"(?i)(?:从|由|将需求从|把需求从).*?(?:创建|新建).*?(?:VSwitch|交换机).*?(?:改为|变更为|切换为|转为).*?(?:SecurityGroup|安全组)",
+    r"(?i)from.*?(?:create|creating).*?(?:VSwitch|switch).*?to.*?(?:SecurityGroup|security group)",
+    r'(?i)"product"\s*:\s*"VSwitch".*?"action"\s*:\s*"forbid"',
+)
+NEGATED_VSWITCH_TARGET_SPAN_PATTERNS = (
+    r"(?is)(?:从|由|将需求从|把需求从).{0,80}(?:创建|新建).{0,80}(?:VSwitch|交换机).{0,160}(?:改为|变更为|切换为|转为).{0,80}(?:SecurityGroup|安全组)",
+    r"(?is)from.{0,80}(?:create|creating).{0,80}(?:VSwitch|switch).{0,160}to.{0,80}(?:SecurityGroup|security group)",
+)
+ARCHITECTURE_PLANNING_HEADING_PATTERNS = (r"●\s*Architecture planning\s*\(2/5\)",)
+EVALUATE_CANDIDATES_HEADING_PATTERNS = (r"●\s*Evaluate candidates\s*\(3/5\)",)
+ASK_USER_QUESTION_HEADING_PATTERNS = (r"●\s*Ask user question",)
+
+STACK_CREATING_SCENARIOS = frozenset(
+    {
+        "scenario1",
+        "ask-waiting",
+        "ask-waiting-resume",
+        "image-initial",
+        "image-ask-waiting-resume",
+        "image-selection-waiting-resume",
+        "image-normal-handoff",
+        "selection-waiting-resume",
+        "selection-invalid-then-valid",
+        "evaluate-resume",
+    }
+)
+
+
+@dataclass
+class ScenarioRunResult:
+    scenario: str
+    run_dir: str
+    passed: bool
+    checks: dict[str, bool]
+    elapsed_seconds: float
+    abort_reason: str = ""
+    notes: list[str] = field(default_factory=list)
+
+
+@dataclass(frozen=True)
+class CleanupNetworkTarget:
+    vpc_id: str
+    vpc_cidr: str
+    zone_id: str
+    vswitch_cidr: str
+    rollback_vswitch_cidr: str
+
+
+def parse_args(argv: list[str] | None = None) -> argparse.Namespace:
+    parser = argparse.ArgumentParser(description="Run interactive REPL pipeline E2E scenarios.")
+    parser.add_argument(
+        "--scenario",
+        action="append",
+        choices=sorted(_SCENARIOS),
+        help="Scenario to run. Can be repeated. Defaults to scenario1.",
+    )
+    parser.add_argument("--allow-real-cloud", action="store_true")
+    parser.add_argument("--cwd", default="", help="Child process cwd. Defaults to <run-dir>/workspace.")
+    parser.add_argument("--run-root", default=str(Path(tempfile.gettempdir()) / RUN_LOG_ROOT_NAME))
+    parser.add_argument("--run-dir", default="", help="Explicit run dir. Only valid with one scenario.")
+    parser.add_argument("--python", default="uv run python")
+    parser.add_argument("--provider", default="")
+    parser.add_argument("--model", default="")
+    parser.add_argument("--api-base", default="")
+    parser.add_argument("--timeout", type=float, default=45.0)
+    parser.add_argument("--stream-timeout", type=float, default=1800.0)
+    parser.add_argument("--terminal-width", type=int, default=140)
+    parser.add_argument("--terminal-height", type=int, default=40)
+    parser.add_argument("--candidate-selection-ready-timeout", type=float, default=30.0)
+    parser.add_argument("--leave-running", action="store_true")
+    parser.add_argument(
+        "--skip-final-teardown",
+        action="store_true",
+        help="Do not delete test-owned ROS stacks after scenario acceptance checks.",
+    )
+    parser.add_argument("--final-teardown-timeout", type=float, default=900.0)
+    parser.add_argument("--cleanup-vpc-id", default="", help="Existing VPC ID to use for cleanup E2E scenarios.")
+    parser.add_argument("--cleanup-vpc-cidr", default="", help="CIDR of --cleanup-vpc-id, used only in prompts.")
+    parser.add_argument("--cleanup-zone-id", default="", help="Zone ID to use for cleanup E2E scenarios.")
+    parser.add_argument(
+        "--cleanup-vswitch-cidr",
+        default="",
+        help="Free VSwitch CIDR to use for the first stack in cleanup E2E scenarios.",
+    )
+    parser.add_argument(
+        "--cleanup-rollback-vswitch-cidr",
+        default="",
+        help="Different free VSwitch CIDR to use for the post-rollback stack in cleanup E2E scenarios.",
+    )
+    parser.add_argument("--initial-prompt", default=DEFAULT_INITIAL_PROMPT)
+    parser.add_argument("--selection-prompt", default=DEFAULT_SELECTION_PROMPT)
+    parser.add_argument(
+        "--permission-prompt-response",
+        default=DEFAULT_PERMISSION_PROMPT_RESPONSE,
+        help="Permission prompt response: pageup-enter, up-enter, enter, or literal text.",
+    )
+    parser.add_argument("--ask-prompt", default=DEFAULT_ASK_PROMPT)
+    parser.add_argument("--ask-answer", default=DEFAULT_ASK_ANSWER)
+    parser.add_argument("--normal-followup-prompt", default=DEFAULT_NORMAL_FOLLOWUP_PROMPT)
+    parser.add_argument("--rollback-prompt", default=DEFAULT_ROLLBACK_PROMPT)
+    parser.add_argument("--invalid-selection-prompt", default=DEFAULT_INVALID_SELECTION_PROMPT)
+    parser.add_argument("--evaluate-resume-continue-prompt", default=DEFAULT_EVALUATE_RESUME_CONTINUE_PROMPT)
+    parser.add_argument("--cleanup-continue-prompt", default=DEFAULT_CLEANUP_CONTINUE_PROMPT)
+    return parser.parse_args(argv)
+
+
+def _selected_scenarios(args: argparse.Namespace) -> list[str]:
+    return args.scenario or ["scenario1"]
+
+
+def _validate_scenario_execution(args: argparse.Namespace, scenario: str) -> None:
+    if scenario in _REAL_CLOUD_SCENARIOS and not args.allow_real_cloud:
+        raise SystemExit("refusing to run real REPL pipeline scenario without --allow-real-cloud: " + scenario)
+
+
+def _split_python_command(value: str) -> list[str]:
+    parts = shlex.split(value, posix=(os.name != "nt"))
+    if not parts:
+        raise ValueError("--python must not be empty")
+    return parts
+
+
+def _build_child_env(args: argparse.Namespace) -> dict[str, str]:
+    env = os.environ.copy()
+    env["PYTHONUTF8"] = "1"
+    env["IAC_CODE_MODE"] = "pipeline"
+    if args.provider:
+        env["IAC_CODE_PROVIDER"] = args.provider
+    if args.model:
+        env["IAC_CODE_MODEL"] = args.model
+    if args.api_base:
+        env["IAC_CODE_BASE_URL"] = args.api_base
+    return env
+
+
+def _redact_sensitive_text(text: str, env: dict[str, str] | None) -> str:
+    redacted = text
+    for name, value in (env or {}).items():
+        if not value or len(value) < 6:
+            continue
+        upper = name.upper()
+        if any(marker in upper for marker in ("KEY", "TOKEN", "SECRET", "PASSWORD", "CREDENTIAL")):
+            redacted = redacted.replace(value, "<redacted>")
+    redacted = re.sub(r"(?i)(api[_ -]?key\s*[:=]\s*)[^\s,'\"}]+", r"\1<redacted>", redacted)
+    redacted = re.sub(r"(?i)(authorization\s*[:=]\s*)[^\s,'\"}]+", r"\1<redacted>", redacted)
+    redacted = re.sub(r"(?<![A-Za-z0-9_-])sk-[A-Za-z0-9_-]{8,}", "sk-<redacted>", redacted)
+    return redacted
+
+
+_ANSI_PATTERN = re.compile(r"\x1b\[[0-?]*[ -/]*[@-~]")
+
+
+def _normalize_transcript(text: str) -> str:
+    text = _ANSI_PATTERN.sub("", text)
+    text = text.replace("\r\n", "\n").replace("\r", "\n")
+    text = text.replace("\b", "")
+    return "\n".join(line.rstrip() for line in text.splitlines())
+
+
+def _compact_text(text: str, *, max_chars: int = 800) -> str:
+    compact = " ".join(text.split())
+    if len(compact) <= max_chars:
+        return compact
+    return compact[: max_chars - 3] + "..."
+
+
+def _permission_prompt_response_sequence(value: str) -> str:
+    if value == "pageup-enter":
+        return "\x1b[5~\r"
+    if value == "up-enter":
+        return "\x1b[A\r"
+    if value == "enter":
+        return "\r"
+    return f"{value}\r" if value else "\r"
+
+
+def _sendline_to_child(child: Any, text: str, *, capture: Callable[[str], None] | None = None) -> None:
+    if len(text) <= PTY_SEND_CHUNK_SIZE:
+        child.sendline(text)
+        return
+    for offset in range(0, len(text), PTY_SEND_CHUNK_SIZE):
+        child.send(text[offset : offset + PTY_SEND_CHUNK_SIZE])
+        _drain_child_output(child, capture=capture)
+        time.sleep(PTY_SEND_CHUNK_DELAY_SECONDS)
+    _drain_child_output(child, capture=capture)
+    child.sendline("")
+
+
+def _drain_child_output(child: Any, *, capture: Callable[[str], None] | None = None) -> None:
+    reader = getattr(child, "read_nonblocking", None)
+    if not callable(reader):
+        return
+    while True:
+        try:
+            text = reader(size=4096, timeout=0)
+        except Exception as exc:
+            if pexpect is not None and isinstance(exc, pexpect.TIMEOUT):
+                return
+            return
+        if not text:
+            return
+        if capture is not None:
+            capture(str(text))
+
+
+def _new_run_dir(root: Path) -> Path:
+    run_name = f"{datetime.now(timezone.utc).strftime('%Y%m%dT%H%M%SZ')}-{os.getpid()}-{uuid.uuid4().hex[:8]}"
+    return root / run_name
+
+
+def _write_json(path: Path, value: Any) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    path.write_text(json.dumps(value, ensure_ascii=False, indent=2, default=str) + "\n", encoding="utf-8")
+
+
+def _append_jsonl(path: Path, value: Any) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    with path.open("a", encoding="utf-8") as handle:
+        handle.write(json.dumps(value, ensure_ascii=False, default=str) + "\n")
+
+
+def _redacted_env_summary(env: dict[str, str]) -> dict[str, str]:
+    keys = ["HOME", "IAC_CODE_CONFIG_DIR", "IAC_CODE_MODE", "IAC_CODE_PROVIDER", "IAC_CODE_MODEL", "IAC_CODE_BASE_URL"]
+    return {key: _redact_sensitive_text(env[key], env) for key in keys if key in env}
+
+
+def _scenario_run_dir(args: argparse.Namespace, scenario: str) -> Path:
+    if args.run_dir:
+        return Path(args.run_dir).expanduser().resolve()
+    return _new_run_dir(Path(args.run_root).expanduser().resolve() / scenario)
+
+
+class ReplPty:
+    def __init__(self, *, args: argparse.Namespace, run_dir: Path, cwd: Path, env: dict[str, str]) -> None:
+        if os.name == "nt":
+            raise SystemExit("real PTY REPL E2E is POSIX-only")
+        if pexpect is None:
+            raise RuntimeError("pexpect is required. Install dependencies with: uv sync --all-extras")
+        self.args = args
+        self.run_dir = run_dir
+        self.cwd = cwd
+        self.env = env
+        self.events: list[dict[str, Any]] = []
+        self.raw_chunks: list[str] = []
+        self.child: Any | None = None
+        self._live_transcript = False
+
+    @property
+    def transcript(self) -> str:
+        return "".join(self.raw_chunks)
+
+    def spawn(self, *, extra_args: list[str] | None = None) -> None:
+        command = [
+            *_split_python_command(self.args.python),
+            "-m",
+            "iac_code.cli.main",
+            "--permission-mode",
+            "bypass_permissions",
+            *(extra_args or []),
+        ]
+        self.events.append({"type": "spawn", "command": command, "cwd": str(self.cwd), "at": _utc_now()})
+        self.child = pexpect.spawn(
+            command[0],
+            command[1:],
+            cwd=str(self.cwd),
+            env=self.env,
+            encoding="utf-8",
+            codec_errors="replace",
+            timeout=self.args.timeout,
+            dimensions=(self.args.terminal_height, self.args.terminal_width),
+        )
+        self.child.logfile_read = _TranscriptCapture(self)
+        self._live_transcript = True
+
+    def sendline(self, text: str) -> None:
+        transcript_offset = len(self.transcript)
+        _sendline_to_child(self._require_child(), text, capture=self._capture_child_output_force)
+        self.events.append(
+            {
+                "type": "sendline",
+                "text": _redact_sensitive_text(text, self.env),
+                "transcript_offset": transcript_offset,
+                "at": _utc_now(),
+            }
+        )
+
+    def send(self, text: str, *, label: str = "send") -> None:
+        transcript_offset = len(self.transcript)
+        self._require_child().send(text)
+        self.events.append(
+            {
+                "type": label,
+                "text": _redact_sensitive_text(text, self.env),
+                "transcript_offset": transcript_offset,
+                "at": _utc_now(),
+            }
+        )
+
+    def paste_image_fixture(self, image_key: str) -> Path:
+        path = _text_image_fixture_path(image_key)
+        transcript_offset = len(self.transcript)
+        child = self._require_child()
+        child.send(f"\x1b[200~{path}\x1b[201~")
+        _drain_child_output(child, capture=self._capture_child_output_force)
+        self.events.append(
+            {
+                "type": "paste-image-fixture",
+                "image_key": image_key,
+                "path": _redact_sensitive_text(str(path), self.env),
+                "transcript_offset": transcript_offset,
+                "at": _utc_now(),
+            }
+        )
+        return path
+
+    def expect_any(self, patterns: tuple[str, ...], *, description: str, timeout: float) -> str:
+        child = self._require_child()
+        deadline = time.monotonic() + timeout
+        all_patterns = list(patterns) + list(PERMISSION_PROMPT_PATTERNS)
+        try:
+            while True:
+                remaining = deadline - time.monotonic()
+                if remaining <= 0:
+                    raise TimeoutError(f"timed out waiting for {description}")
+                index = child.expect(all_patterns, timeout=remaining)
+                self._capture_child_output(f"{child.before}{child.after}")
+                if index < len(patterns):
+                    matched = patterns[index]
+                    self.events.append(
+                        {
+                            "type": "expect",
+                            "description": description,
+                            "pattern": matched,
+                            "passed": True,
+                            "at": _utc_now(),
+                        }
+                    )
+                    return matched
+                matched = PERMISSION_PROMPT_PATTERNS[index - len(patterns)]
+                self.events.append(
+                    {
+                        "type": "permission_prompt",
+                        "description": description,
+                        "pattern": matched,
+                        "at": _utc_now(),
+                    }
+                )
+                self.send(
+                    _permission_prompt_response_sequence(self.args.permission_prompt_response),
+                    label="permission-prompt-response",
+                )
+        except Exception as exc:
+            self._capture_child_output(str(getattr(child, "before", "") or ""))
+            tail = _compact_text(_normalize_transcript(self.transcript)[-2000:])
+            self.events.append(
+                {
+                    "type": "expect",
+                    "description": description,
+                    "patterns": list(patterns),
+                    "passed": False,
+                    "error": str(exc),
+                    "tail": _redact_sensitive_text(tail, self.env),
+                    "at": _utc_now(),
+                }
+            )
+            raise
+
+    def expect_optional(self, patterns: tuple[str, ...], *, description: str, timeout: float) -> bool:
+        child = self._require_child()
+        try:
+            index = child.expect(list(patterns), timeout=timeout)
+            matched = patterns[index]
+            self.events.append(
+                {
+                    "type": "expect",
+                    "description": description,
+                    "pattern": matched,
+                    "passed": True,
+                    "optional": True,
+                    "at": _utc_now(),
+                }
+            )
+            return True
+        except Exception as exc:
+            if pexpect is None or not isinstance(exc, pexpect.TIMEOUT):
+                tail = _compact_text(_normalize_transcript(self.transcript)[-2000:])
+                self.events.append(
+                    {
+                        "type": "expect",
+                        "description": description,
+                        "patterns": list(patterns),
+                        "passed": False,
+                        "optional": True,
+                        "error": str(exc),
+                        "tail": _redact_sensitive_text(tail, self.env),
+                        "at": _utc_now(),
+                    }
+                )
+                raise
+            tail = _compact_text(_normalize_transcript(self.transcript)[-2000:])
+            self.events.append(
+                {
+                    "type": "expect",
+                    "description": description,
+                    "patterns": list(patterns),
+                    "passed": False,
+                    "optional": True,
+                    "tail": _redact_sensitive_text(tail, self.env),
+                    "at": _utc_now(),
+                }
+            )
+            return False
+
+    def terminate(self, *, force: bool = False) -> None:
+        child = self.child
+        if child is None:
+            return
+        try:
+            if force:
+                child.kill(signal.SIGKILL)
+            else:
+                child.terminate(force=True)
+        finally:
+            self._capture_child_output(str(getattr(child, "before", "") or ""))
+            self.events.append({"type": "terminate", "force": force, "at": _utc_now()})
+
+    def _capture_child_output(self, text: str) -> None:
+        if text and not self._live_transcript:
+            self.raw_chunks.append(text)
+
+    def _capture_child_output_force(self, text: str) -> None:
+        if text:
+            self.raw_chunks.append(text)
+
+    def _require_child(self) -> Any:
+        if self.child is None:
+            raise RuntimeError("REPL child has not been spawned")
+        return self.child
+
+
+class _TranscriptCapture:
+    def __init__(self, pty: ReplPty) -> None:
+        self._pty = pty
+
+    def write(self, text: str) -> None:
+        if text:
+            self._pty.raw_chunks.append(text)
+
+    def flush(self) -> None:
+        return None
+
+
+def _utc_now() -> str:
+    return datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")
+
+
+def _redact_json_value(value: Any, env: dict[str, str]) -> Any:
+    if isinstance(value, str):
+        return _redact_sensitive_text(value, env)
+    if isinstance(value, list):
+        return [_redact_json_value(item, env) for item in value]
+    if isinstance(value, dict):
+        redacted: dict[str, Any] = {}
+        for key, item in value.items():
+            key_text = str(key)
+            upper = key_text.upper()
+            if any(marker in upper for marker in ("KEY", "TOKEN", "SECRET", "PASSWORD", "CREDENTIAL", "AUTHORIZATION")):
+                redacted[key_text] = "<redacted>"
+            else:
+                redacted[key_text] = _redact_json_value(item, env)
+        return redacted
+    return value
+
+
+def _write_run_artifacts(
+    *,
+    run_dir: Path,
+    env: dict[str, str],
+    raw_transcript: str,
+    events: list[dict[str, Any]],
+    result: ScenarioRunResult,
+) -> None:
+    run_dir.mkdir(parents=True, exist_ok=True)
+    redacted_raw = _redact_sensitive_text(raw_transcript, env)
+    normalized = _normalize_transcript(redacted_raw)
+    (run_dir / "transcript.raw.log").write_text(redacted_raw, encoding="utf-8")
+    (run_dir / "transcript.normalized.log").write_text(normalized, encoding="utf-8")
+    _write_json(run_dir / "child.env.json", _redacted_env_summary(env))
+    with (run_dir / "events.jsonl").open("w", encoding="utf-8") as handle:
+        for event in events:
+            handle.write(json.dumps(_redact_json_value(event, env), ensure_ascii=False, default=str) + "\n")
+    _write_json(run_dir / "summary.json", _redact_json_value(asdict(result), env))
+
+
+def main(argv: list[str] | None = None) -> int:
+    args = parse_args(argv)
+    scenarios = _selected_scenarios(args)
+    if args.run_dir and len(scenarios) != 1:
+        raise SystemExit("--run-dir can only be used with a single --scenario")
+    for scenario in scenarios:
+        _validate_scenario_execution(args, scenario)
+    results = [_SCENARIOS[scenario](args, scenario) for scenario in scenarios]
+    return 0 if all(code == 0 for code in results) else 1
+
+
+def _run_with_pty(
+    args: argparse.Namespace,
+    scenario: str,
+    callback: Callable[[ReplPty, dict[str, bool]], None],
+) -> int:
+    started = time.monotonic()
+    run_dir = _scenario_run_dir(args, scenario)
+    workspace_dir = Path(args.cwd).expanduser().resolve() if args.cwd else run_dir / "workspace"
+    workspace_dir.mkdir(parents=True, exist_ok=True)
+    env = _build_child_env(args)
+    pty = ReplPty(args=args, run_dir=run_dir, cwd=workspace_dir, env=env)
+    checks: dict[str, bool] = {}
+    notes: list[str] = []
+    abort_reason = ""
+    passed = False
+    acceptance_applied = False
+    teardown_applied = False
+
+    try:
+        pty.spawn()
+        callback(pty, checks)
+        _apply_acceptance_checks(scenario, args, pty, checks)
+        acceptance_applied = True
+        _teardown_real_cloud_scenario_resources(args=args, scenario=scenario, pty=pty, checks=checks, notes=notes)
+        teardown_applied = True
+        passed = all(checks.values()) if checks else True
+    except BaseException as exc:
+        abort_reason = f"{type(exc).__name__}: {exc}"
+        notes.append(abort_reason)
+        passed = False
+    finally:
+        if not acceptance_applied:
+            try:
+                _apply_acceptance_checks(scenario, args, pty, checks)
+                acceptance_applied = True
+            except BaseException as exc:
+                notes.append(f"acceptance check failed: {type(exc).__name__}: {exc}")
+        if acceptance_applied and not teardown_applied:
+            try:
+                _teardown_real_cloud_scenario_resources(
+                    args=args,
+                    scenario=scenario,
+                    pty=pty,
+                    checks=checks,
+                    notes=notes,
+                )
+                teardown_applied = True
+                if passed:
+                    passed = all(checks.values()) if checks else True
+            except BaseException as exc:
+                notes.append(f"final teardown failed: {type(exc).__name__}: {exc}")
+                if passed:
+                    passed = False
+        if not args.leave_running:
+            try:
+                pty.terminate()
+            except BaseException as exc:
+                notes.append(f"terminal child termination failed: {type(exc).__name__}: {exc}")
+                if passed:
+                    passed = False
+        result = ScenarioRunResult(
+            scenario=scenario,
+            run_dir=str(run_dir),
+            passed=passed,
+            checks=checks,
+            elapsed_seconds=round(time.monotonic() - started, 3),
+            abort_reason=abort_reason,
+            notes=notes,
+        )
+        _write_run_artifacts(run_dir=run_dir, env=env, raw_transcript=pty.transcript, events=pty.events, result=result)
+        _print_result(result)
+
+    return 0 if passed else 1
+
+
+def _print_result(result: ScenarioRunResult) -> None:
+    print(f"\nREPL pipeline scenario: {result.scenario}")
+    print(f"run_dir: {result.run_dir}")
+    if result.abort_reason:
+        print(f"abort_reason: {_compact_text(result.abort_reason, max_chars=1000)}")
+    if result.notes:
+        print("\nnotes:")
+        for note in result.notes:
+            print(f"  - {_compact_text(note, max_chars=1000)}")
+    print("\nchecks:")
+    for name, passed in result.checks.items():
+        print(f"  {'OK' if passed else 'FAIL'} {name}")
+    print(f"\nRESULT: {'PASS' if result.passed else 'FAIL'}")
+
+
+def _has_any_pattern(text: str, patterns: tuple[str, ...]) -> bool:
+    return any(re.search(pattern, text) for pattern in patterns)
+
+
+def _count_pattern(text: str, patterns: tuple[str, ...]) -> int:
+    return sum(len(re.findall(pattern, text)) for pattern in patterns)
+
+
+def _resume_spawns(events: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    return [
+        event
+        for event in events
+        if event.get("type") == "spawn" and "--continue" in [str(item) for item in event.get("command", [])]
+    ]
+
+
+def _event_index(events: list[dict[str, Any]], event_type: str) -> int | None:
+    for index, event in enumerate(events):
+        if event.get("type") == event_type:
+            return index
+    return None
+
+
+def _event_before(events: list[dict[str, Any]], before_type: str, after_type: str) -> bool:
+    before = _event_index(events, before_type)
+    after = _event_index(events, after_type)
+    return before is not None and after is not None and before < after
+
+
+def _has_sendline_event(events: list[dict[str, Any]], text: str) -> bool:
+    return any(event.get("type") == "sendline" and event.get("text") == text for event in events)
+
+
+def _has_image_fixture_event(events: list[dict[str, Any]], image_key: str) -> bool:
+    return any(event.get("type") == "paste-image-fixture" and event.get("image_key") == image_key for event in events)
+
+
+def _has_vswitch_business_evidence(transcript: str) -> bool:
+    if _has_any_pattern(transcript, VSWITCH_EVIDENCE_PATTERNS):
+        return True
+    has_vswitch_text = bool(re.search(r"(?i)VSwitch|交换机", transcript))
+    has_deploy_result = bool(re.search(r"Stack ID|Stack 名称|CREATE_COMPLETE|部署成功", transcript))
+    return has_vswitch_text and has_deploy_result
+
+
+def _has_vswitch_answer_evidence(text: str) -> bool:
+    return _has_any_pattern(text, VSWITCH_MENTION_PATTERNS)
+
+
+def _has_security_group_target_evidence(text: str) -> bool:
+    return _has_any_pattern(text, SECURITY_GROUP_EVIDENCE_PATTERNS + SECURITY_GROUP_MENTION_PATTERNS)
+
+
+def _has_positive_vswitch_target_evidence(text: str) -> bool:
+    cleaned_text = text
+    for pattern in NEGATED_VSWITCH_TARGET_SPAN_PATTERNS:
+        cleaned_text = re.sub(pattern, "", cleaned_text)
+    positive_context_lines = [
+        line for line in cleaned_text.splitlines() if not _has_any_pattern(line, NEGATED_VSWITCH_TARGET_LINE_PATTERNS)
+    ]
+    return _has_any_pattern("\n".join(positive_context_lines), POSITIVE_VSWITCH_TARGET_PATTERNS)
+
+
+def _last_event_suffix(
+    transcript: str,
+    events: list[dict[str, Any]],
+    *,
+    event_type: str,
+    text: str | None = None,
+) -> str:
+    offset: int | None = None
+    for event in events:
+        if event.get("type") != event_type:
+            continue
+        if text is not None and event.get("text") != text:
+            continue
+        raw_offset = event.get("transcript_offset")
+        if isinstance(raw_offset, int) and raw_offset >= 0:
+            offset = raw_offset
+    if offset is None:
+        return ""
+    return transcript[offset:]
+
+
+def _suffix_after_sendline_text(
+    transcript: str,
+    events: list[dict[str, Any]],
+    text: str,
+) -> str:
+    suffix = _normalize_transcript(_last_event_suffix(transcript, events, event_type="sendline", text=text))
+    normalized_text = _normalize_transcript(text)
+    if normalized_text and normalized_text in suffix:
+        return suffix.split(normalized_text, 1)[1]
+    return suffix
+
+
+def _suffix_after_image_fixture(
+    transcript: str,
+    events: list[dict[str, Any]],
+    image_key: str,
+) -> str:
+    offset: int | None = None
+    for event in events:
+        if event.get("type") != "paste-image-fixture" or event.get("image_key") != image_key:
+            continue
+        raw_offset = event.get("transcript_offset")
+        if isinstance(raw_offset, int) and raw_offset >= 0:
+            offset = raw_offset
+    if offset is None:
+        return ""
+    return _normalize_transcript(transcript[offset:])
+
+
+def _add_acceptance_check(checks: dict[str, bool], name: str, passed: bool) -> None:
+    checks[f"acceptance: {name}"] = bool(passed)
+
+
+def _cleanup_stack_name(run_dir: Path, label: str) -> str:
+    suffix = Path(run_dir).name.rsplit("-", maxsplit=1)[-1] or "stack"
+    safe_label = "".join(ch if ch.isalnum() else "-" for ch in label.lower()).strip("-") or "stack"
+    return f"iac-e2e-{suffix[:12]}-{safe_label}"[:128]
+
+
+def _scenario_stack_name(run_dir: Path, scenario: str) -> str:
+    suffix = Path(run_dir).name.rsplit("-", maxsplit=1)[-1] or "stack"
+    safe_scenario = "".join(ch if ch.isalnum() else "-" for ch in scenario.lower()).strip("-") or "scenario"
+    return f"iac-e2e-{suffix[:12]}-{safe_scenario}"[:128]
+
+
+def _stack_name_constraint(run_dir: Path, scenario: str) -> str:
+    stack_name = _scenario_stack_name(run_dir, scenario)
+    return f"本次 CreateStack 的 params.StackName 必须精确等于 `{stack_name}`，禁止使用默认或自动生成 StackName。"
+
+
+def _stack_creating_prompt(text: str, run_dir: Path, scenario: str) -> str:
+    return f"{text}。{_stack_name_constraint(run_dir, scenario)}"
+
+
+def _text_image_fixture_path(image_key: str) -> Path:
+    filename = TEXT_IMAGE_FIXTURE_FILENAMES.get(image_key)
+    if not filename:
+        raise KeyError(f"unknown text image fixture: {image_key}")
+    path = (TEXT_IMAGE_FIXTURE_ROOT / filename).resolve()
+    if not path.is_file():
+        raise FileNotFoundError(f"text image fixture not found: {path}")
+    return path
+
+
+def _submit_image_fixture(pty: ReplPty, image_key: str, *, caption: str = "") -> None:
+    pty.paste_image_fixture(image_key)
+    if caption:
+        pty.sendline(caption)
+    else:
+        pty.send("\r", label="submit-image")
+
+
+def _cleanup_network_target_from_args(args: argparse.Namespace) -> CleanupNetworkTarget | None:
+    if not (
+        args.cleanup_vpc_id
+        and args.cleanup_zone_id
+        and args.cleanup_vswitch_cidr
+        and args.cleanup_rollback_vswitch_cidr
+    ):
+        return None
+    return CleanupNetworkTarget(
+        vpc_id=args.cleanup_vpc_id,
+        vpc_cidr=args.cleanup_vpc_cidr,
+        zone_id=args.cleanup_zone_id,
+        vswitch_cidr=args.cleanup_vswitch_cidr,
+        rollback_vswitch_cidr=args.cleanup_rollback_vswitch_cidr,
+    )
+
+
+def _cleanup_network_prompt_fragment(args: argparse.Namespace, *, rollback: bool) -> str:
+    target = _cleanup_network_target_from_args(args)
+    if target is None:
+        return (
+            "必须先读取所选 VPC 的 CIDR，并选择属于该 VPC CIDR 的未占用 VSwitch CIDR；"
+            "第一次和回退后的第二次部署必须使用两个不同的合法未占用 VSwitch CIDR。"
+        )
+
+    vpc_cidr = f"（CIDR `{target.vpc_cidr}`）" if target.vpc_cidr else ""
+    if rollback:
+        return (
+            f"固定使用已有 VPC `{target.vpc_id}`{vpc_cidr}、可用区 `{target.zone_id}`；"
+            f"本次重新部署只创建安全组，CreateStack 模板参数必须显式设置 VpcId=`{target.vpc_id}`。"
+            "禁止创建 VSwitch，禁止在第二个栈中使用 CidrBlock 或模板默认 CidrBlock。"
+        )
+
+    return (
+        f"固定使用已有 VPC `{target.vpc_id}`{vpc_cidr}、可用区 `{target.zone_id}`、"
+        f"首个 VSwitch CIDR `{target.vswitch_cidr}`；首次 CreateStack 模板参数必须显式设置 "
+        f"VpcId=`{target.vpc_id}`、ZoneId=`{target.zone_id}`、CidrBlock=`{target.vswitch_cidr}`。"
+        "禁止使用模板默认 CidrBlock。"
+    )
+
+
+def _cleanup_pipeline_prompt(args: argparse.Namespace, run_dir: Path) -> str:
+    first_stack_name = _cleanup_stack_name(run_dir, "first")
+    return (
+        f"{args.initial_prompt}。第一次 CreateStack 的 params.StackName 必须精确等于 `{first_stack_name}`，"
+        "禁止使用模板名、候选方案名或 vswitch-in-existing-vpc，也不能复用已有资源栈。"
+        f"{_cleanup_network_prompt_fragment(args, rollback=False)}"
+    )
+
+
+def _cleanup_rollback_prompt(args: argparse.Namespace, run_dir: Path) -> str:
+    second_stack_name = _cleanup_stack_name(run_dir, "second")
+    return (
+        f"{args.rollback_prompt}。重新部署时 CreateStack 的 params.StackName 必须精确等于 `{second_stack_name}`，"
+        "禁止使用模板名、候选方案名或 vswitch-in-existing-vpc，也不能复用已有资源栈。"
+        "本次回退后的新方案只创建安全组，不创建 VSwitch。"
+        f"{_cleanup_network_prompt_fragment(args, rollback=True)}"
+    )
+
+
+async def _call_aliyun_api_async(product: str, action: str, params: dict[str, Any]) -> dict[str, Any]:
+    from iac_code.tools.base import ToolContext
+    from iac_code.tools.cloud.aliyun.aliyun_api import AliyunApi
+
+    result = await AliyunApi().execute(
+        tool_input={"product": product, "action": action, "params": params},
+        context=ToolContext(),
+    )
+    if result.is_error:
+        raise RuntimeError(_compact_text(result.content, max_chars=1000))
+    body = json.loads(result.content)
+    return body if isinstance(body, dict) else {}
+
+
+def _call_aliyun_api(product: str, action: str, params: dict[str, Any]) -> dict[str, Any]:
+    return asyncio.run(_call_aliyun_api_async(product, action, params))
+
+
+def _nested_api_items(data: dict[str, Any], outer_key: str, inner_key: str) -> list[dict[str, Any]]:
+    outer = data.get(outer_key)
+    if isinstance(outer, dict):
+        items = outer.get(inner_key) or outer.get(inner_key.lower()) or []
+    else:
+        items = outer or []
+    return [item for item in items if isinstance(item, dict)] if isinstance(items, list) else []
+
+
+def _find_available_vswitch_cidrs(vpc_cidr: str, used_cidrs: Iterable[str], *, count: int) -> list[str]:
+    try:
+        vpc_network = ipaddress.ip_network(vpc_cidr, strict=False)
+    except ValueError:
+        return []
+    if not isinstance(vpc_network, ipaddress.IPv4Network):
+        return []
+
+    used_networks: list[ipaddress.IPv4Network] = []
+    for cidr in used_cidrs:
+        try:
+            network = ipaddress.ip_network(cidr, strict=False)
+        except ValueError:
+            continue
+        if isinstance(network, ipaddress.IPv4Network):
+            used_networks.append(network)
+
+    prefixlen = max(24, vpc_network.prefixlen)
+    available: list[str] = []
+    if prefixlen == vpc_network.prefixlen:
+        if not any(vpc_network.overlaps(used) for used in used_networks):
+            available.append(str(vpc_network))
+        return available
+
+    for subnet in reversed(list(vpc_network.subnets(new_prefix=prefixlen))):
+        if not any(subnet.overlaps(used) for used in used_networks):
+            available.append(str(subnet))
+            used_networks.append(subnet)
+            if len(available) >= count:
+                return available
+    return available
+
+
+def _find_available_vswitch_cidr(vpc_cidr: str, used_cidrs: Iterable[str]) -> str | None:
+    cidrs = _find_available_vswitch_cidrs(vpc_cidr, used_cidrs, count=1)
+    return cidrs[0] if cidrs else None
+
+
+def _discover_cleanup_network_target() -> CleanupNetworkTarget:
+    vpcs_data = _call_aliyun_api("vpc", "DescribeVpcs", {"PageSize": 50})
+    for vpc in _nested_api_items(vpcs_data, "Vpcs", "Vpc"):
+        vpc_id = str(vpc.get("VpcId") or "")
+        vpc_cidr = str(vpc.get("CidrBlock") or "")
+        if not vpc_id or not vpc_cidr or str(vpc.get("Status") or "") != "Available":
+            continue
+
+        vswitches_data = _call_aliyun_api("vpc", "DescribeVSwitches", {"VpcId": vpc_id, "PageSize": 50})
+        vswitches = _nested_api_items(vswitches_data, "VSwitches", "VSwitch")
+        zone_ids = [str(item.get("ZoneId") or "") for item in vswitches if str(item.get("ZoneId") or "")]
+        used_cidrs = [str(item.get("CidrBlock") or "") for item in vswitches if str(item.get("CidrBlock") or "")]
+        vswitch_cidrs = _find_available_vswitch_cidrs(vpc_cidr, used_cidrs, count=2)
+        if zone_ids and len(vswitch_cidrs) >= 2:
+            return CleanupNetworkTarget(
+                vpc_id=vpc_id,
+                vpc_cidr=vpc_cidr,
+                zone_id=zone_ids[0],
+                vswitch_cidr=vswitch_cidrs[0],
+                rollback_vswitch_cidr=vswitch_cidrs[1],
+            )
+
+    raise RuntimeError("No available existing VPC with a free VSwitch CIDR was found for cleanup E2E.")
+
+
+def _ensure_cleanup_network_target(args: argparse.Namespace, run_dir: Path) -> CleanupNetworkTarget:
+    target = _cleanup_network_target_from_args(args)
+    if target is None:
+        target = _discover_cleanup_network_target()
+        args.cleanup_vpc_id = target.vpc_id
+        args.cleanup_vpc_cidr = target.vpc_cidr
+        args.cleanup_zone_id = target.zone_id
+        args.cleanup_vswitch_cidr = target.vswitch_cidr
+        args.cleanup_rollback_vswitch_cidr = target.rollback_vswitch_cidr
+    _write_json(Path(run_dir) / "cleanup-network-target.json", asdict(target))
+    return target
+
+
+def _session_id_from_transcript(transcript: str) -> str | None:
+    patterns = (
+        r"\bSession:\s*([0-9a-fA-F][0-9a-fA-F-]{7,})",
+        r"\bsession_id[\"'\s:=]+([0-9a-fA-F][0-9a-fA-F-]{7,})",
+        r"\bsession[\"'\s:=]+([0-9a-fA-F][0-9a-fA-F-]{7,})",
+    )
+    for pattern in patterns:
+        match = re.search(pattern, transcript)
+        if match:
+            return match.group(1)
+    return None
+
+
+def _cleanup_ledger_path(pty: Any) -> Path | None:
+    explicit = getattr(pty, "cleanup_ledger_path", None)
+    if explicit:
+        return Path(explicit)
+
+    cwd = str(getattr(pty, "cwd", "") or "")
+    if not cwd:
+        return None
+    session_id = str(getattr(pty, "session_id", "") or "") or _session_id_from_transcript(
+        str(getattr(pty, "transcript", "") or "")
+    )
+    try:
+        from iac_code.services.session_storage import SessionStorage
+
+        storage = SessionStorage()
+        if session_id:
+            return Path(storage.session_dir(cwd, session_id)) / "pipeline" / "cleanup.yaml"
+
+        project_dir_for = getattr(storage, "_project_dir_for", None)
+        if callable(project_dir_for):
+            project_dir = Path(project_dir_for(cwd))
+            candidates = sorted(
+                project_dir.glob("*/pipeline/cleanup.yaml"),
+                key=lambda path: path.stat().st_mtime if path.exists() else 0,
+                reverse=True,
+            )
+            if candidates:
+                return candidates[0]
+    except Exception:
+        return None
+    return None
+
+
+def _cleanup_ledger_data(pty: Any) -> dict[str, Any]:
+    inline = getattr(pty, "cleanup_ledger", None)
+    if isinstance(inline, dict):
+        return inline
+    path = _cleanup_ledger_path(pty)
+    if path is None or yaml is None or not path.exists():
+        return {}
+    try:
+        data = yaml.safe_load(path.read_text(encoding="utf-8"))
+    except (OSError, UnicodeDecodeError, Exception):
+        return {}
+    return data if isinstance(data, dict) else {}
+
+
+def _cleanup_ledger_items(pty: Any, key: str) -> list[dict[str, Any]]:
+    values = _cleanup_ledger_data(pty).get(key)
+    return [item for item in values if isinstance(item, dict)] if isinstance(values, list) else []
+
+
+def _is_ros_stack_resource(resource: dict[str, Any]) -> bool:
+    provider = str(resource.get("provider") or "").lower()
+    resource_type = str(resource.get("resource_type") or resource.get("resourceType") or "").lower()
+    return provider == "ros" and resource_type == "stack"
+
+
+def _string_from_mapping(mapping: Any, *keys: str) -> str | None:
+    if not isinstance(mapping, dict):
+        return None
+    for key in keys:
+        value = mapping.get(key)
+        if isinstance(value, str) and value:
+            return value
+    return None
+
+
+def _unique_strings(values: Iterable[str | None]) -> list[str]:
+    result: list[str] = []
+    seen: set[str] = set()
+    for value in values:
+        if not isinstance(value, str) or not value or value in seen:
+            continue
+        seen.add(value)
+        result.append(value)
+    return result
+
+
+def _latest_observed_stack_id(pty: Any, *, exclude: set[str]) -> str | None:
+    resources = _cleanup_ledger_items(pty, "observed_resources")
+    for resource in reversed(resources):
+        if not _is_ros_stack_resource(resource):
+            continue
+        action = str(resource.get("observed_action") or resource.get("observedAction") or resource.get("action") or "")
+        if action and action != "CreateStack":
+            continue
+        stack_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if stack_id and stack_id not in exclude:
+            return stack_id
+    return None
+
+
+def _is_create_stack_observation(resource: dict[str, Any]) -> bool:
+    action = str(resource.get("observed_action") or resource.get("observedAction") or resource.get("action") or "")
+    return not action or action == "CreateStack"
+
+
+def _observed_create_stack_resources(pty: Any) -> list[dict[str, Any]]:
+    resources: list[dict[str, Any]] = []
+    seen: set[str] = set()
+    for resource in _cleanup_ledger_items(pty, "observed_resources"):
+        if not _is_ros_stack_resource(resource) or not _is_create_stack_observation(resource):
+            continue
+        stack_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if not stack_id or stack_id in seen:
+            continue
+        seen.add(stack_id)
+        resources.append(resource)
+    return resources
+
+
+def _observed_create_stack_ids(pty: Any) -> list[str]:
+    return _unique_strings(
+        _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        for resource in _observed_create_stack_resources(pty)
+    )
+
+
+def _observed_create_stack_names(pty: Any) -> list[str]:
+    return _unique_strings(
+        _string_from_mapping(resource, "resource_name", "resourceName", "stack_name", "stackName")
+        for resource in _observed_create_stack_resources(pty)
+    )
+
+
+def _wait_for_latest_observed_stack_id(pty: Any, *, exclude: set[str], timeout: float) -> str:
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        stack_id = _latest_observed_stack_id(pty, exclude=exclude)
+        if stack_id:
+            return stack_id
+        time.sleep(0.5)
+    raise TimeoutError("Timed out waiting for rollback cleanup ledger to observe a ROS stack")
+
+
+def _cleanup_target_stack_ids(pty: Any, *, exclude: set[str]) -> list[str]:
+    stack_ids: list[str] = []
+    for resource in _cleanup_ledger_items(pty, "cleanup_resources"):
+        if not _is_ros_stack_resource(resource):
+            continue
+        if resource.get("cleanup_required") is False or resource.get("cleanupRequired") is False:
+            continue
+        stack_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if stack_id and stack_id not in exclude:
+            stack_ids.append(stack_id)
+    return _unique_strings(stack_ids)
+
+
+def _wait_for_cleanup_target_stack_ids(pty: Any, *, exclude: set[str], timeout: float) -> list[str]:
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        stack_ids = _cleanup_target_stack_ids(pty, exclude=exclude)
+        if stack_ids:
+            return stack_ids
+        time.sleep(0.5)
+    raise TimeoutError("Timed out waiting for rollback cleanup ledger to record target stacks")
+
+
+def _cleanup_resource_for_stack(pty: Any, stack_id: str | None) -> dict[str, Any] | None:
+    if not stack_id:
+        return None
+    for resource in _cleanup_ledger_items(pty, "cleanup_resources"):
+        if _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId") == stack_id:
+            return resource
+    return None
+
+
+def _cleanup_resource_completed(resource: dict[str, Any] | None) -> bool:
+    if not isinstance(resource, dict):
+        return False
+    cleanup_status = resource.get("cleanupStatus") or resource.get("cleanup_status") or resource.get("status")
+    stack_status = resource.get("stackStatus") or resource.get("progressStatus") or resource.get("progress_status")
+    return cleanup_status == "completed" and stack_status == "DELETE_COMPLETE"
+
+
+def _wait_for_cleanup_resource_status(pty: Any, stack_id: str, statuses: set[str], *, timeout: float) -> None:
+    deadline = time.monotonic() + timeout
+    while time.monotonic() < deadline:
+        resource = _cleanup_resource_for_stack(pty, stack_id)
+        status = ""
+        if isinstance(resource, dict):
+            status = str(
+                resource.get("cleanup_status") or resource.get("cleanupStatus") or resource.get("status") or ""
+            )
+        if status in statuses:
+            return
+        time.sleep(0.5)
+    raise TimeoutError(f"Timed out waiting for cleanup ledger status {sorted(statuses)} on {stack_id}")
+
+
+def _cleanup_history_has_event(pty: Any, stack_id: str | None, event_types: set[str]) -> bool:
+    if not stack_id:
+        return False
+    for item in _cleanup_ledger_items(pty, "history"):
+        event_type = str(item.get("type") or item.get("event_type") or item.get("eventType") or "")
+        if event_type not in event_types:
+            continue
+        resource = item.get("resource")
+        resource_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        resource_id = resource_id or _string_from_mapping(item, "resource_id", "resourceId", "stack_id", "stackId")
+        if resource_id == stack_id:
+            return True
+    return False
+
+
+def _capture_ros_stack_states(pty: Any, stack_ids: Iterable[str], name: str) -> dict[str, dict[str, Any]]:
+    existing = getattr(pty, "ros_stack_states", None)
+    states: dict[str, dict[str, Any]] = {}
+    if isinstance(existing, dict):
+        states.update({str(key): value for key, value in existing.items() if isinstance(value, dict)})
+
+    missing = [stack_id for stack_id in _unique_strings(stack_ids) if stack_id not in states]
+    for stack_id in missing:
+        region_id = _region_for_stack(pty, stack_id)
+        states[stack_id] = _get_ros_stack_state(
+            stack_id=stack_id,
+            region_id=region_id,
+            redaction_env=getattr(pty, "env", {}),
+        )
+
+    run_dir = getattr(pty, "run_dir", None)
+    env = getattr(pty, "env", {})
+    if run_dir is not None:
+        _write_json(
+            Path(run_dir) / f"{name}.ros-stack-states.json",
+            _redact_json_value(states, env if isinstance(env, dict) else {}),
+        )
+    return states
+
+
+def _fresh_ros_stack_state(pty: Any, stack_id: str) -> dict[str, Any]:
+    return _get_ros_stack_state(
+        stack_id=stack_id,
+        region_id=_region_for_stack(pty, stack_id),
+        redaction_env=getattr(pty, "env", {}),
+    )
+
+
+def _get_ros_stack_state(
+    *,
+    stack_id: str,
+    region_id: str,
+    redaction_env: dict[str, str] | None,
+) -> dict[str, Any]:
+    try:
+        from alibabacloud_ros20190910 import models as ros_models
+
+        from iac_code.services.cloud_credentials import CloudCredentials
+        from iac_code.tools.cloud.aliyun.ros_client import RosClientFactory
+
+        credential = CloudCredentials().get_provider("aliyun")
+        effective_region = region_id or (credential.region_id if credential is not None else "")
+        client = RosClientFactory.create(credential, effective_region)
+        request = ros_models.GetStackRequest(stack_id=stack_id, region_id=effective_region)
+        response = client.get_stack(request)
+        body = response.body.to_map()
+        return {
+            "stack_id": str(body.get("StackId") or stack_id),
+            "stack_name": str(body.get("StackName") or ""),
+            "region_id": effective_region,
+            "status": str(body.get("Status") or ""),
+            "status_reason": str(body.get("StatusReason") or ""),
+            "not_found": False,
+        }
+    except Exception as exc:
+        message = _redact_sensitive_text(str(exc), redaction_env)
+        return {
+            "stack_id": stack_id,
+            "region_id": region_id,
+            "status": "",
+            "not_found": _is_ros_stack_not_found(exc),
+            "error": _compact_text(message, max_chars=1000),
+        }
+
+
+def _delete_ros_stack(
+    *,
+    stack_id: str,
+    region_id: str,
+    redaction_env: dict[str, str] | None,
+) -> None:
+    try:
+        from alibabacloud_ros20190910 import models as ros_models
+
+        from iac_code.services.cloud_credentials import CloudCredentials
+        from iac_code.tools.cloud.aliyun.ros_client import RosClientFactory
+
+        credential = CloudCredentials().get_provider("aliyun")
+        effective_region = region_id or (credential.region_id if credential is not None else "")
+        client = RosClientFactory.create(credential, effective_region)
+        request = ros_models.DeleteStackRequest(stack_id=stack_id, region_id=effective_region)
+        client.delete_stack(request)
+    except Exception as exc:
+        if _is_ros_stack_not_found(exc):
+            return
+        message = _redact_sensitive_text(str(exc), redaction_env)
+        raise RuntimeError(_compact_text(message, max_chars=1000)) from exc
+
+
+def _wait_for_ros_stack_deleted(
+    *,
+    pty: Any,
+    stack_id: str,
+    timeout: float,
+) -> dict[str, Any]:
+    deadline = time.monotonic() + timeout
+    last_state: dict[str, Any] = {}
+    while time.monotonic() < deadline:
+        last_state = _fresh_ros_stack_state(pty, stack_id)
+        if _ros_stack_deleted(last_state):
+            return last_state
+        time.sleep(5)
+    status = last_state.get("status") or "<unknown>"
+    raise TimeoutError(f"Timed out waiting for ROS stack deletion: {stack_id} ({status})")
+
+
+def _is_ros_stack_not_found(exc: BaseException) -> bool:
+    code = str(getattr(exc, "code", "") or "")
+    message = str(exc)
+    combined = f"{code} {message}".lower()
+    not_found_tokens = (
+        "stacknotfound",
+        "notfound.stack",
+        "entitynotexist.stack",
+        "specified stack does not exist",
+        "stack could not be found",
+        "stack not found",
+    )
+    return any(token in combined for token in not_found_tokens)
+
+
+def _region_for_stack(pty: Any, stack_id: str) -> str:
+    for key in ("cleanup_resources", "observed_resources"):
+        for resource in reversed(_cleanup_ledger_items(pty, key)):
+            if _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId") == stack_id:
+                region = _string_from_mapping(resource, "region_id", "regionId", "RegionId")
+                if region:
+                    return region
+    env = getattr(pty, "env", {})
+    return env.get("ALIBABA_CLOUD_REGION_ID", "") if isinstance(env, dict) else ""
+
+
+def _ros_stack_deleted(state: dict[str, Any]) -> bool:
+    if not isinstance(state, dict):
+        return False
+    if state.get("not_found") is True:
+        return True
+    return state.get("status") in ROS_STACK_DELETED_STATUSES
+
+
+def _ros_stack_retained(state: dict[str, Any]) -> bool:
+    if not isinstance(state, dict) or state.get("not_found") is True:
+        return False
+    status = state.get("status")
+    return isinstance(status, str) and bool(status) and not status.startswith("DELETE_")
+
+
+def _ros_stack_states_for_acceptance(pty: Any, stack_ids: Iterable[str], name: str) -> dict[str, dict[str, Any]]:
+    return _capture_ros_stack_states(pty, _unique_strings(stack_ids), name)
+
+
+def _apply_cleanup_acceptance_checks(
+    *,
+    scenario: str,
+    transcript: str,
+    events: list[dict[str, Any]],
+    pty: Any,
+    checks: dict[str, bool],
+) -> None:
+    first_stack_id = str(getattr(pty, "cleanup_first_stack_id", "") or "")
+    second_stack_id = str(getattr(pty, "cleanup_second_stack_id", "") or "")
+    observed_stack_ids = {
+        stack_id
+        for stack_id in (
+            _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+            for resource in _cleanup_ledger_items(pty, "observed_resources")
+            if _is_ros_stack_resource(resource)
+        )
+        if stack_id
+    }
+    cleanup_stack_ids = _cleanup_target_stack_ids(pty, exclude={stack_id for stack_id in [second_stack_id] if stack_id})
+    run_dir = Path(getattr(pty, "run_dir", ""))
+    expected_first_stack_name = _cleanup_stack_name(run_dir, "first")
+    expected_second_stack_name = _cleanup_stack_name(run_dir, "second")
+
+    _add_acceptance_check(
+        checks,
+        "first rollback stack observed",
+        bool(first_stack_id) and first_stack_id in observed_stack_ids,
+    )
+    _add_acceptance_check(
+        checks,
+        "rollback cleanup ledger includes first stack",
+        bool(first_stack_id) and first_stack_id in cleanup_stack_ids,
+    )
+    _add_acceptance_check(checks, "rollback cleanup target stacks observed", bool(cleanup_stack_ids))
+    _add_acceptance_check(
+        checks,
+        "second stack created after rollback",
+        bool(second_stack_id) and second_stack_id != first_stack_id and second_stack_id in observed_stack_ids,
+    )
+    _add_acceptance_check(
+        checks,
+        "first rollback stack name matches test stack",
+        bool(first_stack_id) and _observed_cleanup_stack_name(pty, first_stack_id) == expected_first_stack_name,
+    )
+    _add_acceptance_check(
+        checks,
+        "second stack name matches test stack",
+        bool(second_stack_id) and _observed_cleanup_stack_name(pty, second_stack_id) == expected_second_stack_name,
+    )
+    _add_acceptance_check(
+        checks,
+        "cleanup snapshot does not target second stack",
+        bool(second_stack_id) and _cleanup_resource_for_stack(pty, second_stack_id) is None,
+    )
+    _add_acceptance_check(
+        checks,
+        "rollback cleanup completed",
+        bool(cleanup_stack_ids)
+        and all(
+            _cleanup_resource_completed(_cleanup_resource_for_stack(pty, stack_id)) for stack_id in cleanup_stack_ids
+        ),
+    )
+    _add_acceptance_check(
+        checks,
+        "no ROS create failure in cleanup transcript",
+        not _has_any_pattern(transcript, CLEANUP_DEPLOYMENT_FAILURE_PATTERNS),
+    )
+
+    ros_states = _ros_stack_states_for_acceptance(
+        pty,
+        [*cleanup_stack_ids, second_stack_id],
+        "acceptance-after-cleanup",
+    )
+    _add_acceptance_check(
+        checks,
+        "ROS first rollback stack deleted",
+        bool(first_stack_id) and _ros_stack_deleted(ros_states.get(first_stack_id, {})),
+    )
+    _add_acceptance_check(
+        checks,
+        "ROS rollback cleanup stacks deleted",
+        bool(cleanup_stack_ids)
+        and all(_ros_stack_deleted(ros_states.get(stack_id, {})) for stack_id in cleanup_stack_ids),
+    )
+    _add_acceptance_check(
+        checks,
+        "ROS second stack retained",
+        bool(second_stack_id) and _ros_stack_retained(ros_states.get(second_stack_id, {})),
+    )
+
+    if scenario == "rollback-step5-cleanup-recovery":
+        _add_acceptance_check(
+            checks,
+            "cleanup process was killed",
+            any(event.get("type") == "terminate" and event.get("force") is True for event in events),
+        )
+        _add_acceptance_check(checks, "cleanup resume used --continue", bool(_resume_spawns(events)))
+        _add_acceptance_check(
+            checks,
+            "cleanup retriggered after restart",
+            bool(_resume_spawns(events))
+            and _cleanup_history_has_event(
+                pty,
+                first_stack_id,
+                {"cleanup_started", "cleanup_progress", "cleanup_completed"},
+            ),
+        )
+
+
+def _owned_cleanup_stack_names(run_dir: Path) -> set[str]:
+    return {_cleanup_stack_name(run_dir, "first"), _cleanup_stack_name(run_dir, "second")}
+
+
+def _observed_cleanup_stack_ids(pty: Any) -> list[str]:
+    stack_ids = [
+        str(getattr(pty, "cleanup_first_stack_id", "") or ""),
+        str(getattr(pty, "cleanup_second_stack_id", "") or ""),
+    ]
+    stack_ids.extend(
+        _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        for resource in _cleanup_ledger_items(pty, "observed_resources")
+        if _is_ros_stack_resource(resource)
+    )
+    return _unique_strings(stack_ids)
+
+
+def _observed_cleanup_stack_name(pty: Any, stack_id: str) -> str:
+    for resource in reversed(_cleanup_ledger_items(pty, "observed_resources")):
+        if not _is_ros_stack_resource(resource):
+            continue
+        resource_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if resource_id != stack_id:
+            continue
+        return _string_from_mapping(resource, "resource_name", "resourceName", "stack_name", "stackName")
+    return ""
+
+
+def _apply_stack_creating_acceptance_checks(scenario: str, pty: Any, checks: dict[str, bool]) -> None:
+    if scenario not in STACK_CREATING_SCENARIOS:
+        return
+    stack_ids = _observed_create_stack_ids(pty)
+    expected_stack_name = _scenario_stack_name(Path(getattr(pty, "run_dir", "")), scenario)
+    stack_names = _observed_create_stack_names(pty)
+    _add_acceptance_check(checks, "ROS stack observed in cleanup ledger", bool(stack_ids))
+    _add_acceptance_check(
+        checks,
+        "ROS stack name is test-owned",
+        bool(stack_ids) and expected_stack_name in stack_names,
+    )
+    ros_states = _ros_stack_states_for_acceptance(pty, stack_ids, "acceptance-before-teardown") if stack_ids else {}
+    _add_acceptance_check(
+        checks,
+        "ROS created stack retained before teardown",
+        bool(stack_ids) and any(_ros_stack_retained(ros_states.get(stack_id, {})) for stack_id in stack_ids),
+    )
+
+
+def _teardown_cleanup_scenario_resources(
+    *,
+    args: argparse.Namespace,
+    scenario: str,
+    pty: Any,
+    checks: dict[str, bool],
+    notes: list[str],
+) -> None:
+    if scenario not in {"rollback-step5-cleanup", "rollback-step5-cleanup-recovery"}:
+        return
+    if args.skip_final_teardown:
+        notes.append("final teardown skipped by --skip-final-teardown")
+        return
+
+    run_dir = Path(getattr(pty, "run_dir", ""))
+    owned_stack_names = _owned_cleanup_stack_names(run_dir)
+    stack_ids = _observed_cleanup_stack_ids(pty)
+    if not stack_ids:
+        checks["teardown: no cleanup scenario stacks leaked"] = True
+        return
+
+    deletion_failures: list[str] = []
+    deleted_stack_ids: list[str] = []
+    for stack_id in stack_ids:
+        state = _fresh_ros_stack_state(pty, stack_id)
+        if _ros_stack_deleted(state):
+            continue
+
+        stack_name = str(state.get("stack_name") or "")
+        if stack_name not in owned_stack_names:
+            deletion_failures.append(
+                f"{stack_id} has unexpected stack name {stack_name or '<unknown>'}; "
+                f"expected one of {sorted(owned_stack_names)}"
+            )
+            continue
+
+        try:
+            _delete_ros_stack(
+                stack_id=stack_id,
+                region_id=str(state.get("region_id") or _region_for_stack(pty, stack_id)),
+                redaction_env=getattr(pty, "env", {}),
+            )
+            final_state = _wait_for_ros_stack_deleted(pty=pty, stack_id=stack_id, timeout=args.final_teardown_timeout)
+            if _ros_stack_deleted(final_state):
+                deleted_stack_ids.append(stack_id)
+            else:
+                deletion_failures.append(f"{stack_id} final status is {final_state.get('status') or '<unknown>'}")
+        except Exception as exc:
+            deletion_failures.append(f"{stack_id}: {type(exc).__name__}: {exc}")
+
+    for failure in deletion_failures:
+        notes.append(f"final teardown failed: {_compact_text(failure, max_chars=1000)}")
+
+    checks["teardown: cleanup scenario owned ROS stacks deleted"] = not deletion_failures
+    if deleted_stack_ids:
+        notes.append(f"final teardown deleted ROS stacks: {', '.join(deleted_stack_ids)}")
+
+
+def _teardown_real_cloud_scenario_resources(
+    *,
+    args: argparse.Namespace,
+    scenario: str,
+    pty: Any,
+    checks: dict[str, bool],
+    notes: list[str],
+) -> None:
+    if scenario in {"rollback-step5-cleanup", "rollback-step5-cleanup-recovery"}:
+        _teardown_cleanup_scenario_resources(args=args, scenario=scenario, pty=pty, checks=checks, notes=notes)
+        return
+    if args.skip_final_teardown:
+        notes.append("final teardown skipped by --skip-final-teardown")
+        return
+
+    resources = _observed_create_stack_resources(pty)
+    if not resources:
+        checks["teardown: no observed ROS stacks leaked"] = True
+        return
+
+    deletion_failures: list[str] = []
+    deleted_stack_ids: list[str] = []
+    expected_scenario_stack_name = _scenario_stack_name(Path(getattr(pty, "run_dir", "")), scenario)
+    for resource in resources:
+        stack_id = _string_from_mapping(resource, "resource_id", "resourceId", "stack_id", "stackId")
+        if not stack_id:
+            continue
+        expected_stack_name = _string_from_mapping(resource, "resource_name", "resourceName", "stack_name", "stackName")
+        if expected_stack_name != expected_scenario_stack_name:
+            deletion_failures.append(
+                f"{stack_id} has unexpected test-owned stack name {expected_stack_name or '<unknown>'}; "
+                f"expected {expected_scenario_stack_name}"
+            )
+            continue
+        state = _fresh_ros_stack_state(pty, stack_id)
+        if _ros_stack_deleted(state):
+            continue
+
+        actual_stack_name = str(state.get("stack_name") or "")
+        if not expected_stack_name:
+            deletion_failures.append(f"{stack_id} has no observed stack name in cleanup ledger")
+            continue
+        if actual_stack_name != expected_stack_name:
+            deletion_failures.append(
+                f"{stack_id} has unexpected stack name {actual_stack_name or '<unknown>'}; "
+                f"expected observed name {expected_stack_name}"
+            )
+            continue
+
+        try:
+            _delete_ros_stack(
+                stack_id=stack_id,
+                region_id=str(state.get("region_id") or _region_for_stack(pty, stack_id)),
+                redaction_env=getattr(pty, "env", {}),
+            )
+            final_state = _wait_for_ros_stack_deleted(pty=pty, stack_id=stack_id, timeout=args.final_teardown_timeout)
+            if _ros_stack_deleted(final_state):
+                deleted_stack_ids.append(stack_id)
+            else:
+                deletion_failures.append(f"{stack_id} final status is {final_state.get('status') or '<unknown>'}")
+        except Exception as exc:
+            deletion_failures.append(f"{stack_id}: {type(exc).__name__}: {exc}")
+
+    for failure in deletion_failures:
+        notes.append(f"final teardown failed: {_compact_text(failure, max_chars=1000)}")
+
+    checks["teardown: observed ROS stacks deleted"] = not deletion_failures
+    if deleted_stack_ids:
+        notes.append(f"final teardown deleted ROS stacks: {', '.join(deleted_stack_ids)}")
+
+
+def _apply_acceptance_checks(
+    scenario: str,
+    args: argparse.Namespace,
+    pty: Any,
+    checks: dict[str, bool],
+) -> None:
+    raw_transcript = str(getattr(pty, "transcript", ""))
+    transcript = _normalize_transcript(raw_transcript)
+    events = list(getattr(pty, "events", []))
+    _add_acceptance_check(checks, "PTY transcript captured", bool(transcript.strip()))
+    _add_acceptance_check(
+        checks,
+        "no terminal error in PTY transcript",
+        not _has_any_pattern(transcript, TERMINAL_ERROR_PATTERNS),
+    )
+
+    if scenario == "scenario1":
+        normal_answer = _suffix_after_sendline_text(raw_transcript, events, args.normal_followup_prompt)
+        _add_acceptance_check(
+            checks,
+            "candidate selection was shown",
+            _has_any_pattern(transcript, CANDIDATE_SELECTION_PATTERNS),
+        )
+        _add_acceptance_check(checks, "pipeline completed", _has_any_pattern(transcript, PIPELINE_COMPLETED_PATTERNS))
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+        _add_acceptance_check(
+            checks,
+            "normal follow-up answered created VSwitch",
+            _has_vswitch_answer_evidence(normal_answer),
+        )
+    elif scenario == "image-initial":
+        _add_acceptance_check(checks, "initial image fixture was pasted", _has_image_fixture_event(events, "initial"))
+        _add_acceptance_check(
+            checks,
+            "candidate selection was shown",
+            _has_any_pattern(transcript, CANDIDATE_SELECTION_PATTERNS),
+        )
+        _add_acceptance_check(checks, "pipeline completed", _has_any_pattern(transcript, PIPELINE_COMPLETED_PATTERNS))
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "image-ask-waiting-resume":
+        after_answer = _suffix_after_image_fixture(raw_transcript, events, "ask-first-answer")
+        _add_acceptance_check(
+            checks,
+            "ask user question was replayed after resume",
+            _count_pattern(transcript, ASK_USER_QUESTION_HEADING_PATTERNS) >= 2,
+        )
+        _add_acceptance_check(checks, "resume used --continue", bool(_resume_spawns(events)))
+        _add_acceptance_check(
+            checks,
+            "ask answer image fixture was pasted",
+            _has_image_fixture_event(events, "ask-first-answer"),
+        )
+        _add_acceptance_check(
+            checks,
+            "ask image answer advanced pipeline after resume",
+            _has_any_pattern(after_answer or transcript, CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "image-selection-waiting-resume":
+        _add_acceptance_check(checks, "initial image fixture was pasted", _has_image_fixture_event(events, "initial"))
+        _add_acceptance_check(
+            checks,
+            "candidate selection was replayed after resume",
+            _count_pattern(transcript, CANDIDATE_SELECTION_PATTERNS) >= 2,
+        )
+        _add_acceptance_check(checks, "resume used --continue", bool(_resume_spawns(events)))
+        _add_acceptance_check(
+            checks,
+            "pipeline completed after resume",
+            _has_any_pattern(transcript, PIPELINE_COMPLETED_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "image-normal-handoff":
+        normal_answer = _suffix_after_image_fixture(raw_transcript, events, "normal-followup")
+        _add_acceptance_check(
+            checks,
+            "candidate selection was shown",
+            _has_any_pattern(transcript, CANDIDATE_SELECTION_PATTERNS),
+        )
+        _add_acceptance_check(checks, "pipeline completed", _has_any_pattern(transcript, PIPELINE_COMPLETED_PATTERNS))
+        _add_acceptance_check(
+            checks,
+            "normal follow-up image fixture was pasted",
+            _has_image_fixture_event(events, "normal-followup"),
+        )
+        _add_acceptance_check(
+            checks,
+            "normal image follow-up answered created VSwitch",
+            _has_vswitch_answer_evidence(normal_answer),
+        )
+    elif scenario == "image-interrupt":
+        after_rollback = _suffix_after_image_fixture(raw_transcript, events, "rollback-interrupt")
+        _add_acceptance_check(
+            checks,
+            "rollback image fixture was pasted",
+            _has_image_fixture_event(events, "rollback-interrupt"),
+        )
+        _add_acceptance_check(
+            checks,
+            "rollback reached evaluate_candidates step",
+            _has_any_pattern(transcript, EVALUATE_CANDIDATES_HEADING_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "rollback image produced post-interrupt pipeline progress",
+            _has_any_pattern(after_rollback, POST_ROLLBACK_PROGRESS_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is security group",
+            _has_security_group_target_evidence(after_rollback),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is not VSwitch",
+            not _has_positive_vswitch_target_evidence(after_rollback),
+        )
+    elif scenario == "ask-waiting":
+        after_answer = _normalize_transcript(
+            _last_event_suffix(raw_transcript, events, event_type="sendline", text=args.ask_answer)
+        )
+        _add_acceptance_check(checks, "ask user question was shown", "Ask user question" in transcript)
+        _add_acceptance_check(
+            checks,
+            "ask answer advanced pipeline",
+            _has_any_pattern(after_answer or transcript, CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "selection-waiting-resume":
+        continue_spawns = _resume_spawns(events)
+        _add_acceptance_check(
+            checks,
+            "candidate selection was replayed after resume",
+            _count_pattern(transcript, CANDIDATE_SELECTION_PATTERNS) >= 2,
+        )
+        _add_acceptance_check(checks, "resume used --continue", bool(continue_spawns))
+        _add_acceptance_check(
+            checks,
+            "pipeline completed after resume",
+            _has_any_pattern(transcript, PIPELINE_COMPLETED_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "rollback-step3":
+        after_rollback = _suffix_after_sendline_text(raw_transcript, events, args.rollback_prompt)
+        _add_acceptance_check(
+            checks,
+            "rollback reached evaluate_candidates step",
+            _has_any_pattern(transcript, EVALUATE_CANDIDATES_HEADING_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "rollback produced post-interrupt pipeline progress",
+            _has_any_pattern(after_rollback, POST_ROLLBACK_PROGRESS_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is security group",
+            _has_security_group_target_evidence(after_rollback),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is not VSwitch",
+            not _has_positive_vswitch_target_evidence(after_rollback),
+        )
+    elif scenario == "rollback-step2":
+        after_rollback = _suffix_after_sendline_text(raw_transcript, events, args.rollback_prompt)
+        _add_acceptance_check(
+            checks,
+            "rollback reached architecture_planning step",
+            _has_any_pattern(transcript, ARCHITECTURE_PLANNING_HEADING_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "rollback produced post-interrupt pipeline progress",
+            _has_any_pattern(after_rollback, POST_ROLLBACK_PROGRESS_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is security group",
+            _has_security_group_target_evidence(after_rollback),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is not VSwitch",
+            not _has_positive_vswitch_target_evidence(after_rollback),
+        )
+    elif scenario == "rollback-step4-selection":
+        after_rollback = _suffix_after_sendline_text(raw_transcript, events, args.rollback_prompt)
+        _add_acceptance_check(
+            checks,
+            "rollback reached candidate selection step",
+            _has_any_pattern(transcript, CANDIDATE_SELECTION_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "rollback produced post-interrupt pipeline progress",
+            _has_any_pattern(after_rollback, POST_ROLLBACK_PROGRESS_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is security group",
+            _has_security_group_target_evidence(after_rollback),
+        )
+        _add_acceptance_check(
+            checks,
+            "post-rollback target is not VSwitch",
+            not _has_positive_vswitch_target_evidence(after_rollback),
+        )
+    elif scenario == "evaluate-resume":
+        after_continue = _normalize_transcript(
+            _last_event_suffix(
+                raw_transcript,
+                events,
+                event_type="sendline",
+                text=args.evaluate_resume_continue_prompt,
+            )
+        )
+        _add_acceptance_check(
+            checks,
+            "evaluate_candidates was shown before resume",
+            _has_any_pattern(transcript, EVALUATE_CANDIDATES_HEADING_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "evaluate_candidates was replayed after resume",
+            _count_pattern(transcript, EVALUATE_CANDIDATES_HEADING_PATTERNS) >= 2,
+        )
+        _add_acceptance_check(checks, "resume used --continue", bool(_resume_spawns(events)))
+        _add_acceptance_check(
+            checks,
+            "resume continue input was sent",
+            _has_sendline_event(events, args.evaluate_resume_continue_prompt),
+        )
+        _add_acceptance_check(
+            checks,
+            "pipeline advanced after resume continue",
+            _has_any_pattern(after_continue or transcript, CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "ask-waiting-resume":
+        after_answer = _normalize_transcript(
+            _last_event_suffix(raw_transcript, events, event_type="sendline", text=args.ask_answer)
+        )
+        _add_acceptance_check(
+            checks,
+            "ask user question was replayed after resume",
+            _count_pattern(transcript, ASK_USER_QUESTION_HEADING_PATTERNS) >= 2,
+        )
+        _add_acceptance_check(checks, "resume used --continue", bool(_resume_spawns(events)))
+        _add_acceptance_check(
+            checks,
+            "ask answer advanced pipeline after resume",
+            _has_any_pattern(after_answer or transcript, CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS),
+        )
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario == "selection-invalid-then-valid":
+        _add_acceptance_check(
+            checks,
+            "invalid selection input was sent",
+            _event_index(events, "select-invalid-candidate") is not None,
+        )
+        _add_acceptance_check(
+            checks,
+            "valid selection input was sent after invalid input",
+            _event_before(events, "select-invalid-candidate", "select-default-candidate"),
+        )
+        _add_acceptance_check(checks, "pipeline completed", _has_any_pattern(transcript, PIPELINE_COMPLETED_PATTERNS))
+        _add_acceptance_check(
+            checks,
+            "VSwitch evidence found in PTY transcript",
+            _has_vswitch_business_evidence(transcript),
+        )
+    elif scenario in {"rollback-step5-cleanup", "rollback-step5-cleanup-recovery"}:
+        _add_acceptance_check(
+            checks,
+            "deploying step was reached",
+            _has_any_pattern(transcript, DEPLOYING_STEP_PATTERNS + FIRST_STACK_CREATED_PATTERNS),
+        )
+        _add_acceptance_check(checks, "cleanup started", _has_any_pattern(transcript, CLEANUP_STARTED_PATTERNS))
+        _apply_cleanup_acceptance_checks(
+            scenario=scenario,
+            transcript=transcript,
+            events=events,
+            pty=pty,
+            checks=checks,
+        )
+    _apply_stack_creating_acceptance_checks(scenario, pty, checks)
+
+
+def _select_default_candidate(pty: ReplPty, args: argparse.Namespace) -> None:
+    if args.selection_prompt:
+        pty.send(f"{args.selection_prompt}\r", label="select-default-candidate")
+    else:
+        pty.send("\r", label="select-default-candidate")
+
+
+def _expect_initial_prompt(pty: ReplPty, args: argparse.Namespace) -> None:
+    pty.expect_any(REPL_PROMPT_PATTERNS, description="initial prompt", timeout=args.timeout)
+    pty.expect_any(REPL_INPUT_READY_PATTERNS, description="prompt input ready", timeout=args.timeout)
+
+
+def _expect_candidate_selection(pty: ReplPty, args: argparse.Namespace, *, description: str) -> None:
+    pty.expect_any(CANDIDATE_SELECTION_PATTERNS, description=description, timeout=args.stream_timeout)
+    pty.expect_optional(
+        CANDIDATE_SELECTION_READY_PATTERNS,
+        description="candidate selection controls ready",
+        timeout=args.candidate_selection_ready_timeout,
+    )
+
+
+def _expect_raw_input_ready(pty: ReplPty, args: argparse.Namespace, *, description: str) -> None:
+    pty.expect_any(REPL_INPUT_READY_PATTERNS, description=description, timeout=args.timeout)
+
+
+def _expect_parallel_interrupt_ready(pty: ReplPty, args: argparse.Namespace) -> None:
+    _expect_raw_input_ready(pty, args, description="parallel interrupt input ready")
+
+
+def _wait_for_cleanup_completed_and_ready(pty: ReplPty, args: argparse.Namespace, first_stack_id: str) -> None:
+    _wait_for_cleanup_resource_status(pty, first_stack_id, {"completed"}, timeout=args.stream_timeout)
+    pty.expect_optional(
+        CLEANUP_COMPLETED_PATTERNS,
+        description="cleanup completed",
+        timeout=min(args.timeout, 5.0),
+    )
+    _expect_raw_input_ready(pty, args, description="post-cleanup prompt input ready")
+
+
+def _finish_vswitch_pipeline_after_possible_selection(
+    pty: ReplPty,
+    args: argparse.Namespace,
+    checks: dict[str, bool],
+    matched_pattern: str,
+    *,
+    selection_check: str,
+    completion_check: str,
+    completion_description: str,
+) -> None:
+    if matched_pattern in CANDIDATE_SELECTION_PATTERNS:
+        pty.expect_optional(
+            CANDIDATE_SELECTION_READY_PATTERNS,
+            description="candidate selection controls ready after ask",
+            timeout=args.candidate_selection_ready_timeout,
+        )
+        _select_default_candidate(pty, args)
+        checks[selection_check] = True
+        pty.expect_any(PIPELINE_COMPLETED_PATTERNS, description=completion_description, timeout=args.stream_timeout)
+    checks[completion_check] = True
+
+
+def _expect_post_rollback_security_group_target(
+    pty: ReplPty,
+    args: argparse.Namespace,
+    checks: dict[str, bool],
+) -> None:
+    pty.expect_any(
+        SECURITY_GROUP_MENTION_PATTERNS,
+        description="post-rollback security group target visible",
+        timeout=min(args.stream_timeout, 300.0),
+    )
+    checks["post-rollback security group target visible"] = True
+
+
+def run_scenario1(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(_stack_creating_prompt(args.initial_prompt, pty.run_dir, scenario))
+        pty.expect_any(PIPELINE_STARTED_PATTERNS, description="pipeline started", timeout=args.stream_timeout)
+        checks["pipeline started"] = True
+        _expect_candidate_selection(pty, args, description="candidate selection visible")
+        checks["candidate selection became visible"] = True
+        _select_default_candidate(pty, args)
+        checks["candidate selection input sent"] = True
+        pty.expect_any(
+            PIPELINE_FULLY_COMPLETED_PATTERNS,
+            description="pipeline fully completed",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline completed"] = True
+        _expect_raw_input_ready(pty, args, description="normal prompt input ready")
+        checks["normal prompt input ready"] = True
+        pty.sendline(args.normal_followup_prompt)
+        pty.expect_any(
+            VSWITCH_MENTION_PATTERNS,
+            description="normal follow-up answered created VSwitch",
+            timeout=min(args.stream_timeout, 120.0),
+        )
+        checks["normal follow-up answered created VSwitch"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_ask_waiting(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.ask_prompt)
+        pty.expect_any(ASK_PATTERNS, description="ask question visible", timeout=args.stream_timeout)
+        checks["ask question became visible"] = True
+        pty.sendline(_stack_creating_prompt(args.ask_answer, pty.run_dir, scenario))
+        checks["ask answer sent"] = True
+        matched = pty.expect_any(
+            CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS,
+            description="pipeline continued after ask",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline continued beyond ask"] = True
+        _finish_vswitch_pipeline_after_possible_selection(
+            pty,
+            args,
+            checks,
+            matched,
+            selection_check="candidate selection input sent after ask",
+            completion_check="pipeline completed after ask",
+            completion_description="pipeline completed after ask",
+        )
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_image_initial(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        _submit_image_fixture(pty, "initial", caption=_stack_name_constraint(pty.run_dir, scenario))
+        checks["initial image fixture pasted"] = True
+        pty.expect_any(PIPELINE_STARTED_PATTERNS, description="pipeline started", timeout=args.stream_timeout)
+        checks["pipeline started"] = True
+        _expect_candidate_selection(pty, args, description="candidate selection visible")
+        checks["candidate selection became visible"] = True
+        _select_default_candidate(pty, args)
+        checks["candidate selection input sent"] = True
+        pty.expect_any(
+            PIPELINE_COMPLETED_PATTERNS,
+            description="pipeline completed after image initial",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline completed after image initial"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_image_ask_waiting_resume(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.ask_prompt)
+        pty.expect_any(ASK_PATTERNS, description="ask question visible before kill", timeout=args.stream_timeout)
+        checks["ask question became visible before kill"] = True
+        pty.terminate(force=True)
+        checks["first process killed"] = True
+        pty.spawn(extra_args=["--continue"])
+        pty.expect_any(ASK_PATTERNS, description="ask question replayed", timeout=args.stream_timeout)
+        checks["ask question replayed"] = True
+        _expect_raw_input_ready(pty, args, description="ask image answer input ready after resume")
+        checks["ask image answer input ready after resume"] = True
+        _submit_image_fixture(pty, "ask-first-answer", caption=_stack_name_constraint(pty.run_dir, scenario))
+        checks["ask first answer image fixture pasted after resume"] = True
+        if pty.expect_optional(
+            ASK_PATTERNS,
+            description="second ask question after image answer",
+            timeout=min(args.timeout, 30.0),
+        ):
+            _expect_raw_input_ready(pty, args, description="second ask image answer input ready")
+            _submit_image_fixture(pty, "ask-second-answer", caption=_stack_name_constraint(pty.run_dir, scenario))
+            checks["ask second answer image fixture pasted"] = True
+        matched = pty.expect_any(
+            CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS,
+            description="pipeline continued after ask image resume",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline continued beyond ask image after resume"] = True
+        _finish_vswitch_pipeline_after_possible_selection(
+            pty,
+            args,
+            checks,
+            matched,
+            selection_check="candidate selection input sent after ask image resume",
+            completion_check="pipeline completed after ask image resume",
+            completion_description="pipeline completed after ask image resume",
+        )
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_image_selection_waiting_resume(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        _submit_image_fixture(pty, "initial", caption=_stack_name_constraint(pty.run_dir, scenario))
+        checks["initial image fixture pasted"] = True
+        _expect_candidate_selection(pty, args, description="candidate selection visible before image resume kill")
+        checks["candidate selection became visible before kill"] = True
+        pty.terminate(force=True)
+        checks["first process killed"] = True
+        pty.spawn(extra_args=["--continue"])
+        _expect_candidate_selection(pty, args, description="candidate selection replayed after image resume")
+        checks["candidate selection replayed after resume"] = True
+        _select_default_candidate(pty, args)
+        checks["candidate selection input sent after resume"] = True
+        pty.expect_any(
+            PIPELINE_COMPLETED_PATTERNS,
+            description="pipeline completed after image selection resume",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline completed after image selection resume"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_image_normal_handoff(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(_stack_creating_prompt(args.initial_prompt, pty.run_dir, scenario))
+        pty.expect_any(PIPELINE_STARTED_PATTERNS, description="pipeline started", timeout=args.stream_timeout)
+        checks["pipeline started"] = True
+        _expect_candidate_selection(pty, args, description="candidate selection visible")
+        checks["candidate selection became visible"] = True
+        _select_default_candidate(pty, args)
+        checks["candidate selection input sent"] = True
+        pty.expect_any(
+            PIPELINE_FULLY_COMPLETED_PATTERNS,
+            description="pipeline fully completed",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline completed"] = True
+        _expect_raw_input_ready(pty, args, description="normal prompt input ready")
+        checks["normal prompt input ready"] = True
+        _submit_image_fixture(pty, "normal-followup")
+        checks["normal follow-up image fixture pasted"] = True
+        pty.expect_any(
+            VSWITCH_MENTION_PATTERNS,
+            description="normal image follow-up answered created VSwitch",
+            timeout=min(args.stream_timeout, 120.0),
+        )
+        checks["normal image follow-up answered created VSwitch"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_image_interrupt(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.initial_prompt)
+        pty.expect_any(
+            CANDIDATE_EVALUATION_PATTERNS,
+            description="candidate evaluation visible",
+            timeout=args.stream_timeout,
+        )
+        checks["candidate evaluation reached"] = True
+        _expect_parallel_interrupt_ready(pty, args)
+        checks["parallel interrupt input ready"] = True
+        pty.send("\x1b", label="send-esc")
+        checks["esc sent"] = True
+        pty.expect_any(
+            REPL_INPUT_READY_PATTERNS, description="parallel interrupt text input ready", timeout=args.timeout
+        )
+        checks["parallel interrupt text input ready"] = True
+        _submit_image_fixture(pty, "rollback-interrupt")
+        checks["rollback interrupt image fixture pasted"] = True
+        pty.expect_any(
+            POST_ROLLBACK_PROGRESS_PATTERNS,
+            description="post-rollback pipeline progress visible",
+            timeout=args.stream_timeout,
+        )
+        checks["post-rollback pipeline progress visible"] = True
+        _expect_post_rollback_security_group_target(pty, args, checks)
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_selection_waiting_resume(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(_stack_creating_prompt(args.initial_prompt, pty.run_dir, scenario))
+        _expect_candidate_selection(pty, args, description="candidate selection visible")
+        checks["candidate selection became visible before kill"] = True
+        pty.terminate(force=True)
+        checks["first process killed"] = True
+        pty.spawn(extra_args=["--continue"])
+        _expect_candidate_selection(pty, args, description="candidate selection replayed")
+        checks["candidate selection replayed"] = True
+        _select_default_candidate(pty, args)
+        checks["candidate selection input sent after resume"] = True
+        pty.expect_any(
+            PIPELINE_COMPLETED_PATTERNS, description="pipeline completed after resume", timeout=args.stream_timeout
+        )
+        checks["pipeline completed after resume"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_ask_waiting_resume(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.ask_prompt)
+        pty.expect_any(ASK_PATTERNS, description="ask question visible before kill", timeout=args.stream_timeout)
+        checks["ask question became visible before kill"] = True
+        pty.terminate(force=True)
+        checks["first process killed"] = True
+        pty.spawn(extra_args=["--continue"])
+        pty.expect_any(ASK_PATTERNS, description="ask question replayed", timeout=args.stream_timeout)
+        checks["ask question replayed"] = True
+        _expect_raw_input_ready(pty, args, description="ask answer input ready after resume")
+        checks["ask answer input ready after resume"] = True
+        pty.sendline(_stack_creating_prompt(args.ask_answer, pty.run_dir, scenario))
+        checks["ask answer sent after resume"] = True
+        matched = pty.expect_any(
+            CANDIDATE_SELECTION_PATTERNS + PIPELINE_COMPLETED_PATTERNS,
+            description="pipeline continued after ask resume",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline continued beyond ask after resume"] = True
+        _finish_vswitch_pipeline_after_possible_selection(
+            pty,
+            args,
+            checks,
+            matched,
+            selection_check="candidate selection input sent after ask resume",
+            completion_check="pipeline completed after ask resume",
+            completion_description="pipeline completed after ask resume",
+        )
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_evaluate_resume(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(_stack_creating_prompt(args.initial_prompt, pty.run_dir, scenario))
+        pty.expect_any(
+            CANDIDATE_EVALUATION_PATTERNS, description="candidate evaluation visible", timeout=args.stream_timeout
+        )
+        checks["candidate evaluation reached before kill"] = True
+        _expect_parallel_interrupt_ready(pty, args)
+        checks["parallel interrupt input ready before kill"] = True
+        pty.terminate(force=True)
+        checks["first process killed"] = True
+        pty.spawn(extra_args=["--continue"])
+        pty.expect_any(
+            EVALUATE_CANDIDATES_HEADING_PATTERNS,
+            description="candidate evaluation replayed after resume",
+            timeout=args.stream_timeout,
+        )
+        checks["candidate evaluation replayed after resume"] = True
+        _expect_raw_input_ready(pty, args, description="evaluate resume prompt input ready")
+        checks["evaluate resume prompt input ready"] = True
+        pty.sendline(args.evaluate_resume_continue_prompt)
+        checks["resume continue input sent"] = True
+        _expect_candidate_selection(pty, args, description="candidate selection visible after resume continue")
+        checks["candidate selection became visible after resume continue"] = True
+        _select_default_candidate(pty, args)
+        checks["candidate selection input sent after resume"] = True
+        pty.expect_any(
+            PIPELINE_COMPLETED_PATTERNS,
+            description="pipeline completed after evaluate resume",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline completed after evaluate resume"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_selection_invalid_then_valid(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(_stack_creating_prompt(args.initial_prompt, pty.run_dir, scenario))
+        _expect_candidate_selection(pty, args, description="candidate selection visible")
+        checks["candidate selection became visible"] = True
+        pty.send(args.invalid_selection_prompt, label="select-invalid-candidate")
+        checks["invalid selection input sent"] = True
+        _select_default_candidate(pty, args)
+        checks["valid selection input sent after invalid input"] = True
+        pty.expect_any(PIPELINE_COMPLETED_PATTERNS, description="pipeline completed", timeout=args.stream_timeout)
+        checks["pipeline completed"] = True
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_rollback_step2(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.initial_prompt)
+        pty.expect_any(
+            ARCHITECTURE_PLANNING_PATTERNS,
+            description="architecture planning visible",
+            timeout=args.stream_timeout,
+        )
+        checks["architecture planning reached"] = True
+        pty.send("\x1b", label="send-esc")
+        checks["esc sent"] = True
+        pty.expect_any(INTERRUPT_INPUT_PATTERNS, description="interrupt input visible", timeout=args.timeout)
+        checks["interrupt input visible"] = True
+        _expect_raw_input_ready(pty, args, description="interrupt prompt input ready")
+        checks["interrupt prompt input ready"] = True
+        pty.sendline(args.rollback_prompt)
+        checks["rollback prompt sent"] = True
+        pty.expect_any(
+            POST_ROLLBACK_PROGRESS_PATTERNS,
+            description="post-rollback pipeline progress visible",
+            timeout=args.stream_timeout,
+        )
+        checks["post-rollback pipeline progress visible"] = True
+        _expect_post_rollback_security_group_target(pty, args, checks)
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_rollback_step3(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.initial_prompt)
+        pty.expect_any(
+            CANDIDATE_EVALUATION_PATTERNS,
+            description="candidate evaluation visible",
+            timeout=args.stream_timeout,
+        )
+        checks["candidate evaluation reached"] = True
+        _expect_parallel_interrupt_ready(pty, args)
+        checks["parallel interrupt input ready"] = True
+        pty.send("\x1b", label="send-esc")
+        checks["esc sent"] = True
+        pty.expect_any(
+            REPL_INPUT_READY_PATTERNS, description="parallel interrupt text input ready", timeout=args.timeout
+        )
+        checks["parallel interrupt text input ready"] = True
+        pty.sendline(args.rollback_prompt)
+        checks["rollback prompt sent"] = True
+        pty.expect_any(
+            POST_ROLLBACK_PROGRESS_PATTERNS,
+            description="post-rollback pipeline progress visible",
+            timeout=args.stream_timeout,
+        )
+        checks["post-rollback pipeline progress visible"] = True
+        _expect_post_rollback_security_group_target(pty, args, checks)
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_rollback_step4_selection(args: argparse.Namespace, scenario: str) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        pty.sendline(args.initial_prompt)
+        _expect_candidate_selection(pty, args, description="candidate selection visible")
+        checks["candidate selection reached"] = True
+        _expect_raw_input_ready(pty, args, description="candidate selection input ready")
+        checks["candidate selection input ready"] = True
+        pty.send("\x1b", label="send-esc")
+        checks["esc sent"] = True
+        _expect_raw_input_ready(pty, args, description="candidate selection interrupt text input ready")
+        checks["candidate selection interrupt text input ready"] = True
+        pty.sendline(args.rollback_prompt)
+        checks["rollback prompt sent"] = True
+        pty.expect_any(
+            POST_ROLLBACK_PROGRESS_PATTERNS,
+            description="post-rollback pipeline progress visible",
+            timeout=args.stream_timeout,
+        )
+        checks["post-rollback pipeline progress visible"] = True
+        _expect_post_rollback_security_group_target(pty, args, checks)
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+def run_rollback_step5_cleanup(args: argparse.Namespace, scenario: str) -> int:
+    return _run_rollback_step5_cleanup(args, scenario, kill_during_cleanup=False)
+
+
+def run_rollback_step5_cleanup_recovery(args: argparse.Namespace, scenario: str) -> int:
+    return _run_rollback_step5_cleanup(args, scenario, kill_during_cleanup=True)
+
+
+def _run_rollback_step5_cleanup(
+    args: argparse.Namespace,
+    scenario: str,
+    *,
+    kill_during_cleanup: bool,
+) -> int:
+    def callback(pty: ReplPty, checks: dict[str, bool]) -> None:
+        _expect_initial_prompt(pty, args)
+        _ensure_cleanup_network_target(args, pty.run_dir)
+        checks["cleanup network target prepared"] = True
+        pty.sendline(_cleanup_pipeline_prompt(args, pty.run_dir))
+        _expect_candidate_selection(pty, args, description="initial candidate selection visible")
+        checks["initial reached step4 selection"] = True
+
+        _select_default_candidate(pty, args)
+        checks["initial candidate selected"] = True
+        pty.expect_any(
+            CREATE_STACK_STARTED_PATTERNS,
+            description="first stack create started",
+            timeout=args.stream_timeout,
+        )
+        first_stack_id = _wait_for_latest_observed_stack_id(pty, exclude=set(), timeout=args.stream_timeout)
+        pty.cleanup_first_stack_id = first_stack_id
+        checks["first rollback stack observed before rollback"] = bool(first_stack_id)
+
+        pty.send("\x1b", label="send-esc")
+        checks["esc sent during deploying"] = True
+        _expect_raw_input_ready(pty, args, description="deploying interrupt input ready")
+        checks["deploying interrupt input ready"] = True
+        pty.sendline(_cleanup_rollback_prompt(args, pty.run_dir))
+        checks["rollback prompt sent"] = True
+        _expect_candidate_selection(pty, args, description="post-rollback candidate selection visible")
+        checks["post-rollback candidate selection visible"] = True
+
+        cleanup_stack_ids = _wait_for_cleanup_target_stack_ids(pty, exclude=set(), timeout=args.timeout)
+        checks["rollback cleanup ledger includes first stack"] = first_stack_id in cleanup_stack_ids
+        checks["rollback cleanup target stacks observed"] = bool(cleanup_stack_ids)
+
+        _select_default_candidate(pty, args)
+        checks["post-rollback candidate selected"] = True
+        pty.expect_any(
+            PIPELINE_FULLY_COMPLETED_PATTERNS,
+            description="pipeline completed after second deployment",
+            timeout=args.stream_timeout,
+        )
+        checks["pipeline completed after second deployment"] = True
+
+        second_stack_id = _latest_observed_stack_id(pty, exclude=set(cleanup_stack_ids) | {first_stack_id})
+        pty.cleanup_second_stack_id = second_stack_id or ""
+        checks["second stack created after rollback"] = bool(second_stack_id)
+        checks["second stack differs from first rollback stack"] = (
+            bool(second_stack_id) and second_stack_id != first_stack_id
+        )
+
+        cleanup_stack_ids = _cleanup_target_stack_ids(
+            pty,
+            exclude={stack_id for stack_id in [second_stack_id] if stack_id},
+        )
+        checks["rollback cleanup ledger includes first stack"] = first_stack_id in cleanup_stack_ids
+        checks["rollback cleanup target stacks observed"] = bool(cleanup_stack_ids)
+        checks["cleanup snapshot does not target second stack"] = (
+            bool(second_stack_id) and _cleanup_resource_for_stack(pty, second_stack_id) is None
+        )
+
+        pty.sendline(args.normal_followup_prompt)
+        if kill_during_cleanup:
+            pty.expect_any(
+                CLEANUP_STARTED_PATTERNS,
+                description="cleanup started before kill",
+                timeout=args.stream_timeout,
+            )
+            checks["cleanup started before kill"] = True
+            pty.terminate(force=True)
+            checks["cleanup process killed"] = True
+            pty.spawn(extra_args=["--continue"])
+            pty.expect_any(
+                CLEANUP_RESUME_SUMMARY_PATTERNS,
+                description="cleanup resume summary",
+                timeout=args.stream_timeout,
+            )
+            if _cleanup_resource_completed(_cleanup_resource_for_stack(pty, first_stack_id)):
+                checks["cleanup already completed after restart"] = True
+            else:
+                _expect_raw_input_ready(pty, args, description="cleanup resume prompt input ready")
+                pty.sendline(args.cleanup_continue_prompt)
+                checks["cleanup continue prompt sent after restart"] = True
+        else:
+            pty.expect_any(CLEANUP_STARTED_PATTERNS, description="cleanup started", timeout=args.stream_timeout)
+            checks["cleanup started"] = True
+
+        _wait_for_cleanup_completed_and_ready(pty, args, first_stack_id)
+        checks["first rollback stack cleanup completed in ledger"] = _cleanup_resource_completed(
+            _cleanup_resource_for_stack(pty, first_stack_id)
+        )
+        checks["rollback cleanup stacks completed in ledger"] = bool(cleanup_stack_ids) and all(
+            _cleanup_resource_completed(_cleanup_resource_for_stack(pty, stack_id)) for stack_id in cleanup_stack_ids
+        )
+        pty.sendline("/exit")
+
+    return _run_with_pty(args, scenario, callback)
+
+
+_SCENARIOS: dict[str, Callable[[argparse.Namespace, str], int]] = {
+    "scenario1": run_scenario1,
+    "ask-waiting": run_ask_waiting,
+    "ask-waiting-resume": run_ask_waiting_resume,
+    "image-initial": run_image_initial,
+    "image-ask-waiting-resume": run_image_ask_waiting_resume,
+    "image-selection-waiting-resume": run_image_selection_waiting_resume,
+    "image-normal-handoff": run_image_normal_handoff,
+    "image-interrupt": run_image_interrupt,
+    "evaluate-resume": run_evaluate_resume,
+    "selection-invalid-then-valid": run_selection_invalid_then_valid,
+    "selection-waiting-resume": run_selection_waiting_resume,
+    "rollback-step2": run_rollback_step2,
+    "rollback-step3": run_rollback_step3,
+    "rollback-step4-selection": run_rollback_step4_selection,
+    "rollback-step5-cleanup": run_rollback_step5_cleanup,
+    "rollback-step5-cleanup-recovery": run_rollback_step5_cleanup_recovery,
+}
+_REAL_CLOUD_SCENARIOS = frozenset(_SCENARIOS)
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/src/iac_code/a2a/app.py b/src/iac_code/a2a/app.py
index 572f3b49..096b5471 100644
--- a/src/iac_code/a2a/app.py
+++ b/src/iac_code/a2a/app.py
@@ -6,6 +6,7 @@
 import hashlib
 import hmac
 import json
+import logging
 import os
 from contextlib import asynccontextmanager, suppress
 from email.utils import formatdate
@@ -25,8 +26,13 @@
 from starlette.routing import BaseRoute, Route
 
 from iac_code.a2a.agent_card import agent_card_to_client_dict
+from iac_code.a2a.jsonrpc_passthrough import (
+    install_jsonrpc_error_data_passthrough,
+    install_v03_jsonrpc_error_data_passthrough,
+)
 from iac_code.i18n import _
 
+logger = logging.getLogger(__name__)
 _V03_JSONRPC_METHODS = frozenset(
     {
         "message/send",
@@ -273,7 +279,9 @@ async def get_pipeline_state(request: Request) -> JSONResponse:
         Route(AGENT_CARD_WELL_KNOWN_PATH, get_agent_card, methods=["GET"]),
         Route("/iac-code/pipeline/state", get_pipeline_state, methods=["GET"]),
     ]
+    install_jsonrpc_error_data_passthrough()
     jsonrpc_endpoint = create_jsonrpc_routes(components.handler, rpc_url="/", enable_v0_3_compat=True)[0].endpoint
+    install_v03_jsonrpc_error_data_passthrough(jsonrpc_endpoint)
 
     async def handle_jsonrpc(request: Request) -> Response:
         await normalize_v03_jsonrpc_version(request)
diff --git a/src/iac_code/a2a/executor.py b/src/iac_code/a2a/executor.py
index 7a4821c3..f50710c9 100644
--- a/src/iac_code/a2a/executor.py
+++ b/src/iac_code/a2a/executor.py
@@ -2,10 +2,11 @@
 
 import asyncio
 import contextlib
+import json
 import logging
 import os
 import uuid
-from collections.abc import Awaitable, Callable, Mapping
+from collections.abc import AsyncIterator, Awaitable, Callable, Mapping
 from pathlib import Path
 from typing import Any, TypeAlias
 
@@ -13,15 +14,25 @@
 from a2a.server.agent_execution import AgentExecutor, RequestContext
 from a2a.server.events import EventQueue
 from a2a.types import Message, Role, Task, TaskState, TaskStatus, TaskStatusUpdateEvent
+from a2a.utils.errors import InvalidParamsError
 from google.protobuf.json_format import MessageToDict
 
 from iac_code.a2a.events import make_text_part, publish_stream_event
 from iac_code.a2a.exposure import normalize_a2a_exposure_types
 from iac_code.a2a.metrics import A2AMetrics, NoOpA2AMetrics
-from iac_code.a2a.parts import allowed_cwd_roots, is_relative_to, parts_to_prompt, resolve_workspace_path
+from iac_code.a2a.parts import (
+    allowed_cwd_roots,
+    is_relative_to,
+    parts_to_pipeline_input,
+    parts_to_prompt,
+    resolve_workspace_path,
+)
+from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
 from iac_code.a2a.pipeline_executor import IacCodeA2APipelineExecutor, recoverable_task_id_from_sidecar
+from iac_code.a2a.pipeline_journal import A2APipelineJournal
 from iac_code.a2a.pipeline_paths import existing_a2a_pipeline_dir_for_session
-from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
+from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore, reduce_pipeline_events
+from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher
 from iac_code.a2a.task_store import A2ATaskStore
 from iac_code.a2a.types import (
     TASK_STATE_CANCELED,
@@ -30,17 +41,38 @@
     TASK_STATE_WORKING,
 )
 from iac_code.agent.message import Message as AgentMessage
+from iac_code.config import get_active_provider_key, get_provider_config, load_credentials
 from iac_code.i18n import _
 from iac_code.pipeline.config import RunMode, get_run_mode
+from iac_code.pipeline.constants import (
+    PIPELINE_EVENT_CLEANUP_COMPLETED,
+    PIPELINE_EVENT_CLEANUP_FAILED,
+    PIPELINE_EVENT_CLEANUP_PROGRESS,
+    PIPELINE_EVENT_CLEANUP_STARTED,
+)
+from iac_code.pipeline.engine.cleanup import (
+    CLEANUP_PROMPT_METADATA_TYPE,
+    CleanupLedger,
+    CleanupObserver,
+    cleanup_prompt_ledger_path,
+    create_cleanup_prompt_message,
+    is_active_cleanup_prompt_message,
+    mark_cleanup_prompt_message_completed,
+)
+from iac_code.pipeline.engine.user_input import PipelineUserInput, normalize_pipeline_user_input
 from iac_code.services.agent_factory import AgentFactoryOptions, create_agent_runtime
+from iac_code.services.capabilities.multimodal import is_model_multimodal
 from iac_code.services.providers.aliyun import DEFAULT_REGION, AliyunCredential, use_aliyun_credential
 from iac_code.services.session_storage import SessionStorage
 from iac_code.services.telemetry import use_session_id, use_user_id
+from iac_code.types.stream_events import TextDeltaEvent
+from iac_code.utils.file_security import atomic_write_text, ensure_private_dir, ensure_private_file
 from iac_code.utils.public_errors import public_exception_summary, sanitize_public_text
 
 logger = logging.getLogger(__name__)
 _CONTEXT_LOCK_ACQUIRE_TIMEOUT_SECONDS = 1
 _ERROR_TEXT_MAX_CHARS = 1000
+_DEFERRED_CLEANUP_PROMPTS_FILENAME = "cleanup-deferred-prompts.json"
 
 
 def _format_exception(exc: BaseException) -> str:
@@ -58,6 +90,671 @@ def _is_relative_to(path: Path, root: Path) -> bool:
     return is_relative_to(path, root)
 
 
+def _cleanup_prompt_from_handoff(handoff: dict[str, Any]) -> str | None:
+    data = handoff.get("data")
+    if not isinstance(data, dict):
+        return None
+    cleanup = data.get("cleanup")
+    if not isinstance(cleanup, dict):
+        return None
+    prompt = cleanup.get("prompt")
+    return prompt if isinstance(prompt, str) and prompt else None
+
+
+def _cleanup_ledger_path_from_handoff(handoff: dict[str, Any]) -> str | None:
+    data = handoff.get("data")
+    if not isinstance(data, dict):
+        return None
+    cleanup = data.get("cleanup")
+    if not isinstance(cleanup, dict):
+        return None
+    path = cleanup.get("ledgerPath") or cleanup.get("ledger_path")
+    return path if isinstance(path, str) and path else None
+
+
+def _cleanup_payload_from_private_ledger_or_unavailable(
+    *,
+    ledger_path: Path,
+) -> dict[str, Any]:
+    ledger = CleanupLedger(ledger_path)
+    try:
+        ledger_exists = ledger_path.exists()
+    except OSError:
+        ledger_exists = False
+    if not ledger_exists or ledger.load_failed():
+        return {
+            "status": "unavailable",
+            "statusMessage": _("Cleanup state unavailable. Inspect the session file and cloud resources manually."),
+        }
+    prompt = ledger.build_pending_prompt()
+    if prompt is None:
+        return {"status": "completed", "resourceCount": 0}
+    return {
+        "status": "pending",
+        "resourceCount": len(prompt.resources),
+        "statusMessage": prompt.status_message,
+        "prompt": prompt.prompt,
+        "ledgerPath": str(ledger_path),
+    }
+
+
+def _session_has_user_message(
+    messages: list[AgentMessage],
+    *,
+    content: str,
+    metadata_type: str | None = None,
+) -> bool:
+    for message in messages:
+        if getattr(message, "role", None) != "user" or getattr(message, "content", None) != content:
+            continue
+        if metadata_type is None:
+            return True
+        metadata = getattr(message, "metadata", None)
+        if isinstance(metadata, dict) and metadata.get("type") == metadata_type:
+            return True
+    return False
+
+
+def _messages_have_cleanup_prompt(messages: list[Any]) -> bool:
+    return any(_message_is_cleanup_prompt(message) for message in messages)
+
+
+def _messages_have_active_cleanup_prompt(messages: list[Any]) -> bool:
+    return any(is_active_cleanup_prompt_message(message) for message in messages)
+
+
+def _session_has_active_cleanup_prompt_content(messages: list[AgentMessage], *, content: str) -> bool:
+    for message in messages:
+        if getattr(message, "role", None) != "user" or getattr(message, "content", None) != content:
+            continue
+        if is_active_cleanup_prompt_message(message):
+            return True
+    return False
+
+
+def _message_is_cleanup_prompt(message: Any) -> bool:
+    metadata = getattr(message, "metadata", None)
+    return isinstance(metadata, dict) and metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE
+
+
+def _cleanup_ledger_for_a2a_normal_chat(*, cwd: str, session_id: str) -> CleanupLedger | None:
+    try:
+        messages = SessionStorage().load(cwd, session_id)
+    except Exception:
+        logger.warning("Failed to inspect A2A session cleanup prompt", exc_info=True)
+        messages = []
+    has_active_cleanup_prompt = False
+    for message in messages:
+        if not is_active_cleanup_prompt_message(message):
+            continue
+        has_active_cleanup_prompt = True
+        ledger_path = cleanup_prompt_ledger_path(message)
+        if ledger_path:
+            return CleanupLedger(ledger_path)
+    try:
+        path = SessionStorage().session_dir(cwd, session_id) / "pipeline" / "cleanup.yaml"
+    except Exception:
+        logger.warning("Failed to locate A2A pipeline cleanup ledger", exc_info=True)
+        return None
+    if not path.exists():
+        return None
+    ledger = CleanupLedger(path)
+    if has_active_cleanup_prompt:
+        return ledger
+    if ledger.load_failed():
+        return None
+    return ledger if ledger.pending_resources() else None
+
+
+def _default_cleanup_ledger_path(*, cwd: str, session_id: str) -> Path:
+    return SessionStorage().session_dir(cwd, session_id) / "pipeline" / "cleanup.yaml"
+
+
+def _ensure_cleanup_prompt_in_session(*, cwd: str, session_id: str, ledger: CleanupLedger, runtime: Any) -> None:
+    cleanup_prompt = ledger.build_pending_prompt()
+    if cleanup_prompt is None:
+        return
+    message = create_cleanup_prompt_message(
+        cleanup_prompt.prompt,
+        cleanup_ledger_path=ledger.path,
+        cleanup_status="pending",
+    )
+    session_storage = SessionStorage()
+    messages = session_storage.load(cwd, session_id)
+    if _session_has_active_cleanup_prompt_content(
+        messages,
+        content=cleanup_prompt.prompt,
+    ):
+        _ensure_cleanup_prompt_in_runtime(runtime=runtime, message=message)
+        return
+    session_storage.append(cwd, session_id, message)
+    ledger.record_prompt_queued(cleanup_prompt, ui_surface="a2a")
+    _ensure_cleanup_prompt_in_runtime(runtime=runtime, message=message)
+
+
+def _ensure_cleanup_prompt_in_runtime(*, runtime: Any, message: AgentMessage) -> None:
+    context_manager = getattr(getattr(runtime, "agent_loop", None), "context_manager", None)
+    remover = getattr(context_manager, "remove_cleanup_prompt_messages", None)
+    add_raw_message = getattr(context_manager, "add_raw_message", None)
+    if not callable(add_raw_message):
+        return
+    if callable(remover):
+        try:
+            remover()
+        except Exception:
+            logger.warning("Failed to replace A2A cleanup prompt in runtime context", exc_info=True)
+    try:
+        add_raw_message(message.to_dict())
+    except Exception:
+        logger.warning("Failed to inject A2A cleanup prompt into runtime context", exc_info=True)
+
+
+def _runtime_has_cleanup_prompt(runtime: Any) -> bool:
+    context_manager = getattr(getattr(runtime, "agent_loop", None), "context_manager", None)
+    get_messages = getattr(context_manager, "get_messages", None)
+    if not callable(get_messages):
+        return False
+    try:
+        messages = get_messages()
+    except Exception:
+        return False
+    return isinstance(messages, list) and _messages_have_active_cleanup_prompt(messages)
+
+
+def _session_has_cleanup_prompt(*, cwd: str, session_id: str) -> bool:
+    try:
+        messages = SessionStorage().load(cwd, session_id)
+    except Exception:
+        logger.warning("Failed to inspect A2A session cleanup prompt", exc_info=True)
+        return False
+    return _messages_have_active_cleanup_prompt(messages)
+
+
+def _a2a_cleanup_prompt_exists(*, runtime: Any, cwd: str, session_id: str) -> bool:
+    return _runtime_has_cleanup_prompt(runtime) or _session_has_cleanup_prompt(cwd=cwd, session_id=session_id)
+
+
+def _a2a_cleanup_ledger_unavailable(
+    ledger: CleanupLedger | None,
+    *,
+    runtime: Any,
+    cwd: str,
+    session_id: str,
+) -> bool:
+    if not _a2a_cleanup_prompt_exists(runtime=runtime, cwd=cwd, session_id=session_id):
+        return False
+    if ledger is None:
+        return True
+    try:
+        if not ledger.path.exists():
+            return True
+    except Exception:
+        return True
+    return ledger.load_failed()
+
+
+def _a2a_deferred_cleanup_prompts_path(*, cwd: str, session_id: str) -> Path:
+    return SessionStorage().session_dir(cwd, session_id) / "a2a" / _DEFERRED_CLEANUP_PROMPTS_FILENAME
+
+
+def _read_a2a_deferred_cleanup_prompts(*, cwd: str, session_id: str) -> tuple[list[str], bool]:
+    path = _a2a_deferred_cleanup_prompts_path(cwd=cwd, session_id=session_id)
+    if not path.exists():
+        return [], False
+    try:
+        data = json.loads(path.read_text(encoding="utf-8"))
+    except (OSError, json.JSONDecodeError):
+        logger.warning("Failed to load deferred A2A cleanup prompts", exc_info=True)
+        return [], True
+    raw_prompts = data.get("prompts") if isinstance(data, dict) else None
+    if not isinstance(raw_prompts, list):
+        raw_prompt = data.get("prompt") if isinstance(data, dict) else None
+        raw_prompts = [raw_prompt] if isinstance(raw_prompt, str) else []
+    return [prompt for prompt in raw_prompts if isinstance(prompt, str) and prompt.strip()], False
+
+
+def _load_a2a_deferred_cleanup_prompts(*, cwd: str, session_id: str) -> list[str]:
+    prompts, _load_failed = _read_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id)
+    return prompts
+
+
+def _save_a2a_deferred_cleanup_prompts(*, cwd: str, session_id: str, prompts: list[str]) -> None:
+    path = _a2a_deferred_cleanup_prompts_path(cwd=cwd, session_id=session_id)
+    if not prompts:
+        _clear_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id)
+        return
+    try:
+        ensure_private_dir(path.parent)
+        atomic_write_text(
+            path,
+            json.dumps({"prompts": prompts}, ensure_ascii=False, sort_keys=True),
+        )
+        ensure_private_file(path)
+    except OSError:
+        logger.warning("Failed to persist deferred A2A cleanup prompt", exc_info=True)
+
+
+def _append_a2a_deferred_cleanup_prompt(*, cwd: str, session_id: str, prompt: str) -> bool:
+    prompt = prompt.strip()
+    if not prompt:
+        return True
+    prompts, load_failed = _read_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id)
+    if load_failed:
+        return False
+    if prompts and _is_cleanup_continue_prompt(prompt):
+        prompts = [prompts[-1]]
+    else:
+        prompts = [prompt]
+    _save_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id, prompts=prompts)
+    return True
+
+
+def _clear_a2a_deferred_cleanup_prompts(*, cwd: str, session_id: str) -> None:
+    path = _a2a_deferred_cleanup_prompts_path(cwd=cwd, session_id=session_id)
+    try:
+        path.unlink()
+    except FileNotFoundError:
+        return
+    except OSError:
+        logger.warning("Failed to clear deferred A2A cleanup prompts", exc_info=True)
+
+
+def _a2a_prompts_after_cleanup(*, cwd: str, session_id: str, prompt: str) -> tuple[list[str], bool] | None:
+    deferred_prompts, load_failed = _read_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id)
+    if load_failed:
+        return None
+    if not deferred_prompts:
+        return [prompt], False
+    if prompt.strip():
+        if not _append_a2a_deferred_cleanup_prompt(cwd=cwd, session_id=session_id, prompt=prompt):
+            return None
+        deferred_prompts, load_failed = _read_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id)
+        if load_failed:
+            return None
+    return deferred_prompts, True
+
+
+def _is_cleanup_continue_prompt(prompt: str) -> bool:
+    normalized = prompt.strip().lower()
+    return normalized in {"continue", "继续"}
+
+
+def _a2a_pipeline_state_for_session(
+    *,
+    cwd: str,
+    session_id: str,
+) -> tuple[A2APipelineSnapshotStore, A2APipelineJournal, dict[str, Any], list[dict[str, Any]] | None] | None:
+    try:
+        pipeline_dir = existing_a2a_pipeline_dir_for_session(cwd=cwd, session_id=session_id)
+        snapshot_store = A2APipelineSnapshotStore(pipeline_dir)
+        journal = A2APipelineJournal(pipeline_dir)
+        snapshot = snapshot_store.load()
+    except Exception:
+        logger.warning("Failed to load A2A pipeline snapshot", exc_info=True)
+        return None
+    journal_events: list[dict[str, Any]] | None = None
+    if not isinstance(snapshot, dict):
+        try:
+            journal_events = journal.read_all_repairing_tail()
+        except Exception:
+            logger.warning("Failed to rebuild A2A pipeline snapshot from journal", exc_info=True)
+            return None
+        if not journal_events:
+            return None
+        snapshot = reduce_pipeline_events(journal_events)
+    return snapshot_store, journal, snapshot, journal_events
+
+
+def _prune_completed_cleanup_prompt_from_runtime(runtime: Any, ledger: CleanupLedger | None) -> None:
+    if ledger is None and _runtime_has_cleanup_prompt(runtime):
+        logger.warning("Keeping A2A cleanup prompt because cleanup ledger is unavailable")
+        return
+    if ledger is not None and ledger.load_failed():
+        logger.warning("Keeping A2A cleanup prompt because cleanup ledger is unreadable")
+        return
+    if ledger is not None and not ledger.path.exists() and _runtime_has_cleanup_prompt(runtime):
+        logger.warning("Keeping A2A cleanup prompt because cleanup ledger is unavailable")
+        return
+    if ledger is not None and ledger.pending_resources():
+        return
+    context_manager = getattr(getattr(runtime, "agent_loop", None), "context_manager", None)
+    remover = getattr(context_manager, "remove_cleanup_prompt_messages", None)
+    if not callable(remover):
+        return
+    try:
+        remover()
+    except Exception:
+        logger.warning("Failed to remove completed A2A cleanup prompt from context", exc_info=True)
+
+
+def _mark_completed_cleanup_prompts(
+    *,
+    runtime: Any,
+    cwd: str,
+    session_id: str,
+    ledger: CleanupLedger,
+) -> None:
+    ledger_path = getattr(ledger, "path", None)
+    context_manager = getattr(getattr(runtime, "agent_loop", None), "context_manager", None)
+    get_messages = getattr(context_manager, "get_messages", None)
+    if callable(get_messages):
+        try:
+            messages = get_messages()
+        except Exception:
+            messages = []
+        if isinstance(messages, list):
+            for message in messages:
+                mark_cleanup_prompt_message_completed(message, cleanup_ledger_path=ledger_path)
+
+    session_storage = SessionStorage()
+    try:
+        messages = session_storage.load(cwd, session_id)
+    except Exception:
+        logger.warning("Failed to load A2A session while marking cleanup prompt completed", exc_info=True)
+        return
+    changed = False
+    for message in messages:
+        changed = mark_cleanup_prompt_message_completed(message, cleanup_ledger_path=ledger_path) or changed
+    if not changed:
+        return
+    try:
+        session_storage.save(cwd, session_id, messages)
+    except Exception:
+        logger.warning("Failed to mark A2A cleanup prompt completed in session", exc_info=True)
+
+
+def _cleanup_publisher_for_a2a_normal_chat(
+    *,
+    event_queue: EventQueue,
+    cwd: str,
+    session_id: str,
+    task_id: str,
+    context_id: str,
+    artifact_store: Any | None,
+    exposure_types: Any,
+) -> PipelineA2AEventPublisher | None:
+    state = _a2a_pipeline_state_for_session(cwd=cwd, session_id=session_id)
+    if state is None:
+        return None
+    snapshot_store, journal, snapshot, journal_events = state
+
+    translator = PipelineEventTranslator(
+        PipelineA2AContext(
+            pipeline_run_id=_string_value(snapshot.get("pipelineRunId")) or context_id,
+            task_id=_string_value(snapshot.get("taskId")) or task_id,
+            context_id=_string_value(snapshot.get("contextId")) or context_id,
+            pipeline_name=_string_value(snapshot.get("pipelineName")) or "pipeline",
+        )
+    )
+    try:
+        if journal_events is None:
+            journal_events = journal.read_all_repairing_tail()
+        translator.hydrate_from_events(journal_events)
+    except Exception:
+        logger.warning("Failed to hydrate A2A cleanup event translator", exc_info=True)
+    return PipelineA2AEventPublisher(
+        event_queue,
+        translator,
+        journal,
+        snapshot_store,
+        artifact_store=artifact_store,
+        exposure_types=exposure_types,
+        delivery_task_id=task_id,
+        delivery_context_id=context_id,
+    )
+
+
+async def _observe_cleanup_stream(
+    events: AsyncIterator[Any],
+    ledger: CleanupLedger,
+    *,
+    publisher: PipelineA2AEventPublisher | None = None,
+) -> AsyncIterator[Any]:
+    if ledger.load_failed():
+        async for event in events:
+            yield event
+        return
+    observer = CleanupObserver(ledger)
+    previous = (
+        _published_cleanup_resource_states(publisher, ledger)
+        if publisher is not None
+        else _cleanup_resource_states(ledger)
+    )
+    if publisher is not None:
+        previous = await _publish_cleanup_resource_changes(publisher, ledger, previous)
+    async for event in events:
+        observer.observe(event)
+        if publisher is not None:
+            previous = await _publish_cleanup_resource_changes(publisher, ledger, previous)
+        yield event
+
+
+def _cleanup_resource_state(resource: Any) -> tuple[Any, ...]:
+    return (
+        getattr(resource, "cleanup_status", None),
+        getattr(resource, "progress_status", None),
+        getattr(resource, "progress_percentage", None),
+        getattr(resource, "cleanup_tool_use_id", None),
+        getattr(resource, "last_error", None),
+    )
+
+
+def _cleanup_resource_states(ledger: CleanupLedger) -> dict[str, tuple[Any, ...]]:
+    return {resource.key: _cleanup_resource_state(resource) for resource in ledger.cleanup_resources()}
+
+
+def _published_cleanup_resource_states(
+    publisher: PipelineA2AEventPublisher,
+    ledger: CleanupLedger,
+) -> dict[str, tuple[Any, ...]]:
+    snapshot_store = getattr(publisher, "snapshot_store", None)
+    load = getattr(snapshot_store, "load", None)
+    if not callable(load):
+        return {}
+    try:
+        snapshot = load()
+    except Exception:
+        logger.warning("Failed to load A2A cleanup snapshot state for catch-up", exc_info=True)
+        return {}
+    if not isinstance(snapshot, dict):
+        return {}
+    cleanup = snapshot.get("cleanup")
+    if not isinstance(cleanup, dict):
+        return {}
+    snapshot_resources = [item for item in cleanup.get("resources", []) if isinstance(item, dict)]
+    states: dict[str, tuple[Any, ...]] = {}
+    for resource in ledger.cleanup_resources():
+        match = _matching_snapshot_cleanup_resource(resource, snapshot_resources)
+        if match is not None:
+            states[resource.key] = _snapshot_cleanup_resource_state(match)
+    return states
+
+
+def _matching_snapshot_cleanup_resource(resource: Any, candidates: list[dict[str, Any]]) -> dict[str, Any] | None:
+    for candidate in candidates:
+        if candidate.get("resourceId") != getattr(resource, "resource_id", None):
+            continue
+        if not _optional_cleanup_field_matches(candidate.get("regionId"), getattr(resource, "region_id", None)):
+            continue
+        if not _optional_cleanup_field_matches(candidate.get("provider"), getattr(resource, "provider", None)):
+            continue
+        resource_type = candidate.get("resourceType") or candidate.get("resource_type")
+        if not _optional_cleanup_field_matches(resource_type, getattr(resource, "resource_type", None)):
+            continue
+        return candidate
+    return None
+
+
+def _optional_cleanup_field_matches(snapshot_value: Any, ledger_value: Any) -> bool:
+    snapshot_text = snapshot_value if isinstance(snapshot_value, str) and snapshot_value else None
+    ledger_text = ledger_value if isinstance(ledger_value, str) and ledger_value else None
+    return snapshot_text is None or ledger_text is None or snapshot_text == ledger_text
+
+
+def _snapshot_cleanup_resource_state(resource: dict[str, Any]) -> tuple[Any, ...]:
+    return (
+        resource.get("cleanupStatus") or resource.get("cleanup_status") or resource.get("status"),
+        resource.get("progressStatus") or resource.get("stackStatus"),
+        resource.get("progressPercentage"),
+        resource.get("cleanupToolUseId") or resource.get("cleanup_tool_use_id"),
+        resource.get("lastError"),
+    )
+
+
+async def _publish_cleanup_resource_changes(
+    publisher: PipelineA2AEventPublisher,
+    ledger: CleanupLedger,
+    previous: dict[str, tuple[Any, ...]],
+) -> dict[str, tuple[Any, ...]]:
+    resources = ledger.cleanup_resources()
+    current = {resource.key: _cleanup_resource_state(resource) for resource in resources}
+    next_previous = dict(previous)
+    for resource in resources:
+        state = current.get(resource.key)
+        if state is None or previous.get(resource.key) == state:
+            continue
+        event_type = _cleanup_event_type_for_status(resource.cleanup_status)
+        if event_type is None:
+            continue
+        try:
+            published = await publisher.publish_manual(
+                event_type,
+                "cleanup",
+                status="working",
+                data=_cleanup_resource_event_data(resource, resource_count=len(resources)),
+                require_durable_metadata=True,
+            )
+        except Exception:
+            logger.warning("Failed to publish A2A cleanup progress event", exc_info=True)
+            continue
+        if published is not None:
+            next_previous[resource.key] = state
+    return next_previous
+
+
+def _cleanup_event_type_for_status(status: str) -> str | None:
+    if status == "started":
+        return PIPELINE_EVENT_CLEANUP_STARTED
+    if status == "in_progress":
+        return PIPELINE_EVENT_CLEANUP_PROGRESS
+    if status == "completed":
+        return PIPELINE_EVENT_CLEANUP_COMPLETED
+    if status == "failed":
+        return PIPELINE_EVENT_CLEANUP_FAILED
+    return None
+
+
+def _cleanup_resource_event_data(resource: Any, *, resource_count: int) -> dict[str, Any]:
+    data = {
+        "status": getattr(resource, "cleanup_status", None),
+        "resourceCount": resource_count,
+        "provider": getattr(resource, "provider", None),
+        "resourceType": getattr(resource, "resource_type", None),
+        "resourceId": getattr(resource, "resource_id", None),
+        "resourceName": getattr(resource, "resource_name", None),
+        "regionId": getattr(resource, "region_id", None),
+        "sourceStepId": getattr(resource, "source_step_id", None),
+        "cleanupStatus": getattr(resource, "cleanup_status", None),
+        "cleanupToolUseId": getattr(resource, "cleanup_tool_use_id", None),
+        "progressStatus": getattr(resource, "progress_status", None),
+        "progressPercentage": getattr(resource, "progress_percentage", None),
+        "stackStatus": getattr(resource, "progress_status", None),
+        "lastError": _public_cleanup_error(getattr(resource, "last_error", None)),
+    }
+    return {key: value for key, value in data.items() if value is not None}
+
+
+def _public_cleanup_error(value: Any) -> str | None:
+    if not value:
+        return None
+    text = sanitize_public_text(str(value))
+    return text[:_ERROR_TEXT_MAX_CHARS] + "..." if len(text) > _ERROR_TEXT_MAX_CHARS else text
+
+
+async def _stream_a2a_normal_events(
+    *,
+    runtime: Any,
+    prompt: str,
+    cleanup_ledger: CleanupLedger | None,
+    cleanup_publisher: PipelineA2AEventPublisher | None,
+    cwd: str,
+    session_id: str,
+) -> AsyncIterator[Any]:
+    if _a2a_cleanup_ledger_unavailable(cleanup_ledger, runtime=runtime, cwd=cwd, session_id=session_id):
+        if not _append_a2a_deferred_cleanup_prompt(cwd=cwd, session_id=session_id, prompt=prompt):
+            yield TextDeltaEvent(
+                text=_("Rollback cleanup deferred prompt state is unavailable. Please repair it before continuing.")
+            )
+            return
+        yield TextDeltaEvent(
+            text=_("Rollback cleanup state is unavailable. Please repair the cleanup ledger before continuing.")
+        )
+        return
+
+    if cleanup_ledger is not None and cleanup_ledger.load_failed():
+        if _runtime_has_cleanup_prompt(runtime) or _session_has_cleanup_prompt(cwd=cwd, session_id=session_id):
+            if not _append_a2a_deferred_cleanup_prompt(cwd=cwd, session_id=session_id, prompt=prompt):
+                yield TextDeltaEvent(
+                    text=_("Rollback cleanup deferred prompt state is unavailable. Please repair it before continuing.")
+                )
+                return
+            yield TextDeltaEvent(
+                text=_("Rollback cleanup state is unavailable. Please repair the cleanup ledger before continuing.")
+            )
+            return
+
+    run_cleanup_continuation = (
+        cleanup_ledger is not None
+        and not cleanup_ledger.load_failed()
+        and bool(cleanup_ledger.pending_resources())
+        and callable(getattr(runtime.agent_loop, "continue_streaming", None))
+    )
+    if run_cleanup_continuation and cleanup_ledger is not None:
+        _ensure_cleanup_prompt_in_session(cwd=cwd, session_id=session_id, ledger=cleanup_ledger, runtime=runtime)
+        cleanup_stream = _observe_cleanup_stream(
+            runtime.agent_loop.continue_streaming(),
+            cleanup_ledger,
+            publisher=cleanup_publisher,
+        )
+        async for event in cleanup_stream:
+            yield event
+        if cleanup_ledger.pending_resources():
+            if not _append_a2a_deferred_cleanup_prompt(cwd=cwd, session_id=session_id, prompt=prompt):
+                yield TextDeltaEvent(
+                    text=_("Rollback cleanup deferred prompt state is unavailable. Please repair it before continuing.")
+                )
+                return
+            yield TextDeltaEvent(
+                text=_("Rollback cleanup is still in progress. Please continue after cleanup completes.")
+            )
+            return
+        _mark_completed_cleanup_prompts(runtime=runtime, cwd=cwd, session_id=session_id, ledger=cleanup_ledger)
+        _prune_completed_cleanup_prompt_from_runtime(runtime, cleanup_ledger)
+
+    prompts_after_cleanup = _a2a_prompts_after_cleanup(cwd=cwd, session_id=session_id, prompt=prompt)
+    if prompts_after_cleanup is None:
+        yield TextDeltaEvent(
+            text=_("Rollback cleanup deferred prompt state is unavailable. Please repair it before continuing.")
+        )
+        return
+    prompts_to_run, has_deferred_prompts = prompts_after_cleanup
+    for prompt_to_run in prompts_to_run:
+        prompt_stream = runtime.agent_loop.run_streaming(prompt_to_run)
+        if cleanup_ledger is not None:
+            prompt_stream = _observe_cleanup_stream(prompt_stream, cleanup_ledger, publisher=cleanup_publisher)
+        async for event in prompt_stream:
+            yield event
+    if cleanup_ledger is not None and not cleanup_ledger.load_failed() and not cleanup_ledger.pending_resources():
+        _mark_completed_cleanup_prompts(runtime=runtime, cwd=cwd, session_id=session_id, ledger=cleanup_ledger)
+        _prune_completed_cleanup_prompt_from_runtime(runtime, cleanup_ledger)
+    if has_deferred_prompts:
+        _clear_a2a_deferred_cleanup_prompts(cwd=cwd, session_id=session_id)
+
+
+def _string_value(value: Any) -> str:
+    return value if isinstance(value, str) and value else ""
+
+
 class IacCodeA2AExecutor(AgentExecutor):
     def __init__(
         self,
@@ -85,6 +782,15 @@ async def execute(self, context: RequestContext, event_queue: EventQueue) -> Non
         task_id = requested_task_id or "task-" + uuid.uuid4().hex[:12]
         context_id = context.context_id or "ctx-" + uuid.uuid4().hex[:12]
         task = None
+        initial_task_published = False
+
+        async def publish_initial_task_if_missing() -> None:
+            nonlocal initial_task_published
+            if initial_task_published or isinstance(getattr(context, "current_task", None), Task):
+                return
+            await self._publish_initial_task(event_queue, task_id=task_id, context_id=context_id, context=context)
+            initial_task_published = True
+
         try:
             metadata = getattr(context, "metadata", None) or getattr(
                 getattr(context, "message", None), "metadata", None
@@ -94,8 +800,23 @@ async def execute(self, context: RequestContext, event_queue: EventQueue) -> Non
             metadata_model = self._resolve_model(metadata)
             model = metadata_model or self._model
             aliyun_credential = self._resolve_aliyun_credential(metadata)
-            prompt = self._prompt_from_context(context, cwd=cwd)
             pipeline_mode = get_run_mode() == RunMode.PIPELINE
+            route_pipeline_handoff_to_normal = False
+            if pipeline_mode:
+                route_pipeline_handoff_to_normal = await self._should_route_pipeline_handoff_to_normal(
+                    context_id=context_id,
+                    cwd=cwd,
+                )
+            pipeline_input: PipelineUserInput | None = None
+            if pipeline_mode and not route_pipeline_handoff_to_normal:
+                try:
+                    pipeline_input = self._pipeline_input_from_context(context, cwd=cwd)
+                except ValueError as exc:
+                    raise InvalidParamsError(sanitize_public_text(str(exc))) from exc
+                prompt = pipeline_input.display_text
+                self._validate_pipeline_request_input(pipeline_input, model=model)
+            else:
+                prompt = self._prompt_from_context(context, cwd=cwd)
             if pipeline_mode and requested_task_id is None:
                 recovered_task_id = await self._recoverable_pipeline_task_id_for_context(context_id=context_id, cwd=cwd)
                 if recovered_task_id is not None:
@@ -107,10 +828,12 @@ async def execute(self, context: RequestContext, event_queue: EventQueue) -> Non
                 owner=owner,
                 restore_interrupted=not pipeline_mode,
             )
-            if not isinstance(getattr(context, "current_task", None), Task):
-                await self._publish_initial_task(event_queue, task_id=task_id, context_id=context_id, context=context)
+            await publish_initial_task_if_missing()
             await self._task_store.ensure_task_not_expired(task.task_id)
+        except InvalidParamsError:
+            raise
         except Exception as exc:
+            await publish_initial_task_if_missing()
             if _is_retryable_executor_error(exc):
                 await self._publish_status(
                     event_queue,
@@ -140,7 +863,7 @@ async def execute(self, context: RequestContext, event_queue: EventQueue) -> Non
             self._metrics.record_task_failed()
             return
 
-        if not prompt.strip():
+        if not (pipeline_mode and not route_pipeline_handoff_to_normal) and not prompt.strip():
             task.state = TASK_STATE_FAILED
             await self._publish_status(
                 event_queue,
@@ -154,11 +877,8 @@ async def execute(self, context: RequestContext, event_queue: EventQueue) -> Non
             self._metrics.record_task_failed()
             return
 
-        route_pipeline_handoff_to_normal = pipeline_mode and await self._should_route_pipeline_handoff_to_normal(
-            context_id=context_id,
-            cwd=cwd,
-        )
         if pipeline_mode and not route_pipeline_handoff_to_normal:
+            assert pipeline_input is not None
             pipeline_executor = IacCodeA2APipelineExecutor(
                 task_store=self._task_store,
                 model=model,
@@ -176,7 +896,7 @@ async def execute(self, context: RequestContext, event_queue: EventQueue) -> Non
                 task_id=task_id,
                 context_id=context_id,
                 cwd=cwd,
-                prompt=prompt,
+                pipeline_input=pipeline_input,
             )
             return
         if route_pipeline_handoff_to_normal:
@@ -288,7 +1008,28 @@ def runtime_factory(session_id: str) -> Any:
                 with use_session_id(ctx.session_id), user_id_ctx, aliyun_credential_ctx:
                     self._configure_runtime_model(runtime, model, from_metadata=metadata_model is not None)
                     self._refresh_runtime_cloud_tools(runtime)
-                    async for event in runtime.agent_loop.run_streaming(prompt):
+                    cleanup_ledger = _cleanup_ledger_for_a2a_normal_chat(cwd=cwd, session_id=ctx.session_id)
+                    _prune_completed_cleanup_prompt_from_runtime(runtime, cleanup_ledger)
+                    cleanup_publisher = None
+                    if cleanup_ledger is not None:
+                        cleanup_publisher = _cleanup_publisher_for_a2a_normal_chat(
+                            event_queue=event_queue,
+                            cwd=cwd,
+                            session_id=ctx.session_id,
+                            task_id=task_id,
+                            context_id=context_id,
+                            artifact_store=self._artifact_store,
+                            exposure_types=self._thinking_exposure_types,
+                        )
+                    stream = _stream_a2a_normal_events(
+                        runtime=runtime,
+                        prompt=prompt,
+                        cleanup_ledger=cleanup_ledger,
+                        cleanup_publisher=cleanup_publisher,
+                        cwd=cwd,
+                        session_id=ctx.session_id,
+                    )
+                    async for event in stream:
                         text_chunk = await publish_stream_event(
                             event_queue,
                             task_id=task_id,
@@ -477,6 +1218,43 @@ def _prompt_from_context(self, context: RequestContext, *, cwd: str) -> str:
             return context.get_user_input()
         return parts_to_prompt(message.parts, cwd=cwd)
 
+    def _pipeline_input_from_context(self, context: RequestContext, *, cwd: str) -> PipelineUserInput:
+        message = getattr(context, "message", None)
+        if not isinstance(message, Message):
+            return normalize_pipeline_user_input(context.get_user_input())
+        return parts_to_pipeline_input(message.parts, cwd=cwd)
+
+    def validate_pipeline_message_request(self, message: Message) -> None:
+        metadata = getattr(message, "metadata", None)
+        try:
+            cwd = self._resolve_cwd(metadata)
+            pipeline_input = parts_to_pipeline_input(message.parts, cwd=cwd)
+        except ValueError as exc:
+            raise InvalidParamsError(sanitize_public_text(str(exc))) from exc
+        model = self._resolve_model(metadata) or self._model
+        self._validate_pipeline_request_input(pipeline_input, model=model)
+
+    def _validate_pipeline_request_input(self, pipeline_input: PipelineUserInput, *, model: str | None = None) -> None:
+        if pipeline_input.is_empty:
+            raise InvalidParamsError("A2A server received empty input.")
+        model = model or self._model
+        if pipeline_input.has_images and not self._model_supports_image_input(model=model):
+            raise InvalidParamsError(_("Current model {model} does not support image input.").format(model=model))
+
+    def _model_supports_image_input(self, *, model: str | None = None) -> bool:
+        model = model or self._model
+        provider_key = get_active_provider_key()
+        provider_config = get_provider_config(provider_key) if provider_key else {}
+        api_base = provider_config.get("apiBase") if isinstance(provider_config.get("apiBase"), str) else None
+        credentials = load_credentials(model=model)
+        api_key = credentials.get(provider_key, "") if provider_key else None
+        return is_model_multimodal(
+            model,
+            provider_key=provider_key,
+            base_url=api_base,
+            api_key=api_key,
+        )
+
     def _sanitize_error(self, exc: Exception) -> str:
         if isinstance(exc, ValueError):
             msg = str(exc).lower()
@@ -496,11 +1274,10 @@ async def _should_route_pipeline_handoff_to_normal(self, *, context_id: str, cwd
             return False
         if ctx.cwd != cwd:
             return False
-        snapshot = A2APipelineSnapshotStore(
-            existing_a2a_pipeline_dir_for_session(cwd=cwd, session_id=ctx.session_id)
-        ).load()
-        if not isinstance(snapshot, dict):
+        state = _a2a_pipeline_state_for_session(cwd=cwd, session_id=ctx.session_id)
+        if state is None:
             return False
+        _snapshot_store, _journal, snapshot, _journal_events = state
         handoff = snapshot.get("normalHandoff")
         if not isinstance(handoff, dict):
             return False
@@ -513,26 +1290,47 @@ async def _ensure_pipeline_handoff_context_in_session(self, *, context_id: str,
             return
         if ctx.cwd != cwd:
             return
-        snapshot = A2APipelineSnapshotStore(
-            existing_a2a_pipeline_dir_for_session(cwd=cwd, session_id=ctx.session_id)
-        ).load()
-        if not isinstance(snapshot, dict):
+        state = _a2a_pipeline_state_for_session(cwd=cwd, session_id=ctx.session_id)
+        if state is None:
             return
+        _snapshot_store, _journal, snapshot, _journal_events = state
         handoff = snapshot.get("normalHandoff")
         if not isinstance(handoff, dict):
             return
         summary = handoff.get("summary")
-        if not isinstance(summary, str) or not summary:
+        cleanup_payload = None
+        data = handoff.get("data")
+        if isinstance(data, dict) and isinstance(data.get("cleanup"), dict):
+            cleanup_payload = _cleanup_payload_from_private_ledger_or_unavailable(
+                ledger_path=_default_cleanup_ledger_path(cwd=cwd, session_id=ctx.session_id),
+            )
+        cleanup_prompt = cleanup_payload.get("prompt") if isinstance(cleanup_payload, dict) else None
+        cleanup_ledger_path = cleanup_payload.get("ledgerPath") if isinstance(cleanup_payload, dict) else None
+        if not isinstance(cleanup_prompt, str) or not cleanup_prompt:
+            cleanup_prompt = None
+        if not isinstance(cleanup_ledger_path, str) or not cleanup_ledger_path:
+            cleanup_ledger_path = None
+        if (not isinstance(summary, str) or not summary) and cleanup_prompt is None:
             return
 
         session_storage = SessionStorage()
         messages = session_storage.load(cwd, ctx.session_id)
-        if any(
-            getattr(message, "role", None) == "user" and getattr(message, "content", None) == summary
-            for message in messages
+        if isinstance(summary, str) and summary and not _session_has_user_message(messages, content=summary):
+            session_storage.append(cwd, ctx.session_id, AgentMessage(role="user", content=summary))
+            messages.append(AgentMessage(role="user", content=summary))
+        if cleanup_prompt is not None and not _session_has_active_cleanup_prompt_content(
+            messages,
+            content=cleanup_prompt,
         ):
-            return
-        session_storage.append(cwd, ctx.session_id, AgentMessage(role="user", content=summary))
+            session_storage.append(
+                cwd,
+                ctx.session_id,
+                create_cleanup_prompt_message(
+                    cleanup_prompt,
+                    cleanup_ledger_path=cleanup_ledger_path,
+                    cleanup_status="pending" if cleanup_ledger_path else None,
+                ),
+            )
 
     async def _recoverable_pipeline_task_id_for_context(self, *, context_id: str, cwd: str) -> str | None:
         try:
diff --git a/src/iac_code/a2a/jsonrpc_passthrough.py b/src/iac_code/a2a/jsonrpc_passthrough.py
new file mode 100644
index 00000000..75898b1b
--- /dev/null
+++ b/src/iac_code/a2a/jsonrpc_passthrough.py
@@ -0,0 +1,88 @@
+from __future__ import annotations
+
+import logging
+from collections.abc import Awaitable, Callable
+from types import MethodType
+from typing import Any, AsyncIterable, AsyncIterator
+
+from a2a.server.context import ServerCallContext
+from jsonrpc.jsonrpc2 import JSONRPC20Response
+from sse_starlette.sse import EventSourceResponse
+from starlette.responses import Response
+
+logger = logging.getLogger(__name__)
+
+
+def install_jsonrpc_error_data_passthrough() -> None:
+    try:
+        from a2a.server.request_handlers import response_helpers
+        from a2a.server.routes import jsonrpc_dispatcher
+    except Exception:
+        return
+    current = response_helpers.build_error_response
+    if getattr(current, "_iac_code_recoverable_data_passthrough", False):
+        return
+    original = current
+
+    def build_error_response_with_passthrough(request_id: str | int | None, error: Any) -> dict[str, Any]:
+        if getattr(error, "jsonrpc_error_data_passthrough", False):
+            payload = {
+                "code": int(getattr(error, "code", -32603)),
+                "message": str(error),
+            }
+            data = getattr(error, "data", None)
+            if data is not None:
+                payload["data"] = data
+            return JSONRPC20Response(error=payload, _id=request_id).data
+        return original(request_id, error)
+
+    setattr(build_error_response_with_passthrough, "_iac_code_recoverable_data_passthrough", True)
+    setattr(response_helpers, "build_error_response", build_error_response_with_passthrough)
+    setattr(jsonrpc_dispatcher, "build_error_response", build_error_response_with_passthrough)
+
+
+def install_v03_jsonrpc_error_data_passthrough(jsonrpc_endpoint: Callable[..., Awaitable[Response]]) -> None:
+    dispatcher = getattr(jsonrpc_endpoint, "__self__", None)
+    adapter = getattr(dispatcher, "_v03_adapter", None)
+    if adapter is None or getattr(adapter, "_iac_code_recoverable_error_passthrough", False):
+        return
+
+    try:
+        from a2a.compat.v0_3 import types as types_v03
+    except Exception:
+        logger.debug("A2A v0.3 compatibility types are unavailable", exc_info=True)
+        return
+
+    async def _process_streaming_request_with_passthrough(
+        self: Any,
+        request_id: str | int | None,
+        request_obj: Any,
+        context: ServerCallContext,
+    ) -> EventSourceResponse:
+        method = request_obj.method
+        if method == "message/stream":
+            stream_gen = self.handler.on_message_send_stream(request_obj, context)
+        elif method == "tasks/resubscribe":
+            stream_gen = self.handler.on_subscribe_to_task(request_obj, context)
+        else:
+            raise ValueError(f"Unsupported streaming method {method}")
+
+        async def event_generator(stream: AsyncIterable[Any]) -> AsyncIterator[dict[str, str]]:
+            try:
+                async for item in stream:
+                    yield {"data": item.model_dump_json(by_alias=True, exclude_none=True)}
+            except Exception as exc:
+                logger.exception("Error during stream generation in v0.3 JSONRPCAdapter")
+                if getattr(exc, "jsonrpc_error_data_passthrough", False):
+                    error = types_v03.InvalidParamsError(message=str(exc), data=getattr(exc, "data", None))
+                else:
+                    error = types_v03.InternalError(message=str(exc))
+                err_resp = types_v03.SendStreamingMessageResponse(
+                    root=types_v03.JSONRPCErrorResponse(id=request_id, error=error)
+                )
+                yield {"data": err_resp.model_dump_json(by_alias=True, exclude_none=True)}
+
+        return EventSourceResponse(event_generator(stream_gen))
+
+    adapter._process_streaming_request = MethodType(_process_streaming_request_with_passthrough, adapter)
+    adapter._iac_code_recoverable_error_passthrough = True
diff --git a/src/iac_code/a2a/parts.py b/src/iac_code/a2a/parts.py
index 0b546cc2..d28fded1 100644
--- a/src/iac_code/a2a/parts.py
+++ b/src/iac_code/a2a/parts.py
@@ -13,6 +13,10 @@
 
 from google.protobuf.json_format import MessageToDict
 
+from iac_code.agent.message import ContentBlock, ImageBlock, TextBlock
+from iac_code.pipeline.engine.user_input import PipelineUserInput, content_display_text, content_has_images
+from iac_code.utils.image.resizer import maybe_resize_and_downsample
+
 MAX_INLINE_BYTES = 1024 * 1024
 MAX_FILE_BYTES = 1024 * 1024
 MAX_BINARY_INLINE_BYTES = 5 * 1024 * 1024
@@ -38,6 +42,7 @@
 )
 TEXT_LIKE_MIME_TYPES = frozenset(DEFAULT_TEXT_LIKE_MIME_TYPES)
 MULTIMODAL_MIME_TYPES = frozenset(DEFAULT_MULTIMODAL_MIME_TYPES)
+SUPPORTED_IMAGE_MIME_TYPES = frozenset(("image/png", "image/jpeg", "image/webp", "image/gif"))
 SUPPORTED_INPUT_MIME_TYPES = [*DEFAULT_TEXT_LIKE_MIME_TYPES, *DEFAULT_MULTIMODAL_MIME_TYPES]
 
 
@@ -108,6 +113,66 @@ def parts_to_prompt(message_parts: Iterable[Any], *, cwd: str | Path) -> str:
     return "\n".join(value for value in values if value)
 
 
+def parts_to_pipeline_input(message_parts: Iterable[Any], *, cwd: str | Path) -> PipelineUserInput:
+    blocks: list[ContentBlock] = []
+    for part in message_parts:
+        converted = part_to_pipeline_block(part, cwd=cwd)
+        if isinstance(converted, list):
+            blocks.extend(converted)
+        elif converted:
+            blocks.append(TextBlock(text=converted))
+    if content_has_images(blocks):
+        return PipelineUserInput(
+            content=blocks,
+            display_text=content_display_text(blocks),
+            has_images=True,
+        )
+    text = "\n".join(block.text for block in blocks if isinstance(block, TextBlock))
+    return PipelineUserInput(content=text, display_text=text, has_images=False)
+
+
+def part_to_pipeline_block(part: Any, *, cwd: str | Path) -> str | list[ContentBlock]:
+    media_type = _media_type(part)
+    if _has_field(part, "text"):
+        _ensure_text_like(media_type)
+        return str(part.text)
+    if _has_field(part, "data"):
+        if media_type in SUPPORTED_IMAGE_MIME_TYPES:
+            return [_image_block_from_binary(_binary_data_part_bytes(part), requested_media_type=media_type)]
+        if _is_multimodal(media_type):
+            raise ValueError("A2A pipeline input has unsupported image media type.")
+        if media_type != "application/json":
+            raise ValueError("A2A data parts must use application/json media type.")
+        data = MessageToDict(part.data, preserving_proto_field_name=False)
+        serialized = json.dumps(data, ensure_ascii=False, separators=(",", ":"), sort_keys=True)
+        _ensure_size(serialized.encode("utf-8"), limit=MAX_INLINE_BYTES, label="A2A data part")
+        return serialized
+    if _has_field(part, "raw"):
+        raw = bytes(part.raw)
+        if media_type in SUPPORTED_IMAGE_MIME_TYPES:
+            _ensure_size(raw, limit=MAX_BINARY_INLINE_BYTES, label="A2A binary raw part")
+            return [_image_block_from_binary(raw, requested_media_type=media_type)]
+        if _is_multimodal(media_type):
+            raise ValueError("A2A pipeline input has unsupported image media type.")
+        _ensure_text_like(media_type)
+        _ensure_size(raw, limit=MAX_INLINE_BYTES, label="A2A raw part")
+        try:
+            return raw.decode("utf-8")
+        except UnicodeDecodeError as exc:
+            raise ValueError("A2A raw parts must contain valid UTF-8.") from exc
+    if _has_field(part, "url"):
+        if media_type in SUPPORTED_IMAGE_MIME_TYPES:
+            path = _safe_file_url_path(str(part.url), cwd=Path(cwd))
+            if path.stat().st_size > MAX_BINARY_FILE_BYTES:
+                raise ValueError("A2A binary file URL part content is too large.")
+            return [_image_block_from_binary(path.read_bytes(), requested_media_type=media_type)]
+        if _is_multimodal(media_type):
+            raise ValueError("A2A pipeline input has unsupported image media type.")
+        _ensure_text_like(media_type)
+        return _read_file_url_part(str(part.url), cwd=Path(cwd))
+    raise ValueError("A2A server supports text, JSON data, raw text, or workspace file URL parts only.")
+
+
 def part_to_prompt(part: Any, *, cwd: str | Path) -> str:
     media_type = _media_type(part)
     if _has_field(part, "text"):
@@ -188,6 +253,20 @@ def _filename(part: Any) -> str:
 
 
 def _binary_data_part_to_manifest(part: Any, *, media_type: str) -> str:
+    data = MessageToDict(part.data, preserving_proto_field_name=False)
+    if not isinstance(data, dict):
+        raise ValueError("A2A binary data parts must contain an object.")
+    content = _binary_data_part_bytes(part)
+    filename = str(data.get("filename") or _filename(part) or "inline")
+    return _multimodal_manifest(
+        filename=os.path.basename(filename),
+        media_type=media_type,
+        content=content,
+        source="data",
+    )
+
+
+def _binary_data_part_bytes(part: Any) -> bytes:
     data = MessageToDict(part.data, preserving_proto_field_name=False)
     if not isinstance(data, dict):
         raise ValueError("A2A binary data parts must contain an object.")
@@ -199,12 +278,16 @@ def _binary_data_part_to_manifest(part: Any, *, media_type: str) -> str:
     except (ValueError, UnicodeEncodeError) as exc:
         raise ValueError("A2A binary data part bytes must be valid base64.") from exc
     _ensure_size(content, limit=MAX_BINARY_INLINE_BYTES, label="A2A binary data part")
-    filename = str(data.get("filename") or _filename(part) or "inline")
-    return _multimodal_manifest(
-        filename=os.path.basename(filename),
-        media_type=media_type,
-        content=content,
-        source="data",
+    return content
+
+
+def _image_block_from_binary(raw: bytes, *, requested_media_type: str) -> ImageBlock:
+    if requested_media_type not in SUPPORTED_IMAGE_MIME_TYPES:
+        raise ValueError("A2A pipeline input has unsupported image media type.")
+    resized = maybe_resize_and_downsample(raw)
+    return ImageBlock(
+        media_type=resized.media_type,
+        data=base64.b64encode(resized.data).decode("ascii"),
     )
 
 
diff --git a/src/iac_code/a2a/pipeline_events.py b/src/iac_code/a2a/pipeline_events.py
index d206c967..ff011887 100644
--- a/src/iac_code/a2a/pipeline_events.py
+++ b/src/iac_code/a2a/pipeline_events.py
@@ -40,11 +40,24 @@
     "from_step": "fromStep",
     "parent_step_id": "parentStepId",
     "pipeline_type": "pipelineType",
+    "progress_status": "progressStatus",
     "rollback_target": "rollbackTarget",
+    "cleanup_status": "cleanupStatus",
+    "cleanup_tool_use_id": "cleanupToolUseId",
+    "last_error": "lastError",
+    "progress_percentage": "progressPercentage",
+    "resource_count": "resourceCount",
+    "resource_id": "resourceId",
+    "resource_name": "resourceName",
+    "resource_type": "resourceType",
+    "region_id": "regionId",
     "selected_index": "selectedIndex",
     "selected_option": "selectedOption",
     "selected_value": "selectedValue",
+    "source_step_id": "sourceStepId",
     "stale_fields": "staleFields",
+    "stack_status": "stackStatus",
+    "status_message": "statusMessage",
     "step_id": "stepId",
     "step_index": "stepIndex",
     "step_names": "stepNames",
@@ -325,6 +338,16 @@ def _translate_pipeline_event(self, event: PipelineEvent) -> list[dict[str, Any]
             return [self._envelope("pipeline_started", "pipeline", "working", _event_data(data), created_at=created_at)]
         if event.type == PipelineEventType.PIPELINE_RESUMED:
             return [self._envelope("pipeline_resumed", "pipeline", "working", _event_data(data), created_at=created_at)]
+        if event.type == PipelineEventType.PIPELINE_WARNING:
+            return [
+                self._envelope(
+                    "pipeline_warning",
+                    "pipeline",
+                    "working",
+                    _warning_event_data(data),
+                    created_at=created_at,
+                )
+            ]
         if event.type == PipelineEventType.PIPELINE_COMPLETED:
             event_type = "pipeline_failed" if data.get("failed") is True else "pipeline_completed"
             status = "failed" if event_type == "pipeline_failed" else "completed"
@@ -541,7 +564,7 @@ def _translate_sub_pipeline_stream_event(self, event: SubPipelineStreamEvent) ->
         return envelopes
 
     def _translate_text_delta_event(self, event: TextDeltaEvent) -> dict[str, Any]:
-        return self._envelope("text_delta", "pipeline", "working", {"text": event.text})
+        return self._translate_parent_scoped_display_event("text_delta", {"text": event.text})
 
     def _translate_ask_user_question_event(self, event: AskUserQuestionEvent) -> dict[str, Any]:
         envelope = self._translate_parent_scoped_display_event("input_required", _ask_user_question_data(event))
@@ -550,7 +573,7 @@ def _translate_ask_user_question_event(self, event: AskUserQuestionEvent) -> dic
         return envelope
 
     def _translate_permission_request_event(self, event: PermissionRequestEvent) -> dict[str, Any]:
-        envelope = self._envelope("permission_requested", "pipeline", "working", _permission_request_data(event))
+        envelope = self._translate_parent_scoped_display_event("permission_requested", _permission_request_data(event))
         envelope["permission"] = _permission_request_metadata(event)
         return envelope
 
@@ -586,7 +609,7 @@ def _translate_tool_result_event(self, event: ToolResultEvent) -> list[dict[str,
         stack_envelope = self._translate_stack_current_changed_event(event)
         if stack_envelope is not None:
             envelopes.append(stack_envelope)
-        envelopes.append(self._envelope("tool_result", "pipeline", "working", _tool_result_data(event)))
+        envelopes.append(self._translate_parent_scoped_display_event("tool_result", _tool_result_data(event)))
         return envelopes
 
     def _remember_tool_input(self, event: ToolUseEndEvent) -> None:
@@ -662,6 +685,11 @@ def _stack_current_changed_data(self, event: ToolResultEvent) -> dict[str, Any]
         if stack_id is None:
             return None
 
+        stack_status = _first_string_from_sources((result,), ("StackStatus", "stackStatus", "status"))
+        is_delete_complete = action in _STACK_CLEAR_ACTIONS and is_success and stack_status == "DELETE_COMPLETE"
+        if action in _STACK_CLEAR_ACTIONS and is_success and stack_status is None:
+            stack_status = "DELETE_REQUESTED"
+
         data: dict[str, Any] = {
             "toolName": event.tool_name,
             "toolUseId": event.tool_use_id,
@@ -670,11 +698,11 @@ def _stack_current_changed_data(self, event: ToolResultEvent) -> dict[str, Any]
             "regionId": operation["regionId"],
             "stackId": stack_id,
             "stackName": _first_string_from_sources((result, params), ("StackName", "stackName", "stack_name", "name")),
-            "stackStatus": _first_string_from_sources((result,), ("StackStatus", "stackStatus", "status")),
+            "stackStatus": stack_status,
             "isSuccess": is_success,
-            "current": False if action in _STACK_CLEAR_ACTIONS and is_success else True,
+            "current": False if is_delete_complete else True,
         }
-        if action in _STACK_CLEAR_ACTIONS and is_success:
+        if is_delete_complete:
             data["cleared"] = True
         return {key: value for key, value in data.items() if value is not None}
 
@@ -944,6 +972,11 @@ def _event_data(data: dict[str, Any]) -> dict[str, Any]:
     }
 
 
+def _warning_event_data(data: dict[str, Any]) -> dict[str, Any]:
+    private_keys = {"ledger_path", "ledgerPath", "load_error", "loadError"}
+    return _event_data({key: value for key, value in data.items() if str(key) not in private_keys})
+
+
 def _sanitize_event_value(key: str, value: Any) -> Any:
     key_lower = key.lower()
     if isinstance(value, str):
diff --git a/src/iac_code/a2a/pipeline_executor.py b/src/iac_code/a2a/pipeline_executor.py
index 02665789..eef50b42 100644
--- a/src/iac_code/a2a/pipeline_executor.py
+++ b/src/iac_code/a2a/pipeline_executor.py
@@ -10,6 +10,7 @@
 
 import httpx
 from a2a.types import Message, Role, TaskState, TaskStatus, TaskStatusUpdateEvent
+from a2a.utils.errors import InvalidParamsError
 
 from iac_code.a2a.events import make_text_part
 from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
@@ -30,15 +31,20 @@
 )
 from iac_code.agent.message import Message as AgentMessage
 from iac_code.i18n import _
-from iac_code.pipeline import create_pipeline
+from iac_code.pipeline import create_pipeline, discover_pipelines
 from iac_code.pipeline.config import get_pipeline_name
+from iac_code.pipeline.engine.cleanup import CleanupLedger
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
-from iac_code.pipeline.engine.handoff import terminal_outcome_from_completed_event
+from iac_code.pipeline.engine.handoff import build_handoff_summary, terminal_outcome_from_completed_event
+from iac_code.pipeline.engine.loader import load_pipeline_dir
 from iac_code.pipeline.engine.public_errors import public_error
+from iac_code.pipeline.engine.session import PipelineSession
+from iac_code.pipeline.engine.user_input import PipelineUserInput, normalize_pipeline_user_input
 from iac_code.services.agent_factory import AgentFactoryOptions, create_agent_runtime
 from iac_code.services.session_storage import SessionStorage
 from iac_code.services.telemetry import use_session_id
 from iac_code.types.stream_events import AskUserQuestionEvent, SubPipelineStreamEvent
+from iac_code.utils.public_errors import sanitize_public_text
 
 logger = logging.getLogger(__name__)
 _CONTEXT_LOCK_ACQUIRE_TIMEOUT_SECONDS = 1
@@ -69,6 +75,27 @@ def _auth_error_text() -> str:
     return _("Authentication required. Configure credentials and retry.")
 
 
+class RecoverablePipelineInvalidParamsError(InvalidParamsError):
+    code = -32602
+    jsonrpc_error_data_passthrough = True
+
+
+def _active_sidecar_mismatch_error(
+    *,
+    recoverable_task_id: str,
+    context_id: str,
+    sidecar_status: str,
+) -> RecoverablePipelineInvalidParamsError:
+    return RecoverablePipelineInvalidParamsError(
+        _("Pipeline already running. Resume task {task_id}.").format(task_id=recoverable_task_id),
+        data={
+            "recoverableTaskId": recoverable_task_id,
+            "contextId": context_id,
+            "sidecarStatus": sidecar_status,
+        },
+    )
+
+
 @dataclass
 class A2APipelineRuntime:
     agent_runtime: Any
@@ -156,8 +183,13 @@ async def execute(
         task_id: str,
         context_id: str,
         cwd: str,
-        prompt: str,
+        pipeline_input: PipelineUserInput | str | None = None,
+        prompt: str | None = None,
     ) -> None:
+        if pipeline_input is None:
+            pipeline_input = prompt or ""
+        pipeline_input = normalize_pipeline_user_input(pipeline_input)
+        prompt = pipeline_input.display_text
         session_storage = SessionStorage()
 
         def runtime_factory(session_id: str) -> Any:
@@ -192,7 +224,7 @@ def runtime_factory(session_id: str) -> Any:
                     task_id=task_id,
                     context_id=context_id,
                     cwd=cwd,
-                    prompt=prompt,
+                    pipeline_input=pipeline_input,
                     preserve_task_record=preserve_active_task,
                 )
                 if routed:
@@ -215,11 +247,7 @@ def runtime_factory(session_id: str) -> Any:
 
         try:
             owner_task = asyncio.current_task()
-            ctx.active_task_id = task.task_id
-            task.active_task = owner_task
-            task.state = TASK_STATE_WORKING
-            self._task_store.mirror_task(task)
-            self._task_store.mirror_context(ctx)
+            task_persistence_started = False
 
             pipeline = None
             publisher: PipelineA2AEventPublisher | None = None
@@ -267,6 +295,7 @@ def fresh_pipeline_factory() -> Any:
                 selected = self._select_stream(
                     pipeline,
                     prompt,
+                    pipeline_input=pipeline_input,
                     publisher=publisher,
                     task_id=task_id,
                     context_id=context_id,
@@ -277,6 +306,12 @@ def fresh_pipeline_factory() -> Any:
                     pipeline_runtime.pipeline = pipeline
                     self._task_store.mirror_context(ctx)
                 stream = selected.stream
+                ctx.active_task_id = task.task_id
+                task.active_task = owner_task
+                task.state = TASK_STATE_WORKING
+                task_persistence_started = True
+                self._task_store.mirror_task(task)
+                self._task_store.mirror_context(ctx)
                 stream_had_events = False
                 with use_session_id(ctx.session_id):
                     while True:
@@ -291,7 +326,7 @@ def fresh_pipeline_factory() -> Any:
                         if not stream_result.restart_requested:
                             break
 
-                        stream = self._continue_after_interrupt_stream(pipeline, prompt)
+                        stream = self._continue_after_interrupt_stream(pipeline, pipeline_input)
 
                 terminal_status_published = False
                 terminal_sidecar = _is_terminal_sidecar_status(getattr(pipeline, "sidecar_status", None))
@@ -352,7 +387,10 @@ def fresh_pipeline_factory() -> Any:
                 )
                 await self._notify_terminal_task(task_id=task.task_id, context_id=task.context_id, state=task.state)
                 self._record_state(task.state)
+            except RecoverablePipelineInvalidParamsError:
+                raise
             except Exception as exc:
+                task_persistence_started = True
                 await self._publish_exception_status(
                     event_queue,
                     task=task,
@@ -367,8 +405,9 @@ def fresh_pipeline_factory() -> Any:
                     if ctx.active_task_id == task.task_id:
                         ctx.active_task_id = None
                 ctx.touch()
-                task.touch()
-                self._task_store.mirror_task(task)
+                if task_persistence_started:
+                    task.touch()
+                    self._task_store.mirror_task(task)
                 self._task_store.mirror_context(ctx)
                 await _flush_telemetry_safely()
         finally:
@@ -392,15 +431,29 @@ async def _route_active_pipeline_interrupt(
         task_id: str,
         context_id: str,
         cwd: str,
-        prompt: str,
+        pipeline_input: PipelineUserInput,
         preserve_task_record: bool,
     ) -> bool:
+        pipeline_input = normalize_pipeline_user_input(pipeline_input)
+        prompt = pipeline_input.display_text
         runtime = ctx.runtime
         pipeline = getattr(runtime, "pipeline", None)
         if pipeline is None:
             return False
 
-        pending_question_route = await self._route_pending_question_answer(runtime, prompt)
+        try:
+            pending_question_route = await self._route_pending_question_answer(runtime, pipeline_input)
+        except Exception as exc:
+            await self._publish_exception_status(
+                event_queue,
+                task=task,
+                task_id=task_id,
+                context_id=context_id,
+                exc=exc,
+                preserve_task_record=preserve_task_record,
+                pipeline_publisher=getattr(runtime, "publisher", None),
+            )
+            return True
         if pending_question_route == _PENDING_QUESTION_ANSWERED:
             task.state = TASK_STATE_WORKING
             self._task_store.mirror_task(task)
@@ -442,7 +495,7 @@ async def _route_active_pipeline_interrupt(
                 task_id=task_id,
                 context_id=context_id,
                 session_id=ctx.session_id,
-                prompt=prompt,
+                pipeline_input=pipeline_input,
                 preserve_task_record=preserve_task_record,
             )
             return True
@@ -465,12 +518,21 @@ async def _route_active_pipeline_interrupt(
                 await _maybe_await(pause_agent_loops())
                 paused = True
 
-            verdict = await _maybe_await(handler(prompt))
+            runner_input = _pipeline_runner_input(pipeline_input)
+            verdict = await _maybe_await(handler(runner_input))
             parent_rollback: bool | None = None
             if getattr(verdict, "action", "") == "hard_interrupt":
                 apply_hard_interrupt = getattr(pipeline, "apply_hard_interrupt", None)
                 if callable(apply_hard_interrupt):
-                    parent_rollback = bool(await _maybe_await(apply_hard_interrupt(verdict)))
+                    parameters = inspect.signature(apply_hard_interrupt).parameters
+                    if pipeline_input.has_images and (
+                        "source_input" in parameters
+                        or any(parameter.kind == inspect.Parameter.VAR_KEYWORD for parameter in parameters.values())
+                    ):
+                        applied = apply_hard_interrupt(verdict, source_input=runner_input)
+                    else:
+                        applied = apply_hard_interrupt(verdict)
+                    parent_rollback = bool(await _maybe_await(applied))
                     if parent_rollback:
                         runtime.restart_after_interrupt = True
                         _restart_requested_event(runtime).set()
@@ -537,9 +599,11 @@ async def _continue_active_pause_confirmation(
         task_id: str,
         context_id: str,
         session_id: str,
-        prompt: str,
+        pipeline_input: PipelineUserInput,
         preserve_task_record: bool,
     ) -> None:
+        pipeline_input = normalize_pipeline_user_input(pipeline_input)
+        prompt = pipeline_input.display_text
         owner_task = asyncio.current_task()
         task.active_task = owner_task
         ctx.active_task_id = task_id
@@ -552,7 +616,10 @@ async def _continue_active_pause_confirmation(
         self._task_store.mirror_task(task)
         self._task_store.mirror_context(ctx)
         try:
-            stream = pipeline.continue_from_sidecar(user_input=prompt) if prompt else pipeline.continue_from_sidecar()
+            if prompt:
+                stream = pipeline.continue_from_sidecar(user_input=_pipeline_runner_input(pipeline_input))
+            else:
+                stream = pipeline.continue_from_sidecar()
             task.state = TASK_STATE_WORKING
             self._task_store.mirror_task(task)
             with use_session_id(session_id):
@@ -565,7 +632,7 @@ async def _continue_active_pause_confirmation(
                     )
                     if not stream_result.restart_requested:
                         break
-                    stream = self._continue_after_interrupt_stream(pipeline, prompt)
+                    stream = self._continue_after_interrupt_stream(pipeline, pipeline_input)
 
             snapshot = publisher.snapshot_store.load() or {}
             task.state = _task_state_from_pipeline(pipeline, snapshot)
@@ -609,6 +676,7 @@ def _create_pipeline(
             session_id=session_id,
             cwd=cwd,
             resume_from_sidecar=resume_from_sidecar,
+            surface="a2a",
         )
 
     def _set_pipeline_telemetry_correlation(self, pipeline: Any, *, task_id: str, context_id: str) -> None:
@@ -620,11 +688,11 @@ def _set_pipeline_telemetry_correlation(self, pipeline: Any, *, task_id: str, co
         except Exception:
             logger.warning("A2A pipeline telemetry correlation setup failed", exc_info=True)
 
-    def _continue_after_interrupt_stream(self, pipeline: Any, prompt: str) -> AsyncIterator[Any]:
+    def _continue_after_interrupt_stream(self, pipeline: Any, pipeline_input: PipelineUserInput) -> AsyncIterator[Any]:
         continue_after_interrupt = getattr(pipeline, "continue_after_interrupt", None)
         if callable(continue_after_interrupt):
             return continue_after_interrupt()
-        return pipeline.run(prompt)
+        return pipeline.run(_pipeline_runner_input(pipeline_input))
 
     async def _consume_stream_until_restart(
         self,
@@ -757,6 +825,7 @@ def _select_stream(
         pipeline: Any,
         prompt: str,
         *,
+        pipeline_input: PipelineUserInput,
         publisher: PipelineA2AEventPublisher,
         task_id: str,
         context_id: str,
@@ -766,8 +835,11 @@ def _select_stream(
         if status == "waiting_input":
             _raise_if_sidecar_restore_failed(pipeline, status)
             if not _sidecar_matches_task(publisher, task_id=task_id, context_id=context_id, sidecar_status=status):
-                pipeline = self._fresh_pipeline_after_sidecar_mismatch(pipeline, fresh_pipeline_factory)
-                return _SelectedPipelineStream(pipeline=pipeline, stream=pipeline.run(prompt))
+                raise _active_sidecar_mismatch_error_from_publisher(
+                    publisher,
+                    context_id=context_id,
+                    sidecar_status=status,
+                )
             pending_ask = _pending_ask_input_from_sidecar(
                 publisher,
                 task_id=task_id,
@@ -781,6 +853,7 @@ def _select_stream(
                         publisher=publisher,
                         pending_input=pending_ask,
                         prompt=prompt,
+                        pipeline_input=pipeline_input,
                     ),
                 )
             pending_pause = _pending_pipeline_pause_input_from_sidecar(
@@ -790,15 +863,23 @@ def _select_stream(
             )
             if pending_pause is not None:
                 stream = (
-                    pipeline.continue_from_sidecar(user_input=prompt) if prompt else pipeline.continue_from_sidecar()
+                    pipeline.continue_from_sidecar(user_input=_pipeline_runner_input(pipeline_input))
+                    if prompt
+                    else pipeline.continue_from_sidecar()
                 )
                 return _SelectedPipelineStream(pipeline=pipeline, stream=stream)
-            return _SelectedPipelineStream(pipeline=pipeline, stream=pipeline.resume(prompt))
+            return _SelectedPipelineStream(
+                pipeline=pipeline,
+                stream=pipeline.resume(_pipeline_runner_input(pipeline_input)),
+            )
         if status == "running":
             _raise_if_sidecar_restore_failed(pipeline, status)
             if not _sidecar_matches_task(publisher, task_id=task_id, context_id=context_id, sidecar_status=status):
-                pipeline = self._fresh_pipeline_after_sidecar_mismatch(pipeline, fresh_pipeline_factory)
-                return _SelectedPipelineStream(pipeline=pipeline, stream=pipeline.run(prompt))
+                raise _active_sidecar_mismatch_error_from_publisher(
+                    publisher,
+                    context_id=context_id,
+                    sidecar_status=status,
+                )
             pending_ask = _pending_ask_input_from_sidecar(
                 publisher,
                 task_id=task_id,
@@ -812,6 +893,7 @@ def _select_stream(
                         publisher=publisher,
                         pending_input=pending_ask,
                         prompt=prompt,
+                        pipeline_input=pipeline_input,
                     ),
                 )
             pending_pause = _pending_pipeline_pause_input_from_sidecar(
@@ -821,20 +903,29 @@ def _select_stream(
             )
             if pending_pause is not None:
                 stream = (
-                    pipeline.continue_from_sidecar(user_input=prompt) if prompt else pipeline.continue_from_sidecar()
+                    pipeline.continue_from_sidecar(user_input=_pipeline_runner_input(pipeline_input))
+                    if prompt
+                    else pipeline.continue_from_sidecar()
                 )
                 return _SelectedPipelineStream(pipeline=pipeline, stream=stream)
             if prompt:
                 return _SelectedPipelineStream(
-                    pipeline=pipeline, stream=pipeline.continue_from_sidecar(user_input=prompt)
+                    pipeline=pipeline,
+                    stream=pipeline.continue_from_sidecar(user_input=_pipeline_runner_input(pipeline_input)),
                 )
             return _SelectedPipelineStream(pipeline=pipeline, stream=pipeline.continue_from_sidecar())
         if status in _TERMINAL_SIDECAR_STATUSES:
             if _terminal_sidecar_matches_task(publisher, status, task_id=task_id, context_id=context_id):
                 return _SelectedPipelineStream(pipeline=pipeline, stream=_empty_stream())
             pipeline = self._fresh_pipeline_after_sidecar_mismatch(pipeline, fresh_pipeline_factory)
-            return _SelectedPipelineStream(pipeline=pipeline, stream=pipeline.run(prompt))
-        return _SelectedPipelineStream(pipeline=pipeline, stream=pipeline.run(prompt))
+            return _SelectedPipelineStream(
+                pipeline=pipeline,
+                stream=pipeline.run(_pipeline_runner_input(pipeline_input)),
+            )
+        return _SelectedPipelineStream(
+            pipeline=pipeline,
+            stream=pipeline.run(_pipeline_runner_input(pipeline_input)),
+        )
 
     def _fresh_pipeline_after_sidecar_mismatch(
         self,
@@ -956,16 +1047,21 @@ async def _publish_normal_handoff_ready(
             logger.warning("Failed to build A2A pipeline normal handoff event", exc_info=True)
             return
 
+        data = {
+            "action": "switch_to_normal",
+            "targetMode": "normal",
+            "outcome": outcome,
+            "summary": summary,
+        }
+        cleanup = _pipeline_cleanup_handoff_data(pipeline)
+        if cleanup is not None:
+            data["cleanup"] = cleanup
+
         published = await publisher.publish_manual(
             "pipeline_handoff_ready",
             "pipeline",
             status=_handoff_status_from_outcome(outcome),
-            data={
-                "action": "switch_to_normal",
-                "targetMode": "normal",
-                "outcome": outcome,
-                "summary": summary,
-            },
+            data=data,
         )
         if published is not None:
             _persist_normal_handoff_summary(pipeline, summary)
@@ -986,7 +1082,9 @@ def _track_pending_question(
             return
         runtime.pending_question = _PendingAskUserQuestion(event=question, envelope=dict(envelope))
 
-    async def _route_pending_question_answer(self, runtime: Any, prompt: str) -> str:
+    async def _route_pending_question_answer(self, runtime: Any, pipeline_input: PipelineUserInput) -> str:
+        pipeline_input = normalize_pipeline_user_input(pipeline_input)
+        prompt = pipeline_input.display_text
         pending = getattr(runtime, "pending_question", None)
         if not isinstance(pending, _PendingAskUserQuestion):
             return _PENDING_QUESTION_NOT_ROUTED
@@ -998,11 +1096,12 @@ async def _route_pending_question_answer(self, runtime: Any, prompt: str) -> str
             return _PENDING_QUESTION_STALE_FINISHED
 
         publisher = getattr(runtime, "publisher", None)
-        if not isinstance(publisher, PipelineA2AEventPublisher):
+        publish_manual = getattr(publisher, "publish_manual", None)
+        if not callable(publish_manual):
             return _PENDING_QUESTION_NOT_ROUTED
 
         answer = _ask_user_question_answer_from_prompt(question, prompt)
-        published = await publisher.publish_manual(
+        published = await publish_manual(
             "input_received",
             str(pending.envelope.get("scope") or "pipeline"),
             status="working",
@@ -1020,10 +1119,56 @@ async def _route_pending_question_answer(self, runtime: Any, prompt: str) -> str
         if published is None:
             return _PENDING_QUESTION_NOT_ROUTED
 
+        if pipeline_input.has_images:
+            inject_pending_question_supplement = getattr(
+                getattr(runtime, "pipeline", None),
+                "inject_pending_question_supplement",
+                None,
+            )
+            if callable(inject_pending_question_supplement):
+                try:
+                    injected = inject_pending_question_supplement(pipeline_input.content, envelope=pending.envelope)
+                    if inspect.isawaitable(injected):
+                        injected = await injected
+                except Exception:
+                    await self._restore_pending_question_input_required(runtime, pending)
+                    raise
+                if injected is False:
+                    await self._restore_pending_question_input_required(runtime, pending)
+                    raise RuntimeError("A2A ask_user_question image supplement could not be delivered.")
+            else:
+                await self._restore_pending_question_input_required(runtime, pending)
+                raise RuntimeError("A2A pipeline cannot accept ask_user_question image supplement.")
         future.set_result(answer)
         runtime.pending_question = None
         return _PENDING_QUESTION_ANSWERED
 
+    async def _restore_pending_question_input_required(self, runtime: Any, pending: "_PendingAskUserQuestion") -> None:
+        publisher = getattr(runtime, "publisher", None)
+        publish_manual = getattr(publisher, "publish_manual", None)
+        if not callable(publish_manual):
+            return
+        question = pending.event
+        envelope = pending.envelope if isinstance(pending.envelope, dict) else {}
+        data = {
+            "kind": "ask_user_question",
+            "inputId": _pending_input_id(envelope, question),
+            "toolUseId": question.tool_use_id,
+            "question": question.question,
+            "prompt": question.question,
+            "options": question.options if isinstance(question.options, list) else [],
+            "allowFreeText": question.allow_free_text,
+            "freeTextPrompt": question.free_text_prompt,
+            "required": True,
+        }
+        await publish_manual(
+            "input_required",
+            str(envelope.get("scope") or "pipeline"),
+            status="input_required",
+            data=data,
+            coordinates=_coordinates_from_envelope(envelope),
+        )
+
     async def _fail_already_active(
         self,
         event_queue: Any,
@@ -1143,13 +1288,19 @@ async def _empty_stream() -> AsyncIterator[Any]:
         yield None
 
 
+def _pipeline_runner_input(pipeline_input: PipelineUserInput) -> PipelineUserInput | str:
+    return pipeline_input if pipeline_input.has_images else pipeline_input.display_text
+
+
 async def _resume_pending_ask_user_question_stream(
     *,
     pipeline: Any,
     publisher: PipelineA2AEventPublisher,
     pending_input: dict[str, Any],
     prompt: str,
+    pipeline_input: PipelineUserInput,
 ) -> AsyncIterator[Any]:
+    pipeline_input = normalize_pipeline_user_input(pipeline_input)
     resume_ask_user_question = getattr(pipeline, "resume_ask_user_question", None)
     if not callable(resume_ask_user_question):
         raise RuntimeError("Pipeline cannot resume pending ask_user_question input.")
@@ -1180,6 +1331,8 @@ async def _resume_pending_ask_user_question_stream(
 
     parameters = inspect.signature(resume_ask_user_question).parameters
     resume_kwargs: dict[str, Any] = {"tool_use_id": tool_use_id}
+    if pipeline_input.has_images:
+        resume_kwargs["supplemental_input"] = pipeline_input
     if "pending_input" in parameters or any(
         parameter.kind == inspect.Parameter.VAR_KEYWORD for parameter in parameters.values()
     ):
@@ -1382,8 +1535,23 @@ def cancel_waiting_input_task_from_sidecar(
     )
     if int(envelope.get("sequence") or 0) <= high_water_sequence:
         envelope["sequence"] = high_water_sequence + 1
+    handoff_envelope = _waiting_input_cancel_handoff_event(
+        translator,
+        snapshot=snapshot,
+        cwd=cwd,
+        session_id=session_id,
+        pipeline_name=pipeline_name,
+        reason=reason,
+    )
+    if handoff_envelope is not None and int(handoff_envelope.get("sequence") or 0) <= int(
+        envelope.get("sequence") or 0
+    ):
+        handoff_envelope["sequence"] = int(envelope.get("sequence") or 0) + 1
     try:
-        journal.append(envelope)
+        events_to_append = [envelope]
+        if handoff_envelope is not None:
+            events_to_append.append(handoff_envelope)
+        journal.append_many(events_to_append, durable=True)
         snapshot_store.save(reduce_pipeline_events(journal.read_all_repairing_tail()))
     except Exception:
         logger.warning("Failed to persist waiting A2A pipeline cancellation", exc_info=True)
@@ -1391,6 +1559,106 @@ def cancel_waiting_input_task_from_sidecar(
     return True
 
 
+def _waiting_input_cancel_handoff_event(
+    translator: PipelineEventTranslator,
+    *,
+    snapshot: dict[str, Any] | None,
+    cwd: str,
+    session_id: str,
+    pipeline_name: str,
+    reason: str,
+) -> dict[str, Any] | None:
+    loaded_pipeline = _load_pipeline_definition_for_handoff(pipeline_name)
+    if loaded_pipeline is None:
+        return None
+    policy = getattr(loaded_pipeline, "on_complete", None)
+    if policy is None or policy.action != "switch_to_normal" or "canceled" not in policy.apply_on:
+        return None
+
+    include_fields = getattr(policy.handoff_context, "include", [])
+    context_snapshot = _flat_pipeline_context_from_sidecar(cwd=cwd, session_id=session_id)
+    if not context_snapshot:
+        context_snapshot = _flat_pipeline_context_from_a2a_snapshot(snapshot, loaded_pipeline)
+    summary = build_handoff_summary(
+        pipeline_name=pipeline_name,
+        outcome="canceled",
+        context_snapshot=context_snapshot,
+        include_fields=include_fields,
+    )
+    data: dict[str, Any] = {
+        "action": "switch_to_normal",
+        "targetMode": "normal",
+        "outcome": "canceled",
+        "summary": summary,
+        "reason": reason,
+    }
+    cleanup = _pipeline_cleanup_handoff_data_from_session(cwd=cwd, session_id=session_id, public_snapshot=snapshot)
+    if cleanup is not None:
+        data["cleanup"] = cleanup
+    return translator.manual_event(
+        "pipeline_handoff_ready",
+        "pipeline",
+        status="canceled",
+        data=data,
+    )
+
+
+def _load_pipeline_definition_for_handoff(pipeline_name: str) -> Any | None:
+    try:
+        pipeline_dir = discover_pipelines().get(pipeline_name)
+        if pipeline_dir is None:
+            return None
+        return load_pipeline_dir(pipeline_dir)
+    except Exception:
+        logger.warning("Failed to load A2A pipeline handoff policy for %s", pipeline_name, exc_info=True)
+        return None
+
+
+def _flat_pipeline_context_from_sidecar(*, cwd: str, session_id: str) -> dict[str, Any]:
+    try:
+        restored = PipelineSession(SessionStorage().session_dir(cwd, session_id) / "pipeline").restore_sync()
+    except Exception:
+        logger.warning("Failed to load pipeline context for A2A cancel handoff", exc_info=True)
+        return {}
+    if not isinstance(restored, dict):
+        return {}
+    context_snapshot = restored.get("context_snapshot")
+    if not isinstance(context_snapshot, dict):
+        return {}
+    return _flatten_pipeline_context_snapshot(context_snapshot)
+
+
+def _flat_pipeline_context_from_a2a_snapshot(snapshot: dict[str, Any] | None, loaded_pipeline: Any) -> dict[str, Any]:
+    if not isinstance(snapshot, dict):
+        return {}
+    field_by_step_id = {
+        str(getattr(step, "step_id")): str(getattr(step, "conclusion_field"))
+        for step in getattr(loaded_pipeline, "steps", [])
+        if getattr(step, "step_id", None) and getattr(step, "conclusion_field", None)
+    }
+    context: dict[str, Any] = {}
+    for step in snapshot.get("steps", []) if isinstance(snapshot.get("steps"), list) else []:
+        if not isinstance(step, dict):
+            continue
+        field_name = field_by_step_id.get(str(step.get("id") or ""))
+        if not field_name:
+            continue
+        conclusion = step.get("conclusion")
+        if conclusion is not None:
+            context[field_name] = conclusion
+    return context
+
+
+def _flatten_pipeline_context_snapshot(snapshot: dict[str, Any]) -> dict[str, Any]:
+    flattened: dict[str, Any] = {}
+    for field_name, field_value in snapshot.items():
+        if isinstance(field_value, dict) and "value" in field_value:
+            value = field_value.get("value")
+            if value is not None:
+                flattened[field_name] = value
+    return flattened
+
+
 def terminal_task_state_from_sidecar(*, cwd: str, session_id: str, context_id: str, task_id: str) -> str | None:
     pipeline_dir = existing_a2a_pipeline_dir_for_session(cwd=cwd, session_id=session_id)
     journal = A2APipelineJournal(pipeline_dir)
@@ -1501,6 +1769,109 @@ def _persist_normal_handoff_summary(pipeline: Any, summary: str) -> None:
         logger.warning("Failed to persist A2A pipeline normal handoff summary", exc_info=True)
 
 
+def _pipeline_cleanup_handoff_data(pipeline: Any) -> dict[str, Any] | None:
+    cleanup_ledger = getattr(pipeline, "cleanup_ledger", None)
+    if not callable(cleanup_ledger):
+        return None
+    try:
+        ledger = cleanup_ledger()
+    except Exception:
+        logger.warning("Failed to build A2A pipeline cleanup handoff data", exc_info=True)
+        return None
+    return _pipeline_cleanup_handoff_data_from_ledger(ledger)
+
+
+def _pipeline_cleanup_handoff_data_from_session(
+    *,
+    cwd: str,
+    session_id: str,
+    public_snapshot: dict[str, Any] | None = None,
+) -> dict[str, Any] | None:
+    try:
+        ledger_path = SessionStorage().session_dir(cwd, session_id) / "pipeline" / "cleanup.yaml"
+    except Exception:
+        logger.warning("Failed to locate A2A pipeline cleanup ledger for handoff", exc_info=True)
+        return None
+    if not ledger_path.exists():
+        snapshot_cleanup = public_snapshot.get("cleanup") if isinstance(public_snapshot, dict) else None
+        if _public_cleanup_snapshot_has_pending_evidence(snapshot_cleanup):
+            return _cleanup_state_unavailable_payload()
+        return None
+    return _pipeline_cleanup_handoff_data_from_ledger(CleanupLedger(ledger_path))
+
+
+def _pipeline_cleanup_handoff_data_from_ledger(ledger: Any) -> dict[str, Any] | None:
+    try:
+        ledger_path = getattr(ledger, "path", None)
+        if ledger_path is not None and not Path(ledger_path).exists():
+            return _cleanup_state_unavailable_payload()
+        load_failed = getattr(ledger, "load_failed", None)
+        if callable(load_failed) and load_failed():
+            return _cleanup_state_unavailable_payload()
+        build_pending_prompt = getattr(ledger, "build_pending_prompt", None)
+        if not callable(build_pending_prompt):
+            return None
+        prompt = build_pending_prompt()
+    except Exception:
+        logger.warning("Failed to build A2A pipeline cleanup handoff data", exc_info=True)
+        return _cleanup_state_unavailable_payload()
+    if prompt is None:
+        return None
+
+    resources = list(getattr(prompt, "resources", []) or [])
+    if not resources:
+        return None
+    return {
+        "status": "pending",
+        "resourceCount": len(resources),
+        "statusMessage": str(getattr(prompt, "status_message", "") or ""),
+        "resources": [_cleanup_resource_handoff_data(resource) for resource in resources],
+    }
+
+
+def _cleanup_state_unavailable_payload() -> dict[str, Any]:
+    return {
+        "status": "unavailable",
+        "statusMessage": _("Cleanup state unavailable. Inspect the session file and cloud resources manually."),
+    }
+
+
+def _public_cleanup_snapshot_has_pending_evidence(cleanup: Any) -> bool:
+    if not isinstance(cleanup, dict):
+        return False
+    resources = cleanup.get("resources")
+    if isinstance(resources, list) and len(resources) > 0:
+        return True
+    resource_count = cleanup.get("resourceCount")
+    if isinstance(resource_count, int) and resource_count > 0:
+        return True
+    status = cleanup.get("status")
+    if isinstance(status, str) and status in {"pending", "started", "in_progress", "failed", "unavailable"}:
+        return True
+    return False
+
+
+def _cleanup_resource_handoff_data(resource: Any) -> dict[str, Any]:
+    return {
+        "provider": str(getattr(resource, "provider", "") or ""),
+        "resourceType": str(getattr(resource, "resource_type", "") or ""),
+        "resourceId": str(getattr(resource, "resource_id", "") or ""),
+        "resourceName": str(getattr(resource, "resource_name", "") or ""),
+        "regionId": str(getattr(resource, "region_id", "") or ""),
+        "sourceStepId": str(getattr(resource, "source_step_id", "") or ""),
+        "cleanupStatus": str(getattr(resource, "cleanup_status", "") or ""),
+        "progressStatus": getattr(resource, "progress_status", None),
+        "lastError": _public_cleanup_error(getattr(resource, "last_error", None)),
+    }
+
+
+def _public_cleanup_error(value: Any) -> str | None:
+    if not value:
+        return None
+    text = sanitize_public_text(value)
+    return text[:1000] + "..." if len(text) > 1000 else text
+
+
 async def _maybe_await(value: Any) -> Any:
     if inspect.isawaitable(value):
         return await value
@@ -1727,6 +2098,22 @@ def _sidecar_matches_task(
     return False
 
 
+def _active_sidecar_mismatch_error_from_publisher(
+    publisher: PipelineA2AEventPublisher,
+    *,
+    context_id: str,
+    sidecar_status: str,
+) -> RecoverablePipelineInvalidParamsError:
+    owner = _current_sidecar_owner(publisher, context_id=context_id)
+    recoverable_task_id = owner.task_id if owner is not None and owner.task_id else "unknown"
+    recoverable_context_id = owner.context_id if owner is not None and owner.context_id else context_id
+    return _active_sidecar_mismatch_error(
+        recoverable_task_id=recoverable_task_id,
+        context_id=recoverable_context_id,
+        sidecar_status=sidecar_status,
+    )
+
+
 def _current_sidecar_owner(publisher: PipelineA2AEventPublisher, *, context_id: str) -> _TaskContextOwner | None:
     return _current_sidecar_owner_from_stores(
         snapshot_store=publisher.snapshot_store,
diff --git a/src/iac_code/a2a/pipeline_journal.py b/src/iac_code/a2a/pipeline_journal.py
index 2a2586bf..201bc915 100644
--- a/src/iac_code/a2a/pipeline_journal.py
+++ b/src/iac_code/a2a/pipeline_journal.py
@@ -8,7 +8,11 @@
 from pathlib import Path
 from typing import Any
 
+from iac_code.utils.state_io import fsync_parent_dir
+
 logger = logging.getLogger(__name__)
+_EVENT_GROUP_RECORD_TYPE = "event_group"
+_EVENT_GROUP_RECORD_KEY = "__iac_code_record_type"
 
 
 class A2APipelineJournalReadError(ValueError):
@@ -20,8 +24,9 @@ def __init__(self, pipeline_dir: str | Path) -> None:
         self.pipeline_dir = Path(pipeline_dir)
         self.path = self.pipeline_dir / "a2a-events.jsonl"
 
-    def append(self, event: dict[str, Any]) -> None:
+    def append(self, event: dict[str, Any], durable: bool = False) -> None:
         self.pipeline_dir.mkdir(parents=True, exist_ok=True)
+        created = not self.path.exists()
         safe_event = to_json_safe(event)
         try:
             line = json.dumps(safe_event, ensure_ascii=False, separators=(",", ":"), allow_nan=False)
@@ -31,6 +36,37 @@ def append(self, event: dict[str, Any]) -> None:
         with self.path.open("a", encoding="utf-8") as handle:
             handle.write(line + "\n")
             handle.flush()
+            if durable:
+                os.fsync(handle.fileno())
+        if durable and created:
+            fsync_parent_dir(self.path)
+
+    def append_many(self, events: list[dict[str, Any]], durable: bool = False) -> None:
+        if not events:
+            return
+
+        self.pipeline_dir.mkdir(parents=True, exist_ok=True)
+        created = not self.path.exists()
+        safe_events = []
+        for event in events:
+            safe_event = to_json_safe(event)
+            if not isinstance(safe_event, dict):
+                raise TypeError("A2A journal group events must be JSON objects")
+            safe_events.append(safe_event)
+        record = {
+            _EVENT_GROUP_RECORD_KEY: _EVENT_GROUP_RECORD_TYPE,
+            "schemaVersion": "1.0",
+            "groupId": uuid.uuid4().hex,
+            "events": safe_events,
+        }
+        line = json.dumps(record, ensure_ascii=False, separators=(",", ":"), allow_nan=False)
+        with self.path.open("a", encoding="utf-8") as handle:
+            handle.write(line + "\n")
+            handle.flush()
+            if durable:
+                os.fsync(handle.fileno())
+        if durable and created:
+            fsync_parent_dir(self.path)
 
     def read_all(self) -> list[dict[str, Any]]:
         return self._read_all(strict=False)
@@ -116,7 +152,7 @@ def _read_all(self, *, strict: bool) -> list[dict[str, Any]]:
                         f"Non-object A2A pipeline journal line {line_number} in {self.path}"
                     )
                 continue
-            events.append(value)
+            events.extend(_events_from_journal_record(value, strict=strict, line_number=line_number, path=self.path))
 
         events.sort(key=_sequence_value)
         return events
@@ -133,6 +169,25 @@ def _sequence_value(event: dict[str, Any]) -> int:
         return 0
 
 
+def _events_from_journal_record(
+    value: dict[str, Any],
+    *,
+    strict: bool,
+    line_number: int,
+    path: Path,
+) -> list[dict[str, Any]]:
+    if value.get(_EVENT_GROUP_RECORD_KEY) != _EVENT_GROUP_RECORD_TYPE:
+        return [value]
+
+    group_events = value.get("events")
+    if not isinstance(group_events, list) or not all(isinstance(event, dict) for event in group_events):
+        if strict:
+            raise A2APipelineJournalReadError(f"Invalid A2A pipeline journal event group line {line_number} in {path}")
+        logger.warning("Skipping invalid A2A pipeline journal event group in %s", path)
+        return []
+    return group_events
+
+
 def _repairable_tail_bytes(content: bytes) -> tuple[bytes, bytes] | None:
     if not content:
         return None
diff --git a/src/iac_code/a2a/pipeline_recovery.py b/src/iac_code/a2a/pipeline_recovery.py
index 99c984ba..a9789d2b 100644
--- a/src/iac_code/a2a/pipeline_recovery.py
+++ b/src/iac_code/a2a/pipeline_recovery.py
@@ -12,6 +12,7 @@
     A2APipelineSnapshotStore,
     reduce_pipeline_events,
     sanitize_pipeline_artifact_uris,
+    sanitize_pipeline_cleanup_private_fields,
 )
 from iac_code.i18n import _
 
@@ -44,9 +45,9 @@ async def get_state(
         snapshot_store = A2APipelineSnapshotStore(pipeline_dir)
         snapshot = snapshot_store.load()
         events = journal.read_all_repairing_tail()
+        context_events = _events_for_task(events, task_id=None, context_id=context_id)
         recovery_task_id = task_id
         if recovery_task_id is None:
-            context_events = _events_for_task(events, task_id=None, context_id=context_id)
             snapshot_task_id = None
             if isinstance(snapshot, dict) and _snapshot_matches_context(snapshot, context_id=context_id):
                 snapshot_task_id = snapshot.get("taskId")
@@ -88,21 +89,45 @@ async def get_state(
                 snapshot_store.save(snapshot)
                 snapshot = snapshot_store.load() or snapshot
         elif recovery_task_id is not None and (
-            not _snapshot_matches(
+            not _snapshot_matches_or_delivery_alias(
                 snapshot,
                 task_id=recovery_task_id,
                 context_id=context_id,
+                context_events=context_events,
             )
-            or not _snapshot_seen_events_are_within_context_task(
-                snapshot,
-                _events_for_task(events, task_id=None, context_id=context_id),
-                task_id=recovery_task_id,
+            or (
+                _snapshot_matches(snapshot, task_id=recovery_task_id, context_id=context_id)
+                and not _snapshot_seen_events_are_within_context_task(
+                    snapshot,
+                    context_events,
+                    task_id=recovery_task_id,
+                )
+            )
+            or (
+                not _snapshot_matches(snapshot, task_id=recovery_task_id, context_id=context_id)
+                and _snapshot_is_missing_delivery_alias_events(
+                    snapshot,
+                    task_id=recovery_task_id,
+                    context_events=context_events,
+                )
             )
         ):
-            if not replay_events:
+            rebuild_events = _rebuild_events_for_recovery_task(
+                events,
+                snapshot=snapshot,
+                task_id=recovery_task_id,
+                context_id=context_id,
+                fallback_events=replay_events,
+            )
+            if not rebuild_events:
                 raise ValueError(_("A2A pipeline state not found"))
-            snapshot = reduce_pipeline_events(replay_events)
-            if not _snapshot_matches(snapshot, task_id=recovery_task_id, context_id=context_id):
+            snapshot = reduce_pipeline_events(rebuild_events)
+            if not _snapshot_matches_or_delivery_alias(
+                snapshot,
+                task_id=recovery_task_id,
+                context_id=context_id,
+                context_events=context_events,
+            ):
                 raise ValueError(_("A2A pipeline state not found"))
             if task_id is None:
                 snapshot_store.save(snapshot)
@@ -132,7 +157,13 @@ async def get_state(
             snapshot = snapshot_store.load() or snapshot
 
         if task_id is not None and not _snapshot_matches(snapshot, task_id=task_id, context_id=context_id):
-            raise ValueError(_("A2A pipeline state not found"))
+            if not _snapshot_matches_or_delivery_alias(
+                snapshot,
+                task_id=task_id,
+                context_id=context_id,
+                context_events=context_events,
+            ):
+                raise ValueError(_("A2A pipeline state not found"))
         if (
             task_id is None
             and recovery_task_id is not None
@@ -149,8 +180,8 @@ async def get_state(
         replay_after = after_sequence if after_sequence is not None else _int_value(snapshot.get("lastSequence"), 0)
         events_after_replay = [event for event in replay_events if _int_value(event.get("sequence"), 0) > replay_after]
         return {
-            "snapshot": _json_compatible(sanitize_pipeline_artifact_uris(snapshot)),
-            "events": _json_compatible(sanitize_pipeline_artifact_uris(events_after_replay)),
+            "snapshot": _json_compatible(_sanitize_public_recovery_payload(snapshot)),
+            "events": _json_compatible(_sanitize_public_recovery_payload(events_after_replay)),
         }
 
     async def _verify_task_owner(
@@ -182,6 +213,10 @@ def _json_compatible(value: Any) -> Any:
     return value
 
 
+def _sanitize_public_recovery_payload(value: Any) -> Any:
+    return sanitize_pipeline_cleanup_private_fields(sanitize_pipeline_artifact_uris(value))
+
+
 def _events_for_task(
     events: list[dict[str, Any]],
     *,
@@ -191,13 +226,77 @@ def _events_for_task(
     context_events = [event for event in events if event.get("contextId") == context_id]
     if task_id is None:
         return context_events
-    return [event for event in context_events if event.get("taskId") == task_id]
+    return [
+        event for event in context_events if event.get("taskId") == task_id or event.get("deliveryTaskId") == task_id
+    ]
 
 
 def _snapshot_matches(snapshot: dict[str, Any], *, task_id: str, context_id: str) -> bool:
     return snapshot.get("taskId") == task_id and snapshot.get("contextId") == context_id
 
 
+def _snapshot_matches_or_delivery_alias(
+    snapshot: dict[str, Any],
+    *,
+    task_id: str,
+    context_id: str,
+    context_events: list[dict[str, Any]],
+) -> bool:
+    if _snapshot_matches(snapshot, task_id=task_id, context_id=context_id):
+        return True
+    if not _snapshot_matches_context(snapshot, context_id=context_id):
+        return False
+    snapshot_task_id = snapshot.get("taskId")
+    if not isinstance(snapshot_task_id, str):
+        return False
+    return any(
+        event.get("taskId") == snapshot_task_id and event.get("deliveryTaskId") == task_id for event in context_events
+    )
+
+
+def _snapshot_is_missing_delivery_alias_events(
+    snapshot: dict[str, Any],
+    *,
+    task_id: str,
+    context_events: list[dict[str, Any]],
+) -> bool:
+    snapshot_task_id = snapshot.get("taskId")
+    if not isinstance(snapshot_task_id, str):
+        return False
+    alias_events = [
+        event
+        for event in context_events
+        if event.get("taskId") == snapshot_task_id and event.get("deliveryTaskId") == task_id
+    ]
+    if not alias_events:
+        return False
+    seen_event_ids = snapshot.get("seenEventIds")
+    if isinstance(seen_event_ids, list):
+        seen = {event_id for event_id in seen_event_ids if isinstance(event_id, str)}
+        return any(isinstance(event.get("eventId"), str) and event["eventId"] not in seen for event in alias_events)
+    snapshot_sequence = _int_value(snapshot.get("lastSequence"), 0)
+    return any(_int_value(event.get("sequence"), 0) > snapshot_sequence for event in alias_events)
+
+
+def _rebuild_events_for_recovery_task(
+    events: list[dict[str, Any]],
+    *,
+    snapshot: dict[str, Any],
+    task_id: str,
+    context_id: str,
+    fallback_events: list[dict[str, Any]],
+) -> list[dict[str, Any]]:
+    if _snapshot_matches(snapshot, task_id=task_id, context_id=context_id):
+        return fallback_events
+    snapshot_task_id = snapshot.get("taskId")
+    if not isinstance(snapshot_task_id, str):
+        return fallback_events
+    source_events = _events_for_task(events, task_id=snapshot_task_id, context_id=context_id)
+    if any(event.get("deliveryTaskId") == task_id for event in source_events):
+        return source_events
+    return fallback_events
+
+
 def _snapshot_matches_context(snapshot: dict[str, Any], *, context_id: str) -> bool:
     return snapshot.get("contextId") == context_id
 
@@ -270,7 +369,15 @@ def _snapshot_seen_events_are_within_context_task(
     event_task_ids = {
         event.get("eventId"): event.get("taskId") for event in context_events if isinstance(event.get("eventId"), str)
     }
+    event_delivery_task_ids = {
+        event.get("eventId"): event.get("deliveryTaskId")
+        for event in context_events
+        if isinstance(event.get("eventId"), str)
+    }
     return all(
-        not isinstance(event_id, str) or event_id not in event_task_ids or event_task_ids[event_id] == task_id
+        not isinstance(event_id, str)
+        or event_id not in event_task_ids
+        or event_task_ids[event_id] == task_id
+        or event_delivery_task_ids.get(event_id) == task_id
         for event_id in seen_event_ids
     )
diff --git a/src/iac_code/a2a/pipeline_snapshot.py b/src/iac_code/a2a/pipeline_snapshot.py
index edef7ad6..6d54b69e 100644
--- a/src/iac_code/a2a/pipeline_snapshot.py
+++ b/src/iac_code/a2a/pipeline_snapshot.py
@@ -3,8 +3,6 @@
 import copy
 import json
 import logging
-import os
-import uuid
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any
@@ -14,15 +12,41 @@
     sanitize_public_tool_output_data,
 )
 from iac_code.a2a.pipeline_journal import to_json_safe
+from iac_code.pipeline.constants import (
+    PIPELINE_EVENT_CLEANUP_COMPLETED,
+    PIPELINE_EVENT_CLEANUP_FAILED,
+    PIPELINE_EVENT_CLEANUP_PROGRESS,
+    PIPELINE_EVENT_CLEANUP_STARTED,
+)
+from iac_code.utils.public_errors import sanitize_public_text
+from iac_code.utils.state_io import atomic_write_json
 
 SNAPSHOT_SCHEMA_VERSION = "1.1"
 logger = logging.getLogger(__name__)
+_PUBLIC_TEXT_MAX_CHARS = 1000
 
 _TERMINAL_STATUS_BY_EVENT_TYPE = {
     "pipeline_completed": "completed",
     "pipeline_failed": "failed",
     "pipeline_canceled": "canceled",
 }
+_CLEANUP_STATUS_BY_EVENT_TYPE = {
+    PIPELINE_EVENT_CLEANUP_STARTED: "started",
+    PIPELINE_EVENT_CLEANUP_PROGRESS: "in_progress",
+    PIPELINE_EVENT_CLEANUP_COMPLETED: "completed",
+    PIPELINE_EVENT_CLEANUP_FAILED: "failed",
+}
+_KNOWN_CLEANUP_STATUSES = {"pending", "started", "in_progress", "completed", "failed", "skipped"}
+_CLEANUP_ERROR_KEYS = {
+    "error",
+    "errorMessage",
+    "errorSummary",
+    "error_message",
+    "error_summary",
+    "lastError",
+    "last_error",
+}
+_PIPELINE_WARNING_PRIVATE_DATA_KEYS = {"ledger_path", "ledgerPath", "load_error", "loadError"}
 
 
 class A2APipelineSnapshotStore:
@@ -32,29 +56,19 @@ def __init__(self, pipeline_dir: str | Path) -> None:
 
     def save(self, snapshot: dict[str, Any]) -> bool:
         previous = self.load()
-        next_snapshot = copy.deepcopy(snapshot)
+        next_snapshot = _sanitize_public_snapshot_private_cleanup_fields(snapshot)
         next_snapshot["snapshotVersion"] = _snapshot_version(previous) + 1
         next_snapshot = to_json_safe(next_snapshot)
         if not isinstance(next_snapshot, dict):
             logger.warning("Skipping invalid A2A pipeline snapshot for %s", self.path)
             return False
 
-        self.pipeline_dir.mkdir(parents=True, exist_ok=True)
-        tmp_path = self.path.with_name(f"{self.path.name}.{uuid.uuid4().hex}.tmp")
         try:
-            with tmp_path.open("w", encoding="utf-8") as handle:
-                json.dump(next_snapshot, handle, ensure_ascii=False, indent=2, sort_keys=True, allow_nan=False)
-                handle.write("\n")
-                handle.flush()
-                os.fsync(handle.fileno())
-            tmp_path.replace(self.path)
+            atomic_write_json(self.path, next_snapshot, durable=True)
             return True
         except (OSError, TypeError, ValueError):
             logger.warning("Failed to persist A2A pipeline snapshot to %s", self.path, exc_info=True)
             return False
-        finally:
-            if tmp_path.exists():
-                tmp_path.unlink()
 
     def load(self) -> dict[str, Any] | None:
         try:
@@ -71,7 +85,7 @@ def load(self) -> dict[str, Any] | None:
                 type(value).__name__,
             )
             return None
-        return value
+        return _sanitize_public_snapshot_private_cleanup_fields(value)
 
 
 def reduce_pipeline_events(
@@ -109,6 +123,25 @@ def sanitize_pipeline_artifact_uris(value: Any) -> Any:
     return sanitized
 
 
+def sanitize_pipeline_cleanup_private_fields(value: Any) -> Any:
+    if isinstance(value, list):
+        return [sanitize_pipeline_cleanup_private_fields(item) for item in value]
+    if not isinstance(value, dict):
+        return value
+
+    sanitized = _sanitize_cleanup_private_fields(value)
+    event_type = _string_or_none(sanitized.get("eventType")) or ""
+    if event_type in _CLEANUP_STATUS_BY_EVENT_TYPE or sanitized.get("scope") == "cleanup":
+        data = _dict_or_none(sanitized.get("data"))
+        if data is not None:
+            sanitized["data"] = _sanitize_cleanup_private_fields(data, root_is_cleanup=True)
+    elif event_type == "pipeline_warning":
+        data = _dict_or_none(sanitized.get("data"))
+        if data is not None:
+            sanitized["data"] = _pipeline_warning_public_data(data)
+    return sanitized
+
+
 class _PipelineSnapshotReducer:
     def __init__(self, existing_snapshot: dict[str, Any] | None = None) -> None:
         self._snapshot = _snapshot_from_existing(existing_snapshot)
@@ -128,7 +161,9 @@ def __init__(self, existing_snapshot: dict[str, Any] | None = None) -> None:
         self._rollback_keys: set[str] = set()
         self._candidate_restart_keys: set[str] = set()
         self._handoff_history_keys: set[str] = set()
+        self._warning_history_keys: set[str] = set()
         self._stack_history_keys: set[str] = set()
+        self._cleanup_history_keys: set[str] = set()
         self._skip_sequences_through = 0
         self._hydrate_existing_snapshot(existing_snapshot)
 
@@ -178,7 +213,9 @@ def _hydrate_existing_snapshot(self, existing_snapshot: dict[str, Any] | None) -
         self._hydrate_rollbacks()
         self._hydrate_candidate_restarts()
         self._hydrate_control_history("handoffHistory", self._handoff_history_keys)
+        self._hydrate_control_history("warningHistory", self._warning_history_keys)
         self._hydrate_stack_history()
+        self._hydrate_cleanup_history()
 
     def _hydrate_steps(self) -> None:
         valid_steps: list[dict[str, Any]] = []
@@ -336,6 +373,24 @@ def _hydrate_stack_history(self) -> None:
                 self._seen_event_ids.add(event_id)
         stacks["history"] = unique_history
 
+    def _hydrate_cleanup_history(self) -> None:
+        cleanup = self._snapshot["cleanup"]
+        unique_history: list[dict[str, Any]] = []
+        for item in cleanup["history"]:
+            if not isinstance(item, dict):
+                continue
+            event_id = _string_or_none(item.get("eventId"))
+            key = event_id or str(_sequence_value(item))
+            if key in self._cleanup_history_keys:
+                if event_id is not None:
+                    self._seen_event_ids.add(event_id)
+                continue
+            self._cleanup_history_keys.add(key)
+            unique_history.append(item)
+            if event_id is not None:
+                self._seen_event_ids.add(event_id)
+        cleanup["history"] = unique_history
+
     def _is_legacy_replay_event(self, event: dict[str, Any]) -> bool:
         return self._skip_sequences_through > 0 and _sequence_value(event) <= self._skip_sequences_through
 
@@ -357,13 +412,22 @@ def _apply(self, event: dict[str, Any]) -> None:
         self._snapshot["lastSequence"] = max(self._snapshot["lastSequence"], _sequence_value(event))
         self._merge_pipeline_identity(event)
 
-        data = _dict_or_empty(event.get("data"))
+        data = _sanitize_cleanup_private_fields(_dict_or_empty(event.get("data")))
         if event_type == "pipeline_started":
             self._apply_pipeline_started(data)
         elif event_type == "pipeline_handoff_ready":
             handoff = _normal_handoff(event)
             self._snapshot["normalHandoff"] = handoff
             self._append_control_history("handoffHistory", self._handoff_history_keys, handoff)
+            cleanup_data = _dict_or_none(data.get("cleanup"))
+            if cleanup_data is not None:
+                self._apply_cleanup_data(cleanup_data, event)
+        elif event_type == "pipeline_warning":
+            self._append_control_history(
+                "warningHistory",
+                self._warning_history_keys,
+                _warning_history_entry(event),
+            )
 
         step = self._upsert_step(event.get("step"), event)
         candidate = self._upsert_candidate(step, event.get("candidate"), event)
@@ -396,6 +460,8 @@ def _apply(self, event: dict[str, Any]) -> None:
             self._upsert_tool_result_item(event)
         elif event_type == "stack_current_changed":
             self._apply_stack_current_changed(event)
+        elif event_type in _CLEANUP_STATUS_BY_EVENT_TYPE:
+            self._apply_cleanup_event(event)
         elif event_type == "rollback_completed":
             self._append_rollback(event)
         elif event_type == "candidate_restart_requested":
@@ -412,7 +478,7 @@ def _apply(self, event: dict[str, Any]) -> None:
             self._snapshot["status"] = terminal_status
             self._snapshot["pendingInput"] = None
             self._snapshot["control"]["activeCandidateRunIds"] = []
-        elif event_type not in {"input_required", "input_received"} and not (
+        elif event_type not in {"input_required", "input_received", *_CLEANUP_STATUS_BY_EVENT_TYPE} and not (
             event_type == "pipeline_handoff_ready" and self._snapshot["status"] in {"completed", "failed", "canceled"}
         ):
             self._apply_event_status(event)
@@ -745,6 +811,82 @@ def _apply_stack_current_changed(self, event: dict[str, Any]) -> None:
         else:
             stacks["current"] = copy.deepcopy(existing)
 
+    def _apply_cleanup_event(self, event: dict[str, Any]) -> None:
+        data = _sanitize_cleanup_private_fields(copy.deepcopy(_dict_or_empty(event.get("data"))), root_is_cleanup=True)
+        event_type = _string_or_none(event.get("eventType")) or ""
+        data.setdefault("status", _CLEANUP_STATUS_BY_EVENT_TYPE.get(event_type, "pending"))
+        self._apply_cleanup_data(data, event)
+
+    def _apply_cleanup_data(self, data: dict[str, Any], event: dict[str, Any]) -> None:
+        cleanup = self._snapshot["cleanup"]
+        status = _string_or_none(data.get("status"))
+        if status is not None:
+            cleanup["status"] = status
+
+        resources = _dict_list(data.get("resources"))
+        if resources:
+            cleanup["resources"] = copy.deepcopy(resources)
+        else:
+            self._merge_cleanup_resource(cleanup, data)
+
+        resource_count = _int_or_none(data.get("resourceCount"))
+        if resource_count is not None:
+            cleanup["resourceCount"] = resource_count
+        elif cleanup["resources"]:
+            cleanup["resourceCount"] = len(cleanup["resources"])
+        cleanup["status"] = _aggregate_cleanup_status(cleanup["resources"], fallback=status or cleanup.get("status"))
+
+        for key in ("statusMessage",):
+            if key in data:
+                cleanup[key] = copy.deepcopy(data[key])
+
+        key = _string_or_none(event.get("eventId")) or str(_sequence_value(event))
+        if key in self._cleanup_history_keys:
+            return
+        self._cleanup_history_keys.add(key)
+        entry = {
+            "eventType": _string_or_none(event.get("eventType")),
+            "eventId": _string_or_none(event.get("eventId")),
+            "sequence": _sequence_value(event),
+            "createdAt": _string_or_none(event.get("createdAt")),
+            "scope": _string_or_none(event.get("scope")) or "cleanup",
+            "status": cleanup["status"],
+            "data": copy.deepcopy(data),
+        }
+        _merge_event_coordinates(entry, event)
+        cleanup["history"].append(entry)
+
+    @staticmethod
+    def _merge_cleanup_resource(cleanup: dict[str, Any], data: dict[str, Any]) -> None:
+        resource_id = _string_or_none(data.get("resourceId"))
+        if resource_id is None:
+            return
+        provider = _string_or_none(data.get("provider"))
+        resource_type = _string_or_none(data.get("resourceType")) or _string_or_none(data.get("resource_type"))
+        region_id = _string_or_none(data.get("regionId"))
+        resources = cleanup["resources"]
+
+        def optional_field_matches(resource: dict[str, Any], *keys: str, incoming: str | None) -> bool:
+            existing = None
+            for key in keys:
+                existing = _string_or_none(resource.get(key))
+                if existing is not None:
+                    break
+            return incoming is None or existing is None or existing == incoming
+
+        for resource in resources:
+            if not isinstance(resource, dict):
+                continue
+            if (
+                resource.get("resourceId") == resource_id
+                and optional_field_matches(resource, "provider", incoming=provider)
+                and optional_field_matches(resource, "resourceType", "resource_type", incoming=resource_type)
+                and optional_field_matches(resource, "regionId", incoming=region_id)
+            ):
+                resource.update(copy.deepcopy(data))
+                return
+        resources.append(copy.deepcopy(data))
+
     def _upsert_display_record(
         self,
         display_key: str,
@@ -832,7 +974,7 @@ def _pending_input(self, event: dict[str, Any]) -> dict[str, Any]:
 
 
 def _normal_handoff(event: dict[str, Any]) -> dict[str, Any]:
-    data = copy.deepcopy(_dict_or_empty(event.get("data")))
+    data = _sanitize_cleanup_private_fields(copy.deepcopy(_dict_or_empty(event.get("data"))))
     handoff = {
         "eventType": _string_or_none(event.get("eventType")),
         "eventId": _string_or_none(event.get("eventId")),
@@ -849,6 +991,23 @@ def _normal_handoff(event: dict[str, Any]) -> dict[str, Any]:
     return handoff
 
 
+def _warning_history_entry(event: dict[str, Any]) -> dict[str, Any]:
+    entry = {
+        "eventId": _string_or_none(event.get("eventId")),
+        "sequence": _sequence_value(event),
+        "createdAt": _string_or_none(event.get("createdAt")),
+        "data": _pipeline_warning_public_data(_dict_or_empty(event.get("data"))),
+    }
+    _merge_event_coordinates(entry, event)
+    return entry
+
+
+def _pipeline_warning_public_data(data: dict[str, Any]) -> dict[str, Any]:
+    return copy.deepcopy(
+        {key: value for key, value in data.items() if str(key) not in _PIPELINE_WARNING_PRIVATE_DATA_KEYS}
+    )
+
+
 def _interaction_history_entry(event: dict[str, Any]) -> dict[str, Any]:
     data = copy.deepcopy(_dict_or_empty(event.get("data")))
     input_value = copy.deepcopy(_dict_or_empty(event.get("input")))
@@ -924,6 +1083,12 @@ def _empty_snapshot() -> dict[str, Any]:
             "byId": {},
             "history": [],
         },
+        "cleanup": {
+            "status": "none",
+            "resourceCount": 0,
+            "resources": [],
+            "history": [],
+        },
         "normalHandoff": None,
         "pendingInput": None,
         "control": {
@@ -933,11 +1098,38 @@ def _empty_snapshot() -> dict[str, Any]:
             "rollbackHistory": [],
             "candidateRestarts": [],
             "handoffHistory": [],
+            "warningHistory": [],
         },
         "seenEventIds": [],
     }
 
 
+def _cleanup_resource_status(resource: dict[str, Any]) -> str | None:
+    status = (
+        _string_or_none(resource.get("cleanupStatus"))
+        or _string_or_none(resource.get("cleanup_status"))
+        or _string_or_none(resource.get("status"))
+    )
+    return status if status in _KNOWN_CLEANUP_STATUSES else None
+
+
+def _aggregate_cleanup_status(resources: list[dict[str, Any]], *, fallback: Any = None) -> str:
+    fallback_status = _string_or_none(fallback) or "none"
+    statuses = [_cleanup_resource_status(resource) for resource in resources if isinstance(resource, dict)]
+    statuses = [status for status in statuses if status is not None]
+    if not statuses:
+        return fallback_status
+    if "failed" in statuses:
+        return "failed"
+    if "in_progress" in statuses:
+        return "in_progress"
+    if "started" in statuses:
+        return "started"
+    if "pending" in statuses:
+        return "pending"
+    return "completed"
+
+
 def _snapshot_from_existing(existing_snapshot: dict[str, Any] | None) -> dict[str, Any]:
     if not isinstance(existing_snapshot, dict):
         return _empty_snapshot()
@@ -969,9 +1161,27 @@ def _snapshot_from_existing(existing_snapshot: dict[str, Any] | None) -> dict[st
         else {},
         "history": _dict_list(stacks.get("history")),
     }
+    normal_handoff = snapshot.get("normalHandoff")
     snapshot["normalHandoff"] = (
-        copy.deepcopy(snapshot.get("normalHandoff")) if isinstance(snapshot.get("normalHandoff"), dict) else None
+        _sanitize_cleanup_private_fields(normal_handoff) if isinstance(normal_handoff, dict) else None
     )
+    cleanup = snapshot.get("cleanup")
+    if not isinstance(cleanup, dict):
+        cleanup = {}
+    cleanup = _sanitize_cleanup_private_fields(cleanup, root_is_cleanup=True)
+    cleanup_resources = _dict_list(cleanup.get("resources"))
+    cleanup_count = _int_or_none(cleanup.get("resourceCount"))
+    if cleanup_count is None:
+        cleanup_count = len(cleanup_resources)
+    snapshot["cleanup"] = {
+        "status": _string_or_none(cleanup.get("status")) or "none",
+        "resourceCount": cleanup_count,
+        "resources": cleanup_resources,
+        "history": _dict_list(cleanup.get("history")),
+    }
+    for key in ("statusMessage",):
+        if key in cleanup:
+            snapshot["cleanup"][key] = copy.deepcopy(cleanup[key])
 
     control = snapshot.get("control")
     if not isinstance(control, dict):
@@ -984,6 +1194,7 @@ def _snapshot_from_existing(existing_snapshot: dict[str, Any] | None) -> dict[st
         "rollbackHistory",
         "candidateRestarts",
         "handoffHistory",
+        "warningHistory",
     ):
         value = snapshot["control"].get(key)
         snapshot["control"][key] = copy.deepcopy(value) if isinstance(value, list) else []
@@ -998,6 +1209,71 @@ def _snapshot_from_existing(existing_snapshot: dict[str, Any] | None) -> dict[st
     return snapshot
 
 
+def _sanitize_public_snapshot_private_cleanup_fields(value: dict[str, Any]) -> dict[str, Any]:
+    sanitized = copy.deepcopy(value)
+    normal_handoff = sanitized.get("normalHandoff")
+    if isinstance(normal_handoff, dict):
+        sanitized["normalHandoff"] = _sanitize_cleanup_private_fields(normal_handoff)
+    cleanup = sanitized.get("cleanup")
+    if isinstance(cleanup, dict):
+        sanitized["cleanup"] = _sanitize_cleanup_private_fields(cleanup, root_is_cleanup=True)
+    control = sanitized.get("control")
+    if isinstance(control, dict):
+        handoff_history = control.get("handoffHistory")
+        if isinstance(handoff_history, list):
+            control["handoffHistory"] = [
+                _sanitize_cleanup_private_fields(item) if isinstance(item, dict) else item for item in handoff_history
+            ]
+        warning_history = control.get("warningHistory")
+        if isinstance(warning_history, list):
+            control["warningHistory"] = [
+                _sanitize_pipeline_warning_history(item) if isinstance(item, dict) else item for item in warning_history
+            ]
+    return sanitized
+
+
+def _sanitize_pipeline_warning_history(item: dict[str, Any]) -> dict[str, Any]:
+    sanitized = copy.deepcopy(item)
+    data = _dict_or_none(sanitized.get("data"))
+    if data is not None:
+        sanitized["data"] = _pipeline_warning_public_data(data)
+    return sanitized
+
+
+def _sanitize_cleanup_private_fields(value: dict[str, Any], *, root_is_cleanup: bool = False) -> dict[str, Any]:
+    sanitized = copy.deepcopy(value)
+    _drop_cleanup_private_fields(sanitized, inside_cleanup=root_is_cleanup)
+    return sanitized
+
+
+def _drop_cleanup_private_fields(value: Any, *, inside_cleanup: bool) -> None:
+    if isinstance(value, dict):
+        if inside_cleanup:
+            for key in ("prompt", "ledgerPath", "ledger_path"):
+                value.pop(key, None)
+            for key in _CLEANUP_ERROR_KEYS & value.keys():
+                value[key] = _sanitize_cleanup_error_value(value[key])
+        for item in value.values():
+            _drop_cleanup_private_fields(item, inside_cleanup=inside_cleanup)
+        cleanup = value.get("cleanup")
+        if cleanup is not None:
+            _drop_cleanup_private_fields(cleanup, inside_cleanup=True)
+    elif isinstance(value, list):
+        for item in value:
+            _drop_cleanup_private_fields(item, inside_cleanup=inside_cleanup)
+
+
+def _sanitize_cleanup_error_value(value: Any) -> Any:
+    if isinstance(value, str):
+        text = sanitize_public_text(value)
+        return text[:_PUBLIC_TEXT_MAX_CHARS] + "..." if len(text) > _PUBLIC_TEXT_MAX_CHARS else text
+    if isinstance(value, dict):
+        return {key: _sanitize_cleanup_error_value(item) for key, item in value.items()}
+    if isinstance(value, list):
+        return [_sanitize_cleanup_error_value(item) for item in value]
+    return value
+
+
 def _merge_coordinate(target: dict[str, Any], coordinate: dict[str, Any]) -> None:
     for key, value in coordinate.items():
         if value is not None:
@@ -1212,4 +1488,9 @@ def _utc_now() -> str:
     return datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")
 
 
-__all__ = ["A2APipelineSnapshotStore", "SNAPSHOT_SCHEMA_VERSION", "reduce_pipeline_events"]
+__all__ = [
+    "A2APipelineSnapshotStore",
+    "SNAPSHOT_SCHEMA_VERSION",
+    "reduce_pipeline_events",
+    "sanitize_pipeline_cleanup_private_fields",
+]
diff --git a/src/iac_code/a2a/pipeline_stream.py b/src/iac_code/a2a/pipeline_stream.py
index 0a1d5356..8ad950fd 100644
--- a/src/iac_code/a2a/pipeline_stream.py
+++ b/src/iac_code/a2a/pipeline_stream.py
@@ -15,10 +15,53 @@
 from iac_code.a2a.pipeline_events import PipelineEventTranslator, safe_permission_metadata
 from iac_code.a2a.pipeline_journal import A2APipelineJournal, to_json_safe
 from iac_code.a2a.pipeline_snapshot import SNAPSHOT_SCHEMA_VERSION, A2APipelineSnapshotStore, reduce_pipeline_events
+from iac_code.pipeline.constants import (
+    PIPELINE_EVENT_CLEANUP_COMPLETED,
+    PIPELINE_EVENT_CLEANUP_FAILED,
+    PIPELINE_EVENT_CLEANUP_PROGRESS,
+    PIPELINE_EVENT_CLEANUP_STARTED,
+)
 from iac_code.types.stream_events import PermissionRequestEvent, SubPipelineStreamEvent, ToolResultEvent
 
 PipelinePermissionResolver = Callable[[PermissionRequestEvent], bool | Awaitable[bool]]
 logger = logging.getLogger(__name__)
+_RECOVERY_SEMANTIC_EVENT_TYPES = {
+    "pipeline_started",
+    "pipeline_resumed",
+    "step_started",
+    "step_completed",
+    "step_failed",
+    "candidate_started",
+    "candidate_selected",
+    "candidate_completed",
+    "candidate_failed",
+    "candidate_step_started",
+    "candidate_step_completed",
+    "candidate_step_failed",
+    "input_required",
+    "input_received",
+    "pipeline_completed",
+    "pipeline_failed",
+    "pipeline_canceled",
+    "pipeline_handoff_ready",
+    "pipeline_warning",
+    PIPELINE_EVENT_CLEANUP_STARTED,
+    PIPELINE_EVENT_CLEANUP_PROGRESS,
+    PIPELINE_EVENT_CLEANUP_COMPLETED,
+    PIPELINE_EVENT_CLEANUP_FAILED,
+    "artifact_created",
+    "rollback_completed",
+    "candidate_restart_requested",
+}
+_DISPLAY_ONLY_EVENT_TYPES = {
+    "candidate_detail_shown",
+    "diagram_shown",
+    "permission_requested",
+    "text_delta",
+    "tool_result",
+}
+_RECOVERY_STATE_SCOPES = {"step", "candidate", "candidateStep", "candidate_step"}
+_RECOVERY_STATE_STATUSES = {"working"}
 
 
 class _SnapshotCatchUpUnavailableError(Exception):
@@ -38,6 +81,8 @@ def __init__(
         snapshot_store: A2APipelineSnapshotStore,
         artifact_store: Any | None = None,
         exposure_types: Any = None,
+        delivery_task_id: str | None = None,
+        delivery_context_id: str | None = None,
     ) -> None:
         self.event_queue = event_queue
         self.translator = translator
@@ -45,6 +90,8 @@ def __init__(
         self.snapshot_store = snapshot_store
         self.artifact_store = artifact_store
         self.exposure_types = normalize_a2a_exposure_types(exposure_types)
+        self.delivery_task_id = delivery_task_id
+        self.delivery_context_id = delivery_context_id
         self._sequence_lock = asyncio.Lock()
         self._last_sequence = 0
         self.last_envelope: dict[str, Any] | None = None
@@ -196,6 +243,7 @@ async def publish_manual(
         status: str = "working",
         data: dict[str, Any] | None = None,
         coordinates: dict[str, Any] | None = None,
+        require_durable_metadata: bool = False,
     ) -> dict[str, Any] | None:
         envelope = self.translator.manual_event(event_type, scope, status=status, data=data)
         if coordinates:
@@ -203,7 +251,11 @@ async def publish_manual(
                 value = coordinates.get(key)
                 if isinstance(value, dict):
                     envelope[key] = dict(value)
-        return envelope if await self._persist_and_enqueue(envelope) else None
+        return (
+            envelope
+            if await self._persist_and_enqueue(envelope, require_durable_metadata=require_durable_metadata)
+            else None
+        )
 
     def _next_snapshot(self, envelope: dict[str, Any]) -> dict[str, Any]:
         existing_snapshot = self.snapshot_store.load()
@@ -244,6 +296,7 @@ async def _persist_and_enqueue(
         require_durable_metadata: bool = False,
     ) -> bool:
         async with self._sequence_lock:
+            self._annotate_delivery_alias(envelope)
             try:
                 self._ensure_monotonic_sequence(envelope)
             except _SequenceHighWaterUnavailableError:
@@ -253,10 +306,11 @@ async def _persist_and_enqueue(
             if not isinstance(safe_envelope, dict):
                 logger.warning("Skipping invalid A2A pipeline envelope: %r", envelope)
                 return False
+            durable_required = require_durable_metadata or is_recovery_semantic_event(safe_envelope)
             journal_persisted = False
             snapshot_persisted = False
             try:
-                self.journal.append(safe_envelope)
+                self.journal.append(safe_envelope, durable=durable_required)
                 journal_persisted = True
             except Exception:
                 logger.warning("Failed to append A2A pipeline journal event", exc_info=True)
@@ -269,7 +323,7 @@ async def _persist_and_enqueue(
                 logger.warning("Failed to persist A2A pipeline snapshot", exc_info=True)
             if snapshot_persisted:
                 _maybe_inject_test_fault("after_a2a_pipeline_snapshot_saved")
-            if require_durable_metadata and not (journal_persisted or snapshot_persisted):
+            if durable_required and not (journal_persisted or snapshot_persisted):
                 logger.warning("Skipping A2A pipeline status update because durable metadata was not persisted")
                 return False
             if artifact_metadata is not None and not (journal_persisted or snapshot_persisted):
@@ -281,6 +335,14 @@ async def _persist_and_enqueue(
             self.last_envelope = safe_envelope
             return True
 
+    def _annotate_delivery_alias(self, envelope: dict[str, Any]) -> None:
+        delivery_task_id = self._delivery_task_id(envelope)
+        delivery_context_id = self._delivery_context_id(envelope)
+        if delivery_task_id != str(envelope.get("taskId")):
+            envelope["deliveryTaskId"] = delivery_task_id
+        if delivery_context_id != str(envelope.get("contextId")):
+            envelope["deliveryContextId"] = delivery_context_id
+
     def _ensure_monotonic_sequence(self, envelope: dict[str, Any]) -> None:
         current = _int_value(envelope.get("sequence"), 0)
         previous = self._last_persisted_sequence()
@@ -359,8 +421,8 @@ async def _maybe_externalize_artifact(
     async def _enqueue_artifact_update(self, envelope: dict[str, Any], artifact_metadata: dict[str, Any]) -> None:
         await self.event_queue.enqueue_event(
             _artifact_update_event(
-                task_id=str(envelope["taskId"]),
-                context_id=str(envelope["contextId"]),
+                task_id=self._delivery_task_id(envelope),
+                context_id=self._delivery_context_id(envelope),
                 metadata=artifact_metadata,
             )
         )
@@ -391,17 +453,25 @@ async def _apply_permission_metadata(
         return approved
 
     async def _enqueue_status(self, envelope: dict[str, Any]) -> None:
+        task_id = self._delivery_task_id(envelope)
+        context_id = self._delivery_context_id(envelope)
         update = TaskStatusUpdateEvent(
-            task_id=str(envelope["taskId"]),
-            context_id=str(envelope["contextId"]),
+            task_id=task_id,
+            context_id=context_id,
             status=TaskStatus(
                 state=_a2a_task_state_name(envelope),
-                message=_message_for_envelope(envelope),
+                message=_message_for_envelope(envelope, task_id=task_id, context_id=context_id),
             ),
         )
         ParseDict({"iac_code": {"pipeline": envelope}}, update.metadata)
         await self.event_queue.enqueue_event(update)
 
+    def _delivery_task_id(self, envelope: dict[str, Any]) -> str:
+        return self.delivery_task_id or str(envelope["taskId"])
+
+    def _delivery_context_id(self, envelope: dict[str, Any]) -> str:
+        return self.delivery_context_id or str(envelope["contextId"])
+
 
 def _permission_request_from(event: Any) -> PermissionRequestEvent | None:
     inner = event.inner if isinstance(event, SubPipelineStreamEvent) else event
@@ -418,6 +488,22 @@ def _resolve_permission_future(request: PermissionRequestEvent, approved: bool)
         request.response_future.set_result(approved)
 
 
+def is_recovery_semantic_event(envelope: dict[str, Any]) -> bool:
+    event_type = envelope.get("eventType")
+    event_type = event_type if isinstance(event_type, str) else None
+    if event_type in _DISPLAY_ONLY_EVENT_TYPES:
+        return False
+    if event_type in _RECOVERY_SEMANTIC_EVENT_TYPES:
+        return True
+    status = envelope.get("status")
+    status = status if isinstance(status, str) else None
+    if status in {"waiting_input", "input_required", "completed", "failed", "canceled"}:
+        return True
+    scope = envelope.get("scope")
+    scope = scope if isinstance(scope, str) else None
+    return scope in _RECOVERY_STATE_SCOPES and status in _RECOVERY_STATE_STATUSES
+
+
 def _should_skip_envelope(envelope: dict[str, Any]) -> bool:
     return envelope.get("eventType") == "text_delta" and _text_from_envelope(envelope) == ""
 
@@ -433,14 +519,20 @@ def _maybe_inject_test_fault(point: str) -> None:
     os._exit(97)
 
 
-def _message_for_envelope(envelope: dict[str, Any]) -> Message | None:
+def _message_for_envelope(
+    envelope: dict[str, Any],
+    *,
+    task_id: str | None = None,
+    context_id: str | None = None,
+) -> Message | None:
     if envelope.get("eventType") != "text_delta":
         return None
 
+    message_task_id = task_id or str(envelope["taskId"])
     return Message(
-        message_id=f"{envelope['taskId']}-pipeline-{envelope['sequence']}",
-        task_id=str(envelope["taskId"]),
-        context_id=str(envelope["contextId"]),
+        message_id=f"{message_task_id}-pipeline-{envelope['sequence']}",
+        task_id=message_task_id,
+        context_id=context_id or str(envelope["contextId"]),
         role=Role.ROLE_AGENT,
         parts=[make_text_part(_text_from_envelope(envelope))],
     )
@@ -488,4 +580,4 @@ def _int_value(value: Any, default: int) -> int:
         return default
 
 
-__all__ = ["PipelineA2AEventPublisher", "PipelinePermissionResolver"]
+__all__ = ["PipelineA2AEventPublisher", "PipelinePermissionResolver", "is_recovery_semantic_event"]
diff --git a/src/iac_code/a2a/transports/dispatcher.py b/src/iac_code/a2a/transports/dispatcher.py
index 23a993e0..714c8079 100644
--- a/src/iac_code/a2a/transports/dispatcher.py
+++ b/src/iac_code/a2a/transports/dispatcher.py
@@ -49,6 +49,10 @@
 from iac_code.a2a.events import make_text_part
 from iac_code.a2a.executor import IacCodeA2AExecutor
 from iac_code.a2a.exposure import normalize_a2a_exposure_types
+from iac_code.a2a.jsonrpc_passthrough import (
+    install_jsonrpc_error_data_passthrough,
+    install_v03_jsonrpc_error_data_passthrough,
+)
 from iac_code.a2a.metrics import NoOpA2AMetrics
 from iac_code.a2a.persistence import A2APersistenceStore
 from iac_code.a2a.pipeline_executor import (
@@ -237,11 +241,13 @@ async def on_list_tasks(self, params: ListTasksRequest, context):
 
     async def on_message_send(self, params: SendMessageRequest, context):
         self._validate_extensions(context)
+        self._validate_pipeline_message_request(params)
         await self._hydrate_recoverable_pipeline_task_id(params)
         return await super().on_message_send(params, context)
 
     async def on_message_send_stream(self, params: SendMessageRequest, context):
         self._validate_extensions(context)
+        self._validate_pipeline_message_request(params)
         await self._hydrate_recoverable_pipeline_task_id(params)
         task_id = params.message.task_id or None
         if task_id and isinstance(self.task_store, A2ATaskStore) and await self.task_store.is_task_active(task_id):
@@ -495,6 +501,13 @@ async def on_delete_task_push_notification_config(
         self._validate_extensions(context)
         await super().on_delete_task_push_notification_config(params, context)
 
+    def _validate_pipeline_message_request(self, params: SendMessageRequest) -> None:
+        if get_run_mode() != RunMode.PIPELINE:
+            return
+        executor = getattr(self, "agent_executor", None)
+        if isinstance(executor, IacCodeA2AExecutor):
+            executor.validate_pipeline_message_request(params.message)
+
     def _validate_extensions(self, context) -> None:
         requested = set(getattr(context, "requested_extensions", set()) or set())
         required = sorted(extension.uri for extension in self._agent_card.capabilities.extensions if extension.required)
@@ -511,7 +524,9 @@ def _task_is_input_required(task: Task) -> bool:
 
 
 def _create_dispatch_app(handler: DefaultRequestHandler) -> Starlette:
+    install_jsonrpc_error_data_passthrough()
     jsonrpc_endpoint = create_jsonrpc_routes(handler, rpc_url="/", enable_v0_3_compat=True)[0].endpoint
+    install_v03_jsonrpc_error_data_passthrough(jsonrpc_endpoint)
 
     async def handle_jsonrpc(request):
         await normalize_v03_jsonrpc_version(request)
diff --git a/src/iac_code/agent/agent_loop.py b/src/iac_code/agent/agent_loop.py
index 9550dbe6..89b73ccd 100644
--- a/src/iac_code/agent/agent_loop.py
+++ b/src/iac_code/agent/agent_loop.py
@@ -9,7 +9,7 @@
 from collections import deque
 from collections.abc import AsyncGenerator, Callable
 from contextlib import suppress
-from dataclasses import dataclass
+from dataclasses import dataclass, replace
 from typing import Any, Literal
 
 from loguru import logger
@@ -73,6 +73,26 @@ def _normalize_memory_filename(filename: Any) -> str:
     return name
 
 
+def _extend_unique(target: list[str], values: list[str]) -> None:
+    seen = set(target)
+    for value in values:
+        if value not in seen:
+            target.append(value)
+            seen.add(value)
+
+
+def _with_trusted_read_directories(permission_context: Any, directories: list[str]) -> Any:
+    if not directories:
+        return permission_context
+
+    trusted_read_directories = list(getattr(permission_context, "trusted_read_directories", []))
+    original_count = len(trusted_read_directories)
+    _extend_unique(trusted_read_directories, directories)
+    if len(trusted_read_directories) == original_count:
+        return permission_context
+    return replace(permission_context, trusted_read_directories=trusted_read_directories)
+
+
 def _filter_recalled_memory_content(content: str, selected_files: list[str]) -> str:
     keep = [_normalize_memory_filename(filename) for filename in selected_files]
     keep = [filename for filename in keep if filename]
@@ -129,6 +149,9 @@ def __init__(
         memory_recall_service: Any = None,
         system_prompt_refresher: Callable[[], str] | None = None,
         pause_event: asyncio.Event | None = None,
+        tool_context_trusted_read_directories: list[str] | None = None,
+        tool_context_relative_read_directories: list[str] | None = None,
+        pipeline_mode: bool = False,
     ) -> None:
         self._provider_manager = provider_manager
         self.system_prompt = system_prompt
@@ -141,6 +164,9 @@ def __init__(
         self._session_usage_totals = self._session_usage_store.load(self._cwd, self._session_id)
         self._permission_context = permission_context
         self._permission_context_getter = permission_context_getter
+        self._tool_context_trusted_read_directories = list(tool_context_trusted_read_directories or [])
+        self._tool_context_relative_read_directories = list(tool_context_relative_read_directories or [])
+        self._pipeline_mode = pipeline_mode
         self._auto_trigger_skills = auto_trigger_skills or []
         self._auto_loaded_skills: set[str] = set()
         self._current_git_branch: str | None = None
@@ -167,7 +193,7 @@ def __init__(
         self._result_storage = ResultStorage(
             storage_dir=os.path.join(str(get_config_dir()), "tool-results", self._session_id),
         )
-        self._pending_injections: deque[str] = deque()
+        self._pending_injections: deque[str | list[ContentBlock]] = deque()
         self._current_turn_text: str = ""
         self._accepting_injected_user_messages = False
         self._pause_event = pause_event
@@ -176,7 +202,7 @@ def __init__(
     def current_turn_text(self) -> str:
         return self._current_turn_text
 
-    def inject_user_message(self, msg: str) -> None:
+    def inject_user_message(self, msg: str | list[ContentBlock]) -> None:
         """Schedule a user message to be injected before the next LLM turn."""
         self._pending_injections.append(msg)
 
@@ -185,13 +211,27 @@ def can_accept_injected_user_message(self) -> bool:
         """Whether a queued supplement can still be consumed by this run."""
         return self._accepting_injected_user_messages
 
-    def try_inject_user_message(self, msg: str) -> bool:
+    def try_inject_user_message(self, msg: str | list[ContentBlock]) -> bool:
         """Queue a supplement only when this loop still has a consumable turn."""
         if not self.can_accept_injected_user_message:
             return False
         self.inject_user_message(msg)
         return True
 
+    def _drain_pending_injections(self) -> None:
+        while self._pending_injections:
+            injected = self._pending_injections.popleft()
+            self.context_manager.add_user_message(injected)
+            if self._session_storage:
+                from iac_code.agent.message import Message
+
+                self._session_storage.append(
+                    self._cwd,
+                    self._session_id,
+                    Message(role="user", content=injected),
+                    git_branch=self._current_git_branch,
+                )
+
     def set_provider(self, provider_manager: Any, system_prompt: str | None = None) -> None:
         """Swap the provider manager in place, preserving conversation history.
 
@@ -347,6 +387,7 @@ def _persist_context_messages(self) -> None:
             self._session_id,
             self.context_manager.get_messages(),
             git_branch=self._current_git_branch,
+            preserve_cleanup_prompts=True,
         )
 
     def _inject_recalled_memory_result(self, result: Any) -> bool:
@@ -765,8 +806,7 @@ async def _run_streaming_inner(
             # inject supplemental user text before the next provider call.
             if self._pause_event is not None:
                 await self._pause_event.wait()
-            while self._pending_injections:
-                self.context_manager.add_user_message(self._pending_injections.popleft())
+            self._drain_pending_injections()
             self._accepting_injected_user_messages = False
             self._current_turn_text = ""
 
@@ -900,7 +940,12 @@ async def _run_streaming_inner(
                             event_queue=queue,
                         )
                     )
-                context = ToolContext(cwd=self._cwd)
+                context = ToolContext(
+                    cwd=self._cwd,
+                    trusted_read_directories=list(self._tool_context_trusted_read_directories),
+                    relative_read_directories=list(self._tool_context_relative_read_directories),
+                    pipeline_mode=self._pipeline_mode,
+                )
 
                 allowed_requests: list[ToolCallRequest] = []
                 denied_results: list[tuple[ToolCallRequest, ToolResult]] = []
@@ -919,7 +964,14 @@ async def _run_streaming_inner(
                     if perm_ctx is not None:
                         from iac_code.services.permissions.pipeline import check_tool_permission
 
-                        permission = await check_tool_permission(tool, request.input, perm_ctx)
+                        effective_perm_ctx = _with_trusted_read_directories(
+                            perm_ctx, self._tool_context_trusted_read_directories
+                        )
+                        _extend_unique(context.additional_directories, list(effective_perm_ctx.additional_directories))
+                        _extend_unique(
+                            context.trusted_read_directories, list(effective_perm_ctx.trusted_read_directories)
+                        )
+                        permission = await check_tool_permission(tool, request.input, effective_perm_ctx)
                     else:
                         permission = await tool.check_permissions(request.input, {"cwd": context.cwd})
 
@@ -1271,6 +1323,7 @@ def stamp_last_turn_elapsed(self, elapsed: float) -> None:
                         self._session_id,
                         msgs,
                         git_branch=self._current_git_branch,
+                        preserve_cleanup_prompts=True,
                     )
                 break
 
diff --git a/src/iac_code/agent/message.py b/src/iac_code/agent/message.py
index 08547cc3..7a2b0eea 100644
--- a/src/iac_code/agent/message.py
+++ b/src/iac_code/agent/message.py
@@ -48,6 +48,7 @@ class ImageBlock(BaseModel):
     type: Literal["image"] = "image"
     media_type: str  # 'image/png' | 'image/jpeg' | 'image/gif' | 'image/webp'
     data: str  # base64
+    ref_id: int | None = None
 
 
 # Union type for all content blocks
diff --git a/src/iac_code/commands/prompt.py b/src/iac_code/commands/prompt.py
index 9089dbcd..24ab7f1c 100644
--- a/src/iac_code/commands/prompt.py
+++ b/src/iac_code/commands/prompt.py
@@ -14,6 +14,7 @@
 from typing import Any, cast
 
 from iac_code.agent.message import RECALLED_MEMORY_MARKER
+from iac_code.agent.message import Message as AgentMessage
 from iac_code.agent.system_prompt import DYNAMIC_BOUNDARY
 from iac_code.i18n import _
 from iac_code.utils.file_security import ensure_private_file
@@ -83,6 +84,14 @@ def build_prompt_snapshot(repl: object) -> dict[str, Any]:
         if "provider_messages" in last_request
         else _provider_messages(agent_loop)
     )
+    cleanup_messages = _cleanup_prompt_messages(repl, agent_loop)
+    provider_messages = _with_cleanup_prompt_messages(
+        repl,
+        agent_loop,
+        provider_messages,
+        cleanup_messages=cleanup_messages,
+    )
+    cleanup_prompts = _cleanup_prompt_snapshots(cleanup_messages)
     tools = list(last_request.get("tools") or []) if "tools" in last_request else _tool_definitions(agent_loop)
     status = _status_snapshot(repl)
     metadata = {
@@ -98,12 +107,22 @@ def build_prompt_snapshot(repl: object) -> dict[str, Any]:
         "system_prompt": system_prompt,
         "system_sections": _split_system_prompt(system_prompt),
         "provider_messages": provider_messages,
+        "cleanup_prompts": cleanup_prompts,
         "tools": tools,
         "memory_sections": _memory_sections(repl),
     }
 
 
 def _pipeline_prompt_snapshot(repl: object) -> dict[str, Any] | None:
+    runtime_getter = getattr(repl, "_get_runtime_mode", None)
+    if callable(runtime_getter):
+        try:
+            runtime_mode = runtime_getter()
+        except Exception:
+            runtime_mode = None
+        if str(getattr(runtime_mode, "value", runtime_mode)) != "pipeline":
+            return None
+
     pipeline = getattr(repl, "_pipeline", None)
     get_prompt_contexts = getattr(pipeline, "get_prompt_contexts", None)
     if not callable(get_prompt_contexts):
@@ -220,6 +239,14 @@ def render_prompt_html(snapshot: dict[str, Any]) -> str:
     provider_messages = "\n".join(
         _message_card(index, message) for index, message in enumerate(snapshot.get("provider_messages", []), start=1)
     )
+    cleanup_messages = list(snapshot.get("cleanup_prompts") or [])
+    if not cleanup_messages:
+        cleanup_messages = [
+            message for message in snapshot.get("provider_messages", []) if _is_cleanup_prompt_snapshot(message)
+        ]
+    cleanup_prompts = "\n".join(
+        _message_card(index, message) for index, message in enumerate(cleanup_messages, start=1)
+    )
     tools = "\n".join(_tool_card(tool) for tool in snapshot.get("tools", []))
     raw_system_prompt = _content_card(
         _("Raw Full System Prompt"),
@@ -232,7 +259,10 @@ def render_prompt_html(snapshot: dict[str, Any]) -> str:
         raw_system_prompt=raw_system_prompt,
     )
     messages_tab = provider_messages or '<p class="empty">{}</p>'.format(escape(_("No provider messages yet.")))
+    cleanup_tab = cleanup_prompts or '<p class="empty">{}</p>'.format(escape(_("No cleanup prompts in this snapshot.")))
     tools_tab = tools or '<p class="empty">{}</p>'.format(escape(_("No tools are currently registered.")))
+    cleanup_tab_button = _tab_button("cleanup", _("Cleanup Prompts")) if cleanup_messages else ""
+    cleanup_panel = _tab_panel("cleanup", cleanup_tab) if cleanup_messages else ""
     return """<!doctype html>
 <html lang="en">
 <head>
@@ -431,11 +461,13 @@ def render_prompt_html(snapshot: dict[str, Any]) -> str:
     {all_tab_button}
     {system_tab_button}
     {messages_tab_button}
+    {cleanup_tab_button}
     {tools_tab_button}
   </nav>
   {all_panel}
   {system_panel}
   {messages_panel}
+  {cleanup_panel}
   {tools_panel}
 </main>
 <script>
@@ -474,10 +506,12 @@ def render_prompt_html(snapshot: dict[str, Any]) -> str:
         all_tab_button=_tab_button("all", _("ALL"), selected=True),
         system_tab_button=_tab_button("system", _("System Prompt")),
         messages_tab_button=_tab_button("messages", _("Provider Messages")),
+        cleanup_tab_button=cleanup_tab_button,
         tools_tab_button=_tab_button("tools", _("Tools")),
         all_panel=_tab_panel("all", all_tab, active=True),
         system_panel=_tab_panel("system", system_tab),
         messages_panel=_tab_panel("messages", messages_tab),
+        cleanup_panel=cleanup_panel,
         tools_panel=_tab_panel("tools", tools_tab),
     )
 
@@ -513,6 +547,231 @@ def _provider_messages(agent_loop: object) -> list[dict[str, Any]]:
     return [_message_snapshot(message) for message in messages]
 
 
+def _is_cleanup_prompt_snapshot(message: Mapping[str, Any]) -> bool:
+    badge = str(message.get("badge") or "")
+    cleanup_badge = _("cleanup prompt")
+    return badge == cleanup_badge or badge.startswith("{} · ".format(cleanup_badge))
+
+
+def _cleanup_prompt_snapshots(cleanup_messages: list[AgentMessage]) -> list[dict[str, Any]]:
+    snapshots: list[dict[str, Any]] = []
+    for cleanup_message in cleanup_messages:
+        snapshot = _message_snapshot(cleanup_message)
+        if not _message_identity(snapshot):
+            continue
+        snapshot["badge"] = _("cleanup prompt")
+        snapshots.append(snapshot)
+    return snapshots
+
+
+def _with_cleanup_prompt_messages(
+    repl: object,
+    agent_loop: object,
+    provider_messages: list[dict[str, Any]],
+    *,
+    cleanup_messages: list[AgentMessage] | None = None,
+) -> list[dict[str, Any]]:
+    messages = [dict(message) for message in provider_messages]
+    cleanup_messages = cleanup_messages if cleanup_messages is not None else _cleanup_prompt_messages(repl, agent_loop)
+    session_messages = _raw_session_messages(repl)
+    ordered_cleanup_messages = _session_ordered_cleanup_messages(session_messages, cleanup_messages)
+    ordered_cleanup_ids = {_raw_cleanup_prompt_identity(message) for message in ordered_cleanup_messages}
+
+    for cleanup_message in ordered_cleanup_messages:
+        _insert_or_mark_cleanup_prompt_message(cleanup_message, session_messages, messages)
+
+    for cleanup_message in cleanup_messages:
+        if _raw_cleanup_prompt_identity(cleanup_message) in ordered_cleanup_ids:
+            continue
+        _mark_existing_cleanup_prompt_message(cleanup_message, messages)
+    return messages
+
+
+def _session_ordered_cleanup_messages(
+    session_messages: list[AgentMessage], cleanup_messages: list[AgentMessage]
+) -> list[AgentMessage]:
+    from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
+    allowed = {_raw_cleanup_prompt_identity(message) for message in cleanup_messages}
+    ordered: list[AgentMessage] = []
+    seen: set[tuple[str, str, str, str]] = set()
+    for message in session_messages:
+        if not is_cleanup_prompt_message(message):
+            continue
+        identity = _raw_cleanup_prompt_identity(message)
+        if identity not in allowed or identity in seen:
+            continue
+        ordered.append(message)
+        seen.add(identity)
+    return ordered
+
+
+def _insert_or_mark_cleanup_prompt_message(
+    cleanup_message: AgentMessage,
+    session_messages: list[AgentMessage],
+    provider_messages: list[dict[str, Any]],
+) -> None:
+    if _mark_existing_cleanup_prompt_message(cleanup_message, provider_messages):
+        return
+    insert_at = _removed_cleanup_prompt_insert_index(cleanup_message, session_messages, provider_messages)
+    if insert_at is None:
+        return
+    snapshot = _message_snapshot(cleanup_message)
+    snapshot["badge"] = _("cleanup prompt · removed")
+    provider_messages.insert(insert_at, snapshot)
+
+
+def _mark_existing_cleanup_prompt_message(
+    cleanup_message: AgentMessage, provider_messages: list[dict[str, Any]]
+) -> bool:
+    cleanup_identity = _message_identity(_message_snapshot(cleanup_message))
+    if cleanup_identity is None:
+        return False
+    marked = False
+    for message in provider_messages:
+        if _message_identity(message) != cleanup_identity:
+            continue
+        message["badge"] = _("cleanup prompt")
+        marked = True
+    return marked
+
+
+def _removed_cleanup_prompt_insert_index(
+    cleanup_message: AgentMessage,
+    session_messages: list[AgentMessage],
+    provider_messages: list[dict[str, Any]],
+) -> int | None:
+    cleanup_raw_identity = _raw_cleanup_prompt_identity(cleanup_message)
+    try:
+        session_index = next(
+            index
+            for index, message in enumerate(session_messages)
+            if _raw_cleanup_prompt_identity(message) == cleanup_raw_identity
+        )
+    except StopIteration:
+        return None
+
+    provider_positions = _unique_provider_message_positions(provider_messages)
+    previous_position = _nearest_session_anchor_position(
+        session_messages[:session_index],
+        provider_positions,
+        reverse=True,
+    )
+    next_position = _nearest_session_anchor_position(
+        session_messages[session_index + 1 :],
+        provider_positions,
+        reverse=False,
+    )
+    if previous_position is None or next_position is None or previous_position >= next_position:
+        return None
+    return next_position
+
+
+def _unique_provider_message_positions(provider_messages: list[dict[str, Any]]) -> dict[tuple[str, str], int]:
+    counts: dict[tuple[str, str], int] = {}
+    positions: dict[tuple[str, str], int] = {}
+    for index, message in enumerate(provider_messages):
+        identity = _message_identity(message)
+        if identity is None or _is_cleanup_prompt_snapshot(message):
+            continue
+        counts[identity] = counts.get(identity, 0) + 1
+        positions[identity] = index
+    return {identity: positions[identity] for identity, count in counts.items() if count == 1}
+
+
+def _nearest_session_anchor_position(
+    session_messages: list[AgentMessage],
+    provider_positions: dict[tuple[str, str], int],
+    *,
+    reverse: bool,
+) -> int | None:
+    from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
+    iterable = reversed(session_messages) if reverse else iter(session_messages)
+    for message in iterable:
+        if is_cleanup_prompt_message(message):
+            continue
+        identity = _message_identity(_message_snapshot(message))
+        if identity is None:
+            continue
+        position = provider_positions.get(identity)
+        if position is not None:
+            return position
+    return None
+
+
+def _cleanup_prompt_messages(repl: object, agent_loop: object) -> list[AgentMessage]:
+    from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
+    found: list[AgentMessage] = []
+    seen: set[tuple[str, str, str, str]] = set()
+    for message in _raw_context_messages(agent_loop) + _raw_session_messages(repl):
+        if not is_cleanup_prompt_message(message):
+            continue
+        identity = _raw_cleanup_prompt_identity(message)
+        if identity in seen:
+            continue
+        found.append(message)
+        seen.add(identity)
+    return found
+
+
+def _raw_context_messages(agent_loop: object) -> list[AgentMessage]:
+    context_manager = getattr(agent_loop, "context_manager", None)
+    getter = getattr(context_manager, "get_messages", None)
+    if not callable(getter):
+        return []
+    try:
+        messages = getter()
+    except Exception:
+        return []
+    return [message for message in list(messages or []) if isinstance(message, AgentMessage)]
+
+
+def _raw_session_messages(repl: object) -> list[AgentMessage]:
+    session_storage = getattr(repl, "_session_storage", None)
+    loader = getattr(session_storage, "load", None)
+    if not callable(loader):
+        return []
+    cwd = getattr(repl, "_original_cwd", None)
+    session_id = getattr(repl, "_session_id", None)
+    if not isinstance(cwd, str) or not isinstance(session_id, str):
+        return []
+    try:
+        messages = loader(cwd, session_id)
+    except Exception:
+        return []
+    return [message for message in list(messages or []) if isinstance(message, AgentMessage)]
+
+
+def _raw_cleanup_prompt_identity(message: AgentMessage) -> tuple[str, str, str, str]:
+    metadata = getattr(message, "metadata", {}) or {}
+    if not isinstance(metadata, Mapping):
+        metadata = {}
+    return (
+        str(getattr(message, "role", "") or ""),
+        _content_identity(getattr(message, "content", "")),
+        str(metadata.get("cleanupLedgerPath") or metadata.get("cleanup_ledger_path") or ""),
+        str(metadata.get("cleanupStatus") or metadata.get("cleanup_status") or ""),
+    )
+
+
+def _message_identity(message: dict[str, Any]) -> tuple[str, str] | None:
+    content = _content_identity(message.get("content", ""))
+    if not content:
+        return None
+    return (str(message.get("role") or ""), content)
+
+
+def _content_identity(content: object) -> str:
+    if isinstance(content, str):
+        return content
+    try:
+        return json.dumps(content, sort_keys=True, ensure_ascii=False)
+    except TypeError:
+        return str(content)
+
+
 def _last_provider_request(agent_loop: object) -> dict[str, Any]:
     getter = getattr(agent_loop, "get_last_provider_request_snapshot", None)
     if not callable(getter):
@@ -677,6 +936,9 @@ def _render_all_tab(snapshot: dict[str, Any]) -> str:
     system_sections = list(snapshot.get("system_sections") or [])
     provider_messages = list(snapshot.get("provider_messages") or [])
     tools = list(snapshot.get("tools") or [])
+    cleanup_messages = list(snapshot.get("cleanup_prompts") or [])
+    if not cleanup_messages:
+        cleanup_messages = [message for message in provider_messages if _is_cleanup_prompt_snapshot(message)]
     has_recalled_memory = any(_is_recalled_memory_content(message.get("content", "")) for message in provider_messages)
     recalled_line = (
         _("Present in Provider Messages as a hidden conversation <system-reminder>.")
@@ -697,6 +959,7 @@ def _render_all_tab(snapshot: dict[str, Any]) -> str:
             _("   Details: Provider Messages tab"),
             _("   Messages: {count}").format(count=len(provider_messages)),
             _("   Recalled memory: {status}").format(status=recalled_line),
+            _("   Cleanup prompts: {count}").format(count=len(cleanup_messages)),
             "",
             _("3. Tools"),
             _("   Provider field: tools"),
@@ -724,6 +987,17 @@ def _render_all_tab(snapshot: dict[str, Any]) -> str:
                     status=_("present") if has_recalled_memory else _("not present"),
                 ),
             )
+            + (
+                _assembly_step(
+                    _("Cleanup Prompts"),
+                    "cleanup",
+                    _("Cleanup Prompts"),
+                    _("Rollback cleanup prompts are also shown separately for quick inspection."),
+                    _("{count} cleanup prompts").format(count=len(cleanup_messages)),
+                )
+                if cleanup_messages
+                else ""
+            )
             + _assembly_step(
                 _("3. Tools"),
                 "tools",
@@ -760,7 +1034,9 @@ def _message_card(index: int, message: dict[str, Any]) -> str:
     content = message.get("content", "")
     if not isinstance(content, str):
         content = json.dumps(content, indent=2, ensure_ascii=False)
-    badge = _("recalled memory") if _is_recalled_memory_content(message.get("content", "")) else _("message")
+    badge = str(message.get("badge") or "")
+    if not badge:
+        badge = _("recalled memory") if _is_recalled_memory_content(message.get("content", "")) else _("message")
     return _content_card("#{index} {role}".format(index=index, role=role), content, badge=badge)
 
 
diff --git a/src/iac_code/i18n/locales/de/LC_MESSAGES/messages.po b/src/iac_code/i18n/locales/de/LC_MESSAGES/messages.po
index 6a483705..3b0d4e7f 100644
--- a/src/iac_code/i18n/locales/de/LC_MESSAGES/messages.po
+++ b/src/iac_code/i18n/locales/de/LC_MESSAGES/messages.po
@@ -48,6 +48,38 @@ msgstr "Unsicherer Artefaktdateiname"
 msgid "Unknown error"
 msgstr "Unbekannter Fehler"
 
+#: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
+msgid ""
+"Cleanup state unavailable. Inspect the session file and cloud resources "
+"manually."
+msgstr ""
+"Bereinigungsstatus nicht verfügbar. Prüfen Sie die Sitzungsdatei und "
+"Cloud-Ressourcen manuell."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup deferred prompt state is unavailable. Please repair it "
+"before continuing."
+msgstr ""
+"Der verzögerte Prompt-Status der Rollback-Bereinigung ist nicht "
+"verfügbar. Bitte reparieren Sie ihn, bevor Sie fortfahren."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup state is unavailable. Please repair the cleanup ledger "
+"before continuing."
+msgstr ""
+"Der Status der Rollback-Bereinigung ist nicht verfügbar. Bitte reparieren"
+" Sie das Bereinigungs-Ledger, bevor Sie fortfahren."
+
+#: src/iac_code/a2a/executor.py src/iac_code/ui/repl.py
+msgid ""
+"Rollback cleanup is still in progress. Please continue after cleanup "
+"completes."
+msgstr ""
+"Die Rollback-Bereinigung läuft noch. Bitte fahren Sie fort, nachdem die "
+"Bereinigung abgeschlossen ist."
+
 #: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
 msgid "Task is already working."
 msgstr "Die Aufgabe läuft bereits."
@@ -57,6 +89,11 @@ msgstr "Die Aufgabe läuft bereits."
 msgid "Task canceled."
 msgstr "Aufgabe abgebrochen."
 
+#: src/iac_code/a2a/executor.py
+#, python-brace-format
+msgid "Current model {model} does not support image input."
+msgstr "Aktuelles Modell {model} unterstützt keine Bildeingabe."
+
 #: src/iac_code/a2a/pipeline_executor.py
 msgid "A temporary error occurred. Please retry."
 msgstr "Ein temporärer Fehler ist aufgetreten. Bitte erneut versuchen."
@@ -67,6 +104,11 @@ msgstr ""
 "Authentifizierung erforderlich. Anmeldedaten konfigurieren und erneut "
 "versuchen."
 
+#: src/iac_code/a2a/pipeline_executor.py
+#, python-brace-format
+msgid "Pipeline already running. Resume task {task_id}."
+msgstr "Pipeline läuft bereits. Setzen Sie Aufgabe {task_id} fort."
+
 #: src/iac_code/a2a/pipeline_recovery.py
 msgid "A2A pipeline state not found"
 msgstr "A2A-Pipeline-Zustand nicht gefunden"
@@ -500,6 +542,22 @@ msgstr "KI-gestütztes Tool zur Orchestrierung von Infrastruktur"
 msgid "Use iac-code as an A2A client."
 msgstr "iac-code als A2A-Client verwenden."
 
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A client dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"A2A-Client-Abhängigkeiten fehlen. Installieren mit: pip install 'iac-"
+"code[a2a]'"
+
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A server dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"A2A-Server-Abhängigkeiten fehlen. Installieren mit: pip install 'iac-"
+"code[a2a]'"
+
 #: src/iac_code/cli/main.py
 msgid "Install Git for Windows via the npmmirror mirror (Windows only)."
 msgstr "Git for Windows über den npmmirror-Spiegel installieren (nur Windows)."
@@ -512,14 +570,6 @@ msgstr "iac-code auf die neueste Version aktualisieren."
 msgid "YAML config file containing A2A client options"
 msgstr "YAML-Konfigurationsdatei mit A2A-Client-Optionen"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A client dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"A2A-Client-Abhängigkeiten fehlen. Installieren mit: pip install 'iac-"
-"code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "LLM model to use"
 msgstr "Zu verwendendes LLM-Modell"
@@ -658,14 +708,6 @@ msgstr ""
 "Legt A2A-Thinking-Signaltypen offen; fuer mehrere Werte wiederholen. "
 "Werte: raw-thinking, tool-trace."
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A server dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"A2A-Server-Abhängigkeiten fehlen. Installieren mit: pip install 'iac-"
-"code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "Send a prompt to an A2A JSON-RPC endpoint."
 msgstr "Sendet einen Prompt an einen A2A-JSON-RPC-Endpunkt."
@@ -1562,10 +1604,18 @@ msgstr "Der System-Prompt ist leer."
 msgid "No provider messages yet."
 msgstr "Noch keine Anbieternachrichten."
 
+#: src/iac_code/commands/prompt.py
+msgid "No cleanup prompts in this snapshot."
+msgstr "In diesem Snapshot gibt es keine Bereinigungs-Prompts."
+
 #: src/iac_code/commands/prompt.py
 msgid "No tools are currently registered."
 msgstr "Derzeit sind keine Tools registriert."
 
+#: src/iac_code/commands/prompt.py
+msgid "Cleanup Prompts"
+msgstr "Bereinigungs-Prompts"
+
 #: src/iac_code/commands/prompt.py
 msgid "IAC-CODE Prompt Snapshot"
 msgstr "IAC-CODE-Prompt-Snapshot"
@@ -1602,6 +1652,14 @@ msgstr "Anbieternachrichten"
 msgid "Tools"
 msgstr "Tools"
 
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt"
+msgstr "Bereinigungs-Prompt"
+
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt · removed"
+msgstr "Bereinigungs-Prompt · entfernt"
+
 #: src/iac_code/commands/prompt.py
 msgid "Instruction Memory"
 msgstr "Anweisungsspeicher"
@@ -1681,6 +1739,11 @@ msgstr "   Nachrichten: {count}"
 msgid "   Recalled memory: {status}"
 msgstr "   Abgerufener Speicher: {status}"
 
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "   Cleanup prompts: {count}"
+msgstr "   Bereinigungs-Prompts: {count}"
+
 #: src/iac_code/commands/prompt.py
 msgid "3. Tools"
 msgstr "3. Tools"
@@ -1730,6 +1793,17 @@ msgstr "vorhanden"
 msgid "not present"
 msgstr "nicht vorhanden"
 
+#: src/iac_code/commands/prompt.py
+msgid "Rollback cleanup prompts are also shown separately for quick inspection."
+msgstr ""
+"Rollback-Bereinigungs-Prompts werden zur schnellen Prüfung auch separat "
+"angezeigt."
+
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "{count} cleanup prompts"
+msgstr "{count} Bereinigungs-Prompts"
+
 #: src/iac_code/commands/prompt.py
 msgid "Tool definitions available to the main model for this request."
 msgstr "Für diese Anfrage verfügbare Tooldefinitionen für das Hauptmodell."
@@ -1761,6 +1835,7 @@ msgid "Input schema"
 msgstr "Eingabeschema"
 
 #: src/iac_code/commands/prompt.py
+#: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid "tool"
 msgstr "Tool"
 
@@ -2055,6 +2130,25 @@ msgstr ""
 msgid "Memory name to read. Omit to list all."
 msgstr "Name des zu lesenden Speichers. Weglassen, um alle aufzulisten."
 
+#: src/iac_code/memory/memory_tools.py
+#, python-brace-format
+msgid ""
+"{base}\n"
+"\n"
+"Available memories:\n"
+"{index}\n"
+"\n"
+"Call read_memory again with one of these names, or omit name to list all "
+"memories."
+msgstr ""
+"{base}\n"
+"\n"
+"Verfügbare Speicher:\n"
+"{index}\n"
+"\n"
+"Rufen Sie read_memory erneut mit einem dieser Namen auf, oder lassen Sie "
+"name weg, um alle Speicher aufzulisten."
+
 #: src/iac_code/memory/memory_tools.py
 #, python-brace-format
 msgid ""
@@ -2157,6 +2251,148 @@ msgstr "ask_user_question erfordert eine Pipeline-Ereigniswarteschlange."
 msgid "User cancelled ask_user_question."
 msgstr "Der Benutzer hat ask_user_question abgebrochen."
 
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"Cloud resources still need cleanup after pipeline rollback. Clean them up"
+" now and keep checking until deletion completes."
+msgstr ""
+"Cloud-Ressourcen müssen nach dem Pipeline-Rollback noch bereinigt werden."
+" Bereinigen Sie sie jetzt und prüfen Sie weiter, bis die Löschung "
+"abgeschlossen ist."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Requirements:"
+msgstr "Anforderungen:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup scope is a strict allowlist: delete only ids in the cleanup "
+"resources list below."
+msgstr ""
+"- Der Bereinigungsumfang ist eine strikte Allowlist: Löschen Sie nur die "
+"IDs in der unten stehenden Bereinigungsressourcenliste."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not delete, modify, or roll back any stack or cloud resource outside"
+" the cleanup resources list."
+msgstr ""
+"- Löschen, ändern oder rollen Sie keine Stacks oder Cloud-Ressourcen "
+"außerhalb der Bereinigungsressourcenliste zurück."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not call ListStacks or search for other stacks by name; cleanup "
+"resource ids are fully listed."
+msgstr ""
+"- Rufen Sie ListStacks nicht auf und suchen Sie nicht nach anderen Stacks"
+" anhand des Namens; die Bereinigungsressourcen-IDs sind vollständig "
+"aufgeführt."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Before every GetStack/DeleteStack call, verify that StackId exactly "
+"matches an id in the cleanup resources list."
+msgstr ""
+"- Prüfen Sie vor jedem GetStack/DeleteStack-Aufruf, dass die StackId "
+"genau mit einer ID in der Bereinigungsressourcenliste übereinstimmt."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If StackId is not in the cleanup resources list, do not call "
+"DeleteStack, even if it is the current handoff or newly created stack."
+msgstr ""
+"- Wenn die StackId nicht in der Bereinigungsressourcenliste steht, rufen "
+"Sie DeleteStack nicht auf, selbst wenn es der aktuelle Handoff- oder neu "
+"erstellte Stack ist."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not infer extra cleanup targets from pipeline handoff, "
+"deployment.stack_id, current stack, or resources_created; those may be "
+"final delivered resources."
+msgstr ""
+"- Leiten Sie keine zusätzlichen Bereinigungsziele aus Pipeline-Handoff, "
+"deployment.stack_id, aktuellem Stack oder resources_created ab; das "
+"können finale Auslieferungsressourcen sein."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not expand cleanup scope for user follow-ups, continue instructions,"
+" or pipeline handoff context."
+msgstr ""
+"- Erweitern Sie den Bereinigungsumfang nicht aufgrund von Benutzer-"
+"Rückfragen, Continue-Anweisungen oder Pipeline-Handoff-Kontext."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- When resuming cleanup, still process only resources listed in this "
+"prompt; do not inspect or delete others."
+msgstr ""
+"- Verarbeiten Sie beim Fortsetzen der Bereinigung weiterhin nur die in "
+"diesem Prompt aufgeführten Ressourcen; prüfen oder löschen Sie keine "
+"anderen."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Prefer available ROS stack tools for deletion; if using aliyun_api, "
+"call DeleteStack first, then repeatedly call GetStack to check status."
+msgstr ""
+"- Verwenden Sie für die Löschung bevorzugt verfügbare ROS-Stack-Tools; "
+"wenn Sie aliyun_api verwenden, rufen Sie zuerst DeleteStack auf und "
+"anschließend wiederholt GetStack, um den Status zu prüfen."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If a resource is already deleting, call GetStack first, then decide "
+"whether DeleteStack is needed again."
+msgstr ""
+"- Wenn eine Ressource bereits gelöscht wird, rufen Sie zuerst GetStack "
+"auf und entscheiden Sie dann, ob DeleteStack erneut nötig ist."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or "
+"unknown status, tell the user the failure reason and next step."
+msgstr ""
+"- Die Bereinigung ist erst nach DELETE_COMPLETE abgeschlossen; bei "
+"DELETE_FAILED oder unbekanntem Status nennen Sie dem Benutzer den "
+"Fehlergrund und den nächsten Schritt."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- After all listed resources are DELETE_COMPLETE, stop this cleanup turn "
+"immediately."
+msgstr ""
+"- Nachdem alle aufgeführten Ressourcen DELETE_COMPLETE erreicht haben, "
+"beenden Sie diesen Bereinigungsschritt sofort."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "- Briefly update the user during cleanup."
+msgstr ""
+"- Informieren Sie den Benutzer während der Bereinigung kurz über den "
+"Fortschritt."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Cleanup resources:"
+msgstr "Bereinigungsressourcen:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid ""
+"{index}. provider={provider}, type={resource_type}, id={resource_id}, "
+"name={name}, region={region}"
+msgstr ""
+"{index}. Anbieter={provider}, Typ={resource_type}, ID={resource_id}, "
+"Name={name}, Region={region}"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid "Detected {count} rollback cleanup resources; starting cleanup."
+msgstr ""
+"{count} Rollback-Bereinigungsressourcen erkannt; Bereinigung wird "
+"gestartet."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid ""
 "Complete the current step by calling this tool to submit the conclusion. "
@@ -2260,23 +2496,52 @@ msgstr ""
 "{message} complete_step.conclusion muss eines dieser Felder enthalten: "
 "{fields}."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "A successful tool result is required before completing the current step."
+msgstr ""
+"Vor dem Abschluss des aktuellen Schritts ist ein erfolgreiches Tool-"
+"Ergebnis erforderlich."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
-msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgid ""
+"{message} complete_step.conclusion.{field} must match the {tool} result "
+"value {value}."
 msgstr ""
-"Die Anzahl der Kandidaten darf {limit} nicht überschreiten; {count} "
-"wurden übermittelt."
+"{message} complete_step.conclusion.{field} muss dem Ergebniswert {value} "
+"von {tool} entsprechen."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "<missing>"
+msgstr "<fehlt>"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " with status {statuses}"
+msgstr " mit Status {statuses}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " and is_success={expected}"
+msgstr " und is_success={expected}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " one of {actions}"
+msgstr " mit einer der Aktionen {actions}"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid ""
-"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
-"user for help or narrow the rollback targets before calling "
-"complete_step."
+"{message} Call {tool}{action} first and wait for a successful "
+"result{status_hint}{success_hint}."
 msgstr ""
-"Die Anzahl der Rücksetzungsziele darf {limit} nicht überschreiten; es "
-"gibt {count}. Bitten Sie den Benutzer um Hilfe oder grenzen Sie die Ziele"
-" ein, bevor Sie complete_step aufrufen."
+"{message} Rufen Sie zuerst {tool}{action} auf und warten Sie auf ein "
+"erfolgreiches Ergebnis{status_hint}{success_hint}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "the required tool"
+msgstr "das erforderliche Tool"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
@@ -2288,6 +2553,24 @@ msgstr ""
 "Schließen Sie den aktuellen Schritt ab oder bitten Sie den Benutzer um "
 "Hilfe."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgstr ""
+"Die Anzahl der Kandidaten darf {limit} nicht überschreiten; {count} "
+"wurden übermittelt."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid ""
+"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
+"user for help or narrow the rollback targets before calling "
+"complete_step."
+msgstr ""
+"Die Anzahl der Rücksetzungsziele darf {limit} nicht überschreiten; es "
+"gibt {count}. Bitten Sie den Benutzer um Hilfe oder grenzen Sie die Ziele"
+" ein, bevor Sie complete_step aufrufen."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid "Schema validation failed after {attempts} attempts: {error}"
@@ -2314,6 +2597,10 @@ msgstr ""
 msgid "Step {step_id} completed. Conclusion submitted."
 msgstr "Schritt {step_id} abgeschlossen. Schlussfolgerung übermittelt."
 
+#: src/iac_code/pipeline/engine/pipeline_runner.py
+msgid "Pipeline state persistence failed."
+msgstr "Persistenz des Pipeline-Zustands fehlgeschlagen."
+
 #: src/iac_code/pipeline/engine/pipeline_runner.py
 #: src/iac_code/pipeline/engine/sub_pipeline_executor.py
 #: src/iac_code/ui/repl.py
@@ -2414,6 +2701,10 @@ msgstr "Der Template-Dateipfad muss relativ zum Arbeitsverzeichnis sein"
 msgid "Template file path cannot escape the working directory"
 msgstr "Der Template-Dateipfad darf das Arbeitsverzeichnis nicht verlassen"
 
+#: src/iac_code/pipeline/engine/user_input.py
+msgid "[Image input]"
+msgstr "[Bildeingabe]"
+
 #: src/iac_code/pipeline/selling/tools/show_candidate_detail_tool.py
 msgid ""
 "Display candidate details (summary and cost breakdown) in the comparison "
@@ -3302,6 +3593,17 @@ msgstr "ROS Stack"
 msgid "CloudStackInstances"
 msgstr "CloudStackInstances"
 
+#: src/iac_code/tools/cloud/aliyun/template_source.py
+msgid ""
+"ROS template calls must use TemplateURL instead of TemplateBody. Save the"
+" template to a file and pass params.TemplateURL, for example a local file"
+" path or OSS/HTTP URL."
+msgstr ""
+"ROS-Vorlagenaufrufe müssen TemplateURL statt TemplateBody verwenden. "
+"Speichern Sie die Vorlage in einer Datei und übergeben Sie "
+"params.TemplateURL, zum Beispiel einen lokalen Dateipfad oder eine OSS"
+"/HTTP-URL."
+
 #: src/iac_code/tools/cloud/aliyun/hooks/ros_validate.py
 #, python-brace-format
 msgid "Template YAML syntax error: {}"
@@ -3418,11 +3720,11 @@ msgstr "Unterbrochen"
 msgid "Running"
 msgstr "Läuft"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Completed"
 msgstr "Abgeschlossen"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Failed"
 msgstr "Fehlgeschlagen"
 
@@ -3699,8 +4001,130 @@ msgid "Command has no handler: {name}"
 msgstr "Kein Handler für Befehl: {name}"
 
 #: src/iac_code/ui/repl.py
-msgid "Note: images are not supported in pipeline mode and will be ignored."
-msgstr "Hinweis: Bilder werden im Pipeline-Modus nicht unterstützt und ignoriert."
+#, python-brace-format
+msgid "↺ Rollback cleanup [{badge}] {label}"
+msgstr "↺ Rollback-Bereinigung [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{kind} {resource_id}"
+msgstr "{kind} {resource_id}"
+
+#: src/iac_code/ui/repl.py
+msgid "Deleting"
+msgstr "Löschen"
+
+#: src/iac_code/ui/repl.py
+msgid "Skipped"
+msgstr "Übersprungen"
+
+#: src/iac_code/ui/repl.py
+msgid "Pending"
+msgstr "Ausstehend"
+
+#: src/iac_code/ui/repl.py
+msgid "Checking"
+msgstr "Prüfen"
+
+#: src/iac_code/ui/repl.py
+msgid "Progress"
+msgstr "Fortschritt"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "DeleteStack submitted; waiting for deletion to complete ({progress})"
+msgstr "DeleteStack übermittelt; warte auf Abschluss der Löschung ({progress})"
+
+#: src/iac_code/ui/repl.py
+msgid "DeleteStack submitted; waiting for deletion to complete"
+msgstr "DeleteStack übermittelt; warte auf Abschluss der Löschung"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Deleting ({progress})"
+msgstr "Wird gelöscht ({progress})"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{progress}; deletion required"
+msgstr "{progress}; Löschung erforderlich"
+
+#: src/iac_code/ui/repl.py
+msgid "stack"
+msgstr "Stack"
+
+#: src/iac_code/ui/repl.py
+msgid "resource"
+msgstr "Ressource"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Could not read rollback cleanup records. The cleanup prompt was kept; "
+"retry later or inspect manually."
+msgstr ""
+"Rollback-Bereinigungsdatensätze konnten nicht gelesen werden. Der "
+"Bereinigungs-Prompt wurde beibehalten; versuchen Sie es später erneut "
+"oder prüfen Sie manuell."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} additional resources needing attention were not shown."
+msgstr ""
+"{count} weitere Ressourcen, die Aufmerksamkeit erfordern, wurden nicht "
+"angezeigt."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: all {count} records are completed."
+msgstr ""
+"↺ Rollback-Bereinigung fortsetzen: Alle {count} Datensätze sind "
+"abgeschlossen."
+
+#: src/iac_code/ui/repl.py
+msgid "failed"
+msgstr "fehlgeschlagen"
+
+#: src/iac_code/ui/repl.py
+msgid "pending"
+msgstr "ausstehend"
+
+#: src/iac_code/ui/repl.py
+msgid "in progress"
+msgstr "in Bearbeitung"
+
+#: src/iac_code/ui/repl.py
+msgid "completed"
+msgstr "abgeschlossen"
+
+#: src/iac_code/ui/repl.py
+msgid "skipped"
+msgstr "übersprungen"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} {label}"
+msgstr "{count} {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records, {summary}."
+msgstr "↺ Rollback-Bereinigung fortsetzen: {count} Datensätze, {summary}."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records."
+msgstr "↺ Rollback-Bereinigung fortsetzen: {count} Datensätze."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "  [{badge}] {label}"
+msgstr "  [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+msgid "Detected rollback cleanup resources, but cleanup prompt injection failed."
+msgstr ""
+"Rollback-Bereinigungsressourcen wurden erkannt, aber das Einfügen des "
+"Bereinigungs-Prompts ist fehlgeschlagen."
 
 #: src/iac_code/ui/repl.py
 #, python-brace-format
@@ -3709,11 +4133,28 @@ msgstr "Gespeicherter Pipeline-Zustand wird ignoriert: {reason}"
 
 #: src/iac_code/ui/repl.py
 msgid ""
-"Pipeline completed. Normal chat is active, but the handoff context could "
-"not be injected or saved."
+"Pipeline state persistence failed. The pipeline is paused; do not "
+"continue until state is durable."
 msgstr ""
-"Die Pipeline wurde abgeschlossen. Der normale Chat ist aktiv, aber der "
-"Übergabekontext konnte nicht eingefügt oder gespeichert werden."
+"Persistenz des Pipeline-Zustands fehlgeschlagen. Die Pipeline ist "
+"pausiert; fahren Sie nicht fort, bis der Zustand dauerhaft gespeichert "
+"ist."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline state persistence failed. Normal chat handoff was not marked "
+"durable."
+msgstr ""
+"Persistenz des Pipeline-Zustands fehlgeschlagen. Der Handoff zum normalen"
+" Chat wurde nicht dauerhaft markiert."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline completed, but the handoff context could not be injected or "
+"saved."
+msgstr ""
+"Pipeline abgeschlossen, aber der Handoff-Kontext konnte nicht eingefügt "
+"oder gespeichert werden."
 
 #: src/iac_code/ui/repl.py
 msgid "Judging your input..."
@@ -3893,6 +4334,11 @@ msgstr "  ✓ {name}: abgeschlossen\n"
 msgid "  ✘ {name}: Failed"
 msgstr "  ✘ {name}: fehlgeschlagen"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Pipeline warning: {reason}"
+msgstr "Pipeline-Warnung: {reason}"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Option {index}"
@@ -3974,6 +4420,15 @@ msgstr "unbekannter Fehler"
 msgid "Resumed pipeline at step: {step}"
 msgstr "Pipeline bei Schritt fortgesetzt: {step}"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Could not read pipeline state metadata: {reason}"
+msgstr "Pipeline-Zustandsmetadaten konnten nicht gelesen werden: {reason}"
+
+#: src/iac_code/ui/repl.py
+msgid "Pipeline state metadata is invalid; continuing as normal chat."
+msgstr "Pipeline-Zustandsmetadaten sind ungültig; fahre als normaler Chat fort."
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Found pipeline state in this session (paused at: {step})."
@@ -4536,3 +4991,207 @@ msgstr "Stacktrace im öffentlichen Ereignis ausgelassen; siehe error_id."
 
 #~ msgid "Project Memory Index"
 #~ msgstr "Projektspeicherindex"
+
+#~ msgid "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+#~ msgstr ""
+#~ "Es wurden Cloud-Ressourcen erkannt, die"
+#~ " nach dem Pipeline-Rollback noch "
+#~ "bereinigt werden müssen. Bereinigen Sie "
+#~ "sie sofort und prüfen Sie weiter, "
+#~ "bis das Löschen abgeschlossen ist."
+
+#~ msgid "要求："
+#~ msgstr "Anforderungen:"
+
+#~ msgid "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+#~ msgstr ""
+#~ "- Der Bereinigungsumfang ist eine "
+#~ "strikte Positivliste: Es dürfen nur die"
+#~ " IDs in der folgenden Liste „Zu "
+#~ "bereinigende Ressourcen“ gelöscht werden."
+
+#~ msgid "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+#~ msgstr ""
+#~ "- Löschen, ändern oder rollen Sie "
+#~ "keine Stacks oder Cloud-Ressourcen "
+#~ "zurück, die nicht unter „Zu bereinigende"
+#~ " Ressourcen“ aufgeführt sind."
+
+#~ msgid "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+#~ msgstr ""
+#~ "- ListStacks nicht aufrufen und nicht"
+#~ " nach anderen Stacks per Name suchen;"
+#~ " die IDs der zu bereinigenden "
+#~ "Ressourcen sind vollstaendig aufgelistet."
+
+#~ msgid "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+#~ msgstr ""
+#~ "- Vor jedem Aufruf von "
+#~ "GetStack/DeleteStack muss geprueft werden, "
+#~ "dass StackId exakt einer ID in der"
+#~ " Liste der zu bereinigenden Ressourcen "
+#~ "entspricht."
+
+#~ msgid "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+#~ msgstr ""
+#~ "- Wenn StackId nicht in der Liste"
+#~ " der zu bereinigenden Ressourcen steht, "
+#~ "darf DeleteStack nicht aufgerufen werden, "
+#~ "selbst wenn es der aktuelle Handoff-"
+#~ "Stack oder ein gerade erstellter Stack"
+#~ " ist."
+
+#~ msgid ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+#~ msgstr ""
+#~ "- Leiten Sie keine zusätzlichen "
+#~ "Bereinigungsobjekte aus pipeline handoff, "
+#~ "deployment.stack_id, current stack oder "
+#~ "resources_created ab; sie können erfolgreich"
+#~ " bereitgestellte Endressourcen sein."
+
+#~ msgid "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+#~ msgstr ""
+#~ "- Auch bei weiteren Nutzerfragen, "
+#~ "Fortsetzungsanweisungen oder Pipeline-Handoff-"
+#~ "Kontext in dieser Runde darf der "
+#~ "Bereinigungsumfang nicht erweitert werden."
+
+#~ msgid "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+#~ msgstr ""
+#~ "- Beim Wiederaufnehmen oder Fortsetzen "
+#~ "der Bereinigung nur die in diesem "
+#~ "Hinweis aufgelisteten Ressourcen verarbeiten; "
+#~ "keine anderen Ressourcen pruefen oder "
+#~ "loeschen."
+
+#~ msgid ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+#~ msgstr ""
+#~ "- Verwenden Sie bevorzugt das verfügbare"
+#~ " ROS-stack-Tool zum Löschen; wenn "
+#~ "Sie aliyun_api nutzen, führen Sie zuerst"
+#~ " DeleteStack aus und prüfen Sie den"
+#~ " Status wiederholt mit GetStack."
+
+#~ msgid "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+#~ msgstr ""
+#~ "- Wenn die Ressource bereits gelöscht"
+#~ " wird, prüfen Sie zuerst den "
+#~ "aktuellen Status mit GetStack, bevor Sie"
+#~ " entscheiden, ob DeleteStack erneut nötig"
+#~ " ist."
+
+#~ msgid "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+#~ msgstr ""
+#~ "- Die Bereinigung gilt erst nach "
+#~ "Bestätigung von DELETE_COMPLETE als "
+#~ "abgeschlossen; bei DELETE_FAILED oder "
+#~ "fehlender Bestätigung erklären Sie dem "
+#~ "Nutzer die Fehlerursache und den "
+#~ "nächsten Schritt."
+
+#~ msgid "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+#~ msgstr ""
+#~ "- Sobald alle Ressourcen in der "
+#~ "Liste DELETE_COMPLETE erreicht haben, stoppen"
+#~ " Sie diese Bereinigung sofort; löschen "
+#~ "oder prüfen Sie keine anderen Stacks."
+
+#~ msgid "- 清理过程中向用户简短同步进度。"
+#~ msgstr ""
+#~ "- Informieren Sie den Nutzer während "
+#~ "der Bereinigung kurz über den "
+#~ "Fortschritt."
+
+#~ msgid "待清理资源："
+#~ msgstr "Zu bereinigende Ressourcen:"
+
+#~ msgid "检测到 {count} 个回滚残留资源，开始清理流程。"
+#~ msgstr ""
+#~ "{count} verbleibende Rollback-Ressourcen "
+#~ "erkannt; Bereinigungsablauf wird gestartet."
+
+#~ msgid "错误：{error}"
+#~ msgstr "Fehler: {error}"
+
+#~ msgid "删除中"
+#~ msgstr "Wird gelöscht"
+
+#~ msgid "完成"
+#~ msgstr "Abgeschlossen"
+
+#~ msgid "失败"
+#~ msgstr "Fehlgeschlagen"
+
+#~ msgid "跳过"
+#~ msgstr "Übersprungen"
+
+#~ msgid "待处理"
+#~ msgstr "Ausstehend"
+
+#~ msgid "检查"
+#~ msgstr "Prüfen"
+
+#~ msgid "进度"
+#~ msgstr "Fortschritt"
+
+#~ msgid "DeleteStack 已提交，等待删除完成（{progress}）"
+#~ msgstr ""
+#~ "DeleteStack wurde übermittelt; warte auf "
+#~ "Abschluss des Löschvorgangs ({progress})"
+
+#~ msgid "DeleteStack 已提交，等待删除完成"
+#~ msgstr "DeleteStack wurde übermittelt; warte auf Abschluss des Löschvorgangs"
+
+#~ msgid "已跳过"
+#~ msgstr "Übersprungen"
+
+#~ msgid "正在删除（{progress}）"
+#~ msgstr "Wird gelöscht ({progress})"
+
+#~ msgid "{progress}，需要删除"
+#~ msgstr "{progress}, Löschen erforderlich"
+
+#~ msgid "资源栈"
+#~ msgstr "Ressourcen-Stack"
+
+#~ msgid "资源"
+#~ msgstr "Ressource"
+
+#~ msgid "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+#~ msgstr ""
+#~ "Das Rollback-Bereinigungsprotokoll konnte "
+#~ "nicht gelesen werden; der Bereinigungs-"
+#~ "Prompt wurde beibehalten. Fahren Sie "
+#~ "später fort oder prüfen Sie manuell."
+
+#~ msgid "还有 {count} 个需要关注的资源未显示。"
+#~ msgstr ""
+#~ "{count} weitere Ressourcen, die Aufmerksamkeit"
+#~ " erfordern, werden nicht angezeigt."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录均已完成。"
+#~ msgstr ""
+#~ "↺ Wiederaufnahme der Rollback-Bereinigung: "
+#~ "Alle {count} Einträge sind abgeschlossen."
+
+#~ msgid "进行中"
+#~ msgstr "In Bearbeitung"
+
+#~ msgid "已完成"
+#~ msgstr "Abgeschlossen"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+#~ msgstr "↺ Wiederaufnahme der Rollback-Bereinigung: {count} Einträge, {summary}."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录。"
+#~ msgstr "↺ Wiederaufnahme der Rollback-Bereinigung: {count} Einträge."
+
+#~ msgid "Note: images are not supported in pipeline mode and will be ignored."
+#~ msgstr ""
+#~ "Hinweis: Bilder werden im Pipeline-Modus"
+#~ " nicht unterstützt und ignoriert."
diff --git a/src/iac_code/i18n/locales/es/LC_MESSAGES/messages.po b/src/iac_code/i18n/locales/es/LC_MESSAGES/messages.po
index bea9968e..328ccf8c 100644
--- a/src/iac_code/i18n/locales/es/LC_MESSAGES/messages.po
+++ b/src/iac_code/i18n/locales/es/LC_MESSAGES/messages.po
@@ -49,6 +49,38 @@ msgstr "Nombre de archivo de artefacto no seguro"
 msgid "Unknown error"
 msgstr "Error desconocido"
 
+#: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
+msgid ""
+"Cleanup state unavailable. Inspect the session file and cloud resources "
+"manually."
+msgstr ""
+"Estado de limpieza no disponible. Inspeccione manualmente el archivo de "
+"sesión y los recursos en la nube."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup deferred prompt state is unavailable. Please repair it "
+"before continuing."
+msgstr ""
+"El estado del prompt diferido de limpieza de rollback no está disponible."
+" Repárelo antes de continuar."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup state is unavailable. Please repair the cleanup ledger "
+"before continuing."
+msgstr ""
+"El estado de limpieza de rollback no está disponible. Repare el registro "
+"de limpieza antes de continuar."
+
+#: src/iac_code/a2a/executor.py src/iac_code/ui/repl.py
+msgid ""
+"Rollback cleanup is still in progress. Please continue after cleanup "
+"completes."
+msgstr ""
+"La limpieza de rollback sigue en curso. Continúe cuando termine la "
+"limpieza."
+
 #: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
 msgid "Task is already working."
 msgstr "La tarea ya está en ejecución."
@@ -58,6 +90,11 @@ msgstr "La tarea ya está en ejecución."
 msgid "Task canceled."
 msgstr "Tarea cancelada."
 
+#: src/iac_code/a2a/executor.py
+#, python-brace-format
+msgid "Current model {model} does not support image input."
+msgstr "El modelo actual {model} no admite entrada de imagen."
+
 #: src/iac_code/a2a/pipeline_executor.py
 msgid "A temporary error occurred. Please retry."
 msgstr "Se produjo un error temporal. Inténtalo de nuevo."
@@ -68,6 +105,11 @@ msgstr ""
 "Se requiere autenticación. Configura las credenciales e inténtalo de "
 "nuevo."
 
+#: src/iac_code/a2a/pipeline_executor.py
+#, python-brace-format
+msgid "Pipeline already running. Resume task {task_id}."
+msgstr "La pipeline ya se está ejecutando. Reanude la tarea {task_id}."
+
 #: src/iac_code/a2a/pipeline_recovery.py
 msgid "A2A pipeline state not found"
 msgstr "No se encontró el estado del pipeline A2A"
@@ -504,6 +546,22 @@ msgstr "Herramienta de orquestación de infraestructura asistida por IA"
 msgid "Use iac-code as an A2A client."
 msgstr "Usa iac-code como cliente A2A."
 
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A client dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"Faltan las dependencias del cliente A2A. Instálalas con: pip install "
+"'iac-code[a2a]'"
+
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A server dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"Faltan las dependencias del servidor A2A. Instálalas con: pip install "
+"'iac-code[a2a]'"
+
 #: src/iac_code/cli/main.py
 msgid "Install Git for Windows via the npmmirror mirror (Windows only)."
 msgstr "Instalar Git for Windows mediante el espejo npmmirror (solo Windows)."
@@ -516,14 +574,6 @@ msgstr "Actualizar iac-code a la última versión."
 msgid "YAML config file containing A2A client options"
 msgstr "Archivo de configuración YAML con opciones del cliente A2A"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A client dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"Faltan las dependencias del cliente A2A. Instálalas con: pip install "
-"'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "LLM model to use"
 msgstr "Modelo LLM a utilizar"
@@ -657,14 +707,6 @@ msgstr ""
 "Expone tipos de señal de thinking A2A; repite para varios. Valores: raw-"
 "thinking, tool-trace."
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A server dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"Faltan las dependencias del servidor A2A. Instálalas con: pip install "
-"'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "Send a prompt to an A2A JSON-RPC endpoint."
 msgstr "Envía un prompt a un endpoint JSON-RPC A2A."
@@ -1563,10 +1605,18 @@ msgstr "El prompt de sistema está vacío."
 msgid "No provider messages yet."
 msgstr "Aún no hay mensajes del proveedor."
 
+#: src/iac_code/commands/prompt.py
+msgid "No cleanup prompts in this snapshot."
+msgstr "No hay prompts de limpieza en esta instantánea."
+
 #: src/iac_code/commands/prompt.py
 msgid "No tools are currently registered."
 msgstr "No hay herramientas registradas actualmente."
 
+#: src/iac_code/commands/prompt.py
+msgid "Cleanup Prompts"
+msgstr "Prompts de limpieza"
+
 #: src/iac_code/commands/prompt.py
 msgid "IAC-CODE Prompt Snapshot"
 msgstr "Instantánea del prompt de IAC-CODE"
@@ -1603,6 +1653,14 @@ msgstr "Mensajes del proveedor"
 msgid "Tools"
 msgstr "Herramientas"
 
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt"
+msgstr "prompt de limpieza"
+
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt · removed"
+msgstr "prompt de limpieza · eliminado"
+
 #: src/iac_code/commands/prompt.py
 msgid "Instruction Memory"
 msgstr "Memoria de instrucciones"
@@ -1682,6 +1740,11 @@ msgstr "   Mensajes: {count}"
 msgid "   Recalled memory: {status}"
 msgstr "   Memoria recuperada: {status}"
 
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "   Cleanup prompts: {count}"
+msgstr "   Prompts de limpieza: {count}"
+
 #: src/iac_code/commands/prompt.py
 msgid "3. Tools"
 msgstr "3. Herramientas"
@@ -1731,6 +1794,17 @@ msgstr "presente"
 msgid "not present"
 msgstr "no presente"
 
+#: src/iac_code/commands/prompt.py
+msgid "Rollback cleanup prompts are also shown separately for quick inspection."
+msgstr ""
+"Los prompts de limpieza de rollback también se muestran por separado para"
+" una revisión rápida."
+
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "{count} cleanup prompts"
+msgstr "{count} prompts de limpieza"
+
 #: src/iac_code/commands/prompt.py
 msgid "Tool definitions available to the main model for this request."
 msgstr ""
@@ -1764,6 +1838,7 @@ msgid "Input schema"
 msgstr "Esquema de entrada"
 
 #: src/iac_code/commands/prompt.py
+#: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid "tool"
 msgstr "herramienta"
 
@@ -2060,6 +2135,25 @@ msgstr ""
 msgid "Memory name to read. Omit to list all."
 msgstr "Nombre de la memoria que se va a leer. Omítelo para listar todas."
 
+#: src/iac_code/memory/memory_tools.py
+#, python-brace-format
+msgid ""
+"{base}\n"
+"\n"
+"Available memories:\n"
+"{index}\n"
+"\n"
+"Call read_memory again with one of these names, or omit name to list all "
+"memories."
+msgstr ""
+"{base}\n"
+"\n"
+"Memorias disponibles:\n"
+"{index}\n"
+"\n"
+"Vuelve a llamar a read_memory con uno de estos nombres, u omite name para"
+" listar todas las memorias."
+
 #: src/iac_code/memory/memory_tools.py
 #, python-brace-format
 msgid ""
@@ -2162,6 +2256,143 @@ msgstr "ask_user_question requiere una cola de eventos del pipeline."
 msgid "User cancelled ask_user_question."
 msgstr "El usuario canceló ask_user_question."
 
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"Cloud resources still need cleanup after pipeline rollback. Clean them up"
+" now and keep checking until deletion completes."
+msgstr ""
+"Los recursos en la nube aún necesitan limpieza después del rollback de la"
+" pipeline. Límpielos ahora y siga comprobando hasta que la eliminación se"
+" complete."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Requirements:"
+msgstr "Requisitos:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup scope is a strict allowlist: delete only ids in the cleanup "
+"resources list below."
+msgstr ""
+"- El alcance de limpieza es una lista permitida estricta: elimine solo "
+"los ID de la lista de recursos de limpieza siguiente."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not delete, modify, or roll back any stack or cloud resource outside"
+" the cleanup resources list."
+msgstr ""
+"- No elimine, modifique ni revierta ningún stack o recurso en la nube "
+"fuera de la lista de recursos de limpieza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not call ListStacks or search for other stacks by name; cleanup "
+"resource ids are fully listed."
+msgstr ""
+"- No llame a ListStacks ni busque otros stacks por nombre; los ID de "
+"recursos de limpieza están completamente listados."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Before every GetStack/DeleteStack call, verify that StackId exactly "
+"matches an id in the cleanup resources list."
+msgstr ""
+"- Antes de cada llamada GetStack/DeleteStack, verifique que StackId "
+"coincida exactamente con un ID de la lista de recursos de limpieza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If StackId is not in the cleanup resources list, do not call "
+"DeleteStack, even if it is the current handoff or newly created stack."
+msgstr ""
+"- Si StackId no está en la lista de recursos de limpieza, no llame a "
+"DeleteStack, aunque sea el stack actual del handoff o uno recién creado."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not infer extra cleanup targets from pipeline handoff, "
+"deployment.stack_id, current stack, or resources_created; those may be "
+"final delivered resources."
+msgstr ""
+"- No infiera objetivos de limpieza adicionales desde el handoff de la "
+"pipeline, deployment.stack_id, el stack actual o resources_created; "
+"pueden ser recursos entregados finales."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not expand cleanup scope for user follow-ups, continue instructions,"
+" or pipeline handoff context."
+msgstr ""
+"- No amplíe el alcance de limpieza por seguimientos del usuario, "
+"instrucciones de continuación o contexto de handoff de la pipeline."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- When resuming cleanup, still process only resources listed in this "
+"prompt; do not inspect or delete others."
+msgstr ""
+"- Al reanudar la limpieza, procese solo los recursos listados en este "
+"prompt; no inspeccione ni elimine otros."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Prefer available ROS stack tools for deletion; if using aliyun_api, "
+"call DeleteStack first, then repeatedly call GetStack to check status."
+msgstr ""
+"- Prefiera las herramientas de stack ROS disponibles para eliminar; si "
+"usa aliyun_api, llame primero a DeleteStack y luego llame repetidamente a"
+" GetStack para comprobar el estado."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If a resource is already deleting, call GetStack first, then decide "
+"whether DeleteStack is needed again."
+msgstr ""
+"- Si un recurso ya se está eliminando, llame primero a GetStack y luego "
+"decida si hace falta otra llamada DeleteStack."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or "
+"unknown status, tell the user the failure reason and next step."
+msgstr ""
+"- La limpieza solo se completa tras DELETE_COMPLETE; para DELETE_FAILED o"
+" un estado desconocido, indique al usuario el motivo del fallo y el "
+"siguiente paso."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- After all listed resources are DELETE_COMPLETE, stop this cleanup turn "
+"immediately."
+msgstr ""
+"- Cuando todos los recursos listados estén en DELETE_COMPLETE, detenga de"
+" inmediato este turno de limpieza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "- Briefly update the user during cleanup."
+msgstr "- Actualice brevemente al usuario durante la limpieza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Cleanup resources:"
+msgstr "Recursos de limpieza:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid ""
+"{index}. provider={provider}, type={resource_type}, id={resource_id}, "
+"name={name}, region={region}"
+msgstr ""
+"{index}. proveedor={provider}, tipo={resource_type}, id={resource_id}, "
+"nombre={name}, región={region}"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid "Detected {count} rollback cleanup resources; starting cleanup."
+msgstr ""
+"Se detectaron {count} recursos de limpieza de rollback; iniciando "
+"limpieza."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid ""
 "Complete the current step by calling this tool to submit the conclusion. "
@@ -2262,21 +2493,52 @@ msgstr ""
 "{message} complete_step.conclusion debe incluir uno de estos campos: "
 "{fields}."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "A successful tool result is required before completing the current step."
+msgstr ""
+"Se requiere un resultado de herramienta correcto antes de completar el "
+"paso actual."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
-msgid "Candidate count cannot exceed {limit}; {count} were submitted."
-msgstr "La cantidad de candidatos no puede superar {limit}; se enviaron {count}."
+msgid ""
+"{message} complete_step.conclusion.{field} must match the {tool} result "
+"value {value}."
+msgstr ""
+"{message} complete_step.conclusion.{field} debe coincidir con el valor "
+"{value} del resultado de {tool}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "<missing>"
+msgstr "<faltante>"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " with status {statuses}"
+msgstr " con estado {statuses}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " and is_success={expected}"
+msgstr " e is_success={expected}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " one of {actions}"
+msgstr " con una de las acciones {actions}"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid ""
-"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
-"user for help or narrow the rollback targets before calling "
-"complete_step."
+"{message} Call {tool}{action} first and wait for a successful "
+"result{status_hint}{success_hint}."
 msgstr ""
-"La cantidad de destinos de reversión no puede superar {limit}; hay "
-"{count}. Pide ayuda al usuario o reduce los destinos antes de llamar a "
-"complete_step."
+"{message} Llama primero a {tool}{action} y espera un resultado "
+"correcto{status_hint}{success_hint}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "the required tool"
+msgstr "la herramienta requerida"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
@@ -2287,6 +2549,22 @@ msgstr ""
 "La cantidad de reversiones no puede superar {max_rollbacks}. Completa el "
 "paso actual o pide ayuda al usuario."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgstr "La cantidad de candidatos no puede superar {limit}; se enviaron {count}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid ""
+"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
+"user for help or narrow the rollback targets before calling "
+"complete_step."
+msgstr ""
+"La cantidad de destinos de reversión no puede superar {limit}; hay "
+"{count}. Pide ayuda al usuario o reduce los destinos antes de llamar a "
+"complete_step."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid "Schema validation failed after {attempts} attempts: {error}"
@@ -2313,6 +2591,10 @@ msgstr ""
 msgid "Step {step_id} completed. Conclusion submitted."
 msgstr "Paso {step_id} completado. Conclusión enviada."
 
+#: src/iac_code/pipeline/engine/pipeline_runner.py
+msgid "Pipeline state persistence failed."
+msgstr "Error al persistir el estado de la pipeline."
+
 #: src/iac_code/pipeline/engine/pipeline_runner.py
 #: src/iac_code/pipeline/engine/sub_pipeline_executor.py
 #: src/iac_code/ui/repl.py
@@ -2415,6 +2697,10 @@ msgstr ""
 msgid "Template file path cannot escape the working directory"
 msgstr "La ruta del archivo de plantilla no puede salir del directorio de trabajo"
 
+#: src/iac_code/pipeline/engine/user_input.py
+msgid "[Image input]"
+msgstr "[Entrada de imagen]"
+
 #: src/iac_code/pipeline/selling/tools/show_candidate_detail_tool.py
 msgid ""
 "Display candidate details (summary and cost breakdown) in the comparison "
@@ -3297,6 +3583,17 @@ msgstr "ROS Stack"
 msgid "CloudStackInstances"
 msgstr "CloudStackInstances"
 
+#: src/iac_code/tools/cloud/aliyun/template_source.py
+msgid ""
+"ROS template calls must use TemplateURL instead of TemplateBody. Save the"
+" template to a file and pass params.TemplateURL, for example a local file"
+" path or OSS/HTTP URL."
+msgstr ""
+"Las llamadas a plantillas ROS deben usar TemplateURL en lugar de "
+"TemplateBody. Guarda la plantilla en un archivo y pasa "
+"params.TemplateURL, por ejemplo una ruta de archivo local o una URL "
+"OSS/HTTP."
+
 #: src/iac_code/tools/cloud/aliyun/hooks/ros_validate.py
 #, python-brace-format
 msgid "Template YAML syntax error: {}"
@@ -3420,11 +3717,11 @@ msgstr "Interrumpido"
 msgid "Running"
 msgstr "En ejecución"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Completed"
 msgstr "Completado"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Failed"
 msgstr "Error"
 
@@ -3706,8 +4003,129 @@ msgid "Command has no handler: {name}"
 msgstr "El comando no tiene controlador: {name}"
 
 #: src/iac_code/ui/repl.py
-msgid "Note: images are not supported in pipeline mode and will be ignored."
-msgstr "Nota: las imágenes no son compatibles con el modo pipeline y se ignorarán."
+#, python-brace-format
+msgid "↺ Rollback cleanup [{badge}] {label}"
+msgstr "↺ Limpieza de rollback [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{kind} {resource_id}"
+msgstr "{kind} {resource_id}"
+
+#: src/iac_code/ui/repl.py
+msgid "Deleting"
+msgstr "Eliminando"
+
+#: src/iac_code/ui/repl.py
+msgid "Skipped"
+msgstr "Omitido"
+
+#: src/iac_code/ui/repl.py
+msgid "Pending"
+msgstr "Pendiente"
+
+#: src/iac_code/ui/repl.py
+msgid "Checking"
+msgstr "Comprobando"
+
+#: src/iac_code/ui/repl.py
+msgid "Progress"
+msgstr "Progreso"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "DeleteStack submitted; waiting for deletion to complete ({progress})"
+msgstr ""
+"DeleteStack enviado; esperando a que se complete la eliminación "
+"({progress})"
+
+#: src/iac_code/ui/repl.py
+msgid "DeleteStack submitted; waiting for deletion to complete"
+msgstr "DeleteStack enviado; esperando a que se complete la eliminación"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Deleting ({progress})"
+msgstr "Eliminando ({progress})"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{progress}; deletion required"
+msgstr "{progress}; se requiere eliminación"
+
+#: src/iac_code/ui/repl.py
+msgid "stack"
+msgstr "stack"
+
+#: src/iac_code/ui/repl.py
+msgid "resource"
+msgstr "recurso"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Could not read rollback cleanup records. The cleanup prompt was kept; "
+"retry later or inspect manually."
+msgstr ""
+"No se pudieron leer los registros de limpieza de rollback. Se conservó el"
+" prompt de limpieza; reintente más tarde o inspeccione manualmente."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} additional resources needing attention were not shown."
+msgstr "No se mostraron {count} recursos adicionales que requieren atención."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: all {count} records are completed."
+msgstr ""
+"↺ Reanudación de limpieza de rollback: los {count} registros están "
+"completados."
+
+#: src/iac_code/ui/repl.py
+msgid "failed"
+msgstr "fallido"
+
+#: src/iac_code/ui/repl.py
+msgid "pending"
+msgstr "pendiente"
+
+#: src/iac_code/ui/repl.py
+msgid "in progress"
+msgstr "en curso"
+
+#: src/iac_code/ui/repl.py
+msgid "completed"
+msgstr "completado"
+
+#: src/iac_code/ui/repl.py
+msgid "skipped"
+msgstr "omitido"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} {label}"
+msgstr "{count} {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records, {summary}."
+msgstr "↺ Reanudación de limpieza de rollback: {count} registros, {summary}."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records."
+msgstr "↺ Reanudación de limpieza de rollback: {count} registros."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "  [{badge}] {label}"
+msgstr "  [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+msgid "Detected rollback cleanup resources, but cleanup prompt injection failed."
+msgstr ""
+"Se detectaron recursos de limpieza de rollback, pero falló la inyección "
+"del prompt de limpieza."
 
 #: src/iac_code/ui/repl.py
 #, python-brace-format
@@ -3716,11 +4134,27 @@ msgstr "Ignorando el estado guardado del pipeline: {reason}"
 
 #: src/iac_code/ui/repl.py
 msgid ""
-"Pipeline completed. Normal chat is active, but the handoff context could "
-"not be injected or saved."
+"Pipeline state persistence failed. The pipeline is paused; do not "
+"continue until state is durable."
+msgstr ""
+"Error al persistir el estado de la pipeline. La pipeline está pausada; no"
+" continúe hasta que el estado sea duradero."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline state persistence failed. Normal chat handoff was not marked "
+"durable."
+msgstr ""
+"Error al persistir el estado de la pipeline. El handoff al chat normal no"
+" se marcó como duradero."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline completed, but the handoff context could not be injected or "
+"saved."
 msgstr ""
-"El pipeline se completó. El chat normal está activo, pero no se pudo "
-"inyectar ni guardar el contexto de traspaso."
+"La pipeline se completó, pero no se pudo inyectar o guardar el contexto "
+"de handoff."
 
 #: src/iac_code/ui/repl.py
 msgid "Judging your input..."
@@ -3895,6 +4329,11 @@ msgstr "  ✓ {name}: completado\n"
 msgid "  ✘ {name}: Failed"
 msgstr "  ✘ {name}: error"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Pipeline warning: {reason}"
+msgstr "Advertencia de la pipeline: {reason}"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Option {index}"
@@ -3976,6 +4415,17 @@ msgstr "error desconocido"
 msgid "Resumed pipeline at step: {step}"
 msgstr "Pipeline reanudado en el paso: {step}"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Could not read pipeline state metadata: {reason}"
+msgstr "No se pudieron leer los metadatos de estado de la pipeline: {reason}"
+
+#: src/iac_code/ui/repl.py
+msgid "Pipeline state metadata is invalid; continuing as normal chat."
+msgstr ""
+"Los metadatos de estado de la pipeline no son válidos; se continúa como "
+"chat normal."
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Found pipeline state in this session (paused at: {step})."
@@ -4538,3 +4988,198 @@ msgstr "La traza de pila se omitió del evento público; consulta error_id."
 
 #~ msgid "Project Memory Index"
 #~ msgstr "Índice de memoria del proyecto"
+
+#~ msgid "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+#~ msgstr ""
+#~ "Se detectaron recursos en la nube "
+#~ "que aún deben limpiarse después del "
+#~ "rollback del pipeline. Límpielos de "
+#~ "inmediato y siga comprobando hasta que"
+#~ " la eliminación termine."
+
+#~ msgid "要求："
+#~ msgstr "Requisitos:"
+
+#~ msgid "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+#~ msgstr ""
+#~ "- El alcance de limpieza es una"
+#~ " lista blanca estricta: solo se "
+#~ "pueden eliminar los id de la lista"
+#~ " \"Recursos por limpiar\" siguiente."
+
+#~ msgid "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+#~ msgstr ""
+#~ "- No elimine, modifique ni revierta "
+#~ "ningún stack o recurso de nube que"
+#~ " no esté en \"Recursos por limpiar\"."
+
+#~ msgid "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+#~ msgstr ""
+#~ "- No llames a ListStacks ni "
+#~ "busques otros stacks por nombre; los "
+#~ "id de recursos pendientes de limpieza"
+#~ " ya estan listados por completo."
+
+#~ msgid "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+#~ msgstr ""
+#~ "- Antes de cada llamada a "
+#~ "GetStack/DeleteStack, debes comprobar que "
+#~ "StackId coincida exactamente con algun "
+#~ "id de la lista de recursos "
+#~ "pendientes de limpieza."
+
+#~ msgid "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+#~ msgstr ""
+#~ "- Si StackId no esta en la "
+#~ "lista de recursos pendientes de "
+#~ "limpieza, esta prohibido llamar a "
+#~ "DeleteStack, aunque sea el stack del "
+#~ "handoff actual o recien creado."
+
+#~ msgid ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+#~ msgstr ""
+#~ "- No infiera objetos de limpieza "
+#~ "adicionales desde pipeline handoff, "
+#~ "deployment.stack_id, current stack o "
+#~ "resources_created; podrían ser recursos "
+#~ "entregados correctamente al final."
+
+#~ msgid "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+#~ msgstr ""
+#~ "- Aunque haya preguntas del usuario, "
+#~ "instrucciones para continuar o contexto "
+#~ "de pipeline handoff en esta ronda, "
+#~ "no amplíe el alcance de limpieza."
+
+#~ msgid "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+#~ msgstr ""
+#~ "- Al reanudar o continuar la "
+#~ "limpieza, procesa solo los recursos "
+#~ "listados en este aviso; no compruebes"
+#~ " ni elimines otros recursos."
+
+#~ msgid ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+#~ msgstr ""
+#~ "- Use preferentemente la herramienta ROS"
+#~ " stack disponible para eliminar; si "
+#~ "usa aliyun_api, ejecute primero DeleteStack"
+#~ " y luego GetStack repetidamente para "
+#~ "comprobar el estado."
+
+#~ msgid "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+#~ msgstr ""
+#~ "- Si el recurso ya está en "
+#~ "eliminación, use primero GetStack para "
+#~ "comprobar el estado actual antes de "
+#~ "decidir si debe ejecutar DeleteStack "
+#~ "otra vez."
+
+#~ msgid "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+#~ msgstr ""
+#~ "- La limpieza solo se considera "
+#~ "completa tras confirmar DELETE_COMPLETE; con"
+#~ " DELETE_FAILED o si no se puede "
+#~ "confirmar, explique al usuario el motivo"
+#~ " del fallo y el siguiente paso."
+
+#~ msgid "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+#~ msgstr ""
+#~ "- Cuando todos los recursos de la"
+#~ " lista estén en DELETE_COMPLETE, detenga"
+#~ " inmediatamente esta limpieza; no elimine"
+#~ " ni compruebe ningún otro stack."
+
+#~ msgid "- 清理过程中向用户简短同步进度。"
+#~ msgstr "- Informe brevemente al usuario sobre el progreso durante la limpieza."
+
+#~ msgid "待清理资源："
+#~ msgstr "Recursos por limpiar:"
+
+#~ msgid "检测到 {count} 个回滚残留资源，开始清理流程。"
+#~ msgstr ""
+#~ "Se detectaron {count} recursos residuales "
+#~ "del rollback; iniciando el flujo de "
+#~ "limpieza."
+
+#~ msgid "错误：{error}"
+#~ msgstr "Error: {error}"
+
+#~ msgid "删除中"
+#~ msgstr "Eliminando"
+
+#~ msgid "完成"
+#~ msgstr "Completado"
+
+#~ msgid "失败"
+#~ msgstr "Fallido"
+
+#~ msgid "跳过"
+#~ msgstr "Omitido"
+
+#~ msgid "待处理"
+#~ msgstr "Pendiente"
+
+#~ msgid "检查"
+#~ msgstr "Comprobar"
+
+#~ msgid "进度"
+#~ msgstr "Progreso"
+
+#~ msgid "DeleteStack 已提交，等待删除完成（{progress}）"
+#~ msgstr "DeleteStack enviado; esperando que termine la eliminación ({progress})"
+
+#~ msgid "DeleteStack 已提交，等待删除完成"
+#~ msgstr "DeleteStack enviado; esperando que termine la eliminación"
+
+#~ msgid "已跳过"
+#~ msgstr "Omitido"
+
+#~ msgid "正在删除（{progress}）"
+#~ msgstr "Eliminando ({progress})"
+
+#~ msgid "{progress}，需要删除"
+#~ msgstr "{progress}, requiere eliminación"
+
+#~ msgid "资源栈"
+#~ msgstr "Stack de recursos"
+
+#~ msgid "资源"
+#~ msgstr "Recurso"
+
+#~ msgid "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+#~ msgstr ""
+#~ "No se pudo leer el registro de "
+#~ "limpieza de rollback; se conservó el "
+#~ "prompt de limpieza. Continúe más tarde"
+#~ " o revise manualmente."
+
+#~ msgid "还有 {count} 个需要关注的资源未显示。"
+#~ msgstr "Hay {count} recursos más que requieren atención y no se muestran."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录均已完成。"
+#~ msgstr ""
+#~ "↺ Recuperación de limpieza de rollback:"
+#~ " las {count} entradas están completadas."
+
+#~ msgid "进行中"
+#~ msgstr "En curso"
+
+#~ msgid "已完成"
+#~ msgstr "Completado"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+#~ msgstr "↺ Recuperación de limpieza de rollback: {count} entradas, {summary}."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录。"
+#~ msgstr "↺ Recuperación de limpieza de rollback: {count} entradas."
+
+#~ msgid "Note: images are not supported in pipeline mode and will be ignored."
+#~ msgstr ""
+#~ "Nota: las imágenes no son compatibles"
+#~ " con el modo pipeline y se "
+#~ "ignorarán."
diff --git a/src/iac_code/i18n/locales/fr/LC_MESSAGES/messages.po b/src/iac_code/i18n/locales/fr/LC_MESSAGES/messages.po
index 2edcd6c0..339e9b9b 100644
--- a/src/iac_code/i18n/locales/fr/LC_MESSAGES/messages.po
+++ b/src/iac_code/i18n/locales/fr/LC_MESSAGES/messages.po
@@ -49,6 +49,38 @@ msgstr "Nom de fichier d’artefact non sûr"
 msgid "Unknown error"
 msgstr "Erreur inconnue"
 
+#: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
+msgid ""
+"Cleanup state unavailable. Inspect the session file and cloud resources "
+"manually."
+msgstr ""
+"État de nettoyage indisponible. Inspectez manuellement le fichier de "
+"session et les ressources cloud."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup deferred prompt state is unavailable. Please repair it "
+"before continuing."
+msgstr ""
+"L'état du prompt différé de nettoyage du rollback est indisponible. "
+"Réparez-le avant de continuer."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup state is unavailable. Please repair the cleanup ledger "
+"before continuing."
+msgstr ""
+"L'état du nettoyage du rollback est indisponible. Réparez le journal de "
+"nettoyage avant de continuer."
+
+#: src/iac_code/a2a/executor.py src/iac_code/ui/repl.py
+msgid ""
+"Rollback cleanup is still in progress. Please continue after cleanup "
+"completes."
+msgstr ""
+"Le nettoyage du rollback est encore en cours. Continuez une fois le "
+"nettoyage terminé."
+
 #: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
 msgid "Task is already working."
 msgstr "La tâche est déjà en cours."
@@ -58,6 +90,11 @@ msgstr "La tâche est déjà en cours."
 msgid "Task canceled."
 msgstr "Tâche annulée."
 
+#: src/iac_code/a2a/executor.py
+#, python-brace-format
+msgid "Current model {model} does not support image input."
+msgstr "Le modèle actuel {model} ne prend pas en charge l’entrée d’image."
+
 #: src/iac_code/a2a/pipeline_executor.py
 msgid "A temporary error occurred. Please retry."
 msgstr "Une erreur temporaire s’est produite. Veuillez réessayer."
@@ -66,6 +103,11 @@ msgstr "Une erreur temporaire s’est produite. Veuillez réessayer."
 msgid "Authentication required. Configure credentials and retry."
 msgstr "Authentification requise. Configurez les identifiants puis réessayez."
 
+#: src/iac_code/a2a/pipeline_executor.py
+#, python-brace-format
+msgid "Pipeline already running. Resume task {task_id}."
+msgstr "Le pipeline est déjà en cours d'exécution. Reprenez la tâche {task_id}."
+
 #: src/iac_code/a2a/pipeline_recovery.py
 msgid "A2A pipeline state not found"
 msgstr "État du pipeline A2A introuvable"
@@ -501,6 +543,22 @@ msgstr "Outil d’orchestration d’infrastructure assisté par IA"
 msgid "Use iac-code as an A2A client."
 msgstr "Utilise iac-code comme client A2A."
 
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A client dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"Les dépendances du client A2A sont manquantes. Installez-les avec : pip "
+"install 'iac-code[a2a]'"
+
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A server dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"Les dépendances du serveur A2A sont manquantes. Installez-les avec : pip "
+"install 'iac-code[a2a]'"
+
 #: src/iac_code/cli/main.py
 msgid "Install Git for Windows via the npmmirror mirror (Windows only)."
 msgstr "Installer Git for Windows via le miroir npmmirror (Windows uniquement)."
@@ -513,14 +571,6 @@ msgstr "Mettre à jour iac-code vers la dernière version."
 msgid "YAML config file containing A2A client options"
 msgstr "Fichier de configuration YAML contenant les options client A2A"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A client dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"Les dépendances du client A2A sont manquantes. Installez-les avec : pip "
-"install 'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "LLM model to use"
 msgstr "Modèle LLM à utiliser"
@@ -656,14 +706,6 @@ msgstr ""
 "Expose les types de signal de thinking A2A ; répétez pour en fournir "
 "plusieurs. Valeurs : raw-thinking, tool-trace."
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A server dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"Les dépendances du serveur A2A sont manquantes. Installez-les avec : pip "
-"install 'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "Send a prompt to an A2A JSON-RPC endpoint."
 msgstr "Envoie un prompt à un point de terminaison JSON-RPC A2A."
@@ -1566,10 +1608,18 @@ msgstr "Le prompt système est vide."
 msgid "No provider messages yet."
 msgstr "Aucun message fournisseur pour le moment."
 
+#: src/iac_code/commands/prompt.py
+msgid "No cleanup prompts in this snapshot."
+msgstr "Aucun prompt de nettoyage dans cet instantané."
+
 #: src/iac_code/commands/prompt.py
 msgid "No tools are currently registered."
 msgstr "Aucun outil n’est actuellement enregistré."
 
+#: src/iac_code/commands/prompt.py
+msgid "Cleanup Prompts"
+msgstr "Prompts de nettoyage"
+
 #: src/iac_code/commands/prompt.py
 msgid "IAC-CODE Prompt Snapshot"
 msgstr "Instantané du prompt IAC-CODE"
@@ -1606,6 +1656,14 @@ msgstr "Messages fournisseur"
 msgid "Tools"
 msgstr "Outils"
 
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt"
+msgstr "prompt de nettoyage"
+
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt · removed"
+msgstr "prompt de nettoyage · supprimé"
+
 #: src/iac_code/commands/prompt.py
 msgid "Instruction Memory"
 msgstr "Mémoire d’instructions"
@@ -1685,6 +1743,11 @@ msgstr "   Messages : {count}"
 msgid "   Recalled memory: {status}"
 msgstr "   Mémoire rappelée : {status}"
 
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "   Cleanup prompts: {count}"
+msgstr "   Prompts de nettoyage : {count}"
+
 #: src/iac_code/commands/prompt.py
 msgid "3. Tools"
 msgstr "3. Outils"
@@ -1734,6 +1797,17 @@ msgstr "présente"
 msgid "not present"
 msgstr "absente"
 
+#: src/iac_code/commands/prompt.py
+msgid "Rollback cleanup prompts are also shown separately for quick inspection."
+msgstr ""
+"Les prompts de nettoyage du rollback sont aussi affichés séparément pour "
+"une inspection rapide."
+
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "{count} cleanup prompts"
+msgstr "{count} prompts de nettoyage"
+
 #: src/iac_code/commands/prompt.py
 msgid "Tool definitions available to the main model for this request."
 msgstr ""
@@ -1767,6 +1841,7 @@ msgid "Input schema"
 msgstr "Schéma d’entrée"
 
 #: src/iac_code/commands/prompt.py
+#: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid "tool"
 msgstr "outil"
 
@@ -2061,6 +2136,25 @@ msgstr ""
 msgid "Memory name to read. Omit to list all."
 msgstr "Nom de la mémoire à lire. Omettez-le pour tout lister."
 
+#: src/iac_code/memory/memory_tools.py
+#, python-brace-format
+msgid ""
+"{base}\n"
+"\n"
+"Available memories:\n"
+"{index}\n"
+"\n"
+"Call read_memory again with one of these names, or omit name to list all "
+"memories."
+msgstr ""
+"{base}\n"
+"\n"
+"Mémoires disponibles :\n"
+"{index}\n"
+"\n"
+"Appelez à nouveau read_memory avec l’un de ces noms, ou omettez name pour"
+" lister toutes les mémoires."
+
 #: src/iac_code/memory/memory_tools.py
 #, python-brace-format
 msgid ""
@@ -2163,6 +2257,145 @@ msgstr "ask_user_question nécessite une file d’événements du pipeline."
 msgid "User cancelled ask_user_question."
 msgstr "L’utilisateur a annulé ask_user_question."
 
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"Cloud resources still need cleanup after pipeline rollback. Clean them up"
+" now and keep checking until deletion completes."
+msgstr ""
+"Des ressources cloud doivent encore être nettoyées après le rollback du "
+"pipeline. Nettoyez-les maintenant et continuez à vérifier jusqu'à la fin "
+"de la suppression."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Requirements:"
+msgstr "Exigences :"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup scope is a strict allowlist: delete only ids in the cleanup "
+"resources list below."
+msgstr ""
+"- Le périmètre de nettoyage est une liste autorisée stricte : supprimez "
+"uniquement les ID de la liste des ressources de nettoyage ci-dessous."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not delete, modify, or roll back any stack or cloud resource outside"
+" the cleanup resources list."
+msgstr ""
+"- Ne supprimez, modifiez ou restaurez aucun stack ni aucune ressource "
+"cloud hors de la liste des ressources de nettoyage."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not call ListStacks or search for other stacks by name; cleanup "
+"resource ids are fully listed."
+msgstr ""
+"- N’appelez pas ListStacks et ne cherchez pas d’autres stacks par nom ; "
+"les ID des ressources de nettoyage sont entièrement listés."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Before every GetStack/DeleteStack call, verify that StackId exactly "
+"matches an id in the cleanup resources list."
+msgstr ""
+"- Avant chaque appel GetStack/DeleteStack, vérifiez que StackId "
+"correspond exactement à un ID de la liste des ressources de nettoyage."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If StackId is not in the cleanup resources list, do not call "
+"DeleteStack, even if it is the current handoff or newly created stack."
+msgstr ""
+"- Si StackId n’est pas dans la liste des ressources de nettoyage, "
+"n’appelez pas DeleteStack, même s’il s’agit du stack courant du handoff "
+"ou d’un stack récemment créé."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not infer extra cleanup targets from pipeline handoff, "
+"deployment.stack_id, current stack, or resources_created; those may be "
+"final delivered resources."
+msgstr ""
+"- N’inférez aucune cible de nettoyage supplémentaire depuis le handoff du"
+" pipeline, deployment.stack_id, le stack courant ou resources_created ; "
+"il peut s’agir de ressources livrées finales."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not expand cleanup scope for user follow-ups, continue instructions,"
+" or pipeline handoff context."
+msgstr ""
+"- N’élargissez pas le périmètre de nettoyage en raison d’un suivi "
+"utilisateur, d’instructions de continuation ou du contexte de handoff du "
+"pipeline."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- When resuming cleanup, still process only resources listed in this "
+"prompt; do not inspect or delete others."
+msgstr ""
+"- Lors de la reprise du nettoyage, traitez uniquement les ressources "
+"listées dans ce prompt ; n’inspectez et ne supprimez pas les autres."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Prefer available ROS stack tools for deletion; if using aliyun_api, "
+"call DeleteStack first, then repeatedly call GetStack to check status."
+msgstr ""
+"- Préférez les outils de stack ROS disponibles pour la suppression ; si "
+"vous utilisez aliyun_api, appelez d’abord DeleteStack, puis appelez "
+"GetStack à plusieurs reprises pour vérifier le statut."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If a resource is already deleting, call GetStack first, then decide "
+"whether DeleteStack is needed again."
+msgstr ""
+"- Si une ressource est déjà en cours de suppression, appelez d’abord "
+"GetStack, puis décidez si DeleteStack est à nouveau nécessaire."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or "
+"unknown status, tell the user the failure reason and next step."
+msgstr ""
+"- Le nettoyage n’est terminé qu’après DELETE_COMPLETE ; pour "
+"DELETE_FAILED ou un statut inconnu, indiquez à l’utilisateur la raison de"
+" l’échec et l’étape suivante."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- After all listed resources are DELETE_COMPLETE, stop this cleanup turn "
+"immediately."
+msgstr ""
+"- Une fois toutes les ressources listées en DELETE_COMPLETE, arrêtez "
+"immédiatement ce tour de nettoyage."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "- Briefly update the user during cleanup."
+msgstr "- Tenez brièvement l’utilisateur informé pendant le nettoyage."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Cleanup resources:"
+msgstr "Ressources de nettoyage :"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid ""
+"{index}. provider={provider}, type={resource_type}, id={resource_id}, "
+"name={name}, region={region}"
+msgstr ""
+"{index}. fournisseur={provider}, type={resource_type}, id={resource_id}, "
+"nom={name}, région={region}"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid "Detected {count} rollback cleanup resources; starting cleanup."
+msgstr ""
+"{count} ressources de nettoyage du rollback détectées ; démarrage du "
+"nettoyage."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid ""
 "Complete the current step by calling this tool to submit the conclusion. "
@@ -2261,23 +2494,50 @@ msgstr ""
 "{message} complete_step.conclusion doit inclure l’un de ces champs : "
 "{fields}."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "A successful tool result is required before completing the current step."
+msgstr "Un résultat d’outil réussi est requis avant de terminer l’étape actuelle."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
-msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgid ""
+"{message} complete_step.conclusion.{field} must match the {tool} result "
+"value {value}."
 msgstr ""
-"Le nombre de candidats ne peut pas dépasser {limit} ; {count} ont été "
-"soumis."
+"{message} complete_step.conclusion.{field} doit correspondre à la valeur "
+"de résultat {value} de {tool}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "<missing>"
+msgstr "<manquant>"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " with status {statuses}"
+msgstr " avec le statut {statuses}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " and is_success={expected}"
+msgstr " et is_success={expected}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " one of {actions}"
+msgstr " avec l’une des actions {actions}"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid ""
-"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
-"user for help or narrow the rollback targets before calling "
-"complete_step."
+"{message} Call {tool}{action} first and wait for a successful "
+"result{status_hint}{success_hint}."
 msgstr ""
-"Le nombre de cibles de retour arrière ne peut pas dépasser {limit} ; il y"
-" en a {count}. Demandez l’aide de l’utilisateur ou réduisez les cibles "
-"avant d’appeler complete_step."
+"{message} Appelez d’abord {tool}{action} et attendez un résultat "
+"réussi{status_hint}{success_hint}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "the required tool"
+msgstr "l’outil requis"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
@@ -2288,6 +2548,24 @@ msgstr ""
 "Le nombre de retours arrière ne peut pas dépasser {max_rollbacks}. "
 "Terminez l’étape actuelle ou demandez l’aide de l’utilisateur."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgstr ""
+"Le nombre de candidats ne peut pas dépasser {limit} ; {count} ont été "
+"soumis."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid ""
+"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
+"user for help or narrow the rollback targets before calling "
+"complete_step."
+msgstr ""
+"Le nombre de cibles de retour arrière ne peut pas dépasser {limit} ; il y"
+" en a {count}. Demandez l’aide de l’utilisateur ou réduisez les cibles "
+"avant d’appeler complete_step."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid "Schema validation failed after {attempts} attempts: {error}"
@@ -2314,6 +2592,10 @@ msgstr ""
 msgid "Step {step_id} completed. Conclusion submitted."
 msgstr "Étape {step_id} terminée. Conclusion soumise."
 
+#: src/iac_code/pipeline/engine/pipeline_runner.py
+msgid "Pipeline state persistence failed."
+msgstr "Échec de la persistance de l’état du pipeline."
+
 #: src/iac_code/pipeline/engine/pipeline_runner.py
 #: src/iac_code/pipeline/engine/sub_pipeline_executor.py
 #: src/iac_code/ui/repl.py
@@ -2414,6 +2696,10 @@ msgstr "Le chemin du fichier de modèle doit être relatif au répertoire de tra
 msgid "Template file path cannot escape the working directory"
 msgstr "Le chemin du fichier de modèle ne peut pas sortir du répertoire de travail"
 
+#: src/iac_code/pipeline/engine/user_input.py
+msgid "[Image input]"
+msgstr "[Entrée d'image]"
+
 #: src/iac_code/pipeline/selling/tools/show_candidate_detail_tool.py
 msgid ""
 "Display candidate details (summary and cost breakdown) in the comparison "
@@ -3299,6 +3585,17 @@ msgstr "ROS Stack"
 msgid "CloudStackInstances"
 msgstr "CloudStackInstances"
 
+#: src/iac_code/tools/cloud/aliyun/template_source.py
+msgid ""
+"ROS template calls must use TemplateURL instead of TemplateBody. Save the"
+" template to a file and pass params.TemplateURL, for example a local file"
+" path or OSS/HTTP URL."
+msgstr ""
+"Les appels de modèle ROS doivent utiliser TemplateURL au lieu de "
+"TemplateBody. Enregistrez le modèle dans un fichier et transmettez "
+"params.TemplateURL, par exemple un chemin de fichier local ou une URL "
+"OSS/HTTP."
+
 #: src/iac_code/tools/cloud/aliyun/hooks/ros_validate.py
 #, python-brace-format
 msgid "Template YAML syntax error: {}"
@@ -3422,11 +3719,11 @@ msgstr "Interrompu"
 msgid "Running"
 msgstr "En cours"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Completed"
 msgstr "Terminé"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Failed"
 msgstr "Échec"
 
@@ -3707,10 +4004,130 @@ msgid "Command has no handler: {name}"
 msgstr "Aucun gestionnaire pour la commande : {name}"
 
 #: src/iac_code/ui/repl.py
-msgid "Note: images are not supported in pipeline mode and will be ignored."
+#, python-brace-format
+msgid "↺ Rollback cleanup [{badge}] {label}"
+msgstr "↺ Nettoyage du rollback [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{kind} {resource_id}"
+msgstr "{kind} {resource_id}"
+
+#: src/iac_code/ui/repl.py
+msgid "Deleting"
+msgstr "Suppression"
+
+#: src/iac_code/ui/repl.py
+msgid "Skipped"
+msgstr "Ignoré"
+
+#: src/iac_code/ui/repl.py
+msgid "Pending"
+msgstr "En attente"
+
+#: src/iac_code/ui/repl.py
+msgid "Checking"
+msgstr "Vérification"
+
+#: src/iac_code/ui/repl.py
+msgid "Progress"
+msgstr "Progression"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "DeleteStack submitted; waiting for deletion to complete ({progress})"
+msgstr "DeleteStack envoyé ; attente de la fin de la suppression ({progress})"
+
+#: src/iac_code/ui/repl.py
+msgid "DeleteStack submitted; waiting for deletion to complete"
+msgstr "DeleteStack envoyé ; attente de la fin de la suppression"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Deleting ({progress})"
+msgstr "Suppression en cours ({progress})"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{progress}; deletion required"
+msgstr "{progress} ; suppression requise"
+
+#: src/iac_code/ui/repl.py
+msgid "stack"
+msgstr "stack"
+
+#: src/iac_code/ui/repl.py
+msgid "resource"
+msgstr "ressource"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Could not read rollback cleanup records. The cleanup prompt was kept; "
+"retry later or inspect manually."
+msgstr ""
+"Impossible de lire les enregistrements de nettoyage du rollback. Le "
+"prompt de nettoyage a été conservé ; réessayez plus tard ou inspectez "
+"manuellement."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} additional resources needing attention were not shown."
+msgstr ""
+"{count} ressources supplémentaires nécessitant une attention n'ont pas "
+"été affichées."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: all {count} records are completed."
 msgstr ""
-"Remarque : les images ne sont pas prises en charge en mode pipeline et "
-"seront ignorées."
+"↺ Reprise du nettoyage du rollback : les {count} enregistrements sont "
+"terminés."
+
+#: src/iac_code/ui/repl.py
+msgid "failed"
+msgstr "échoué"
+
+#: src/iac_code/ui/repl.py
+msgid "pending"
+msgstr "en attente"
+
+#: src/iac_code/ui/repl.py
+msgid "in progress"
+msgstr "en cours"
+
+#: src/iac_code/ui/repl.py
+msgid "completed"
+msgstr "terminé"
+
+#: src/iac_code/ui/repl.py
+msgid "skipped"
+msgstr "ignoré"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} {label}"
+msgstr "{count} {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records, {summary}."
+msgstr "↺ Reprise du nettoyage du rollback : {count} enregistrements, {summary}."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records."
+msgstr "↺ Reprise du nettoyage du rollback : {count} enregistrements."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "  [{badge}] {label}"
+msgstr "  [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+msgid "Detected rollback cleanup resources, but cleanup prompt injection failed."
+msgstr ""
+"Des ressources de nettoyage du rollback ont été détectées, mais "
+"l’injection du prompt de nettoyage a échoué."
 
 #: src/iac_code/ui/repl.py
 #, python-brace-format
@@ -3719,11 +4136,27 @@ msgstr "État de pipeline enregistré ignoré : {reason}"
 
 #: src/iac_code/ui/repl.py
 msgid ""
-"Pipeline completed. Normal chat is active, but the handoff context could "
-"not be injected or saved."
+"Pipeline state persistence failed. The pipeline is paused; do not "
+"continue until state is durable."
+msgstr ""
+"Échec de la persistance de l'état du pipeline. Le pipeline est en pause ;"
+" ne continuez pas tant que l'état n'est pas durable."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline state persistence failed. Normal chat handoff was not marked "
+"durable."
 msgstr ""
-"Le pipeline est terminé. Le chat normal est actif, mais le contexte de "
-"transfert n'a pas pu être injecté ou enregistré."
+"Échec de la persistance de l'état du pipeline. Le handoff vers le chat "
+"normal n'a pas été marqué comme durable."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline completed, but the handoff context could not be injected or "
+"saved."
+msgstr ""
+"Le pipeline est terminé, mais le contexte de handoff n’a pas pu être "
+"injecté ou enregistré."
 
 #: src/iac_code/ui/repl.py
 msgid "Judging your input..."
@@ -3903,6 +4336,11 @@ msgstr "  ✓ {name} : terminé\n"
 msgid "  ✘ {name}: Failed"
 msgstr "  ✘ {name} : échec"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Pipeline warning: {reason}"
+msgstr "Avertissement du pipeline : {reason}"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Option {index}"
@@ -3984,6 +4422,17 @@ msgstr "erreur inconnue"
 msgid "Resumed pipeline at step: {step}"
 msgstr "Pipeline repris à l'étape : {step}"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Could not read pipeline state metadata: {reason}"
+msgstr "Impossible de lire les métadonnées d'état du pipeline : {reason}"
+
+#: src/iac_code/ui/repl.py
+msgid "Pipeline state metadata is invalid; continuing as normal chat."
+msgstr ""
+"Les métadonnées d’état du pipeline sont invalides ; poursuite en chat "
+"normal."
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Found pipeline state in this session (paused at: {step})."
@@ -4531,3 +4980,210 @@ msgstr "Trace de pile omise de l’événement public ; consultez error_id."
 
 #~ msgid "Project Memory Index"
 #~ msgstr "Index de mémoire du projet"
+
+#~ msgid "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+#~ msgstr ""
+#~ "Des ressources cloud nécessitant encore "
+#~ "un nettoyage après le rollback du "
+#~ "pipeline ont été détectées. Nettoyez-les"
+#~ " immédiatement et vérifiez jusqu’à la "
+#~ "fin de la suppression."
+
+#~ msgid "要求："
+#~ msgstr "Exigences :"
+
+#~ msgid "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+#~ msgstr ""
+#~ "- Le périmètre de nettoyage est "
+#~ "une liste blanche stricte : seuls "
+#~ "les id listés dans « Ressources à"
+#~ " nettoyer » ci-dessous peuvent être"
+#~ " supprimés."
+
+#~ msgid "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+#~ msgstr ""
+#~ "- Ne supprimez, modifiez ni annulez "
+#~ "aucun stack ou ressource cloud non "
+#~ "listé dans « Ressources à nettoyer "
+#~ "»."
+
+#~ msgid "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+#~ msgstr ""
+#~ "- N'appelez pas ListStacks et ne "
+#~ "recherchez pas d'autres stacks par nom"
+#~ " ; les id des ressources a "
+#~ "nettoyer sont deja tous listes."
+
+#~ msgid "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+#~ msgstr ""
+#~ "- Avant chaque appel a "
+#~ "GetStack/DeleteStack, verifiez que StackId "
+#~ "correspond exactement a un id de "
+#~ "la liste des ressources a nettoyer."
+
+#~ msgid "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+#~ msgstr ""
+#~ "- Si StackId n'est pas dans la "
+#~ "liste des ressources a nettoyer, il "
+#~ "est interdit d'appeler DeleteStack, meme "
+#~ "s'il s'agit du stack du handoff "
+#~ "actuel ou d'un stack tout juste "
+#~ "cree."
+
+#~ msgid ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+#~ msgstr ""
+#~ "- Ne déduisez pas d’autres objets "
+#~ "à nettoyer depuis pipeline handoff, "
+#~ "deployment.stack_id, current stack ou "
+#~ "resources_created ; ils peuvent être les"
+#~ " ressources finalement livrées avec succès."
+
+#~ msgid "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+#~ msgstr ""
+#~ "- Même s’il existe des questions "
+#~ "utilisateur, des instructions de poursuite "
+#~ "ou un contexte de pipeline handoff "
+#~ "dans ce tour, n’élargissez pas le "
+#~ "périmètre de nettoyage."
+
+#~ msgid "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+#~ msgstr ""
+#~ "- Lors de la reprise ou de "
+#~ "la poursuite du nettoyage, traitez "
+#~ "uniquement les ressources listees dans "
+#~ "cette invite ; ne verifiez ni ne"
+#~ " supprimez d'autres ressources."
+
+#~ msgid ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+#~ msgstr ""
+#~ "- Utilisez en priorité l’outil ROS "
+#~ "stack disponible pour supprimer ; si "
+#~ "vous utilisez aliyun_api, lancez d’abord "
+#~ "DeleteStack puis vérifiez l’état avec "
+#~ "GetStack à plusieurs reprises."
+
+#~ msgid "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+#~ msgstr ""
+#~ "- Si la ressource est déjà en "
+#~ "cours de suppression, utilisez d’abord "
+#~ "GetStack pour vérifier son état actuel"
+#~ " avant de décider s’il faut relancer"
+#~ " DeleteStack."
+
+#~ msgid "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+#~ msgstr ""
+#~ "- Le nettoyage n’est terminé qu’après"
+#~ " confirmation de DELETE_COMPLETE ; en "
+#~ "cas de DELETE_FAILED ou d’impossibilité "
+#~ "de confirmer, expliquez à l’utilisateur "
+#~ "la cause de l’échec et la suite."
+
+#~ msgid "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+#~ msgstr ""
+#~ "- Lorsque toutes les ressources de "
+#~ "la liste sont en DELETE_COMPLETE, "
+#~ "arrêtez immédiatement ce nettoyage ; ne"
+#~ " supprimez ni ne vérifiez aucun autre"
+#~ " stack."
+
+#~ msgid "- 清理过程中向用户简短同步进度。"
+#~ msgstr ""
+#~ "- Tenez brièvement l’utilisateur informé "
+#~ "de la progression pendant le nettoyage."
+
+#~ msgid "待清理资源："
+#~ msgstr "Ressources à nettoyer :"
+
+#~ msgid "检测到 {count} 个回滚残留资源，开始清理流程。"
+#~ msgstr ""
+#~ "{count} ressources résiduelles du rollback "
+#~ "détectées ; démarrage du flux de "
+#~ "nettoyage."
+
+#~ msgid "错误：{error}"
+#~ msgstr "Erreur : {error}"
+
+#~ msgid "删除中"
+#~ msgstr "Suppression"
+
+#~ msgid "完成"
+#~ msgstr "Terminé"
+
+#~ msgid "失败"
+#~ msgstr "Échec"
+
+#~ msgid "跳过"
+#~ msgstr "Ignoré"
+
+#~ msgid "待处理"
+#~ msgstr "En attente"
+
+#~ msgid "检查"
+#~ msgstr "Vérifier"
+
+#~ msgid "进度"
+#~ msgstr "Progression"
+
+#~ msgid "DeleteStack 已提交，等待删除完成（{progress}）"
+#~ msgstr "DeleteStack envoyé ; attente de la fin de la suppression ({progress})"
+
+#~ msgid "DeleteStack 已提交，等待删除完成"
+#~ msgstr "DeleteStack envoyé ; attente de la fin de la suppression"
+
+#~ msgid "已跳过"
+#~ msgstr "Ignoré"
+
+#~ msgid "正在删除（{progress}）"
+#~ msgstr "Suppression ({progress})"
+
+#~ msgid "{progress}，需要删除"
+#~ msgstr "{progress}, suppression requise"
+
+#~ msgid "资源栈"
+#~ msgstr "Stack de ressources"
+
+#~ msgid "资源"
+#~ msgstr "Ressource"
+
+#~ msgid "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+#~ msgstr ""
+#~ "Impossible de lire le journal de "
+#~ "nettoyage du rollback ; le prompt "
+#~ "de nettoyage a été conservé. Continuez"
+#~ " plus tard ou vérifiez manuellement."
+
+#~ msgid "还有 {count} 个需要关注的资源未显示。"
+#~ msgstr ""
+#~ "{count} autres ressources nécessitant une "
+#~ "attention ne sont pas affichées."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录均已完成。"
+#~ msgstr ""
+#~ "↺ Reprise du nettoyage du rollback "
+#~ ": les {count} enregistrements sont "
+#~ "terminés."
+
+#~ msgid "进行中"
+#~ msgstr "En cours"
+
+#~ msgid "已完成"
+#~ msgstr "Terminé"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+#~ msgstr ""
+#~ "↺ Reprise du nettoyage du rollback "
+#~ ": {count} enregistrements, {summary}."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录。"
+#~ msgstr "↺ Reprise du nettoyage du rollback : {count} enregistrements."
+
+#~ msgid "Note: images are not supported in pipeline mode and will be ignored."
+#~ msgstr ""
+#~ "Remarque : les images ne sont pas"
+#~ " prises en charge en mode pipeline"
+#~ " et seront ignorées."
diff --git a/src/iac_code/i18n/locales/ja/LC_MESSAGES/messages.po b/src/iac_code/i18n/locales/ja/LC_MESSAGES/messages.po
index c45c6214..bf22dd73 100644
--- a/src/iac_code/i18n/locales/ja/LC_MESSAGES/messages.po
+++ b/src/iac_code/i18n/locales/ja/LC_MESSAGES/messages.po
@@ -44,6 +44,30 @@ msgstr "安全でないアーティファクトファイル名"
 msgid "Unknown error"
 msgstr "不明なエラー"
 
+#: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
+msgid ""
+"Cleanup state unavailable. Inspect the session file and cloud resources "
+"manually."
+msgstr "クリーンアップ状態を利用できません。セッションファイルとクラウドリソースを手動で確認してください。"
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup deferred prompt state is unavailable. Please repair it "
+"before continuing."
+msgstr "ロールバッククリーンアップの遅延プロンプト状態を利用できません。続行する前に修復してください。"
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup state is unavailable. Please repair the cleanup ledger "
+"before continuing."
+msgstr "ロールバッククリーンアップ状態を利用できません。続行する前にクリーンアップ台帳を修復してください。"
+
+#: src/iac_code/a2a/executor.py src/iac_code/ui/repl.py
+msgid ""
+"Rollback cleanup is still in progress. Please continue after cleanup "
+"completes."
+msgstr "ロールバッククリーンアップはまだ進行中です。完了後に続行してください。"
+
 #: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
 msgid "Task is already working."
 msgstr "タスクはすでに実行中です。"
@@ -53,6 +77,11 @@ msgstr "タスクはすでに実行中です。"
 msgid "Task canceled."
 msgstr "タスクがキャンセルされました。"
 
+#: src/iac_code/a2a/executor.py
+#, python-brace-format
+msgid "Current model {model} does not support image input."
+msgstr "現在のモデル {model} は画像入力をサポートしていません。"
+
 #: src/iac_code/a2a/pipeline_executor.py
 msgid "A temporary error occurred. Please retry."
 msgstr "一時的なエラーが発生しました。再試行してください。"
@@ -61,6 +90,11 @@ msgstr "一時的なエラーが発生しました。再試行してください
 msgid "Authentication required. Configure credentials and retry."
 msgstr "認証が必要です。認証情報を設定して再試行してください。"
 
+#: src/iac_code/a2a/pipeline_executor.py
+#, python-brace-format
+msgid "Pipeline already running. Resume task {task_id}."
+msgstr "パイプラインはすでに実行中です。タスク {task_id} を再開してください。"
+
 #: src/iac_code/a2a/pipeline_recovery.py
 msgid "A2A pipeline state not found"
 msgstr "A2A パイプライン状態が見つかりません"
@@ -479,6 +513,18 @@ msgstr "AI 駆動のインフラストラクチャ・オーケストレーショ
 msgid "Use iac-code as an A2A client."
 msgstr "iac-code を A2A クライアントとして使用します。"
 
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A client dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr "A2A クライアントの依存関係が不足しています。次のコマンドでインストールしてください: pip install 'iac-code[a2a]'"
+
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A server dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr "A2A サーバーの依存関係が不足しています。次のコマンドでインストールしてください: pip install 'iac-code[a2a]'"
+
 #: src/iac_code/cli/main.py
 msgid "Install Git for Windows via the npmmirror mirror (Windows only)."
 msgstr "npmmirror ミラー経由で Git for Windows をインストールします（Windows 専用）。"
@@ -491,12 +537,6 @@ msgstr "iac-code を最新バージョンに更新します。"
 msgid "YAML config file containing A2A client options"
 msgstr "A2A クライアントオプションを含む YAML 設定ファイル"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A client dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr "A2A クライアントの依存関係が不足しています。次のコマンドでインストールしてください: pip install 'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "LLM model to use"
 msgstr "使用する LLM モデル"
@@ -622,12 +662,6 @@ msgid ""
 "thinking, tool-trace."
 msgstr "A2A thinking 信号タイプを公開します。複数指定するには繰り返します。値：raw-thinking、tool-trace。"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A server dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr "A2A サーバーの依存関係が不足しています。次のコマンドでインストールしてください: pip install 'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "Send a prompt to an A2A JSON-RPC endpoint."
 msgstr "A2A JSON-RPC エンドポイントにプロンプトを送信します。"
@@ -1526,10 +1560,18 @@ msgstr "システムプロンプトは空です。"
 msgid "No provider messages yet."
 msgstr "プロバイダーメッセージはまだありません。"
 
+#: src/iac_code/commands/prompt.py
+msgid "No cleanup prompts in this snapshot."
+msgstr "このスナップショットにはクリーンアッププロンプトがありません。"
+
 #: src/iac_code/commands/prompt.py
 msgid "No tools are currently registered."
 msgstr "現在登録されているツールはありません。"
 
+#: src/iac_code/commands/prompt.py
+msgid "Cleanup Prompts"
+msgstr "クリーンアッププロンプト"
+
 #: src/iac_code/commands/prompt.py
 msgid "IAC-CODE Prompt Snapshot"
 msgstr "IAC-CODE プロンプトスナップショット"
@@ -1564,6 +1606,14 @@ msgstr "プロバイダーメッセージ"
 msgid "Tools"
 msgstr "ツール"
 
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt"
+msgstr "クリーンアッププロンプト"
+
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt · removed"
+msgstr "クリーンアッププロンプト · 削除済み"
+
 #: src/iac_code/commands/prompt.py
 msgid "Instruction Memory"
 msgstr "指示メモリ"
@@ -1641,6 +1691,11 @@ msgstr "   メッセージ: {count}"
 msgid "   Recalled memory: {status}"
 msgstr "   呼び出されたメモリ: {status}"
 
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "   Cleanup prompts: {count}"
+msgstr "   クリーンアッププロンプト: {count}"
+
 #: src/iac_code/commands/prompt.py
 msgid "3. Tools"
 msgstr "3. ツール"
@@ -1686,6 +1741,15 @@ msgstr "存在します"
 msgid "not present"
 msgstr "存在しません"
 
+#: src/iac_code/commands/prompt.py
+msgid "Rollback cleanup prompts are also shown separately for quick inspection."
+msgstr "ロールバッククリーンアッププロンプトは、すばやく確認できるよう別途表示されます。"
+
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "{count} cleanup prompts"
+msgstr "{count} 件のクリーンアッププロンプト"
+
 #: src/iac_code/commands/prompt.py
 msgid "Tool definitions available to the main model for this request."
 msgstr "このリクエストでメインモデルが利用できるツール定義です。"
@@ -1717,6 +1781,7 @@ msgid "Input schema"
 msgstr "入力スキーマ"
 
 #: src/iac_code/commands/prompt.py
+#: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid "tool"
 msgstr "ツール"
 
@@ -1999,6 +2064,24 @@ msgstr "永続メモリを読み取ります。すべてを一覧表示するに
 msgid "Memory name to read. Omit to list all."
 msgstr "読み取るメモリ名。すべてを一覧表示するには省略します。"
 
+#: src/iac_code/memory/memory_tools.py
+#, python-brace-format
+msgid ""
+"{base}\n"
+"\n"
+"Available memories:\n"
+"{index}\n"
+"\n"
+"Call read_memory again with one of these names, or omit name to list all "
+"memories."
+msgstr ""
+"{base}\n"
+"\n"
+"利用可能なメモリ:\n"
+"{index}\n"
+"\n"
+"これらの名前のいずれかを指定して read_memory を再度呼び出すか、すべてのメモリを一覧表示するには name を省略してください。"
+
 #: src/iac_code/memory/memory_tools.py
 #, python-brace-format
 msgid ""
@@ -2097,6 +2180,121 @@ msgstr "ask_user_question にはパイプラインイベントキューが必要
 msgid "User cancelled ask_user_question."
 msgstr "ユーザーが ask_user_question をキャンセルしました。"
 
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"Cloud resources still need cleanup after pipeline rollback. Clean them up"
+" now and keep checking until deletion completes."
+msgstr "パイプラインのロールバック後もクラウドリソースのクリーンアップが必要です。今すぐクリーンアップし、削除が完了するまで確認を続けてください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Requirements:"
+msgstr "要件:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup scope is a strict allowlist: delete only ids in the cleanup "
+"resources list below."
+msgstr "- クリーンアップ範囲は厳密な許可リストです。下のクリーンアップリソース一覧にある ID だけを削除してください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not delete, modify, or roll back any stack or cloud resource outside"
+" the cleanup resources list."
+msgstr "- クリーンアップリソース一覧にないスタックやクラウドリソースを削除、変更、ロールバックしないでください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not call ListStacks or search for other stacks by name; cleanup "
+"resource ids are fully listed."
+msgstr "- ListStacks を呼び出したり、名前で他のスタックを検索したりしないでください。クリーンアップリソース ID は完全に列挙されています。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Before every GetStack/DeleteStack call, verify that StackId exactly "
+"matches an id in the cleanup resources list."
+msgstr ""
+"- GetStack/DeleteStack を呼び出す前に、StackId がクリーンアップリソース一覧内の ID "
+"と完全に一致することを確認してください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If StackId is not in the cleanup resources list, do not call "
+"DeleteStack, even if it is the current handoff or newly created stack."
+msgstr ""
+"- StackId がクリーンアップリソース一覧にない場合は、それが現在の handoff や新規作成スタックでも DeleteStack "
+"を呼び出さないでください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not infer extra cleanup targets from pipeline handoff, "
+"deployment.stack_id, current stack, or resources_created; those may be "
+"final delivered resources."
+msgstr ""
+"- pipeline handoff、deployment.stack_id、現在のスタック、resources_created "
+"から追加のクリーンアップ対象を推測しないでください。それらは最終納品リソースの可能性があります。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not expand cleanup scope for user follow-ups, continue instructions,"
+" or pipeline handoff context."
+msgstr "- ユーザーの追加質問、continue 指示、pipeline handoff コンテキストを理由にクリーンアップ範囲を広げないでください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- When resuming cleanup, still process only resources listed in this "
+"prompt; do not inspect or delete others."
+msgstr "- クリーンアップを再開するときも、このプロンプトに列挙されたリソースだけを処理し、それ以外を調査または削除しないでください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Prefer available ROS stack tools for deletion; if using aliyun_api, "
+"call DeleteStack first, then repeatedly call GetStack to check status."
+msgstr ""
+"- 削除には利用可能な ROS スタックツールを優先してください。aliyun_api を使う場合は、最初に DeleteStack "
+"を呼び出し、その後 GetStack を繰り返し呼び出して状態を確認してください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If a resource is already deleting, call GetStack first, then decide "
+"whether DeleteStack is needed again."
+msgstr "- リソースがすでに削除中の場合は、まず GetStack を呼び出し、その後 DeleteStack が再度必要か判断してください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or "
+"unknown status, tell the user the failure reason and next step."
+msgstr ""
+"- クリーンアップは DELETE_COMPLETE 後にのみ完了です。DELETE_FAILED "
+"または不明な状態の場合は、失敗理由と次の手順をユーザーに伝えてください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- After all listed resources are DELETE_COMPLETE, stop this cleanup turn "
+"immediately."
+msgstr "- 列挙されたすべてのリソースが DELETE_COMPLETE になったら、このクリーンアップターンを直ちに停止してください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "- Briefly update the user during cleanup."
+msgstr "- クリーンアップ中はユーザーに簡潔に進捗を伝えてください。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Cleanup resources:"
+msgstr "クリーンアップリソース:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid ""
+"{index}. provider={provider}, type={resource_type}, id={resource_id}, "
+"name={name}, region={region}"
+msgstr ""
+"{index}. プロバイダー={provider}, 種別={resource_type}, ID={resource_id}, "
+"名前={name}, リージョン={region}"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid "Detected {count} rollback cleanup resources; starting cleanup."
+msgstr "{count} 件のロールバッククリーンアップリソースを検出しました。クリーンアップを開始します。"
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid ""
 "Complete the current step by calling this tool to submit the conclusion. "
@@ -2185,20 +2383,50 @@ msgid ""
 "{fields}."
 msgstr "{message} complete_step.conclusion には次のいずれかのフィールドが必要です: {fields}。"
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "A successful tool result is required before completing the current step."
+msgstr "現在のステップを完了する前に、成功したツール結果が必要です。"
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
-msgid "Candidate count cannot exceed {limit}; {count} were submitted."
-msgstr "候補数は {limit} を超えられません。{count} 件が送信されました。"
+msgid ""
+"{message} complete_step.conclusion.{field} must match the {tool} result "
+"value {value}."
+msgstr ""
+"{message} complete_step.conclusion.{field} は {tool} の結果値 {value} "
+"と一致する必要があります。"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "<missing>"
+msgstr "<欠落>"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " with status {statuses}"
+msgstr "（ステータス: {statuses}）"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " and is_success={expected}"
+msgstr "、かつ is_success={expected}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " one of {actions}"
+msgstr "（アクションは {actions} のいずれか）"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid ""
-"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
-"user for help or narrow the rollback targets before calling "
-"complete_step."
+"{message} Call {tool}{action} first and wait for a successful "
+"result{status_hint}{success_hint}."
 msgstr ""
-"ロールバック対象数は {limit} を超えられません。現在 {count} 件あります。complete_step "
-"を呼ぶ前にユーザーに支援を求めるか、対象を絞ってください。"
+"{message} まず {tool}{action} "
+"を呼び出し、成功した結果{status_hint}{success_hint}を待ってください。"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "the required tool"
+msgstr "必須ツール"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
@@ -2207,6 +2435,21 @@ msgid ""
 "or ask the user for help."
 msgstr "ロールバック回数は {max_rollbacks} を超えられません。現在のステップを完了するか、ユーザーに支援を求めてください。"
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgstr "候補数は {limit} を超えられません。{count} 件が送信されました。"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid ""
+"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
+"user for help or narrow the rollback targets before calling "
+"complete_step."
+msgstr ""
+"ロールバック対象数は {limit} を超えられません。現在 {count} 件あります。complete_step "
+"を呼ぶ前にユーザーに支援を求めるか、対象を絞ってください。"
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid "Schema validation failed after {attempts} attempts: {error}"
@@ -2229,6 +2472,10 @@ msgstr "conclusion の検証に失敗しました。修正して complete_step 
 msgid "Step {step_id} completed. Conclusion submitted."
 msgstr "ステップ {step_id} が完了しました。結論を送信しました。"
 
+#: src/iac_code/pipeline/engine/pipeline_runner.py
+msgid "Pipeline state persistence failed."
+msgstr "パイプライン状態の永続化に失敗しました。"
+
 #: src/iac_code/pipeline/engine/pipeline_runner.py
 #: src/iac_code/pipeline/engine/sub_pipeline_executor.py
 #: src/iac_code/ui/repl.py
@@ -2324,6 +2571,10 @@ msgstr "テンプレートファイルのパスは作業ディレクトリから
 msgid "Template file path cannot escape the working directory"
 msgstr "テンプレートファイルのパスは作業ディレクトリの外に出られません"
 
+#: src/iac_code/pipeline/engine/user_input.py
+msgid "[Image input]"
+msgstr "[画像入力]"
+
 #: src/iac_code/pipeline/selling/tools/show_candidate_detail_tool.py
 msgid ""
 "Display candidate details (summary and cost breakdown) in the comparison "
@@ -3183,6 +3434,16 @@ msgstr "ROS スタック"
 msgid "CloudStackInstances"
 msgstr "CloudStackInstances"
 
+#: src/iac_code/tools/cloud/aliyun/template_source.py
+msgid ""
+"ROS template calls must use TemplateURL instead of TemplateBody. Save the"
+" template to a file and pass params.TemplateURL, for example a local file"
+" path or OSS/HTTP URL."
+msgstr ""
+"ROS テンプレート呼び出しでは TemplateBody ではなく TemplateURL "
+"を使用する必要があります。テンプレートをファイルに保存し、ローカルファイルパスまたは OSS/HTTP URL などを "
+"params.TemplateURL として渡してください。"
+
 #: src/iac_code/tools/cloud/aliyun/hooks/ros_validate.py
 #, python-brace-format
 msgid "Template YAML syntax error: {}"
@@ -3293,11 +3554,11 @@ msgstr "中断済み"
 msgid "Running"
 msgstr "実行中"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Completed"
 msgstr "完了"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Failed"
 msgstr "失敗"
 
@@ -3570,8 +3831,121 @@ msgid "Command has no handler: {name}"
 msgstr "ハンドラーがないコマンドです：{name}"
 
 #: src/iac_code/ui/repl.py
-msgid "Note: images are not supported in pipeline mode and will be ignored."
-msgstr "注: パイプラインモードでは画像はサポートされておらず、無視されます。"
+#, python-brace-format
+msgid "↺ Rollback cleanup [{badge}] {label}"
+msgstr "↺ ロールバッククリーンアップ [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{kind} {resource_id}"
+msgstr "{kind} {resource_id}"
+
+#: src/iac_code/ui/repl.py
+msgid "Deleting"
+msgstr "削除中"
+
+#: src/iac_code/ui/repl.py
+msgid "Skipped"
+msgstr "スキップ済み"
+
+#: src/iac_code/ui/repl.py
+msgid "Pending"
+msgstr "保留中"
+
+#: src/iac_code/ui/repl.py
+msgid "Checking"
+msgstr "確認中"
+
+#: src/iac_code/ui/repl.py
+msgid "Progress"
+msgstr "進捗"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "DeleteStack submitted; waiting for deletion to complete ({progress})"
+msgstr "DeleteStack を送信しました。削除完了を待機しています ({progress})"
+
+#: src/iac_code/ui/repl.py
+msgid "DeleteStack submitted; waiting for deletion to complete"
+msgstr "DeleteStack を送信しました。削除完了を待機しています"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Deleting ({progress})"
+msgstr "削除中 ({progress})"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{progress}; deletion required"
+msgstr "{progress}; 削除が必要です"
+
+#: src/iac_code/ui/repl.py
+msgid "stack"
+msgstr "スタック"
+
+#: src/iac_code/ui/repl.py
+msgid "resource"
+msgstr "リソース"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Could not read rollback cleanup records. The cleanup prompt was kept; "
+"retry later or inspect manually."
+msgstr "ロールバッククリーンアップレコードを読み取れませんでした。クリーンアッププロンプトは保持されています。後で再試行するか、手動で確認してください。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} additional resources needing attention were not shown."
+msgstr "対応が必要な追加リソース {count} 件は表示されませんでした。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: all {count} records are completed."
+msgstr "↺ ロールバッククリーンアップ再開: {count} 件のレコードはすべて完了しています。"
+
+#: src/iac_code/ui/repl.py
+msgid "failed"
+msgstr "失敗"
+
+#: src/iac_code/ui/repl.py
+msgid "pending"
+msgstr "保留中"
+
+#: src/iac_code/ui/repl.py
+msgid "in progress"
+msgstr "進行中"
+
+#: src/iac_code/ui/repl.py
+msgid "completed"
+msgstr "完了"
+
+#: src/iac_code/ui/repl.py
+msgid "skipped"
+msgstr "スキップ済み"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} {label}"
+msgstr "{count} 件の{label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records, {summary}."
+msgstr "↺ ロールバッククリーンアップ再開: {count} 件のレコード、{summary}。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records."
+msgstr "↺ ロールバッククリーンアップ再開: {count} 件のレコード。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "  [{badge}] {label}"
+msgstr "  [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+msgid "Detected rollback cleanup resources, but cleanup prompt injection failed."
+msgstr "ロールバッククリーンアップリソースを検出しましたが、クリーンアッププロンプトの注入に失敗しました。"
 
 #: src/iac_code/ui/repl.py
 #, python-brace-format
@@ -3580,9 +3954,21 @@ msgstr "保存済みのパイプライン状態を無視しています: {reason
 
 #: src/iac_code/ui/repl.py
 msgid ""
-"Pipeline completed. Normal chat is active, but the handoff context could "
-"not be injected or saved."
-msgstr "パイプラインが完了しました。通常チャットは有効ですが、引き継ぎコンテキストを注入または保存できませんでした。"
+"Pipeline state persistence failed. The pipeline is paused; do not "
+"continue until state is durable."
+msgstr "パイプライン状態の永続化に失敗しました。パイプラインは一時停止中です。状態が永続化されるまで続行しないでください。"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline state persistence failed. Normal chat handoff was not marked "
+"durable."
+msgstr "パイプライン状態の永続化に失敗しました。通常チャットへのハンドオフは永続化済みとしてマークされていません。"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline completed, but the handoff context could not be injected or "
+"saved."
+msgstr "パイプラインは完了しましたが、handoff コンテキストを注入または保存できませんでした。"
 
 #: src/iac_code/ui/repl.py
 msgid "Judging your input..."
@@ -3748,6 +4134,11 @@ msgstr "  ✓ {name}: 完了\n"
 msgid "  ✘ {name}: Failed"
 msgstr "  ✘ {name}: 失敗"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Pipeline warning: {reason}"
+msgstr "パイプライン警告: {reason}"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Option {index}"
@@ -3827,6 +4218,15 @@ msgstr "不明なエラー"
 msgid "Resumed pipeline at step: {step}"
 msgstr "パイプラインをステップ {step} から再開しました"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Could not read pipeline state metadata: {reason}"
+msgstr "パイプライン状態メタデータを読み取れませんでした: {reason}"
+
+#: src/iac_code/ui/repl.py
+msgid "Pipeline state metadata is invalid; continuing as normal chat."
+msgstr "パイプライン状態メタデータが無効です。通常チャットとして続行します。"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Found pipeline state in this session (paused at: {step})."
@@ -4367,3 +4767,153 @@ msgstr "公開イベントではスタックトレースを省略しました。
 
 #~ msgid "Project Memory Index"
 #~ msgstr "プロジェクトメモリ索引"
+
+#~ msgid "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+#~ msgstr ""
+#~ "pipeline rollback "
+#~ "後もクリーンアップが必要なクラウドリソースを検出しました。直ちにこれらを削除し、削除完了まで継続して確認してください。"
+
+#~ msgid "要求："
+#~ msgstr "要件:"
+
+#~ msgid "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+#~ msgstr "- クリーンアップ範囲は厳密なホワイトリストです。以下の「クリーンアップ対象リソース」一覧の id だけを削除できます。"
+
+#~ msgid "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+#~ msgstr "- 「クリーンアップ対象リソース」に記載されていない stack やクラウドリソースは削除、変更、ロールバックしないでください。"
+
+#~ msgid "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+#~ msgstr ""
+#~ "- ListStacks を呼び出したり、名前で他の stack "
+#~ "を検索したりしないでください。クリーンアップ対象リソースの id はすべて列挙されています。"
+
+#~ msgid "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+#~ msgstr ""
+#~ "- GetStack/DeleteStack を呼び出す前に、StackId "
+#~ "が「クリーンアップ対象リソース」リスト内のいずれかの id と完全に一致することを必ず確認してください。"
+
+#~ msgid "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+#~ msgstr ""
+#~ "- StackId が「クリーンアップ対象リソース」リストにない場合、それが現在の handoff"
+#~ " や作成直後の stack であっても DeleteStack "
+#~ "を呼び出してはいけません。"
+
+#~ msgid ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+#~ msgstr ""
+#~ "- pipeline handoff、deployment.stack_id、current "
+#~ "stack、resources_created "
+#~ "から追加のクリーンアップ対象を推測しないでください。これらは最終的に正常提供されたリソースかもしれません。"
+
+#~ msgid "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+#~ msgstr ""
+#~ "- このラウンドにユーザーの追加質問、続行指示、pipeline handoff "
+#~ "コンテキストがあっても、クリーンアップ範囲を広げないでください。"
+
+#~ msgid "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+#~ msgstr ""
+#~ "- "
+#~ "クリーンアップを再開または続行する場合も、このプロンプトに列挙されたリソースだけを処理してください。他のリソースを確認または削除しないでください。"
+
+#~ msgid ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+#~ msgstr ""
+#~ "- 利用可能な ROS stack ツールでの削除を優先してください。aliyun_api"
+#~ " を使う場合は、まず DeleteStack を実行し、その後 GetStack "
+#~ "で状態を繰り返し確認してください。"
+
+#~ msgid "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+#~ msgstr ""
+#~ "- リソースがすでに削除中の場合は、まず GetStack で現在状態を確認し、DeleteStack"
+#~ " を再実行する必要があるか判断してください。"
+
+#~ msgid "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+#~ msgstr ""
+#~ "- DELETE_COMPLETE を確認した場合のみクリーンアップ完了です。DELETE_FAILED "
+#~ "または確認不能の場合は、失敗原因と次の手順をユーザーに説明してください。"
+
+#~ msgid "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+#~ msgstr ""
+#~ "- 一覧内のすべてのリソースが DELETE_COMPLETE "
+#~ "になったら、このクリーンアップを直ちに停止してください。他の stack を削除または確認しないでください。"
+
+#~ msgid "- 清理过程中向用户简短同步进度。"
+#~ msgstr "- クリーンアップ中は進捗を簡潔にユーザーへ共有してください。"
+
+#~ msgid "待清理资源："
+#~ msgstr "クリーンアップ対象リソース:"
+
+#~ msgid "检测到 {count} 个回滚残留资源，开始清理流程。"
+#~ msgstr "{count} 件のロールバック残留リソースを検出しました。クリーンアップフローを開始します。"
+
+#~ msgid "错误：{error}"
+#~ msgstr "エラー: {error}"
+
+#~ msgid "删除中"
+#~ msgstr "削除中"
+
+#~ msgid "完成"
+#~ msgstr "完了"
+
+#~ msgid "失败"
+#~ msgstr "失敗"
+
+#~ msgid "跳过"
+#~ msgstr "スキップ"
+
+#~ msgid "待处理"
+#~ msgstr "保留中"
+
+#~ msgid "检查"
+#~ msgstr "確認"
+
+#~ msgid "进度"
+#~ msgstr "進捗"
+
+#~ msgid "DeleteStack 已提交，等待删除完成（{progress}）"
+#~ msgstr "DeleteStack を送信しました。削除完了を待機中（{progress}）"
+
+#~ msgid "DeleteStack 已提交，等待删除完成"
+#~ msgstr "DeleteStack を送信しました。削除完了を待機中"
+
+#~ msgid "已跳过"
+#~ msgstr "スキップ済み"
+
+#~ msgid "正在删除（{progress}）"
+#~ msgstr "削除中（{progress}）"
+
+#~ msgid "{progress}，需要删除"
+#~ msgstr "{progress}、削除が必要"
+
+#~ msgid "资源栈"
+#~ msgstr "リソーススタック"
+
+#~ msgid "资源"
+#~ msgstr "リソース"
+
+#~ msgid "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+#~ msgstr "ロールバッククリーンアップ記録を読み取れませんでした。クリーンアッププロンプトは保持されています。後で続行するか手動で確認してください。"
+
+#~ msgid "还有 {count} 个需要关注的资源未显示。"
+#~ msgstr "注意が必要な未表示のリソースがさらに {count} 件あります。"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录均已完成。"
+#~ msgstr "↺ ロールバッククリーンアップ復元: {count} 件の記録はすべて完了済みです。"
+
+#~ msgid "进行中"
+#~ msgstr "進行中"
+
+#~ msgid "已完成"
+#~ msgstr "完了済み"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+#~ msgstr "↺ ロールバッククリーンアップ復元: {count} 件の記録、{summary}。"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录。"
+#~ msgstr "↺ ロールバッククリーンアップ復元: {count} 件の記録。"
+
+#~ msgid "Note: images are not supported in pipeline mode and will be ignored."
+#~ msgstr "注: パイプラインモードでは画像はサポートされておらず、無視されます。"
diff --git a/src/iac_code/i18n/locales/pt/LC_MESSAGES/messages.po b/src/iac_code/i18n/locales/pt/LC_MESSAGES/messages.po
index 7ceb3c1b..55b40178 100644
--- a/src/iac_code/i18n/locales/pt/LC_MESSAGES/messages.po
+++ b/src/iac_code/i18n/locales/pt/LC_MESSAGES/messages.po
@@ -48,6 +48,38 @@ msgstr "Nome de arquivo de artefato inseguro"
 msgid "Unknown error"
 msgstr "Erro desconhecido"
 
+#: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
+msgid ""
+"Cleanup state unavailable. Inspect the session file and cloud resources "
+"manually."
+msgstr ""
+"Estado de limpeza indisponível. Inspecione manualmente o arquivo de "
+"sessão e os recursos de nuvem."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup deferred prompt state is unavailable. Please repair it "
+"before continuing."
+msgstr ""
+"O estado do prompt adiado de limpeza de rollback não está disponível. "
+"Corrija-o antes de continuar."
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup state is unavailable. Please repair the cleanup ledger "
+"before continuing."
+msgstr ""
+"O estado de limpeza de rollback não está disponível. Corrija o ledger de "
+"limpeza antes de continuar."
+
+#: src/iac_code/a2a/executor.py src/iac_code/ui/repl.py
+msgid ""
+"Rollback cleanup is still in progress. Please continue after cleanup "
+"completes."
+msgstr ""
+"A limpeza de rollback ainda está em andamento. Continue após a limpeza "
+"terminar."
+
 #: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
 msgid "Task is already working."
 msgstr "A tarefa já está em execução."
@@ -57,6 +89,11 @@ msgstr "A tarefa já está em execução."
 msgid "Task canceled."
 msgstr "Tarefa cancelada."
 
+#: src/iac_code/a2a/executor.py
+#, python-brace-format
+msgid "Current model {model} does not support image input."
+msgstr "O modelo atual {model} não oferece suporte a entrada de imagem."
+
 #: src/iac_code/a2a/pipeline_executor.py
 msgid "A temporary error occurred. Please retry."
 msgstr "Ocorreu um erro temporário. Tente novamente."
@@ -65,6 +102,11 @@ msgstr "Ocorreu um erro temporário. Tente novamente."
 msgid "Authentication required. Configure credentials and retry."
 msgstr "Autenticação necessária. Configure as credenciais e tente novamente."
 
+#: src/iac_code/a2a/pipeline_executor.py
+#, python-brace-format
+msgid "Pipeline already running. Resume task {task_id}."
+msgstr "O pipeline já está em execução. Retome a tarefa {task_id}."
+
 #: src/iac_code/a2a/pipeline_recovery.py
 msgid "A2A pipeline state not found"
 msgstr "Estado do pipeline A2A não encontrado"
@@ -497,6 +539,22 @@ msgstr "Ferramenta de orquestração de infraestrutura com IA"
 msgid "Use iac-code as an A2A client."
 msgstr "Usa o iac-code como cliente A2A."
 
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A client dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"As dependências do cliente A2A estão ausentes. Instale com: pip install "
+"'iac-code[a2a]'"
+
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A server dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr ""
+"As dependências do servidor A2A estão ausentes. Instale com: pip install "
+"'iac-code[a2a]'"
+
 #: src/iac_code/cli/main.py
 msgid "Install Git for Windows via the npmmirror mirror (Windows only)."
 msgstr "Instalar Git for Windows pelo espelho npmmirror (somente Windows)."
@@ -509,14 +567,6 @@ msgstr "Atualizar o iac-code para a versão mais recente."
 msgid "YAML config file containing A2A client options"
 msgstr "Arquivo de configuração YAML com opções do cliente A2A"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A client dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"As dependências do cliente A2A estão ausentes. Instale com: pip install "
-"'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "LLM model to use"
 msgstr "Modelo LLM a utilizar"
@@ -650,14 +700,6 @@ msgstr ""
 "Expõe tipos de sinal de thinking A2A; repita para múltiplos. Valores: "
 "raw-thinking, tool-trace."
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A server dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr ""
-"As dependências do servidor A2A estão ausentes. Instale com: pip install "
-"'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "Send a prompt to an A2A JSON-RPC endpoint."
 msgstr "Envia um prompt para um endpoint JSON-RPC A2A."
@@ -1554,10 +1596,18 @@ msgstr "O prompt de sistema está vazio."
 msgid "No provider messages yet."
 msgstr "Ainda não há mensagens do provedor."
 
+#: src/iac_code/commands/prompt.py
+msgid "No cleanup prompts in this snapshot."
+msgstr "Não há prompts de limpeza neste snapshot."
+
 #: src/iac_code/commands/prompt.py
 msgid "No tools are currently registered."
 msgstr "Nenhuma ferramenta está registrada no momento."
 
+#: src/iac_code/commands/prompt.py
+msgid "Cleanup Prompts"
+msgstr "Prompts de limpeza"
+
 #: src/iac_code/commands/prompt.py
 msgid "IAC-CODE Prompt Snapshot"
 msgstr "Instantâneo do prompt do IAC-CODE"
@@ -1594,6 +1644,14 @@ msgstr "Mensagens do provedor"
 msgid "Tools"
 msgstr "Ferramentas"
 
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt"
+msgstr "prompt de limpeza"
+
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt · removed"
+msgstr "prompt de limpeza · removido"
+
 #: src/iac_code/commands/prompt.py
 msgid "Instruction Memory"
 msgstr "Memória de instruções"
@@ -1673,6 +1731,11 @@ msgstr "   Mensagens: {count}"
 msgid "   Recalled memory: {status}"
 msgstr "   Memória recuperada: {status}"
 
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "   Cleanup prompts: {count}"
+msgstr "   Prompts de limpeza: {count}"
+
 #: src/iac_code/commands/prompt.py
 msgid "3. Tools"
 msgstr "3. Ferramentas"
@@ -1722,6 +1785,17 @@ msgstr "presente"
 msgid "not present"
 msgstr "não presente"
 
+#: src/iac_code/commands/prompt.py
+msgid "Rollback cleanup prompts are also shown separately for quick inspection."
+msgstr ""
+"Os prompts de limpeza de rollback também são exibidos separadamente para "
+"inspeção rápida."
+
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "{count} cleanup prompts"
+msgstr "{count} prompts de limpeza"
+
 #: src/iac_code/commands/prompt.py
 msgid "Tool definitions available to the main model for this request."
 msgstr ""
@@ -1755,6 +1829,7 @@ msgid "Input schema"
 msgstr "Esquema de entrada"
 
 #: src/iac_code/commands/prompt.py
+#: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid "tool"
 msgstr "ferramenta"
 
@@ -2049,6 +2124,25 @@ msgstr ""
 msgid "Memory name to read. Omit to list all."
 msgstr "Nome da memória a ler. Omita para listar todas."
 
+#: src/iac_code/memory/memory_tools.py
+#, python-brace-format
+msgid ""
+"{base}\n"
+"\n"
+"Available memories:\n"
+"{index}\n"
+"\n"
+"Call read_memory again with one of these names, or omit name to list all "
+"memories."
+msgstr ""
+"{base}\n"
+"\n"
+"Memórias disponíveis:\n"
+"{index}\n"
+"\n"
+"Chame read_memory novamente com um destes nomes, ou omita name para "
+"listar todas as memórias."
+
 #: src/iac_code/memory/memory_tools.py
 #, python-brace-format
 msgid ""
@@ -2151,6 +2245,141 @@ msgstr "ask_user_question requer uma fila de eventos do pipeline."
 msgid "User cancelled ask_user_question."
 msgstr "O usuário cancelou ask_user_question."
 
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"Cloud resources still need cleanup after pipeline rollback. Clean them up"
+" now and keep checking until deletion completes."
+msgstr ""
+"Os recursos de nuvem ainda precisam de limpeza após o rollback do "
+"pipeline. Limpe-os agora e continue verificando até que a exclusão seja "
+"concluída."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Requirements:"
+msgstr "Requisitos:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup scope is a strict allowlist: delete only ids in the cleanup "
+"resources list below."
+msgstr ""
+"- O escopo de limpeza é uma allowlist estrita: exclua apenas os IDs na "
+"lista de recursos de limpeza abaixo."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not delete, modify, or roll back any stack or cloud resource outside"
+" the cleanup resources list."
+msgstr ""
+"- Não exclua, modifique nem reverta stacks ou recursos de nuvem fora da "
+"lista de recursos de limpeza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not call ListStacks or search for other stacks by name; cleanup "
+"resource ids are fully listed."
+msgstr ""
+"- Não chame ListStacks nem pesquise outros stacks por nome; os IDs dos "
+"recursos de limpeza estão totalmente listados."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Before every GetStack/DeleteStack call, verify that StackId exactly "
+"matches an id in the cleanup resources list."
+msgstr ""
+"- Antes de cada chamada GetStack/DeleteStack, verifique se StackId "
+"corresponde exatamente a um ID na lista de recursos de limpeza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If StackId is not in the cleanup resources list, do not call "
+"DeleteStack, even if it is the current handoff or newly created stack."
+msgstr ""
+"- Se StackId não estiver na lista de recursos de limpeza, não chame "
+"DeleteStack, mesmo que seja o stack atual do handoff ou recém-criado."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not infer extra cleanup targets from pipeline handoff, "
+"deployment.stack_id, current stack, or resources_created; those may be "
+"final delivered resources."
+msgstr ""
+"- Não infira alvos de limpeza extras a partir do handoff do pipeline, "
+"deployment.stack_id, stack atual ou resources_created; eles podem ser "
+"recursos finais entregues."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not expand cleanup scope for user follow-ups, continue instructions,"
+" or pipeline handoff context."
+msgstr ""
+"- Não expanda o escopo de limpeza por causa de acompanhamento do usuário,"
+" instruções de continue ou contexto de handoff do pipeline."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- When resuming cleanup, still process only resources listed in this "
+"prompt; do not inspect or delete others."
+msgstr ""
+"- Ao retomar a limpeza, processe apenas os recursos listados neste "
+"prompt; não inspecione nem exclua outros."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Prefer available ROS stack tools for deletion; if using aliyun_api, "
+"call DeleteStack first, then repeatedly call GetStack to check status."
+msgstr ""
+"- Prefira as ferramentas de stack ROS disponíveis para exclusão; se usar "
+"aliyun_api, chame DeleteStack primeiro e depois chame GetStack "
+"repetidamente para verificar o status."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If a resource is already deleting, call GetStack first, then decide "
+"whether DeleteStack is needed again."
+msgstr ""
+"- Se um recurso já estiver sendo excluído, chame GetStack primeiro e "
+"depois decida se DeleteStack é necessário novamente."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or "
+"unknown status, tell the user the failure reason and next step."
+msgstr ""
+"- A limpeza só está completa após DELETE_COMPLETE; para DELETE_FAILED ou "
+"status desconhecido, informe ao usuário o motivo da falha e o próximo "
+"passo."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- After all listed resources are DELETE_COMPLETE, stop this cleanup turn "
+"immediately."
+msgstr ""
+"- Depois que todos os recursos listados estiverem em DELETE_COMPLETE, "
+"pare este turno de limpeza imediatamente."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "- Briefly update the user during cleanup."
+msgstr "- Atualize brevemente o usuário durante a limpeza."
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Cleanup resources:"
+msgstr "Recursos de limpeza:"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid ""
+"{index}. provider={provider}, type={resource_type}, id={resource_id}, "
+"name={name}, region={region}"
+msgstr ""
+"{index}. provedor={provider}, tipo={resource_type}, id={resource_id}, "
+"nome={name}, região={region}"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid "Detected {count} rollback cleanup resources; starting cleanup."
+msgstr "{count} recursos de limpeza de rollback detectados; iniciando limpeza."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid ""
 "Complete the current step by calling this tool to submit the conclusion. "
@@ -2246,23 +2475,52 @@ msgstr ""
 "{message} complete_step.conclusion deve incluir um destes campos: "
 "{fields}."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "A successful tool result is required before completing the current step."
+msgstr ""
+"É necessário um resultado de ferramenta bem-sucedido antes de concluir a "
+"etapa atual."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
-msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgid ""
+"{message} complete_step.conclusion.{field} must match the {tool} result "
+"value {value}."
 msgstr ""
-"A quantidade de candidatos não pode exceder {limit}; {count} foram "
-"enviados."
+"{message} complete_step.conclusion.{field} deve corresponder ao valor de "
+"resultado {value} de {tool}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "<missing>"
+msgstr "<ausente>"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " with status {statuses}"
+msgstr " com status {statuses}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " and is_success={expected}"
+msgstr " e is_success={expected}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " one of {actions}"
+msgstr " com uma das ações {actions}"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid ""
-"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
-"user for help or narrow the rollback targets before calling "
-"complete_step."
+"{message} Call {tool}{action} first and wait for a successful "
+"result{status_hint}{success_hint}."
 msgstr ""
-"A quantidade de destinos de reversão não pode exceder {limit}; há "
-"{count}. Peça ajuda ao usuário ou reduza os destinos antes de chamar "
-"complete_step."
+"{message} Chame {tool}{action} primeiro e aguarde um resultado bem-"
+"sucedido{status_hint}{success_hint}."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "the required tool"
+msgstr "a ferramenta obrigatória"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
@@ -2273,6 +2531,24 @@ msgstr ""
 "A quantidade de reversões não pode exceder {max_rollbacks}. Conclua a "
 "etapa atual ou peça ajuda ao usuário."
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgstr ""
+"A quantidade de candidatos não pode exceder {limit}; {count} foram "
+"enviados."
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid ""
+"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
+"user for help or narrow the rollback targets before calling "
+"complete_step."
+msgstr ""
+"A quantidade de destinos de reversão não pode exceder {limit}; há "
+"{count}. Peça ajuda ao usuário ou reduza os destinos antes de chamar "
+"complete_step."
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid "Schema validation failed after {attempts} attempts: {error}"
@@ -2299,6 +2575,10 @@ msgstr ""
 msgid "Step {step_id} completed. Conclusion submitted."
 msgstr "Etapa {step_id} concluída. Conclusão enviada."
 
+#: src/iac_code/pipeline/engine/pipeline_runner.py
+msgid "Pipeline state persistence failed."
+msgstr "Falha ao persistir o estado do pipeline."
+
 #: src/iac_code/pipeline/engine/pipeline_runner.py
 #: src/iac_code/pipeline/engine/sub_pipeline_executor.py
 #: src/iac_code/ui/repl.py
@@ -2401,6 +2681,10 @@ msgstr ""
 msgid "Template file path cannot escape the working directory"
 msgstr "O caminho do arquivo de template não pode sair do diretório de trabalho"
 
+#: src/iac_code/pipeline/engine/user_input.py
+msgid "[Image input]"
+msgstr "[Entrada de imagem]"
+
 #: src/iac_code/pipeline/selling/tools/show_candidate_detail_tool.py
 msgid ""
 "Display candidate details (summary and cost breakdown) in the comparison "
@@ -3279,6 +3563,16 @@ msgstr "ROS Stack"
 msgid "CloudStackInstances"
 msgstr "CloudStackInstances"
 
+#: src/iac_code/tools/cloud/aliyun/template_source.py
+msgid ""
+"ROS template calls must use TemplateURL instead of TemplateBody. Save the"
+" template to a file and pass params.TemplateURL, for example a local file"
+" path or OSS/HTTP URL."
+msgstr ""
+"As chamadas de modelo ROS devem usar TemplateURL em vez de TemplateBody. "
+"Salve o modelo em um arquivo e passe params.TemplateURL, por exemplo um "
+"caminho de arquivo local ou uma URL OSS/HTTP."
+
 #: src/iac_code/tools/cloud/aliyun/hooks/ros_validate.py
 #, python-brace-format
 msgid "Template YAML syntax error: {}"
@@ -3397,11 +3691,11 @@ msgstr "Interrompido"
 msgid "Running"
 msgstr "Em execução"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Completed"
 msgstr "Concluído"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Failed"
 msgstr "Falhou"
 
@@ -3676,8 +3970,128 @@ msgid "Command has no handler: {name}"
 msgstr "Comando sem tratador: {name}"
 
 #: src/iac_code/ui/repl.py
-msgid "Note: images are not supported in pipeline mode and will be ignored."
-msgstr "Observação: imagens não são suportadas no modo pipeline e serão ignoradas."
+#, python-brace-format
+msgid "↺ Rollback cleanup [{badge}] {label}"
+msgstr "↺ Limpeza de rollback [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{kind} {resource_id}"
+msgstr "{kind} {resource_id}"
+
+#: src/iac_code/ui/repl.py
+msgid "Deleting"
+msgstr "Excluindo"
+
+#: src/iac_code/ui/repl.py
+msgid "Skipped"
+msgstr "Ignorado"
+
+#: src/iac_code/ui/repl.py
+msgid "Pending"
+msgstr "Pendente"
+
+#: src/iac_code/ui/repl.py
+msgid "Checking"
+msgstr "Verificando"
+
+#: src/iac_code/ui/repl.py
+msgid "Progress"
+msgstr "Progresso"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "DeleteStack submitted; waiting for deletion to complete ({progress})"
+msgstr "DeleteStack enviado; aguardando a conclusão da exclusão ({progress})"
+
+#: src/iac_code/ui/repl.py
+msgid "DeleteStack submitted; waiting for deletion to complete"
+msgstr "DeleteStack enviado; aguardando a conclusão da exclusão"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Deleting ({progress})"
+msgstr "Excluindo ({progress})"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{progress}; deletion required"
+msgstr "{progress}; exclusão necessária"
+
+#: src/iac_code/ui/repl.py
+msgid "stack"
+msgstr "stack"
+
+#: src/iac_code/ui/repl.py
+msgid "resource"
+msgstr "recurso"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Could not read rollback cleanup records. The cleanup prompt was kept; "
+"retry later or inspect manually."
+msgstr ""
+"Não foi possível ler os registros de limpeza de rollback. O prompt de "
+"limpeza foi mantido; tente novamente mais tarde ou inspecione "
+"manualmente."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} additional resources needing attention were not shown."
+msgstr "{count} recursos adicionais que precisam de atenção não foram exibidos."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: all {count} records are completed."
+msgstr ""
+"↺ Retomada da limpeza de rollback: todos os {count} registros foram "
+"concluídos."
+
+#: src/iac_code/ui/repl.py
+msgid "failed"
+msgstr "falhou"
+
+#: src/iac_code/ui/repl.py
+msgid "pending"
+msgstr "pendente"
+
+#: src/iac_code/ui/repl.py
+msgid "in progress"
+msgstr "em andamento"
+
+#: src/iac_code/ui/repl.py
+msgid "completed"
+msgstr "concluído"
+
+#: src/iac_code/ui/repl.py
+msgid "skipped"
+msgstr "ignorado"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} {label}"
+msgstr "{count} {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records, {summary}."
+msgstr "↺ Retomada da limpeza de rollback: {count} registros, {summary}."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records."
+msgstr "↺ Retomada da limpeza de rollback: {count} registros."
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "  [{badge}] {label}"
+msgstr "  [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+msgid "Detected rollback cleanup resources, but cleanup prompt injection failed."
+msgstr ""
+"Recursos de limpeza de rollback foram detectados, mas a injeção do prompt"
+" de limpeza falhou."
 
 #: src/iac_code/ui/repl.py
 #, python-brace-format
@@ -3686,11 +4100,27 @@ msgstr "Ignorando estado salvo do pipeline: {reason}"
 
 #: src/iac_code/ui/repl.py
 msgid ""
-"Pipeline completed. Normal chat is active, but the handoff context could "
-"not be injected or saved."
+"Pipeline state persistence failed. The pipeline is paused; do not "
+"continue until state is durable."
+msgstr ""
+"Falha ao persistir o estado do pipeline. O pipeline está pausado; não "
+"continue até que o estado esteja durável."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline state persistence failed. Normal chat handoff was not marked "
+"durable."
+msgstr ""
+"Falha ao persistir o estado do pipeline. O handoff para chat normal não "
+"foi marcado como durável."
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline completed, but the handoff context could not be injected or "
+"saved."
 msgstr ""
-"O pipeline foi concluído. O chat normal está ativo, mas o contexto de "
-"transferência não pôde ser injetado ou salvo."
+"O pipeline foi concluído, mas o contexto de handoff não pôde ser injetado"
+" ou salvo."
 
 #: src/iac_code/ui/repl.py
 msgid "Judging your input..."
@@ -3868,6 +4298,11 @@ msgstr "  ✓ {name}: concluído\n"
 msgid "  ✘ {name}: Failed"
 msgstr "  ✘ {name}: falhou"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Pipeline warning: {reason}"
+msgstr "Aviso do pipeline: {reason}"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Option {index}"
@@ -3949,6 +4384,17 @@ msgstr "erro desconhecido"
 msgid "Resumed pipeline at step: {step}"
 msgstr "Pipeline retomado na etapa: {step}"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Could not read pipeline state metadata: {reason}"
+msgstr "Não foi possível ler os metadados de estado do pipeline: {reason}"
+
+#: src/iac_code/ui/repl.py
+msgid "Pipeline state metadata is invalid; continuing as normal chat."
+msgstr ""
+"Os metadados de estado do pipeline são inválidos; continuando como chat "
+"normal."
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Found pipeline state in this session (paused at: {step})."
@@ -4496,3 +4942,199 @@ msgstr "Rastreamento de pilha omitido do evento público; veja error_id."
 
 #~ msgid "Project Memory Index"
 #~ msgstr "Índice de memória do projeto"
+
+#~ msgid "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+#~ msgstr ""
+#~ "Foram detectados recursos de nuvem que"
+#~ " ainda precisam de limpeza após o "
+#~ "rollback do pipeline. Limpe-os "
+#~ "imediatamente e verifique continuamente até"
+#~ " a exclusão terminar."
+
+#~ msgid "要求："
+#~ msgstr "Requisitos:"
+
+#~ msgid "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+#~ msgstr ""
+#~ "- O escopo da limpeza é uma "
+#~ "lista branca estrita: somente os ids "
+#~ "na lista \"Recursos a limpar\" abaixo"
+#~ " podem ser excluídos."
+
+#~ msgid "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+#~ msgstr ""
+#~ "- Não exclua, modifique nem faça "
+#~ "rollback de nenhum stack ou recurso "
+#~ "de nuvem que não esteja em "
+#~ "\"Recursos a limpar\"."
+
+#~ msgid "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+#~ msgstr ""
+#~ "- Nao chame ListStacks nem pesquise "
+#~ "outros stacks por nome; os ids dos"
+#~ " recursos pendentes de limpeza ja "
+#~ "estao completamente listados."
+
+#~ msgid "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+#~ msgstr ""
+#~ "- Antes de cada chamada a "
+#~ "GetStack/DeleteStack, verifique se StackId "
+#~ "corresponde exatamente a algum id da "
+#~ "lista de recursos pendentes de limpeza."
+
+#~ msgid "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+#~ msgstr ""
+#~ "- Se StackId nao estiver na lista"
+#~ " de recursos pendentes de limpeza, e"
+#~ " proibido chamar DeleteStack, mesmo que "
+#~ "seja o stack do handoff atual ou"
+#~ " recem-criado."
+
+#~ msgid ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+#~ msgstr ""
+#~ "- Não deduza objetos extras de "
+#~ "limpeza a partir de pipeline handoff,"
+#~ " deployment.stack_id, current stack ou "
+#~ "resources_created; eles podem ser recursos "
+#~ "entregues com sucesso no final."
+
+#~ msgid "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+#~ msgstr ""
+#~ "- Mesmo que haja perguntas do "
+#~ "usuário, instruções para continuar ou "
+#~ "contexto de pipeline handoff nesta "
+#~ "rodada, não amplie o escopo da "
+#~ "limpeza."
+
+#~ msgid "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+#~ msgstr ""
+#~ "- Ao retomar ou continuar a "
+#~ "limpeza, processe apenas os recursos "
+#~ "listados neste aviso; nao verifique nem"
+#~ " exclua outros recursos."
+
+#~ msgid ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+#~ msgstr ""
+#~ "- Prefira usar a ferramenta ROS "
+#~ "stack disponível para excluir; se usar"
+#~ " aliyun_api, execute DeleteStack primeiro e"
+#~ " depois verifique o estado repetidamente"
+#~ " com GetStack."
+
+#~ msgid "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+#~ msgstr ""
+#~ "- Se o recurso já estiver sendo"
+#~ " excluído, use GetStack primeiro para "
+#~ "verificar o estado atual antes de "
+#~ "decidir se precisa executar DeleteStack "
+#~ "novamente."
+
+#~ msgid "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+#~ msgstr ""
+#~ "- A limpeza só é concluída após"
+#~ " confirmar DELETE_COMPLETE; em caso de "
+#~ "DELETE_FAILED ou impossibilidade de confirmar,"
+#~ " explique ao usuário a causa da "
+#~ "falha e o próximo passo."
+
+#~ msgid "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+#~ msgstr ""
+#~ "- Quando todos os recursos da "
+#~ "lista estiverem em DELETE_COMPLETE, interrompa"
+#~ " imediatamente esta limpeza; não exclua "
+#~ "nem verifique nenhum outro stack."
+
+#~ msgid "- 清理过程中向用户简短同步进度。"
+#~ msgstr "- Informe brevemente o progresso ao usuário durante a limpeza."
+
+#~ msgid "待清理资源："
+#~ msgstr "Recursos a limpar:"
+
+#~ msgid "检测到 {count} 个回滚残留资源，开始清理流程。"
+#~ msgstr ""
+#~ "{count} recursos residuais de rollback "
+#~ "detectados; iniciando o fluxo de "
+#~ "limpeza."
+
+#~ msgid "错误：{error}"
+#~ msgstr "Erro: {error}"
+
+#~ msgid "删除中"
+#~ msgstr "Excluindo"
+
+#~ msgid "完成"
+#~ msgstr "Concluído"
+
+#~ msgid "失败"
+#~ msgstr "Falhou"
+
+#~ msgid "跳过"
+#~ msgstr "Ignorado"
+
+#~ msgid "待处理"
+#~ msgstr "Pendente"
+
+#~ msgid "检查"
+#~ msgstr "Verificar"
+
+#~ msgid "进度"
+#~ msgstr "Progresso"
+
+#~ msgid "DeleteStack 已提交，等待删除完成（{progress}）"
+#~ msgstr "DeleteStack enviado; aguardando a exclusão terminar ({progress})"
+
+#~ msgid "DeleteStack 已提交，等待删除完成"
+#~ msgstr "DeleteStack enviado; aguardando a exclusão terminar"
+
+#~ msgid "已跳过"
+#~ msgstr "Ignorado"
+
+#~ msgid "正在删除（{progress}）"
+#~ msgstr "Excluindo ({progress})"
+
+#~ msgid "{progress}，需要删除"
+#~ msgstr "{progress}, requer exclusão"
+
+#~ msgid "资源栈"
+#~ msgstr "Stack de recursos"
+
+#~ msgid "资源"
+#~ msgstr "Recurso"
+
+#~ msgid "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+#~ msgstr ""
+#~ "Não foi possível ler o registro de"
+#~ " limpeza de rollback; o prompt de "
+#~ "limpeza foi preservado. Continue mais "
+#~ "tarde ou verifique manualmente."
+
+#~ msgid "还有 {count} 个需要关注的资源未显示。"
+#~ msgstr "Há mais {count} recursos que precisam de atenção e não são exibidos."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录均已完成。"
+#~ msgstr ""
+#~ "↺ Recuperação da limpeza de rollback:"
+#~ " todos os {count} registros foram "
+#~ "concluídos."
+
+#~ msgid "进行中"
+#~ msgstr "Em andamento"
+
+#~ msgid "已完成"
+#~ msgstr "Concluído"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+#~ msgstr "↺ Recuperação da limpeza de rollback: {count} registros, {summary}."
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录。"
+#~ msgstr "↺ Recuperação da limpeza de rollback: {count} registros."
+
+#~ msgid "Note: images are not supported in pipeline mode and will be ignored."
+#~ msgstr ""
+#~ "Observação: imagens não são suportadas "
+#~ "no modo pipeline e serão ignoradas."
diff --git a/src/iac_code/i18n/locales/zh/LC_MESSAGES/messages.po b/src/iac_code/i18n/locales/zh/LC_MESSAGES/messages.po
index bce338f6..a9b40763 100644
--- a/src/iac_code/i18n/locales/zh/LC_MESSAGES/messages.po
+++ b/src/iac_code/i18n/locales/zh/LC_MESSAGES/messages.po
@@ -44,6 +44,30 @@ msgstr "不安全的工件文件名"
 msgid "Unknown error"
 msgstr "未知错误"
 
+#: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
+msgid ""
+"Cleanup state unavailable. Inspect the session file and cloud resources "
+"manually."
+msgstr "清理状态不可用。请手动检查会话文件和云资源。"
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup deferred prompt state is unavailable. Please repair it "
+"before continuing."
+msgstr "回滚清理延迟提示状态不可用。请修复后再继续。"
+
+#: src/iac_code/a2a/executor.py
+msgid ""
+"Rollback cleanup state is unavailable. Please repair the cleanup ledger "
+"before continuing."
+msgstr "回滚清理状态不可用。请修复清理记录后再继续。"
+
+#: src/iac_code/a2a/executor.py src/iac_code/ui/repl.py
+msgid ""
+"Rollback cleanup is still in progress. Please continue after cleanup "
+"completes."
+msgstr "回滚清理仍在进行中。请在清理完成后继续。"
+
 #: src/iac_code/a2a/executor.py src/iac_code/a2a/pipeline_executor.py
 msgid "Task is already working."
 msgstr "任务已在运行。"
@@ -53,6 +77,11 @@ msgstr "任务已在运行。"
 msgid "Task canceled."
 msgstr "任务已取消。"
 
+#: src/iac_code/a2a/executor.py
+#, python-brace-format
+msgid "Current model {model} does not support image input."
+msgstr "当前模型 {model} 不支持图片输入。"
+
 #: src/iac_code/a2a/pipeline_executor.py
 msgid "A temporary error occurred. Please retry."
 msgstr "发生临时错误，请重试。"
@@ -61,6 +90,11 @@ msgstr "发生临时错误，请重试。"
 msgid "Authentication required. Configure credentials and retry."
 msgstr "需要身份验证。请配置凭据后重试。"
 
+#: src/iac_code/a2a/pipeline_executor.py
+#, python-brace-format
+msgid "Pipeline already running. Resume task {task_id}."
+msgstr "管道已在运行。请恢复任务 {task_id}。"
+
 #: src/iac_code/a2a/pipeline_recovery.py
 msgid "A2A pipeline state not found"
 msgstr "未找到 A2A pipeline 状态"
@@ -473,6 +507,18 @@ msgstr "AI 驱动的基础设施编排工具"
 msgid "Use iac-code as an A2A client."
 msgstr "将 iac-code 作为 A2A 客户端使用。"
 
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A client dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr "缺少 A2A 客户端依赖。请使用以下命令安装：pip install 'iac-code[a2a]'"
+
+#: src/iac_code/cli/main.py
+msgid ""
+"A2A server dependencies are missing. Install with: pip install 'iac-"
+"code[a2a]'"
+msgstr "缺少 A2A 服务器依赖。请使用以下命令安装：pip install 'iac-code[a2a]'"
+
 #: src/iac_code/cli/main.py
 msgid "Install Git for Windows via the npmmirror mirror (Windows only)."
 msgstr "通过 npmmirror 镜像安装 Git for Windows（仅 Windows）。"
@@ -485,12 +531,6 @@ msgstr "将 iac-code 更新到最新版本。"
 msgid "YAML config file containing A2A client options"
 msgstr "包含 A2A 客户端选项的 YAML 配置文件"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A client dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr "缺少 A2A 客户端依赖。请使用以下命令安装：pip install 'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "LLM model to use"
 msgstr "使用的 LLM 模型"
@@ -612,12 +652,6 @@ msgid ""
 "thinking, tool-trace."
 msgstr "暴露 A2A thinking 信号类型；可重复指定多个。取值：raw-thinking、tool-trace。"
 
-#: src/iac_code/cli/main.py
-msgid ""
-"A2A server dependencies are missing. Install with: pip install 'iac-"
-"code[a2a]'"
-msgstr "缺少 A2A 服务器依赖。请使用以下命令安装：pip install 'iac-code[a2a]'"
-
 #: src/iac_code/cli/main.py
 msgid "Send a prompt to an A2A JSON-RPC endpoint."
 msgstr "向 A2A JSON-RPC 端点发送提示。"
@@ -1512,10 +1546,18 @@ msgstr "系统提示词为空。"
 msgid "No provider messages yet."
 msgstr "暂无提供商消息。"
 
+#: src/iac_code/commands/prompt.py
+msgid "No cleanup prompts in this snapshot."
+msgstr "此快照中没有清理提示词。"
+
 #: src/iac_code/commands/prompt.py
 msgid "No tools are currently registered."
 msgstr "当前未注册任何工具。"
 
+#: src/iac_code/commands/prompt.py
+msgid "Cleanup Prompts"
+msgstr "清理提示词"
+
 #: src/iac_code/commands/prompt.py
 msgid "IAC-CODE Prompt Snapshot"
 msgstr "IAC-CODE Prompt 快照"
@@ -1550,6 +1592,14 @@ msgstr "提供商消息"
 msgid "Tools"
 msgstr "工具"
 
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt"
+msgstr "清理提示词"
+
+#: src/iac_code/commands/prompt.py
+msgid "cleanup prompt · removed"
+msgstr "清理提示 · 已移除"
+
 #: src/iac_code/commands/prompt.py
 msgid "Instruction Memory"
 msgstr "指令记忆"
@@ -1627,6 +1677,11 @@ msgstr "   消息：{count}"
 msgid "   Recalled memory: {status}"
 msgstr "   已召回记忆：{status}"
 
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "   Cleanup prompts: {count}"
+msgstr "   清理提示词：{count}"
+
 #: src/iac_code/commands/prompt.py
 msgid "3. Tools"
 msgstr "3. 工具"
@@ -1672,6 +1727,15 @@ msgstr "存在"
 msgid "not present"
 msgstr "不存在"
 
+#: src/iac_code/commands/prompt.py
+msgid "Rollback cleanup prompts are also shown separately for quick inspection."
+msgstr "回滚清理提示词也会单独展示，便于快速检查。"
+
+#: src/iac_code/commands/prompt.py
+#, python-brace-format
+msgid "{count} cleanup prompts"
+msgstr "{count} 个清理提示词"
+
 #: src/iac_code/commands/prompt.py
 msgid "Tool definitions available to the main model for this request."
 msgstr "本次请求中主模型可用的工具定义。"
@@ -1703,6 +1767,7 @@ msgid "Input schema"
 msgstr "输入 schema"
 
 #: src/iac_code/commands/prompt.py
+#: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid "tool"
 msgstr "工具"
 
@@ -1985,6 +2050,24 @@ msgstr "读取持久记忆。省略 name 可列出全部，提供 name 可读取
 msgid "Memory name to read. Omit to list all."
 msgstr "要读取的记忆名称。省略则列出全部。"
 
+#: src/iac_code/memory/memory_tools.py
+#, python-brace-format
+msgid ""
+"{base}\n"
+"\n"
+"Available memories:\n"
+"{index}\n"
+"\n"
+"Call read_memory again with one of these names, or omit name to list all "
+"memories."
+msgstr ""
+"{base}\n"
+"\n"
+"可用记忆：\n"
+"{index}\n"
+"\n"
+"请使用其中一个名称再次调用 read_memory，或省略 name 以列出所有记忆。"
+
 #: src/iac_code/memory/memory_tools.py
 #, python-brace-format
 msgid ""
@@ -2081,6 +2164,115 @@ msgstr "ask_user_question 需要 pipeline 事件队列。"
 msgid "User cancelled ask_user_question."
 msgstr "用户取消了 ask_user_question。"
 
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"Cloud resources still need cleanup after pipeline rollback. Clean them up"
+" now and keep checking until deletion completes."
+msgstr "管道回滚后仍有云资源需要清理。请立即清理，并持续检查直到删除完成。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Requirements:"
+msgstr "需求："
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup scope is a strict allowlist: delete only ids in the cleanup "
+"resources list below."
+msgstr "- 清理范围是严格白名单：只删除下面清理资源列表中的 ID。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not delete, modify, or roll back any stack or cloud resource outside"
+" the cleanup resources list."
+msgstr "- 不要删除、修改或回滚清理资源列表之外的任何资源栈或云资源。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not call ListStacks or search for other stacks by name; cleanup "
+"resource ids are fully listed."
+msgstr "- 不要调用 ListStacks，也不要按名称搜索其他资源栈；清理资源 ID 已完整列出。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Before every GetStack/DeleteStack call, verify that StackId exactly "
+"matches an id in the cleanup resources list."
+msgstr "- 每次调用 GetStack/DeleteStack 前，确认 StackId 与清理资源列表中的某个 ID 完全一致。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If StackId is not in the cleanup resources list, do not call "
+"DeleteStack, even if it is the current handoff or newly created stack."
+msgstr "- 如果 StackId 不在清理资源列表中，不要调用 DeleteStack，即使它是当前 handoff 或新创建的资源栈。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not infer extra cleanup targets from pipeline handoff, "
+"deployment.stack_id, current stack, or resources_created; those may be "
+"final delivered resources."
+msgstr ""
+"- 不要从管道 handoff、deployment.stack_id、当前资源栈或 resources_created "
+"推断额外清理目标；它们可能是最终交付资源。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Do not expand cleanup scope for user follow-ups, continue instructions,"
+" or pipeline handoff context."
+msgstr "- 不要因为用户追问、continue 指令或管道 handoff 上下文而扩大清理范围。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- When resuming cleanup, still process only resources listed in this "
+"prompt; do not inspect or delete others."
+msgstr "- 恢复清理时，仍然只处理此提示中列出的资源；不要检查或删除其他资源。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Prefer available ROS stack tools for deletion; if using aliyun_api, "
+"call DeleteStack first, then repeatedly call GetStack to check status."
+msgstr ""
+"- 删除时优先使用可用的 ROS 资源栈工具；如果使用 aliyun_api，请先调用 DeleteStack，然后反复调用 GetStack "
+"检查状态。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- If a resource is already deleting, call GetStack first, then decide "
+"whether DeleteStack is needed again."
+msgstr "- 如果资源已在删除中，请先调用 GetStack，再判断是否需要再次调用 DeleteStack。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or "
+"unknown status, tell the user the failure reason and next step."
+msgstr "- 只有达到 DELETE_COMPLETE 后清理才算完成；如果是 DELETE_FAILED 或未知状态，请告诉用户失败原因和下一步。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid ""
+"- After all listed resources are DELETE_COMPLETE, stop this cleanup turn "
+"immediately."
+msgstr "- 所有列出的资源达到 DELETE_COMPLETE 后，立即停止本轮清理。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "- Briefly update the user during cleanup."
+msgstr "- 清理过程中简要向用户更新进展。"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+msgid "Cleanup resources:"
+msgstr "清理资源："
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid ""
+"{index}. provider={provider}, type={resource_type}, id={resource_id}, "
+"name={name}, region={region}"
+msgstr ""
+"{index}. 提供方={provider}, 类型={resource_type}, ID={resource_id}, 名称={name},"
+" 地域={region}"
+
+#: src/iac_code/pipeline/engine/cleanup.py
+#, python-brace-format
+msgid "Detected {count} rollback cleanup resources; starting cleanup."
+msgstr "检测到 {count} 个回滚清理资源；开始清理。"
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 msgid ""
 "Complete the current step by calling this tool to submit the conclusion. "
@@ -2167,18 +2359,46 @@ msgid ""
 "{fields}."
 msgstr "{message} complete_step.conclusion 必须包含以下字段之一: {fields}。"
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "A successful tool result is required before completing the current step."
+msgstr "完成当前步骤前需要成功的工具结果。"
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
-msgid "Candidate count cannot exceed {limit}; {count} were submitted."
-msgstr "候选方案数量不能超过 {limit} 个，当前提交了 {count} 个。"
+msgid ""
+"{message} complete_step.conclusion.{field} must match the {tool} result "
+"value {value}."
+msgstr "{message} complete_step.conclusion.{field} 必须与 {tool} 结果值 {value} 匹配。"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "<missing>"
+msgstr "<缺失>"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " with status {statuses}"
+msgstr "，状态为 {statuses}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " and is_success={expected}"
+msgstr "，且 is_success={expected}"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid " one of {actions}"
+msgstr "，动作为 {actions} 之一"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid ""
-"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
-"user for help or narrow the rollback targets before calling "
-"complete_step."
-msgstr "可回滚目标数量不能超过 {limit} 个，当前有 {count} 个。请请求用户介入或收窄回滚目标后再调用 complete_step。"
+"{message} Call {tool}{action} first and wait for a successful "
+"result{status_hint}{success_hint}."
+msgstr "{message} 请先调用 {tool}{action}，并等待成功结果{status_hint}{success_hint}。"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+msgid "the required tool"
+msgstr "必需工具"
 
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
@@ -2187,6 +2407,19 @@ msgid ""
 "or ask the user for help."
 msgstr "回滚次数不能超过 {max_rollbacks} 次。请完成当前步骤或请求用户介入。"
 
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid "Candidate count cannot exceed {limit}; {count} were submitted."
+msgstr "候选方案数量不能超过 {limit} 个，当前提交了 {count} 个。"
+
+#: src/iac_code/pipeline/engine/complete_step_tool.py
+#, python-brace-format
+msgid ""
+"Rollback target count cannot exceed {limit}; there are {count}. Ask the "
+"user for help or narrow the rollback targets before calling "
+"complete_step."
+msgstr "可回滚目标数量不能超过 {limit} 个，当前有 {count} 个。请请求用户介入或收窄回滚目标后再调用 complete_step。"
+
 #: src/iac_code/pipeline/engine/complete_step_tool.py
 #, python-brace-format
 msgid "Schema validation failed after {attempts} attempts: {error}"
@@ -2209,6 +2442,10 @@ msgstr "conclusion 校验失败；请修正后重新调用 complete_step: {error
 msgid "Step {step_id} completed. Conclusion submitted."
 msgstr "步骤 {step_id} 已完成。结论已提交。"
 
+#: src/iac_code/pipeline/engine/pipeline_runner.py
+msgid "Pipeline state persistence failed."
+msgstr "管道状态持久化失败。"
+
 #: src/iac_code/pipeline/engine/pipeline_runner.py
 #: src/iac_code/pipeline/engine/sub_pipeline_executor.py
 #: src/iac_code/ui/repl.py
@@ -2302,6 +2539,10 @@ msgstr "模板文件路径必须是相对于工作目录的路径"
 msgid "Template file path cannot escape the working directory"
 msgstr "模板文件路径不能跳出工作目录"
 
+#: src/iac_code/pipeline/engine/user_input.py
+msgid "[Image input]"
+msgstr "[图片输入]"
+
 #: src/iac_code/pipeline/selling/tools/show_candidate_detail_tool.py
 msgid ""
 "Display candidate details (summary and cost breakdown) in the comparison "
@@ -3149,6 +3390,15 @@ msgstr "ROS 资源栈"
 msgid "CloudStackInstances"
 msgstr "云资源栈实例"
 
+#: src/iac_code/tools/cloud/aliyun/template_source.py
+msgid ""
+"ROS template calls must use TemplateURL instead of TemplateBody. Save the"
+" template to a file and pass params.TemplateURL, for example a local file"
+" path or OSS/HTTP URL."
+msgstr ""
+"ROS 模板调用必须使用 TemplateURL，而不能使用 TemplateBody。请将模板保存到文件，并传入 "
+"params.TemplateURL，例如本地文件路径或 OSS/HTTP URL。"
+
 #: src/iac_code/tools/cloud/aliyun/hooks/ros_validate.py
 #, python-brace-format
 msgid "Template YAML syntax error: {}"
@@ -3257,11 +3507,11 @@ msgstr "已中断"
 msgid "Running"
 msgstr "进行中"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Completed"
 msgstr "已完成"
 
-#: src/iac_code/ui/pipeline_display_replay.py
+#: src/iac_code/ui/pipeline_display_replay.py src/iac_code/ui/repl.py
 msgid "Failed"
 msgstr "失败"
 
@@ -3532,8 +3782,121 @@ msgid "Command has no handler: {name}"
 msgstr "命令没有处理器：{name}"
 
 #: src/iac_code/ui/repl.py
-msgid "Note: images are not supported in pipeline mode and will be ignored."
-msgstr "注意：pipeline 模式不支持图像，将忽略图像。"
+#, python-brace-format
+msgid "↺ Rollback cleanup [{badge}] {label}"
+msgstr "↺ 回滚清理 [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{kind} {resource_id}"
+msgstr "{kind} {resource_id}"
+
+#: src/iac_code/ui/repl.py
+msgid "Deleting"
+msgstr "删除中"
+
+#: src/iac_code/ui/repl.py
+msgid "Skipped"
+msgstr "已跳过"
+
+#: src/iac_code/ui/repl.py
+msgid "Pending"
+msgstr "待处理"
+
+#: src/iac_code/ui/repl.py
+msgid "Checking"
+msgstr "检查中"
+
+#: src/iac_code/ui/repl.py
+msgid "Progress"
+msgstr "进度"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "DeleteStack submitted; waiting for deletion to complete ({progress})"
+msgstr "DeleteStack 已提交；等待删除完成（{progress}）"
+
+#: src/iac_code/ui/repl.py
+msgid "DeleteStack submitted; waiting for deletion to complete"
+msgstr "DeleteStack 已提交；等待删除完成"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Deleting ({progress})"
+msgstr "删除中（{progress}）"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{progress}; deletion required"
+msgstr "{progress}；需要删除"
+
+#: src/iac_code/ui/repl.py
+msgid "stack"
+msgstr "资源栈"
+
+#: src/iac_code/ui/repl.py
+msgid "resource"
+msgstr "资源"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Could not read rollback cleanup records. The cleanup prompt was kept; "
+"retry later or inspect manually."
+msgstr "无法读取回滚清理记录。清理提示已保留；请稍后重试或手动检查。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} additional resources needing attention were not shown."
+msgstr "还有 {count} 个需要注意的资源未显示。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: all {count} records are completed."
+msgstr "↺ 回滚清理恢复：所有 {count} 条记录都已完成。"
+
+#: src/iac_code/ui/repl.py
+msgid "failed"
+msgstr "已失败"
+
+#: src/iac_code/ui/repl.py
+msgid "pending"
+msgstr "待处理"
+
+#: src/iac_code/ui/repl.py
+msgid "in progress"
+msgstr "进行中"
+
+#: src/iac_code/ui/repl.py
+msgid "completed"
+msgstr "已完成"
+
+#: src/iac_code/ui/repl.py
+msgid "skipped"
+msgstr "已跳过"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "{count} {label}"
+msgstr "{count} 个{label}"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records, {summary}."
+msgstr "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "↺ Rollback cleanup resume: {count} records."
+msgstr "↺ 回滚清理恢复：{count} 条记录。"
+
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "  [{badge}] {label}"
+msgstr "  [{badge}] {label}"
+
+#: src/iac_code/ui/repl.py
+msgid "Detected rollback cleanup resources, but cleanup prompt injection failed."
+msgstr "检测到回滚清理资源，但清理提示注入失败。"
 
 #: src/iac_code/ui/repl.py
 #, python-brace-format
@@ -3542,9 +3905,21 @@ msgstr "正在忽略已保存的 pipeline 状态：{reason}"
 
 #: src/iac_code/ui/repl.py
 msgid ""
-"Pipeline completed. Normal chat is active, but the handoff context could "
-"not be injected or saved."
-msgstr "Pipeline 已完成。普通聊天已启用，但交接上下文无法注入或保存。"
+"Pipeline state persistence failed. The pipeline is paused; do not "
+"continue until state is durable."
+msgstr "管道状态持久化失败。管道已暂停；在状态可靠持久化之前不要继续。"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline state persistence failed. Normal chat handoff was not marked "
+"durable."
+msgstr "管道状态持久化失败。普通聊天 handoff 未标记为已持久化。"
+
+#: src/iac_code/ui/repl.py
+msgid ""
+"Pipeline completed, but the handoff context could not be injected or "
+"saved."
+msgstr "管道已完成，但无法注入或保存 handoff 上下文。"
 
 #: src/iac_code/ui/repl.py
 msgid "Judging your input..."
@@ -3708,6 +4083,11 @@ msgstr "  ✓ {name}: 已完成\n"
 msgid "  ✘ {name}: Failed"
 msgstr "  ✘ {name}: 失败"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Pipeline warning: {reason}"
+msgstr "管道警告：{reason}"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Option {index}"
@@ -3787,6 +4167,15 @@ msgstr "未知错误"
 msgid "Resumed pipeline at step: {step}"
 msgstr "已恢复 pipeline 到步骤：{step}"
 
+#: src/iac_code/ui/repl.py
+#, python-brace-format
+msgid "Could not read pipeline state metadata: {reason}"
+msgstr "无法读取管道状态元数据：{reason}"
+
+#: src/iac_code/ui/repl.py
+msgid "Pipeline state metadata is invalid; continuing as normal chat."
+msgstr "管道状态元数据无效；继续按普通聊天处理。"
+
 #: src/iac_code/ui/repl.py
 #, python-brace-format
 msgid "Found pipeline state in this session (paused at: {step})."
@@ -4325,3 +4714,133 @@ msgstr "公开事件中已省略堆栈跟踪；请查看 error_id。"
 
 #~ msgid "Project Memory Index"
 #~ msgstr "项目记忆索引"
+
+#~ msgid "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+#~ msgstr "检测到 pipeline rollback 后仍需要清理的云资源。请立即清理这些资源，并持续检查直到删除完成。"
+
+#~ msgid "要求："
+#~ msgstr "要求："
+
+#~ msgid "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+#~ msgstr "- 清理范围是严格白名单：只能删除下面“待清理资源”列表中的 id。"
+
+#~ msgid "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+#~ msgstr "- 不要删除、修改或回滚任何未列入“待清理资源”的 stack 或云资源。"
+
+#~ msgid "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+#~ msgstr "- 不要调用 ListStacks 或按名称搜索其它 stack；待清理资源 id 已完整列出。"
+
+#~ msgid "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+#~ msgstr "- 每次调用 GetStack/DeleteStack 前，必须核对 StackId 精确等于“待清理资源”列表中的某个 id。"
+
+#~ msgid "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+#~ msgstr "- 如果 StackId 不在“待清理资源”列表中，禁止调用 DeleteStack，即使它是当前 handoff 或刚创建的 stack。"
+
+#~ msgid ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+#~ msgstr ""
+#~ "- 不要根据 pipeline handoff、deployment.stack_id、current"
+#~ " stack 或 resources_created "
+#~ "额外推断清理对象；这些可能是最终成功交付的资源。"
+
+#~ msgid "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+#~ msgstr "- 即使本轮还有用户追问、继续指令或 pipeline handoff 上下文，也不能扩大清理范围。"
+
+#~ msgid "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+#~ msgstr "- 恢复或继续清理时仍只处理当前提示列出的资源；不要检查或删除其它资源。"
+
+#~ msgid ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+#~ msgstr ""
+#~ "- 优先使用可用的 ROS stack 工具删除；如果改用 "
+#~ "aliyun_api，请先 DeleteStack，再反复 GetStack 检查状态。"
+
+#~ msgid "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+#~ msgstr "- 如果资源已经处于删除中，请先 GetStack 检查当前状态，再决定是否需要重新 DeleteStack。"
+
+#~ msgid "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+#~ msgstr "- 只有确认 DELETE_COMPLETE 才算清理完成；DELETE_FAILED 或无法确认时要向用户说明失败原因和下一步。"
+
+#~ msgid "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+#~ msgstr "- 列表内资源全部 DELETE_COMPLETE 后，立刻停止本轮清理；不要继续删除或检查任何其他 stack。"
+
+#~ msgid "- 清理过程中向用户简短同步进度。"
+#~ msgstr "- 清理过程中向用户简短同步进度。"
+
+#~ msgid "待清理资源："
+#~ msgstr "待清理资源："
+
+#~ msgid "检测到 {count} 个回滚残留资源，开始清理流程。"
+#~ msgstr "检测到 {count} 个回滚残留资源，开始清理流程。"
+
+#~ msgid "错误：{error}"
+#~ msgstr "错误：{error}"
+
+#~ msgid "删除中"
+#~ msgstr "删除中"
+
+#~ msgid "完成"
+#~ msgstr "完成"
+
+#~ msgid "失败"
+#~ msgstr "失败"
+
+#~ msgid "跳过"
+#~ msgstr "跳过"
+
+#~ msgid "待处理"
+#~ msgstr "待处理"
+
+#~ msgid "检查"
+#~ msgstr "检查"
+
+#~ msgid "进度"
+#~ msgstr "进度"
+
+#~ msgid "DeleteStack 已提交，等待删除完成（{progress}）"
+#~ msgstr "DeleteStack 已提交，等待删除完成（{progress}）"
+
+#~ msgid "DeleteStack 已提交，等待删除完成"
+#~ msgstr "DeleteStack 已提交，等待删除完成"
+
+#~ msgid "已跳过"
+#~ msgstr "已跳过"
+
+#~ msgid "正在删除（{progress}）"
+#~ msgstr "正在删除（{progress}）"
+
+#~ msgid "{progress}，需要删除"
+#~ msgstr "{progress}，需要删除"
+
+#~ msgid "资源栈"
+#~ msgstr "资源栈"
+
+#~ msgid "资源"
+#~ msgstr "资源"
+
+#~ msgid "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+#~ msgstr "无法读取回滚清理记录，已保留清理提示，请稍后继续或手动检查。"
+
+#~ msgid "还有 {count} 个需要关注的资源未显示。"
+#~ msgstr "还有 {count} 个需要关注的资源未显示。"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录均已完成。"
+#~ msgstr "↺ 回滚清理恢复：{count} 条记录均已完成。"
+
+#~ msgid "进行中"
+#~ msgstr "进行中"
+
+#~ msgid "已完成"
+#~ msgstr "已完成"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+#~ msgstr "↺ 回滚清理恢复：{count} 条记录，{summary}。"
+
+#~ msgid "↺ 回滚清理恢复：{count} 条记录。"
+#~ msgstr "↺ 回滚清理恢复：{count} 条记录。"
+
+#~ msgid "Note: images are not supported in pipeline mode and will be ignored."
+#~ msgstr "注意：pipeline 模式不支持图像，将忽略图像。"
diff --git a/src/iac_code/memory/memory_tools.py b/src/iac_code/memory/memory_tools.py
index c634fda1..c6b87f82 100644
--- a/src/iac_code/memory/memory_tools.py
+++ b/src/iac_code/memory/memory_tools.py
@@ -40,7 +40,17 @@ async def execute(self, *, tool_input: dict[str, Any], context: ToolContext) ->
         if name:
             mem = self._manager.load(name)
             if mem is None:
-                return ToolResult.error(_("Memory '{name}' not found.").format(name=name))
+                base = _("Memory '{name}' not found.").format(name=name)
+                index = self._manager.get_index_content()
+                if index:
+                    return ToolResult.error(
+                        _(
+                            "{base}\n\n"
+                            "Available memories:\n{index}\n\n"
+                            "Call read_memory again with one of these names, or omit name to list all memories."
+                        ).format(base=base, index=index.rstrip())
+                    )
+                return ToolResult.error("{base}\n\n{empty}".format(base=base, empty=_("No memories saved yet.")))
             return ToolResult.success(f"[{mem.get('type', '')}] {mem.get('description', '')}\n\n{mem['content']}")
         else:
             index = self._manager.get_index_content()
diff --git a/src/iac_code/pipeline/__init__.py b/src/iac_code/pipeline/__init__.py
index 024628eb..e34a3533 100644
--- a/src/iac_code/pipeline/__init__.py
+++ b/src/iac_code/pipeline/__init__.py
@@ -33,6 +33,7 @@ def create_pipeline(
     memory_content_getter: Callable[[], str] | None = None,
     auto_trigger_skills: list[Any] | None = None,
     resume_from_sidecar: bool = False,
+    surface: str = "repl",
 ) -> PipelineRunner:
     """Factory: create a pipeline runner by name.
 
@@ -60,6 +61,7 @@ def create_pipeline(
         memory_content_getter=memory_content_getter,
         auto_trigger_skills=auto_trigger_skills,
         resume_from_sidecar=resume_from_sidecar,
+        surface=surface,
     )
 
 
diff --git a/src/iac_code/pipeline/constants.py b/src/iac_code/pipeline/constants.py
new file mode 100644
index 00000000..bc704b14
--- /dev/null
+++ b/src/iac_code/pipeline/constants.py
@@ -0,0 +1,8 @@
+"""Low-dependency pipeline constants."""
+
+CLEANUP_PROMPT_METADATA_TYPE = "pipeline_cleanup_prompt"
+
+PIPELINE_EVENT_CLEANUP_STARTED = "cleanup_started"
+PIPELINE_EVENT_CLEANUP_PROGRESS = "cleanup_progress"
+PIPELINE_EVENT_CLEANUP_COMPLETED = "cleanup_completed"
+PIPELINE_EVENT_CLEANUP_FAILED = "cleanup_failed"
diff --git a/src/iac_code/pipeline/engine/__init__.py b/src/iac_code/pipeline/engine/__init__.py
index 1325b1df..b95db431 100644
--- a/src/iac_code/pipeline/engine/__init__.py
+++ b/src/iac_code/pipeline/engine/__init__.py
@@ -1,19 +1,34 @@
 """Generic pipeline engine — state machine, context, step execution."""
 
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Any
+
 from iac_code.pipeline.engine.complete_step_tool import CompleteStepTool
 from iac_code.pipeline.engine.context import PipelineContext, VersionedField
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.pipeline.engine.interrupt import InterruptController, InterruptVerdict
 from iac_code.pipeline.engine.loader import load_pipeline_dir
-from iac_code.pipeline.engine.pipeline_runner import PipelineRunner
 from iac_code.pipeline.engine.session import PipelineSession
 from iac_code.pipeline.engine.state_machine import StateMachine
 from iac_code.pipeline.engine.step_executor import StepExecutor
 from iac_code.pipeline.engine.step_spec import A2AArtifactSpec, LoadedPipeline, StepSpec, SubPipelineSpec, render_prompt
 from iac_code.pipeline.engine.sub_pipeline_executor import SubPipelineExecutor, SubPipelineResult
-from iac_code.pipeline.engine.types import RollbackRule, StepConfig, StepResult, StepStatus
+from iac_code.pipeline.engine.types import StepConfig, StepResult, StepStatus
 from iac_code.pipeline.engine.ui_contract import PipelineStepType, PipelineUiMode
 
+if TYPE_CHECKING:
+    from iac_code.pipeline.engine.pipeline_runner import PipelineRunner
+
+
+def __getattr__(name: str) -> Any:
+    if name == "PipelineRunner":
+        from iac_code.pipeline.engine.pipeline_runner import PipelineRunner
+
+        return PipelineRunner
+    raise AttributeError(f"module {__name__!r} has no attribute {name!r}")
+
+
 __all__ = [
     "CompleteStepTool",
     "A2AArtifactSpec",
@@ -27,7 +42,6 @@
     "PipelineSession",
     "PipelineStepType",
     "PipelineUiMode",
-    "RollbackRule",
     "StateMachine",
     "StepConfig",
     "StepExecutor",
diff --git a/src/iac_code/pipeline/engine/cleanup.py b/src/iac_code/pipeline/engine/cleanup.py
new file mode 100644
index 00000000..3e19a637
--- /dev/null
+++ b/src/iac_code/pipeline/engine/cleanup.py
@@ -0,0 +1,1054 @@
+"""Cleanup ledger and observer for pipeline rollback leftovers."""
+
+from __future__ import annotations
+
+import json
+import logging
+import time
+from dataclasses import asdict, dataclass, field, replace
+from pathlib import Path
+from typing import Any, Literal, cast
+
+import yaml
+
+from iac_code.agent.message import Message
+from iac_code.i18n import _
+from iac_code.pipeline.constants import (
+    CLEANUP_PROMPT_METADATA_TYPE,
+    PIPELINE_EVENT_CLEANUP_COMPLETED,
+    PIPELINE_EVENT_CLEANUP_FAILED,
+    PIPELINE_EVENT_CLEANUP_PROGRESS,
+    PIPELINE_EVENT_CLEANUP_STARTED,
+)
+from iac_code.types.stream_events import StackProgressEvent, ToolResultEvent, ToolUseEndEvent
+from iac_code.utils.path_locks import PathLockRegistry
+from iac_code.utils.public_errors import sanitize_public_text
+from iac_code.utils.state_io import atomic_write_text
+
+logger = logging.getLogger(__name__)
+
+CleanupStatus = Literal["pending", "started", "in_progress", "completed", "failed", "skipped"]
+_LOAD_FAILED_KEY = "_load_failed"
+_LOAD_ERROR_KEY = "_load_error"
+_RETRYABLE_CLEANUP_STATUSES = {"pending", "failed"}
+_ACTIVE_CLEANUP_STATUSES = {"started", "in_progress"}
+_FOLLOWUP_CLEANUP_STATUSES = _RETRYABLE_CLEANUP_STATUSES | _ACTIVE_CLEANUP_STATUSES
+_TERMINAL_CLEANUP_STATUSES = {"completed", "skipped"}
+_DELETE_COMPLETE_STATUSES = {"DELETE_COMPLETE"}
+_DELETE_FAILED_STATUSES = {"DELETE_FAILED"}
+_LEDGER_LOCKS = PathLockRegistry()
+
+
+@dataclass(frozen=True)
+class ObservedResource:
+    """Cloud resource observed during a side-effecting pipeline step."""
+
+    provider: str
+    resource_type: str
+    resource_id: str
+    resource_name: str = ""
+    region_id: str = ""
+    source_step_id: str = ""
+    source_attempt_id: str | None = None
+    observed_action: str = ""
+    observed_at: float = 0.0
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+    @property
+    def key(self) -> str:
+        return _resource_key(self.provider, self.resource_type, self.resource_id, self.region_id)
+
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "ObservedResource":
+        return cls(
+            provider=str(data.get("provider") or ""),
+            resource_type=str(data.get("resource_type") or ""),
+            resource_id=str(data.get("resource_id") or ""),
+            resource_name=str(data.get("resource_name") or ""),
+            region_id=str(data.get("region_id") or ""),
+            source_step_id=str(data.get("source_step_id") or ""),
+            source_attempt_id=_optional_str(data.get("source_attempt_id")),
+            observed_action=str(data.get("observed_action") or ""),
+            observed_at=_float_value(data.get("observed_at")),
+            metadata=dict(data.get("metadata") or {}),
+        )
+
+
+@dataclass(frozen=True)
+class CleanupResource:
+    """Resource that may need cleanup after rollback or handoff."""
+
+    provider: str
+    resource_type: str
+    resource_id: str
+    resource_name: str = ""
+    region_id: str = ""
+    source_step_id: str = ""
+    source_attempt_id: str | None = None
+    cleanup_reason: str = ""
+    cleanup_required: bool = True
+    cleanup_status: CleanupStatus = "pending"
+    cleanup_tool_use_id: str | None = None
+    cleanup_action: str | None = None
+    progress_status: str | None = None
+    progress_percentage: float | None = None
+    last_error: str | None = None
+    observed_at: float = 0.0
+    updated_at: float = 0.0
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+    @property
+    def key(self) -> str:
+        return _resource_key(self.provider, self.resource_type, self.resource_id, self.region_id)
+
+    @classmethod
+    def from_observed(cls, resource: ObservedResource, *, reason: str) -> "CleanupResource":
+        now = time.time()
+        return cls(
+            provider=resource.provider,
+            resource_type=resource.resource_type,
+            resource_id=resource.resource_id,
+            resource_name=resource.resource_name,
+            region_id=resource.region_id,
+            source_step_id=resource.source_step_id,
+            source_attempt_id=resource.source_attempt_id,
+            cleanup_reason=reason,
+            observed_at=resource.observed_at,
+            updated_at=now,
+            metadata=dict(resource.metadata),
+        )
+
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "CleanupResource":
+        status = str(data.get("cleanup_status") or "pending")
+        if status not in {"pending", "started", "in_progress", "completed", "failed", "skipped"}:
+            status = "pending"
+        return cls(
+            provider=str(data.get("provider") or ""),
+            resource_type=str(data.get("resource_type") or ""),
+            resource_id=str(data.get("resource_id") or ""),
+            resource_name=str(data.get("resource_name") or ""),
+            region_id=str(data.get("region_id") or ""),
+            source_step_id=str(data.get("source_step_id") or ""),
+            source_attempt_id=_optional_str(data.get("source_attempt_id")),
+            cleanup_reason=str(data.get("cleanup_reason") or ""),
+            cleanup_required=bool(data.get("cleanup_required", True)),
+            cleanup_status=cast(CleanupStatus, status),
+            cleanup_tool_use_id=_optional_str(data.get("cleanup_tool_use_id")),
+            cleanup_action=_optional_str(data.get("cleanup_action")),
+            progress_status=_optional_str(data.get("progress_status")),
+            progress_percentage=_optional_float(data.get("progress_percentage")),
+            last_error=_optional_str(data.get("last_error")),
+            observed_at=_float_value(data.get("observed_at")),
+            updated_at=_float_value(data.get("updated_at")),
+            metadata=dict(data.get("metadata") or {}),
+        )
+
+
+@dataclass(frozen=True)
+class CleanupPrompt:
+    """Hidden user message content that constrains cleanup to ledger resources."""
+
+    resources: list[CleanupResource]
+    prompt: str
+    status_message: str
+
+
+@dataclass(frozen=True)
+class CleanupLedgerWriteStatus:
+    """Result of a cleanup ledger write attempt."""
+
+    written: bool
+    unavailable: bool = False
+    reason: str | None = None
+    load_error: str | None = None
+
+
+_WRITE_SKIPPED = CleanupLedgerWriteStatus(written=False)
+_WRITE_OK = CleanupLedgerWriteStatus(written=True)
+
+
+class CleanupLedger:
+    """Durable cleanup state for rollback leftovers.
+
+    The ledger is fail-closed for writes: corrupt or unreadable files are never
+    replaced with empty state. Key write methods return
+    `CleanupLedgerWriteStatus` so callers can surface unavailable cleanup
+    tracking without broadening cleanup scope.
+    """
+
+    def __init__(self, path: str | Path) -> None:
+        self.path = Path(path)
+
+    def observed_resources(self) -> list[ObservedResource]:
+        data = self._load()
+        return [ObservedResource.from_dict(item) for item in _dict_list(data.get("observed_resources"))]
+
+    def cleanup_resources(self) -> list[CleanupResource]:
+        data = self._load()
+        return [CleanupResource.from_dict(item) for item in _dict_list(data.get("cleanup_resources"))]
+
+    def history_entries(self) -> list[dict[str, Any]]:
+        data = self._load()
+        return [dict(item) for item in _dict_list(data.get("history"))]
+
+    def pending_resources(self, *, include_failed: bool = True, include_active: bool = True) -> list[CleanupResource]:
+        if include_failed and include_active:
+            statuses = set(_FOLLOWUP_CLEANUP_STATUSES)
+        else:
+            statuses = set(_RETRYABLE_CLEANUP_STATUSES if include_failed else {"pending"})
+            if include_active:
+                statuses.update(_ACTIVE_CLEANUP_STATUSES)
+        return [
+            resource
+            for resource in self.cleanup_resources()
+            if resource.cleanup_required and resource.cleanup_status in statuses
+        ]
+
+    def load_failed(self) -> bool:
+        return bool(self._load().get(_LOAD_FAILED_KEY))
+
+    def load_error(self) -> str | None:
+        error = self._load().get(_LOAD_ERROR_KEY)
+        return error if isinstance(error, str) and error else None
+
+    def active_resources(self) -> list[CleanupResource]:
+        return [
+            resource
+            for resource in self.cleanup_resources()
+            if resource.cleanup_required and resource.cleanup_status in _ACTIVE_CLEANUP_STATUSES
+        ]
+
+    def record_observed(self, resource: ObservedResource) -> CleanupLedgerWriteStatus:
+        """Persist an observed resource and report whether the write happened."""
+
+        if not resource.resource_id:
+            return _WRITE_SKIPPED
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return CleanupLedgerWriteStatus(
+                    written=False,
+                    unavailable=True,
+                    reason="load_failed",
+                    load_error=self.load_error(),
+                )
+            observed = {
+                ObservedResource.from_dict(item).key: ObservedResource.from_dict(item)
+                for item in _dict_list(data.get("observed_resources"))
+            }
+            observed[resource.key] = resource
+            data["observed_resources"] = [asdict(item) for item in observed.values()]
+            self._save(data)
+            return _WRITE_OK
+
+    def mark_cleanup_required(
+        self,
+        resources: list[CleanupResource],
+        *,
+        source_step_id: str,
+        reason: str,
+    ) -> CleanupLedgerWriteStatus:
+        """Mark resources for cleanup after rollback without overwriting corrupt state."""
+
+        if not resources:
+            return _WRITE_SKIPPED
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return CleanupLedgerWriteStatus(
+                    written=False,
+                    unavailable=True,
+                    reason="load_failed",
+                    load_error=self.load_error(),
+                )
+            cleanup = {
+                CleanupResource.from_dict(item).key: CleanupResource.from_dict(item)
+                for item in _dict_list(data.get("cleanup_resources"))
+            }
+            now = time.time()
+            changed_count = 0
+            for resource in resources:
+                if not resource.resource_id:
+                    continue
+                existing = cleanup.get(resource.key)
+                merged = _merge_cleanup_required(
+                    existing,
+                    resource,
+                    source_step_id=source_step_id,
+                    reason=reason,
+                    now=now,
+                )
+                if existing == merged:
+                    continue
+                cleanup[resource.key] = merged
+                changed_count += 1
+            if changed_count == 0:
+                return _WRITE_SKIPPED
+            data["cleanup_resources"] = [asdict(item) for item in cleanup.values()]
+            self._append_history(
+                data,
+                {
+                    "type": "cleanup_required",
+                    "source_step_id": source_step_id,
+                    "reason": reason,
+                    "resource_count": changed_count,
+                    "timestamp": now,
+                },
+            )
+            self._save(data)
+            return _WRITE_OK
+
+    def update_resource(
+        self,
+        *,
+        provider: str,
+        resource_type: str,
+        resource_id: str,
+        region_id: str | None = None,
+        cleanup_status: CleanupStatus | None = None,
+        cleanup_tool_use_id: str | None = None,
+        cleanup_action: str | None = None,
+        progress_status: str | None = None,
+        progress_percentage: float | None = None,
+        last_error: str | None = None,
+        clear_last_error: bool = False,
+    ) -> bool:
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return False
+            changed = False
+            history_entries: list[dict[str, Any]] = []
+            updated_items: list[CleanupResource] = []
+            for item in _dict_list(data.get("cleanup_resources")):
+                resource = CleanupResource.from_dict(item)
+                if not _matches_resource(resource, provider, resource_type, resource_id, region_id):
+                    updated_items.append(resource)
+                    continue
+                if resource.cleanup_status in _TERMINAL_CLEANUP_STATUSES and cleanup_status != resource.cleanup_status:
+                    updated_items.append(resource)
+                    continue
+                updates: dict[str, Any] = {"updated_at": time.time()}
+                if cleanup_status is not None:
+                    updates["cleanup_status"] = cleanup_status
+                if cleanup_tool_use_id is not None:
+                    updates["cleanup_tool_use_id"] = cleanup_tool_use_id
+                if cleanup_action is not None:
+                    updates["cleanup_action"] = cleanup_action
+                if progress_status is not None:
+                    updates["progress_status"] = progress_status
+                if progress_percentage is not None:
+                    updates["progress_percentage"] = progress_percentage
+                if last_error is not None:
+                    updates["last_error"] = _safe_history_error(last_error)
+                elif clear_last_error:
+                    updates["last_error"] = None
+                updated = replace(resource, **updates)
+                updated_items.append(updated)
+                changed = True
+                if _cleanup_lifecycle_state(updated) != _cleanup_lifecycle_state(resource):
+                    history_entries.append(_cleanup_lifecycle_history_entry(updated))
+            if changed:
+                data["cleanup_resources"] = [asdict(item) for item in updated_items]
+                for entry in history_entries:
+                    self._append_history(data, entry)
+                self._save(data)
+            return changed
+
+    def record_prompt_queued(self, prompt: CleanupPrompt, *, ui_surface: str) -> None:
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return
+            resources = list(prompt.resources or [])
+            self._append_history(
+                data,
+                {
+                    "type": "cleanup_prompt_queued",
+                    "ui_surface": ui_surface,
+                    "resource_count": len(resources),
+                    "resources": [_cleanup_resource_history_data(resource) for resource in resources],
+                    "timestamp": time.time(),
+                },
+            )
+            self._save(data)
+
+    def record_tool_use_mapping(
+        self,
+        *,
+        tool_use_id: str,
+        provider: str,
+        resource_type: str,
+        resource_id: str,
+        region_id: str,
+        action: str,
+        tool_name: str,
+        tool_input: dict[str, Any],
+    ) -> None:
+        if not tool_use_id or not resource_id:
+            return
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return
+            mappings = {
+                str(item.get("tool_use_id")): dict(item)
+                for item in _dict_list(data.get("tool_uses"))
+                if item.get("tool_use_id")
+            }
+            mappings[tool_use_id] = {
+                "tool_use_id": tool_use_id,
+                "provider": provider,
+                "resource_type": resource_type,
+                "resource_id": resource_id,
+                "region_id": region_id,
+                "action": action,
+                "tool_name": tool_name,
+                "input_summary": _safe_history_error(
+                    json.dumps(
+                        _cleanup_tool_input_summary(tool_input, resource_id=resource_id, region_id=region_id),
+                        ensure_ascii=False,
+                        sort_keys=True,
+                    )
+                ),
+            }
+            data["tool_uses"] = list(mappings.values())
+            self._save(data)
+
+    def tool_use_mapping(self, tool_use_id: str) -> dict[str, Any] | None:
+        if not tool_use_id:
+            return None
+        data = self._load()
+        for item in _dict_list(data.get("tool_uses")):
+            if item.get("tool_use_id") == tool_use_id:
+                return dict(item)
+        return None
+
+    def record_tool_result_unmatched(self, *, tool_use_id: str, tool_name: str) -> None:
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return
+            self._append_history(
+                data,
+                {
+                    "type": "cleanup_tool_result_unmatched",
+                    "tool_use_id": tool_use_id,
+                    "tool_name": tool_name,
+                    "timestamp": time.time(),
+                },
+            )
+            self._save(data)
+
+    def record_tool_result_mismatch(
+        self,
+        *,
+        tool_use_id: str,
+        tool_name: str,
+        mapped_resource_id: str,
+        result_resource_id: str,
+    ) -> None:
+        with self._write_lock():
+            data = self._load_for_write()
+            if data is None:
+                return
+            self._append_history(
+                data,
+                {
+                    "type": "cleanup_tool_result_mismatch",
+                    "tool_use_id": _safe_history_error(tool_use_id),
+                    "tool_name": _safe_history_error(tool_name),
+                    "mapped_resource_id": _safe_history_error(mapped_resource_id),
+                    "result_resource_id": _safe_history_error(result_resource_id),
+                    "timestamp": time.time(),
+                },
+            )
+            self._save(data)
+
+    def build_pending_prompt(self) -> CleanupPrompt | None:
+        resources = self.pending_resources()
+        if not resources:
+            return None
+        count = len(resources)
+        lines = [
+            _(
+                "Cloud resources still need cleanup after pipeline rollback. "
+                "Clean them up now and keep checking until deletion completes."
+            ),
+            "",
+            _("Requirements:"),
+            _("- Cleanup scope is a strict allowlist: delete only ids in the cleanup resources list below."),
+            _("- Do not delete, modify, or roll back any stack or cloud resource outside the cleanup resources list."),
+            _("- Do not call ListStacks or search for other stacks by name; cleanup resource ids are fully listed."),
+            _(
+                "- Before every GetStack/DeleteStack call, verify that StackId exactly matches an id in "
+                "the cleanup resources list."
+            ),
+            _(
+                "- If StackId is not in the cleanup resources list, do not call DeleteStack, even if it is "
+                "the current handoff or newly created stack."
+            ),
+            _(
+                "- Do not infer extra cleanup targets from pipeline handoff, deployment.stack_id, current stack, "
+                "or resources_created; those may be final delivered resources."
+            ),
+            _("- Do not expand cleanup scope for user follow-ups, continue instructions, or pipeline handoff context."),
+            _(
+                "- When resuming cleanup, still process only resources listed in this prompt; "
+                "do not inspect or delete others."
+            ),
+            _(
+                "- Prefer available ROS stack tools for deletion; if using aliyun_api, call DeleteStack first, "
+                "then repeatedly call GetStack to check status."
+            ),
+            _(
+                "- If a resource is already deleting, call GetStack first, "
+                "then decide whether DeleteStack is needed again."
+            ),
+            _(
+                "- Cleanup is complete only after DELETE_COMPLETE; for DELETE_FAILED or unknown status, "
+                "tell the user the failure reason and next step."
+            ),
+            _("- After all listed resources are DELETE_COMPLETE, stop this cleanup turn immediately."),
+            _("- Briefly update the user during cleanup."),
+            "",
+            _("Cleanup resources:"),
+        ]
+        for index, resource in enumerate(resources, start=1):
+            label = resource.resource_name or resource.resource_id
+            lines.append(
+                _(
+                    "{index}. provider={provider}, type={resource_type}, id={resource_id}, name={name}, region={region}"
+                ).format(
+                    index=index,
+                    provider=resource.provider,
+                    resource_type=resource.resource_type,
+                    resource_id=resource.resource_id,
+                    name=label,
+                    region=resource.region_id or "unknown",
+                )
+            )
+        return CleanupPrompt(
+            resources=resources,
+            prompt="\n".join(lines),
+            status_message=_("Detected {count} rollback cleanup resources; starting cleanup.").format(count=count),
+        )
+
+    def _load(self) -> dict[str, Any]:
+        if not self.path.exists():
+            return _empty_ledger_data()
+        try:
+            loaded = yaml.safe_load(self.path.read_text(encoding="utf-8"))
+        except (OSError, UnicodeDecodeError, yaml.YAMLError) as exc:
+            logger.warning("Failed to load cleanup ledger %s: %s", self.path, exc)
+            return _failed_ledger_data(str(exc))
+        if not isinstance(loaded, dict):
+            logger.warning(
+                "Failed to load cleanup ledger %s: expected mapping, got %s",
+                self.path,
+                type(loaded).__name__,
+            )
+            return _failed_ledger_data(f"expected mapping, got {type(loaded).__name__}")
+        loaded.setdefault("schema_version", 1)
+        loaded.setdefault("observed_resources", [])
+        loaded.setdefault("cleanup_resources", [])
+        loaded.setdefault("tool_uses", [])
+        loaded.setdefault("history", [])
+        return loaded
+
+    def _load_for_write(self) -> dict[str, Any] | None:
+        data = self._load()
+        if not data.get(_LOAD_FAILED_KEY):
+            return data
+        return None
+
+    def _save(self, data: dict[str, Any]) -> None:
+        content = yaml.safe_dump(data, allow_unicode=True, sort_keys=False)
+        atomic_write_text(self.path, content, durable=True)
+
+    @staticmethod
+    def _append_history(data: dict[str, Any], entry: dict[str, Any]) -> None:
+        history = data.setdefault("history", [])
+        if isinstance(history, list):
+            history.append(entry)
+
+    def _write_lock(self):
+        return _ledger_path_lock(self.path)
+
+
+class CleanupObserver:
+    """Observe tool calls/results and update cleanup resource lifecycle state."""
+
+    def __init__(self, ledger: CleanupLedger) -> None:
+        self._ledger = ledger
+        self._tool_inputs: dict[str, dict[str, Any]] = {}
+
+    def observe(self, event: Any) -> None:
+        if isinstance(event, ToolUseEndEvent):
+            self._observe_tool_use(event)
+        elif isinstance(event, ToolResultEvent):
+            self._observe_tool_result(event)
+        elif isinstance(event, StackProgressEvent):
+            self._observe_stack_progress(event)
+
+    def _observe_tool_use(self, event: ToolUseEndEvent) -> None:
+        self._tool_inputs[event.tool_use_id] = {"tool_name": event.name, "input": dict(event.input)}
+        operation = _stack_operation_from_tool_input(event.name, event.input)
+        if operation is None or operation["action"] not in {"DeleteStack", "GetStack"}:
+            return
+        stack_id = _stack_id_from_sources(operation["params"])
+        if stack_id is None:
+            return
+        self._ledger.record_tool_use_mapping(
+            tool_use_id=event.tool_use_id,
+            provider=operation["provider"],
+            resource_type="stack",
+            resource_id=stack_id,
+            region_id=operation["region_id"],
+            action=operation["action"],
+            tool_name=event.name,
+            tool_input=event.input,
+        )
+        if operation["action"] != "DeleteStack":
+            return
+        self._ledger.update_resource(
+            provider=operation["provider"],
+            resource_type="stack",
+            resource_id=stack_id,
+            region_id=operation["region_id"],
+            cleanup_status="started",
+            cleanup_tool_use_id=event.tool_use_id,
+            cleanup_action="DeleteStack",
+            progress_status="DELETE_STARTED",
+            clear_last_error=True,
+        )
+
+    def _observe_tool_result(self, event: ToolResultEvent) -> None:
+        record = self._tool_inputs.get(event.tool_use_id)
+        result = _json_object(event.result) or {}
+        operation: dict[str, Any] | None = None
+        stack_id: str | None = None
+        result_stack_id = _stack_id_from_sources(result)
+        if isinstance(record, dict):
+            tool_name = str(record.get("tool_name") or event.tool_name)
+            tool_input = record.get("input")
+            if not isinstance(tool_input, dict):
+                return
+            operation = _stack_operation_from_tool_input(tool_name, tool_input)
+            if operation is None or operation["action"] not in {"DeleteStack", "GetStack"}:
+                return
+            stack_id = _stack_id_from_sources(operation["params"])
+            if stack_id is None:
+                return
+            if result_stack_id is not None and result_stack_id != stack_id:
+                self._record_tool_result_mismatch(
+                    tool_use_id=event.tool_use_id,
+                    tool_name=tool_name,
+                    mapped_resource_id=stack_id,
+                    result_resource_id=result_stack_id,
+                )
+                return
+        else:
+            mapping = self._ledger.tool_use_mapping(event.tool_use_id)
+            if mapping is None:
+                if _is_cleanup_stack_tool_name(event.tool_name):
+                    logger.warning(
+                        "Unmatched cleanup tool result: tool_use_id=%s tool_name=%s",
+                        event.tool_use_id,
+                        event.tool_name,
+                    )
+                    self._ledger.record_tool_result_unmatched(
+                        tool_use_id=event.tool_use_id,
+                        tool_name=event.tool_name,
+                    )
+                return
+            operation = _stack_operation_from_tool_mapping(mapping)
+            if operation is None:
+                return
+            stack_id = operation["resource_id"]
+            if result_stack_id is not None and result_stack_id != stack_id:
+                self._record_tool_result_mismatch(
+                    tool_use_id=event.tool_use_id,
+                    tool_name=event.tool_name,
+                    mapped_resource_id=stack_id,
+                    result_resource_id=result_stack_id,
+                )
+                return
+        if stack_id is None:
+            return
+        status = _status_from_result(result)
+        if operation["action"] == "DeleteStack" and status is None and not event.is_error:
+            self._ledger.update_resource(
+                provider=operation["provider"],
+                resource_type="stack",
+                resource_id=stack_id,
+                region_id=operation["region_id"],
+                cleanup_status="in_progress",
+                cleanup_tool_use_id=event.tool_use_id,
+                cleanup_action="DeleteStack",
+                progress_status="DELETE_REQUESTED",
+                clear_last_error=True,
+            )
+            return
+        cleanup_status = _cleanup_status_from_stack_status(status, event.is_error)
+        self._ledger.update_resource(
+            provider=operation["provider"],
+            resource_type="stack",
+            resource_id=stack_id,
+            region_id=operation["region_id"],
+            cleanup_status=cleanup_status,
+            cleanup_tool_use_id=event.tool_use_id,
+            cleanup_action=operation["action"],
+            progress_status=status,
+            last_error=event.result if cleanup_status == "failed" else None,
+            clear_last_error=cleanup_status != "failed",
+        )
+
+    def _observe_stack_progress(self, event: StackProgressEvent) -> None:
+        status = event.status
+        self._ledger.update_resource(
+            provider="ros",
+            resource_type="stack",
+            resource_id=event.stack_id,
+            cleanup_status=_cleanup_status_from_stack_status(status, False),
+            progress_status=status,
+            progress_percentage=event.progress_percentage,
+            last_error=status if status in _DELETE_FAILED_STATUSES else None,
+            clear_last_error=status not in _DELETE_FAILED_STATUSES,
+        )
+
+    def _record_tool_result_mismatch(
+        self,
+        *,
+        tool_use_id: str,
+        tool_name: str,
+        mapped_resource_id: str,
+        result_resource_id: str,
+    ) -> None:
+        safe_tool_use_id = _safe_history_error(tool_use_id) or ""
+        safe_tool_name = _safe_history_error(tool_name) or ""
+        safe_mapped_resource_id = _safe_history_error(mapped_resource_id) or ""
+        safe_result_resource_id = _safe_history_error(result_resource_id) or ""
+        logger.warning(
+            "Mismatched cleanup tool result: tool_use_id=%s tool_name=%s mapped_resource_id=%s result_resource_id=%s",
+            safe_tool_use_id,
+            safe_tool_name,
+            safe_mapped_resource_id,
+            safe_result_resource_id,
+        )
+        self._ledger.record_tool_result_mismatch(
+            tool_use_id=tool_use_id,
+            tool_name=tool_name,
+            mapped_resource_id=mapped_resource_id,
+            result_resource_id=result_resource_id,
+        )
+
+
+def create_cleanup_prompt_message(
+    prompt: str,
+    *,
+    cleanup_ledger_path: str | Path | None = None,
+    cleanup_status: str | None = None,
+) -> Message:
+    metadata = {"type": CLEANUP_PROMPT_METADATA_TYPE, "source": "pipeline_cleanup"}
+    if cleanup_ledger_path is not None:
+        metadata["cleanupLedgerPath"] = str(cleanup_ledger_path)
+    if cleanup_status is not None:
+        metadata["cleanupStatus"] = cleanup_status
+    return Message(role="user", content=prompt, metadata=metadata)
+
+
+def is_cleanup_prompt_message(message: Message) -> bool:
+    return message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE
+
+
+def cleanup_prompt_ledger_path(message: Message) -> str | None:
+    if not is_cleanup_prompt_message(message):
+        return None
+    value = message.metadata.get("cleanupLedgerPath") or message.metadata.get("cleanup_ledger_path")
+    return value if isinstance(value, str) and value else None
+
+
+def is_active_cleanup_prompt_message(message: Message) -> bool:
+    if not is_cleanup_prompt_message(message):
+        return False
+    status = message.metadata.get("cleanupStatus") or message.metadata.get("cleanup_status")
+    return status not in {"completed", "skipped"}
+
+
+def mark_cleanup_prompt_message_completed(message: Message, *, cleanup_ledger_path: str | Path | None = None) -> bool:
+    if not is_cleanup_prompt_message(message):
+        return False
+    if cleanup_ledger_path is not None:
+        existing_path = cleanup_prompt_ledger_path(message)
+        if existing_path is not None and existing_path != str(cleanup_ledger_path):
+            return False
+    if message.metadata.get("cleanupStatus") == "completed":
+        return False
+    message.metadata = {**message.metadata, "cleanupStatus": "completed"}
+    return True
+
+
+def _ledger_path_lock(path: Path):
+    return _LEDGER_LOCKS.lock_for(path)
+
+
+def _merge_cleanup_required(
+    existing: CleanupResource | None,
+    incoming: CleanupResource,
+    *,
+    source_step_id: str,
+    reason: str,
+    now: float,
+) -> CleanupResource:
+    if existing is None:
+        return replace(
+            incoming,
+            cleanup_required=True,
+            cleanup_reason=incoming.cleanup_reason or reason,
+            source_step_id=incoming.source_step_id or source_step_id,
+            updated_at=now,
+        )
+    if existing.cleanup_status in _TERMINAL_CLEANUP_STATUSES:
+        return existing
+    cleanup_status = incoming.cleanup_status
+    if existing.cleanup_status in _ACTIVE_CLEANUP_STATUSES or existing.cleanup_status == "failed":
+        cleanup_status = existing.cleanup_status
+    return replace(
+        incoming,
+        cleanup_required=True,
+        cleanup_reason=incoming.cleanup_reason or existing.cleanup_reason or reason,
+        source_step_id=incoming.source_step_id or existing.source_step_id or source_step_id,
+        source_attempt_id=incoming.source_attempt_id or existing.source_attempt_id,
+        cleanup_status=cleanup_status,
+        cleanup_tool_use_id=existing.cleanup_tool_use_id,
+        cleanup_action=existing.cleanup_action,
+        progress_status=existing.progress_status,
+        progress_percentage=existing.progress_percentage,
+        last_error=existing.last_error,
+        observed_at=existing.observed_at or incoming.observed_at,
+        updated_at=now,
+    )
+
+
+def _resource_key(provider: str, resource_type: str, resource_id: str, region_id: str) -> str:
+    return "|".join([provider.strip().lower(), resource_type.strip().lower(), region_id.strip(), resource_id.strip()])
+
+
+def _matches_resource(
+    resource: CleanupResource,
+    provider: str,
+    resource_type: str,
+    resource_id: str,
+    region_id: str | None,
+) -> bool:
+    if resource.provider.lower() != provider.lower():
+        return False
+    if resource.resource_type.lower() != resource_type.lower():
+        return False
+    if resource.resource_id != resource_id:
+        return False
+    return not region_id or not resource.region_id or resource.region_id == region_id
+
+
+def _stack_operation_from_tool_input(tool_name: str, tool_input: dict[str, Any]) -> dict[str, Any] | None:
+    params = _dict_value(tool_input.get("params") or tool_input.get("parameters"))
+    normalized_tool_name = tool_name.lower()
+    if normalized_tool_name == "ros_stack":
+        action = _first_string(tool_input, ("action", "Action"))
+    elif normalized_tool_name == "aliyun_api":
+        product = _first_string(tool_input, ("product", "Product", "service", "Service"))
+        if product is None or product.lower() != "ros":
+            return None
+        action = _first_string(tool_input, ("action", "Action"))
+    else:
+        return None
+    if action not in {"CreateStack", "UpdateStack", "ContinueCreateStack", "DeleteStack", "GetStack"}:
+        return None
+    return {
+        "provider": "ros",
+        "action": action,
+        "params": params,
+        "region_id": _first_string(tool_input, ("region_id", "regionId", "RegionId"))
+        or _first_string(params, ("region_id", "regionId", "RegionId"))
+        or "",
+    }
+
+
+def _stack_operation_from_tool_mapping(mapping: dict[str, Any]) -> dict[str, Any] | None:
+    action = mapping.get("action")
+    if action not in {"DeleteStack", "GetStack"}:
+        return None
+    resource_id = _optional_str(mapping.get("resource_id"))
+    if resource_id is None:
+        return None
+    return {
+        "provider": str(mapping.get("provider") or "ros"),
+        "resource_type": str(mapping.get("resource_type") or "stack"),
+        "resource_id": resource_id,
+        "action": action,
+        "region_id": str(mapping.get("region_id") or ""),
+    }
+
+
+def _cleanup_tool_input_summary(
+    tool_input: dict[str, Any],
+    *,
+    resource_id: str,
+    region_id: str,
+) -> dict[str, Any]:
+    params = _dict_value(tool_input.get("params") or tool_input.get("parameters"))
+    return {
+        "action": _first_string(tool_input, ("action", "Action")),
+        "product": _first_string(tool_input, ("product", "Product", "service", "Service")),
+        "region_id": region_id,
+        "stack_id": resource_id,
+        "param_keys": sorted(str(key) for key in params),
+    }
+
+
+def _is_cleanup_stack_tool_name(tool_name: str) -> bool:
+    return tool_name.lower() in {"ros_stack", "aliyun_api"}
+
+
+def _cleanup_status_from_stack_status(status: str | None, is_error: bool) -> CleanupStatus:
+    if status in _DELETE_COMPLETE_STATUSES:
+        return "completed"
+    if status in _DELETE_FAILED_STATUSES or is_error:
+        return "failed"
+    return "in_progress"
+
+
+def _cleanup_lifecycle_state(resource: CleanupResource) -> tuple[Any, ...]:
+    return (
+        resource.cleanup_status,
+        resource.cleanup_tool_use_id,
+        resource.cleanup_action,
+        resource.progress_status,
+        resource.progress_percentage,
+        resource.last_error,
+    )
+
+
+def _cleanup_lifecycle_history_entry(resource: CleanupResource) -> dict[str, Any]:
+    event_type = {
+        "started": PIPELINE_EVENT_CLEANUP_STARTED,
+        "in_progress": PIPELINE_EVENT_CLEANUP_PROGRESS,
+        "completed": PIPELINE_EVENT_CLEANUP_COMPLETED,
+        "failed": PIPELINE_EVENT_CLEANUP_FAILED,
+        "skipped": "cleanup_skipped",
+        "pending": "cleanup_pending",
+    }.get(resource.cleanup_status, PIPELINE_EVENT_CLEANUP_PROGRESS)
+    entry = {
+        "type": event_type,
+        "resource": _cleanup_resource_history_data(resource),
+        "cleanup_status": resource.cleanup_status,
+        "cleanup_tool_use_id": resource.cleanup_tool_use_id,
+        "cleanup_action": resource.cleanup_action,
+        "progress_status": resource.progress_status,
+        "progress_percentage": resource.progress_percentage,
+        "last_error": _safe_history_error(resource.last_error),
+        "timestamp": resource.updated_at or time.time(),
+    }
+    return {key: value for key, value in entry.items() if value is not None}
+
+
+def _cleanup_resource_history_data(resource: CleanupResource) -> dict[str, Any]:
+    return {
+        "provider": resource.provider,
+        "resource_type": resource.resource_type,
+        "resource_id": resource.resource_id,
+        "resource_name": resource.resource_name,
+        "region_id": resource.region_id,
+        "source_step_id": resource.source_step_id,
+        "source_attempt_id": resource.source_attempt_id,
+        "cleanup_status": resource.cleanup_status,
+        "progress_status": resource.progress_status,
+    }
+
+
+def _safe_history_error(value: str | None) -> str | None:
+    if not value:
+        return None
+    text = sanitize_public_text(value)
+    return text[:1000] + "..." if len(text) > 1000 else text
+
+
+def _status_from_result(result: dict[str, Any]) -> str | None:
+    nested = _dict_value(result.get("Stack") or result.get("stack"))
+    return _first_string(
+        result,
+        ("StackStatus", "stackStatus", "stack_status", "Status", "status"),
+    ) or _first_string(nested, ("StackStatus", "stackStatus", "stack_status", "Status", "status"))
+
+
+def _stack_id_from_sources(*sources: dict[str, Any]) -> str | None:
+    for source in sources:
+        stack_id = _first_string(source, ("StackId", "stackId", "stack_id"))
+        if stack_id:
+            return stack_id
+        nested = _dict_value(source.get("Stack") or source.get("stack"))
+        stack_id = _first_string(nested, ("StackId", "stackId", "stack_id"))
+        if stack_id:
+            return stack_id
+    return None
+
+
+def _json_object(value: Any) -> dict[str, Any] | None:
+    if isinstance(value, dict):
+        return value
+    if not isinstance(value, str) or not value:
+        return None
+    try:
+        parsed = json.loads(value)
+    except json.JSONDecodeError:
+        return None
+    return parsed if isinstance(parsed, dict) else None
+
+
+def _empty_ledger_data() -> dict[str, Any]:
+    return {"schema_version": 1, "observed_resources": [], "cleanup_resources": [], "tool_uses": [], "history": []}
+
+
+def _failed_ledger_data(reason: str) -> dict[str, Any]:
+    data = _empty_ledger_data()
+    data[_LOAD_FAILED_KEY] = True
+    data[_LOAD_ERROR_KEY] = reason
+    return data
+
+
+def _dict_list(value: Any) -> list[dict[str, Any]]:
+    return [item for item in value if isinstance(item, dict)] if isinstance(value, list) else []
+
+
+def _dict_value(value: Any) -> dict[str, Any]:
+    return value if isinstance(value, dict) else {}
+
+
+def _first_string(data: dict[str, Any], keys: tuple[str, ...]) -> str | None:
+    for key in keys:
+        value = data.get(key)
+        if isinstance(value, str) and value:
+            return value
+    return None
+
+
+def _optional_str(value: Any) -> str | None:
+    return value if isinstance(value, str) and value else None
+
+
+def _float_value(value: Any) -> float:
+    if isinstance(value, bool):
+        return 0.0
+    if isinstance(value, int | float):
+        return float(value)
+    return 0.0
+
+
+def _optional_float(value: Any) -> float | None:
+    if isinstance(value, bool):
+        return None
+    if isinstance(value, int | float):
+        return float(value)
+    return None
diff --git a/src/iac_code/pipeline/engine/complete_step_tool.py b/src/iac_code/pipeline/engine/complete_step_tool.py
index 9e5236f0..e7f99752 100644
--- a/src/iac_code/pipeline/engine/complete_step_tool.py
+++ b/src/iac_code/pipeline/engine/complete_step_tool.py
@@ -249,6 +249,7 @@ def _validate_completion_guards(self, conclusion: dict) -> str | None:
                 continue
 
             required_tool = guard.get("require_tool")
+            required_tool_result = guard.get("require_tool_result")
             required_field = guard.get("required_conclusion_field")
             required_any_of = guard.get("required_conclusion_any_of") or []
             successful_tools = self._completion_guard_state.get("successful_tools", set())
@@ -279,8 +280,117 @@ def _validate_completion_guards(self, conclusion: dict) -> str | None:
                     message=message,
                     fields=fields,
                 )
+            if isinstance(required_tool_result, dict):
+                validation_error = self._validate_required_tool_result(
+                    required_tool_result,
+                    conclusion,
+                    guard.get("message"),
+                )
+                if validation_error is not None:
+                    return validation_error
         return None
 
+    def _validate_required_tool_result(
+        self,
+        requirement: dict[str, Any],
+        conclusion: dict[str, Any],
+        message: str | None,
+    ) -> str | None:
+        tool_name = str(requirement.get("tool") or "")
+        actions = self._expected_actions(requirement)
+        expected_success = requirement.get("is_success")
+        status_in = {str(status) for status in requirement.get("status_in") or [] if status is not None}
+        match_conclusion_field = requirement.get("match_conclusion_field")
+        match_result_field = str(requirement.get("match_result_field") or "stack_id")
+        base_message = message or _("A successful tool result is required before completing the current step.")
+
+        records = self._completion_guard_state.get("tool_result_records") or []
+        mismatch_message: str | None = None
+        for record in records:
+            if not isinstance(record, dict):
+                continue
+            if tool_name and record.get("tool_name") != tool_name:
+                continue
+            tool_input = record.get("input") if isinstance(record.get("input"), dict) else {}
+            if actions and self._first_string(tool_input, ("action", "Action")) not in actions:
+                continue
+            if record.get("is_error"):
+                continue
+            result = record.get("result")
+            if not isinstance(result, dict):
+                continue
+            if expected_success is not None and self._bool_from_result(result) is not bool(expected_success):
+                continue
+            if status_in:
+                status = self._status_from_result(result)
+                if status not in status_in:
+                    continue
+            if isinstance(match_conclusion_field, str) and match_conclusion_field:
+                conclusion_value = self._resolve_dotted(conclusion, match_conclusion_field)
+                result_value = (
+                    self._stack_id_from_result(result)
+                    if match_result_field == "stack_id"
+                    else self._resolve_dotted(result, match_result_field)
+                )
+                if conclusion_value != result_value:
+                    mismatch_message = _(
+                        "{message} complete_step.conclusion.{field} must match the {tool} result value {value}."
+                    ).format(
+                        message=base_message,
+                        field=match_conclusion_field,
+                        tool=tool_name or _("tool"),
+                        value=result_value or _("<missing>"),
+                    )
+                    continue
+            return None
+
+        if mismatch_message is not None:
+            return mismatch_message
+        status_hint = ""
+        if status_in:
+            status_hint = _(" with status {statuses}").format(statuses=", ".join(sorted(status_in)))
+        success_hint = ""
+        if expected_success is not None:
+            success_hint = _(" and is_success={expected}").format(expected=str(bool(expected_success)).lower())
+        action_hint = ""
+        if len(actions) == 1:
+            action_hint = f" {next(iter(actions))}"
+        elif actions:
+            action_hint = _(" one of {actions}").format(actions=", ".join(sorted(actions)))
+        return _(
+            "{message} Call {tool}{action} first and wait for a successful result{status_hint}{success_hint}."
+        ).format(
+            message=base_message,
+            tool=tool_name or _("the required tool"),
+            action=action_hint,
+            status_hint=status_hint,
+            success_hint=success_hint,
+        )
+
+    def validate_completion_input(self, tool_input: dict[str, Any]) -> str | None:
+        """Validate a complete_step input without mutating retry counters."""
+
+        self.normalize_input(tool_input)
+        rollback_target_error = self._validate_rollback_target_limit()
+        if rollback_target_error is not None:
+            return rollback_target_error
+
+        conclusion = tool_input["conclusion"]
+        rollback = tool_input.get("rollback_request")
+        rollback_tuple = (rollback["target_step"], rollback["reason"]) if rollback else None
+        if rollback_tuple and self._step_config.rollback_count >= self._step_config.max_rollbacks:
+            max_rollbacks = self._step_config.max_rollbacks
+            return _(
+                "Rollback count cannot exceed {max_rollbacks}. Complete the current step or ask the user for help."
+            ).format(max_rollbacks=max_rollbacks)
+
+        validation_error = self._validate_conclusion(conclusion)
+        if validation_error is None:
+            validation_error = self._validate_completion_guards(conclusion)
+        if validation_error is None:
+            validation_error = self._validate_candidate_limit(conclusion)
+        return validation_error
+
     def _guard_applies(self, guard: dict, conclusion: dict) -> bool:
         unless_patterns = guard.get("unless_user_message_matches_any") or []
         if any(self._matches(pattern, self._user_message) for pattern in unless_patterns):
@@ -330,6 +440,64 @@ def _resolve_dotted(value: dict, path: str) -> Any:
                 return None
         return current
 
+    @classmethod
+    def _status_from_result(cls, result: dict[str, Any]) -> str | None:
+        nested = cls._dict_value(result.get("Stack") or result.get("stack"))
+        return cls._first_string(
+            result,
+            ("StackStatus", "stackStatus", "stack_status", "Status", "status"),
+        ) or cls._first_string(nested, ("StackStatus", "stackStatus", "stack_status", "Status", "status"))
+
+    @classmethod
+    def _stack_id_from_result(cls, result: dict[str, Any]) -> str | None:
+        nested = cls._dict_value(result.get("Stack") or result.get("stack"))
+        return cls._first_string(result, ("StackId", "stackId", "stack_id")) or cls._first_string(
+            nested,
+            ("StackId", "stackId", "stack_id"),
+        )
+
+    @classmethod
+    def _bool_from_result(cls, result: dict[str, Any]) -> bool | None:
+        value = result.get("is_success")
+        if value is None:
+            value = result.get("isSuccess")
+        if isinstance(value, bool):
+            return value
+        if isinstance(value, str):
+            lower = value.strip().lower()
+            if lower in {"true", "1", "yes"}:
+                return True
+            if lower in {"false", "0", "no"}:
+                return False
+        return None
+
+    @staticmethod
+    def _dict_value(value: Any) -> dict[str, Any]:
+        return value if isinstance(value, dict) else {}
+
+    @staticmethod
+    def _first_string(source: dict[str, Any], keys: tuple[str, ...]) -> str | None:
+        for key in keys:
+            value = source.get(key)
+            if isinstance(value, str) and value:
+                return value
+        return None
+
+    @classmethod
+    def _expected_actions(cls, requirement: dict[str, Any]) -> set[str]:
+        actions: set[str] = set()
+        for key in ("action", "action_in", "actions"):
+            actions.update(cls._string_set(requirement.get(key)))
+        return actions
+
+    @staticmethod
+    def _string_set(value: Any) -> set[str]:
+        if isinstance(value, str):
+            return {value} if value else set()
+        if isinstance(value, list | tuple | set):
+            return {str(item) for item in value if item not in (None, "")}
+        return set()
+
     async def execute(self, *, tool_input: dict[str, Any], context: ToolContext) -> ToolResult:
         self.normalize_input(tool_input)
         rollback_target_error = self._validate_rollback_target_limit()
diff --git a/src/iac_code/pipeline/engine/completion_guard_state.py b/src/iac_code/pipeline/engine/completion_guard_state.py
new file mode 100644
index 00000000..ffc9a997
--- /dev/null
+++ b/src/iac_code/pipeline/engine/completion_guard_state.py
@@ -0,0 +1,83 @@
+"""State helpers for completion guards that depend on prior tool results."""
+
+from __future__ import annotations
+
+import json
+import logging
+from typing import Any
+
+logger = logging.getLogger(__name__)
+
+
+def ensure_completion_guard_state(state: dict[str, Any]) -> dict[str, Any]:
+    state.setdefault("successful_tools", set())
+    state.setdefault("tool_results", {})
+    state.setdefault("tool_result_records", [])
+    return state
+
+
+def record_completion_guard_tool_result(
+    state: dict[str, Any],
+    *,
+    tool_name: str,
+    tool_input: dict[str, Any],
+    content: Any,
+    is_error: bool,
+) -> None:
+    """Record tool results that completion guards may need later in the same step."""
+
+    try:
+        ensure_completion_guard_state(state)
+        if tool_name == "ask_user_question":
+            _record_ask_user_question(state, content, is_error=is_error)
+            return
+        if tool_name == "ros_stack":
+            _record_ros_stack(state, tool_input, content, is_error=is_error)
+    except Exception:
+        logger.warning("Failed to rebuild completion guard state", exc_info=True)
+
+
+def _record_ask_user_question(state: dict[str, Any], content: Any, *, is_error: bool) -> None:
+    if is_error:
+        return
+    successful_tools: set[str] = state.setdefault("successful_tools", set())
+    successful_tools.add("ask_user_question")
+    tool_results: dict[str, Any] = state.setdefault("tool_results", {})
+    parsed = _json_object(content)
+    if parsed is None:
+        parsed = {
+            "selected_id": "",
+            "selected_label": "",
+            "free_text": str(content),
+        }
+    tool_results["ask_user_question"] = parsed
+
+
+def _record_ros_stack(state: dict[str, Any], tool_input: dict[str, Any], content: Any, *, is_error: bool) -> None:
+    parsed = _json_object(content)
+    if parsed is None:
+        return
+    records: list[dict[str, Any]] = state.setdefault("tool_result_records", [])
+    record = {
+        "tool_name": "ros_stack",
+        "input": dict(tool_input),
+        "result": parsed,
+        "is_error": bool(is_error),
+    }
+    records.append(record)
+    state.setdefault("tool_results", {})["ros_stack"] = parsed
+    if not is_error:
+        state.setdefault("successful_tools", set()).add("ros_stack")
+
+
+def _json_object(value: Any) -> dict[str, Any] | None:
+    if isinstance(value, dict):
+        return value
+    if not isinstance(value, str) or not value:
+        return None
+    try:
+        parsed = json.loads(value)
+    except json.JSONDecodeError:
+        logger.warning("Failed to parse completion guard state", exc_info=True)
+        return None
+    return parsed if isinstance(parsed, dict) else None
diff --git a/src/iac_code/pipeline/engine/events.py b/src/iac_code/pipeline/engine/events.py
index fc90116b..8999fc78 100644
--- a/src/iac_code/pipeline/engine/events.py
+++ b/src/iac_code/pipeline/engine/events.py
@@ -11,6 +11,7 @@ class PipelineEventType(str, Enum):
     PIPELINE_COMPLETED = "pipeline_completed"
     PIPELINE_RESUMED = "pipeline_resumed"
     PIPELINE_ERROR = "pipeline_error"
+    PIPELINE_WARNING = "pipeline_warning"
 
     STEP_STARTED = "step_started"
     STEP_COMPLETED = "step_completed"
diff --git a/src/iac_code/pipeline/engine/interrupt.py b/src/iac_code/pipeline/engine/interrupt.py
index 3f15f903..5cc3c120 100644
--- a/src/iac_code/pipeline/engine/interrupt.py
+++ b/src/iac_code/pipeline/engine/interrupt.py
@@ -10,6 +10,13 @@
 from pathlib import Path
 from typing import Any, Callable, Literal
 
+from iac_code.agent.message import ImageBlock
+from iac_code.pipeline.engine.user_input import (
+    IMAGE_INPUT_PLACEHOLDER,
+    PipelineUserInput,
+    normalize_pipeline_user_input,
+)
+
 logger = logging.getLogger(__name__)
 
 # LLM judge calls typically take 2-8s, but in parallel-pipeline mode candidate
@@ -72,15 +79,16 @@ def __init__(
         self._get_state = pipeline_state_getter
         self._pipeline_dir = pipeline_dir
 
-    async def judge(self, user_message: str) -> InterruptVerdict:
+    async def judge(self, user_message: str | PipelineUserInput) -> InterruptVerdict:
         """Judge a user message. Returns verdict. Defaults to 'continue' on failure."""
         import time
 
+        pipeline_input = normalize_pipeline_user_input(user_message)
         started = time.monotonic()
-        logger.info("interrupt judge START: message=%r", user_message[:200])
+        logger.info("interrupt judge START: message=%r", pipeline_input.display_text[:200])
         try:
             verdict = await asyncio.wait_for(
-                self._call_judge_llm(user_message),
+                self._call_judge_llm(pipeline_input),
                 timeout=JUDGE_TIMEOUT_SECONDS,
             )
             logger.info(
@@ -105,19 +113,32 @@ async def judge(self, user_message: str) -> InterruptVerdict:
             logger.warning("interrupt judge FAILED: %s", e, exc_info=True)
             return InterruptVerdict(action="continue", reason=f"judge failed: {type(e).__name__}: {e}")
 
-    async def _call_judge_llm(self, user_message: str) -> InterruptVerdict:
+    async def _call_judge_llm(self, user_message: str | PipelineUserInput) -> InterruptVerdict:
         """Make the actual LLM call and parse the response."""
+        from iac_code.providers.base import ContentBlock as ProviderContentBlock
         from iac_code.providers.base import Message as ProviderMessage
 
+        pipeline_input = normalize_pipeline_user_input(user_message)
         state = self._get_state()
         system_prompt = self._build_judge_system_prompt(state)
-        user_prompt = self._build_judge_user_prompt(user_message, state)
+        user_prompt = self._build_judge_user_prompt(pipeline_input, state)
+        provider_content: str | list[ProviderContentBlock]
+        if pipeline_input.has_images and isinstance(pipeline_input.content, list):
+            provider_blocks = [ProviderContentBlock(type="text", text=user_prompt)]
+            for block in pipeline_input.content:
+                if isinstance(block, ImageBlock):
+                    provider_blocks.append(
+                        ProviderContentBlock(type="image", media_type=block.media_type, data=block.data)
+                    )
+            provider_content = provider_blocks
+        else:
+            provider_content = user_prompt
 
         max_attempts = 2
         last_response_text = ""
         for attempt in range(max_attempts):
             response = await self._provider_manager.complete(
-                messages=[ProviderMessage.user(user_prompt)],
+                messages=[ProviderMessage(role="user", content=provider_content)],
                 system=system_prompt,
             )
             last_response_text = response.text
@@ -187,8 +208,9 @@ def _default_judge_system_prompt(self) -> str:
             "输出严格的 JSON 格式，不要包含其他文字。"
         )
 
-    def _build_judge_user_prompt(self, user_message: str, state: dict) -> str:
+    def _build_judge_user_prompt(self, user_message: str | PipelineUserInput, state: dict) -> str:
         """Build the user prompt with full pipeline context."""
+        pipeline_input = normalize_pipeline_user_input(user_message)
         sections = []
 
         # Pipeline structure
@@ -229,7 +251,14 @@ def _build_judge_user_prompt(self, user_message: str, state: dict) -> str:
             sections.append("=== Sub-pipeline 可回滚步骤 ===\n" + "\n".join(lines))
 
         # User message
-        sections.append(f"=== 用户新消息 ===\n{user_message}")
+        user_text = pipeline_input.display_text
+        if pipeline_input.has_images:
+            user_text = user_text if user_text.strip() else IMAGE_INPUT_PLACEHOLDER
+            user_text += (
+                "\n\n用户同时提供了图片输入。请检查图片内容，并在 reason 或 rollback_context "
+                "中写出与路由相关的图像信息。"
+            )
+        sections.append(f"=== 用户新消息 ===\n{user_text}")
 
         # Available actions
         sections.append(
diff --git a/src/iac_code/pipeline/engine/loader.py b/src/iac_code/pipeline/engine/loader.py
index 309c86d2..c1cc59c1 100644
--- a/src/iac_code/pipeline/engine/loader.py
+++ b/src/iac_code/pipeline/engine/loader.py
@@ -20,9 +20,9 @@
     LoadedPipeline,
     OnCompletePolicy,
     StepSpec,
+    StepSurfaceOverride,
     SubPipelineSpec,
 )
-from iac_code.pipeline.engine.types import RollbackRule
 
 logger = logging.getLogger(__name__)
 
@@ -195,10 +195,6 @@ def _parse_sub_pipelines(
 def _parse_steps(raw_steps: list[dict]) -> list[StepSpec]:
     steps: list[StepSpec] = []
     for raw in raw_steps:
-        rollback_rules = [
-            RollbackRule(target_step=r["target"], condition=r["condition"]) for r in raw.get("rollback", [])
-        ]
-
         raw_tools = raw.get("tools")
         if raw_tools is not None:
             tools = IncludeExcludeConfig(
@@ -217,6 +213,7 @@ def _parse_steps(raw_steps: list[dict]) -> list[StepSpec]:
         else:
             step_sections = None
 
+        step_id = raw.get("id", "?")
         steps.append(
             StepSpec(
                 step_id=raw["id"],
@@ -227,7 +224,6 @@ def _parse_steps(raw_steps: list[dict]) -> list[StepSpec]:
                 step_type=raw.get("type", "normal"),
                 sub_pipeline_name=raw.get("sub_pipeline"),
                 tools=tools,
-                rollback_rules=rollback_rules,
                 auto_advance=raw.get("auto_advance", True),
                 max_agent_turns=raw.get("max_agent_turns", 50),
                 context_fields=raw.get("context_fields", []),
@@ -244,13 +240,55 @@ def _parse_steps(raw_steps: list[dict]) -> list[StepSpec]:
                 ),
                 completion_guards=raw.get("completion_guards", []),
                 description=raw.get("description", ""),
-                exit_condition=_parse_exit_condition(raw.get("exit_condition"), raw.get("id", "?")),
-                a2a_artifacts=_parse_a2a_artifacts(raw.get("a2a_artifacts"), raw.get("id", "?")),
+                exit_condition=_parse_exit_condition(raw.get("exit_condition"), step_id),
+                a2a_artifacts=_parse_a2a_artifacts(raw.get("a2a_artifacts"), step_id),
+                surface_overrides=_parse_surface_overrides(raw.get("surface_overrides"), step_id),
             )
         )
     return steps
 
 
+def _parse_surface_overrides(raw: object, step_id: str) -> dict[str, StepSurfaceOverride]:
+    if raw is None:
+        return {}
+    if not isinstance(raw, dict):
+        raise ValueError(f"Step '{step_id}': surface_overrides must be a mapping, got {raw!r}")
+
+    overrides: dict[str, StepSurfaceOverride] = {}
+    for surface, raw_override in raw.items():
+        if not isinstance(surface, str) or not surface:
+            raise ValueError(f"Step '{step_id}': surface_overrides keys must be non-empty strings, got {surface!r}")
+        if not isinstance(raw_override, dict):
+            raise ValueError(f"Step '{step_id}': surface_overrides.{surface} must be a mapping, got {raw_override!r}")
+        override = cast(dict[str, Any], raw_override)
+        unsupported = set(override) - {"prompt", "inject_tools"}
+        if unsupported:
+            supported = "inject_tools, prompt"
+            unknown = ", ".join(sorted(unsupported))
+            raise ValueError(
+                f"Step '{step_id}': surface_overrides.{surface} contains unsupported key(s): "
+                f"{unknown}; supported: {supported}"
+            )
+
+        prompt = override.get("prompt")
+        if prompt is not None and not isinstance(prompt, str):
+            raise ValueError(f"Step '{step_id}': surface_overrides.{surface}.prompt must be a string")
+
+        inject_tools = override.get("inject_tools")
+        if inject_tools is not None:
+            if not isinstance(inject_tools, list) or not all(isinstance(name, str) for name in inject_tools):
+                raise ValueError(
+                    f"Step '{step_id}': surface_overrides.{surface}.inject_tools must be a list of strings"
+                )
+            inject_tools = cast(list[str], inject_tools)
+
+        overrides[surface] = StepSurfaceOverride(
+            prompt_file=prompt,
+            inject_tools=list(inject_tools) if inject_tools is not None else None,
+        )
+    return overrides
+
+
 def _parse_a2a_artifacts(raw: object, step_id: str) -> list[A2AArtifactSpec]:
     if raw is None:
         return []
@@ -321,7 +359,7 @@ def _find_next_enabled(all_steps: list[StepSpec], start_id: str, enabled_ids: se
 
 
 def _bind_hooks(steps: list[StepSpec], pipeline_dir: Path) -> None:
-    """Load hook files and bind on_enter/on_exit callables."""
+    """Load hook files and bind optional step hook callables."""
     for step in steps:
         if not step.hooks_file:
             continue
@@ -333,6 +371,10 @@ def _bind_hooks(steps: list[StepSpec], pipeline_dir: Path) -> None:
             step.on_enter = module.on_enter
         if hasattr(module, "on_exit"):
             step.on_exit = module.on_exit
+        if hasattr(module, "on_resource_observed"):
+            step.on_resource_observed = module.on_resource_observed
+        if hasattr(module, "on_rollback_cleanup_required"):
+            step.on_rollback_cleanup_required = module.on_rollback_cleanup_required
 
 
 def _load_module_from_file(path: Path, module_name: str) -> ModuleType:
@@ -346,11 +388,16 @@ def _load_module_from_file(path: Path, module_name: str) -> ModuleType:
 
 def _validate_prompts_exist(steps: list[StepSpec], pipeline_dir: Path) -> None:
     for step in steps:
-        if not step.prompt_file:
-            continue
-        prompt_path = pipeline_dir / step.prompt_file
-        if not prompt_path.exists():
-            raise FileNotFoundError(f"Prompt file not found: {prompt_path}")
+        prompt_files = [step.prompt_file]
+        prompt_files.extend(
+            override.prompt_file for override in step.surface_overrides.values() if override.prompt_file is not None
+        )
+        for prompt_file in prompt_files:
+            if not prompt_file:
+                continue
+            prompt_path = pipeline_dir / prompt_file
+            if not prompt_path.exists():
+                raise FileNotFoundError(f"Prompt file not found: {prompt_path}")
 
 
 def _discover_pipeline_tools(pipeline_dir: Path) -> dict[str, type]:
diff --git a/src/iac_code/pipeline/engine/pipeline_runner.py b/src/iac_code/pipeline/engine/pipeline_runner.py
index 529e8477..5e8d7a6d 100644
--- a/src/iac_code/pipeline/engine/pipeline_runner.py
+++ b/src/iac_code/pipeline/engine/pipeline_runner.py
@@ -16,6 +16,12 @@
 
 from iac_code.agent.message import ContentBlock, Message, ToolResultBlock
 from iac_code.i18n import _
+from iac_code.pipeline.engine.cleanup import (
+    CleanupLedger,
+    CleanupLedgerWriteStatus,
+    CleanupResource,
+    ObservedResource,
+)
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.display_replay import DISPLAY_TRANSCRIPT_FILENAME
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
@@ -24,20 +30,30 @@
 from iac_code.pipeline.engine.loader import load_pipeline_dir
 from iac_code.pipeline.engine.observability import PipelineObservability
 from iac_code.pipeline.engine.public_errors import public_error, public_error_from_exception
+from iac_code.pipeline.engine.resume_recovery import reconcile_resume_messages, user_message_already_in_resume
 from iac_code.pipeline.engine.session import PipelineIdentity, PipelineSession, RestoreResult
 from iac_code.pipeline.engine.state_machine import StateMachine
 from iac_code.pipeline.engine.step_executor import StepExecutor
 from iac_code.pipeline.engine.step_spec import AllowUserEscapes, LoadedPipeline, OnCompletePolicy, StepSpec
 from iac_code.pipeline.engine.sub_pipeline_executor import SubPipelineExecutor
 from iac_code.pipeline.engine.types import StepResult, StepStatus
-from iac_code.pipeline.engine.ui_contract import PipelineStepType
-from iac_code.types.stream_events import StreamEvent
+from iac_code.pipeline.engine.ui_contract import PipelineStepType, parse_selected_candidate
+from iac_code.pipeline.engine.user_input import (
+    PipelineInputContent,
+    PipelineUserInput,
+    normalize_pipeline_user_input,
+)
+from iac_code.types.stream_events import ResourceObservedEvent, StreamEvent
 from iac_code.utils.public_errors import sanitize_public_text
 
 logger = logging.getLogger(__name__)
 
 _TERMINAL_SIDECAR_STATUSES = {"completed", "user_aborted", "failed", "discarded"}
 _CURRENT_STEP_USER_INPUT_KEY = "current_step_user_input"
+_CURRENT_STEP_USER_INPUT_CONTENT_KEY = "current_step_user_input_content"
+_CURRENT_STEP_RESUME_MESSAGES_KEY = "current_step_resume_messages"
+_CURRENT_STEP_PRECOMPLETED_TOOLS_KEY = "current_step_precompleted_tools"
+_PENDING_ASK_USER_QUESTION_RESUME_KEY = "pending_ask_user_question_resume"
 _PENDING_INPUT_KIND_KEY = "pending_input_kind"
 _PIPELINE_PAUSE_CONFIRMATION_KIND = "pipeline_pause_confirmation"
 _REAL_RESTORE_FAILURE_REASONS = {
@@ -50,24 +66,34 @@
 }
 
 
+class PipelineStatePersistenceError(RuntimeError):
+    """Raised when recovery-critical pipeline state cannot be persisted."""
+
+    def __init__(self, message: str, *, step_id: str | None = None) -> None:
+        super().__init__(message)
+        self.step_id = step_id
+
+
 def _string_answer_value(value: Any) -> str:
     return value if isinstance(value, str) else ""
 
 
 def _user_input_received_data(
-    user_input: str,
+    user_input: PipelineUserInput,
     *,
     ui_mode: str | None,
     selected_index: int | None,
     waiting_options: list[Any],
 ) -> dict[str, Any]:
-    data: dict[str, Any] = {"user_input_length": len(user_input)}
+    data: dict[str, Any] = {"user_input_length": len(user_input.display_text)}
+    if user_input.has_images:
+        data["has_images"] = True
     if ui_mode != "candidate_selection":
         return data
     data.update(
         {
             "kind": "candidate_selection",
-            "selected_value": user_input,
+            "selected_value": user_input.display_text,
         }
     )
     if selected_index is not None:
@@ -79,10 +105,85 @@ def _user_input_received_data(
     return data
 
 
-def _pipeline_pause_input_received_data(user_input: str) -> dict[str, Any]:
-    return {
+def _pipeline_pause_input_received_data(user_input: PipelineUserInput) -> dict[str, Any]:
+    data: dict[str, Any] = {
         "kind": _PIPELINE_PAUSE_CONFIRMATION_KIND,
-        "user_input_length": len(user_input),
+        "user_input_length": len(user_input.display_text),
+    }
+    if user_input.has_images:
+        data["has_images"] = True
+    return data
+
+
+def _serialize_pipeline_input_content(content: PipelineInputContent) -> str | list[dict[str, Any]]:
+    dumped = Message(role="user", content=content).to_dict()["content"]
+    return cast(str | list[dict[str, Any]], dumped)
+
+
+def _deserialize_pipeline_input_content(value: Any) -> PipelineInputContent | None:
+    if isinstance(value, str):
+        return value
+    if not isinstance(value, list):
+        return None
+    try:
+        content = Message(role="user", content=value).content
+    except Exception:
+        return None
+    return content if isinstance(content, list) else None
+
+
+def _serialize_pipeline_messages(messages: list[Message]) -> list[dict[str, Any]]:
+    return [message.to_dict() for message in messages]
+
+
+def _deserialize_pipeline_messages(value: Any) -> list[Message] | None:
+    if not isinstance(value, list):
+        return None
+    messages: list[Message] = []
+    try:
+        for item in value:
+            if not isinstance(item, dict):
+                return None
+            messages.append(Message.from_dict(item))
+    except Exception:
+        return None
+    return messages
+
+
+def _deserialize_precompleted_tools(value: Any) -> dict[str, dict[str, Any]] | None:
+    if not isinstance(value, dict):
+        return None
+    tools: dict[str, dict[str, Any]] = {}
+    for name, payload in value.items():
+        if isinstance(name, str) and isinstance(payload, dict):
+            tools[name] = dict(payload)
+    return tools
+
+
+def _serialize_ask_user_question_resume_state(
+    *,
+    user_message: PipelineInputContent,
+    resume_messages: list[Message] | None,
+    precompleted_tools: dict[str, dict[str, Any]] | None,
+) -> dict[str, Any]:
+    state: dict[str, Any] = {"user_message": _serialize_pipeline_input_content(user_message)}
+    if resume_messages is not None:
+        state["resume_messages"] = _serialize_pipeline_messages(resume_messages)
+    if precompleted_tools is not None:
+        state["precompleted_tools"] = precompleted_tools
+    return state
+
+
+def _deserialize_ask_user_question_resume_state(value: Any) -> dict[str, Any] | None:
+    if not isinstance(value, dict):
+        return None
+    user_message = _deserialize_pipeline_input_content(value.get("user_message"))
+    if user_message is None:
+        return None
+    return {
+        "user_message": user_message,
+        "resume_messages": _deserialize_pipeline_messages(value.get("resume_messages")),
+        "precompleted_tools": _deserialize_precompleted_tools(value.get("precompleted_tools")),
     }
 
 
@@ -193,6 +294,7 @@ class RestartInfo:
     start_from_step: str | None
     preserved_conclusions: dict[str, Any]
     rollback_context: str | None = None
+    rollback_input: PipelineInputContent | None = None
 
 
 @dataclass
@@ -225,6 +327,7 @@ def __init__(
         memory_content_getter: Callable[[], str] | None = None,
         auto_trigger_skills: list[Any] | None = None,
         resume_from_sidecar: bool = False,
+        surface: str = "repl",
     ) -> None:
         self._session_storage = session_storage
         self._session_id = session_id
@@ -232,6 +335,7 @@ def __init__(
         self._permission_context_getter = permission_context_getter
         self._memory_content_getter = memory_content_getter
         self._auto_trigger_skills = auto_trigger_skills or []
+        self._surface = surface
 
         self._pipeline_dir = pipeline_dir
         self._loaded: LoadedPipeline = load_pipeline_dir(pipeline_dir)
@@ -247,7 +351,9 @@ def __init__(
         self._sidecar_status: str | None = None
         self._sidecar_restore_result: RestoreResult | None = None
         self._current_step_user_input: str | None = None
-        self._restored_current_step_user_input: str | None = None
+        self._restored_current_step_user_input: PipelineUserInput | None = None
+        self._restored_current_step_resume_messages: list[Message] | None = None
+        self._restored_current_step_precompleted_tools: dict[str, dict[str, Any]] | None = None
         self._last_applied_interrupt_verdict: InterruptVerdict | None = None
         self._waiting_input_started_at: dict[str, float] = {}
         self._waiting_input_options_by_step: dict[str, list[Any]] = {}
@@ -292,6 +398,7 @@ def __init__(
             permission_context_getter=self._permission_context_getter,
             memory_content_getter=self._memory_content_getter,
             auto_trigger_skills=self._auto_trigger_skills,
+            surface=self._surface,
         )
         self._apply_telemetry_correlation(self._step_executor)
 
@@ -307,7 +414,11 @@ def __init__(
         self._active_candidates: dict[int, Any] = {}
         self._pending_candidate_restarts: dict[int, RestartInfo] = {}
         self._rollback_context: str | None = None
-        self._restored_supplement: dict[str, str | None] | None = None
+        self._rollback_input: PipelineInputContent | None = None
+        self._current_step_user_input_content: PipelineInputContent | None = None
+        self._current_step_resume_messages: list[Message] | None = None
+        self._current_step_precompleted_tools: dict[str, dict[str, Any]] | None = None
+        self._restored_supplement: dict[str, Any] | None = None
         # Total candidate count for the currently-executing parallel sub-pipeline
         # step. 0 when no parallel step is in flight. Used by apply_hard_interrupt
         # to detect scope="all" with partial completion and escalate to parent
@@ -383,6 +494,165 @@ def display_transcript_path(self) -> Path | None:
             return None
         return self.session.session_dir / DISPLAY_TRANSCRIPT_FILENAME
 
+    def cleanup_ledger(self) -> CleanupLedger | None:
+        session = getattr(self, "session", None)
+        if session is None:
+            return None
+        session_dir = getattr(session, "session_dir", None)
+        if not isinstance(session_dir, (str, Path)):
+            return None
+        return CleanupLedger(Path(session_dir) / "cleanup.yaml")
+
+    def _handle_resource_observed(
+        self,
+        step: StepSpec,
+        event: ResourceObservedEvent,
+        *,
+        attempt_id: str | None,
+    ) -> list[PipelineEvent]:
+        hook = getattr(step, "on_resource_observed", None)
+        ledger = self.cleanup_ledger()
+        if ledger is None or not callable(hook):
+            return []
+        try:
+            result = hook(
+                self.context,
+                event,
+                ledger=ledger,
+                step_id=step.step_id,
+                attempt_id=attempt_id,
+            )
+        except Exception:
+            logger.warning("Pipeline resource-observed hook failed: step_id=%s", step.step_id, exc_info=True)
+            return []
+        events: list[PipelineEvent] = []
+        for observed in self._observed_resources_from_hook_result(result):
+            try:
+                status = ledger.record_observed(observed)
+            except Exception as exc:
+                logger.warning(
+                    "Failed to persist observed cleanup resource: step_id=%s resource_id=%s error=%s",
+                    step.step_id,
+                    observed.resource_id,
+                    exc,
+                    exc_info=True,
+                )
+                raise PipelineStatePersistenceError(
+                    "pipeline state persistence failed during record_observed_cleanup_resource",
+                    step_id=step.step_id,
+                ) from exc
+            if status.unavailable:
+                events.append(
+                    self._cleanup_tracking_unavailable_event(
+                        step_id=step.step_id,
+                        operation="record_observed",
+                        ledger=ledger,
+                        status=status,
+                        resource_id=observed.resource_id,
+                    )
+                )
+        return events
+
+    def _mark_rollback_cleanup_required(
+        self,
+        step: StepSpec,
+        to_step: str,
+        reason: str,
+        *,
+        from_attempt_id: str | None,
+    ) -> list[PipelineEvent]:
+        hook = getattr(step, "on_rollback_cleanup_required", None)
+        ledger = self.cleanup_ledger()
+        if ledger is None or not callable(hook):
+            return []
+        try:
+            result = hook(
+                self.context,
+                ledger=ledger,
+                from_step=step.step_id,
+                from_attempt_id=from_attempt_id,
+                to_step=to_step,
+                reason=reason,
+            )
+        except Exception:
+            logger.warning("Pipeline rollback cleanup hook failed: step_id=%s", step.step_id, exc_info=True)
+            return []
+        resources = self._cleanup_resources_from_hook_result(result)
+        if resources:
+            try:
+                status = ledger.mark_cleanup_required(resources, source_step_id=step.step_id, reason=reason)
+            except Exception as exc:
+                logger.warning(
+                    "Failed to persist rollback cleanup resources: step_id=%s target_step_id=%s error=%s",
+                    step.step_id,
+                    to_step,
+                    exc,
+                    exc_info=True,
+                )
+                raise PipelineStatePersistenceError(
+                    "pipeline state persistence failed during mark_rollback_cleanup_required",
+                    step_id=step.step_id,
+                ) from exc
+            if status.unavailable:
+                return [
+                    self._cleanup_tracking_unavailable_event(
+                        step_id=step.step_id,
+                        operation="mark_cleanup_required",
+                        ledger=ledger,
+                        status=status,
+                        resource_count=len(resources),
+                    )
+                ]
+        return []
+
+    def _cleanup_tracking_unavailable_event(
+        self,
+        *,
+        step_id: str,
+        operation: str,
+        ledger: CleanupLedger,
+        status: CleanupLedgerWriteStatus,
+        resource_id: str | None = None,
+        resource_count: int | None = None,
+    ) -> PipelineEvent:
+        data: dict[str, Any] = {
+            "reason": "cleanup_tracking_unavailable",
+            "operation": operation,
+        }
+        if resource_id:
+            data["resource_id"] = resource_id
+        if resource_count is not None:
+            data["resource_count"] = resource_count
+        logger.warning(
+            "Pipeline cleanup tracking unavailable: step_id=%s operation=%s ledger_path=%s error=%s",
+            step_id,
+            operation,
+            ledger.path,
+            status.load_error,
+        )
+        return PipelineEvent(
+            type=PipelineEventType.PIPELINE_WARNING,
+            step_id=step_id,
+            timestamp=time.time(),
+            data=data,
+        )
+
+    @staticmethod
+    def _observed_resources_from_hook_result(result: object) -> list[ObservedResource]:
+        if isinstance(result, ObservedResource):
+            return [result]
+        if isinstance(result, list):
+            return [item for item in result if isinstance(item, ObservedResource)]
+        return []
+
+    @staticmethod
+    def _cleanup_resources_from_hook_result(result: object) -> list[CleanupResource]:
+        if isinstance(result, CleanupResource):
+            return [result]
+        if isinstance(result, list):
+            return [item for item in result if isinstance(item, CleanupResource)]
+        return []
+
     def _build_pipeline_identity(self, pipeline_dir: Path) -> PipelineIdentity:
         yaml_path = pipeline_dir / "pipeline.yaml"
         digest = hashlib.sha256(yaml_path.read_bytes()).hexdigest()
@@ -426,7 +696,7 @@ def mark_normal_handoff(self, status: str, failed_reason: str | None = None) ->
         current_step = self._terminal_current_step_id()
         normal_handoff = {
             "status": status,
-            "switched_to_normal": True,
+            "switched_to_normal": status in {"succeeded", "failed"},
             "root_session_id": self._session_id,
             "summary_message_appended": status == "succeeded",
             "failed_reason": failed_reason,
@@ -490,9 +760,7 @@ def restore_from_sidecar_sync(self) -> RestoreResult:
             max_rollbacks=self._loaded.max_rollbacks,
         )
         self._step_attempts = self._step_attempts_from_snapshot(result.state_machine_snapshot)
-        restored_user_input = result.state_machine_snapshot.get(_CURRENT_STEP_USER_INPUT_KEY)
-        self._restored_current_step_user_input = restored_user_input if isinstance(restored_user_input, str) else None
-        self._current_step_user_input = self._restored_current_step_user_input
+        self._restore_current_step_user_input_from_snapshot(result.state_machine_snapshot)
         self.context = PipelineContext.from_snapshot(result.context_snapshot, self._loaded.context_dependencies)
         if result.execution is not None:
             self._execution = dict(result.execution)
@@ -521,52 +789,61 @@ async def restore_from_sidecar(self) -> RestoreResult:
         return self.restore_from_sidecar_sync()
 
     def continue_from_sidecar(
-        self, user_input: str | None = None
+        self, user_input: str | list[ContentBlock] | PipelineUserInput | None = None
     ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
         if not user_input:
             return self._continue_from_current(resume_running_step=True)
         return self._continue_from_sidecar_with_input(user_input)
 
     async def _continue_from_sidecar_with_input(
-        self, user_input: str
+        self, user_input: str | list[ContentBlock] | PipelineUserInput
     ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
+        pipeline_input = normalize_pipeline_user_input(user_input)
+        user_text = pipeline_input.display_text
         was_pause_confirmation = self.has_pending_pipeline_pause_confirmation()
         if was_pause_confirmation:
             self._set_pending_input_kind(None)
             current_step = getattr(self.state_machine, "current_step", None)
             step_id = getattr(current_step, "step_id", None)
+            self._set_current_step_user_input(pipeline_input)
+            try:
+                await self._save_running(str(step_id or ""), reason="pipeline pause confirmation received")
+            except PipelineStatePersistenceError as exc:
+                yield self._persistence_failure_event(exc)
+                return
             yield PipelineEvent(
                 type=PipelineEventType.USER_INPUT_RECEIVED,
                 step_id=step_id,
                 timestamp=time.time(),
-                data=_pipeline_pause_input_received_data(user_input),
+                data=_pipeline_pause_input_received_data(pipeline_input),
             )
-            if user_input.strip().lower() == "continue":
+            if user_text.strip().lower() == "continue":
                 self.resume_agent_loops()
                 async for event in self._continue_from_current(user_input=None, resume_running_step=True):
                     yield event
                 return
         try:
-            verdict = await self._interrupt_controller.judge(user_input)
+            judge_input: str | PipelineUserInput = pipeline_input if pipeline_input.has_images else user_text
+            verdict = await self._interrupt_controller.judge(judge_input)
         except Exception as exc:
             logger.warning("Interrupt judge failed during sidecar continuation: %s", exc, exc_info=True)
             verdict = self._apply_interrupt_judge_failure_policy(
                 InterruptVerdict(action="continue", reason=f"judge failed: {exc}")
             )
-            async for event in self._continue_after_sidecar_judgment_failure(verdict, user_input=user_input):
+            async for event in self._continue_after_sidecar_judgment_failure(verdict, user_input=pipeline_input):
                 yield event
             return
 
         if self._is_judgment_error_verdict(verdict):
             verdict = self._apply_interrupt_judge_failure_policy(verdict)
-            async for event in self._continue_after_sidecar_judgment_failure(verdict, user_input=user_input):
+            async for event in self._continue_after_sidecar_judgment_failure(verdict, user_input=pipeline_input):
                 yield event
             return
         if verdict.action == "supplement":
             self.resume_agent_loops()
             if self._current_step_is_parallel_sub_pipeline():
                 self._restored_supplement = {
-                    "message": user_input,
+                    "message": pipeline_input.content,
                     "target": verdict.supplement_target,
                 }
                 try:
@@ -575,11 +852,14 @@ async def _continue_from_sidecar_with_input(
                 finally:
                     self._restored_supplement = None
                 return
-            async for event in self._continue_from_current(user_input=user_input, resume_running_step=True):
+            async for event in self._continue_from_current(
+                **self._continue_input_kwargs(pipeline_input),
+                resume_running_step=True,
+            ):
                 yield event
             return
         if verdict.action == "hard_interrupt":
-            async for event in self._continue_after_sidecar_hard_interrupt(verdict):
+            async for event in self._continue_after_sidecar_hard_interrupt(verdict, source_input=pipeline_input):
                 yield event
             return
 
@@ -588,23 +868,36 @@ async def _continue_from_sidecar_with_input(
             yield event
 
     async def _continue_after_sidecar_judgment_failure(
-        self, verdict: InterruptVerdict, *, user_input: str
+        self, verdict: InterruptVerdict, *, user_input: PipelineUserInput
     ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
         if verdict.paused:
-            yield await self._save_and_emit_interrupt_pause(verdict)
+            try:
+                yield await self._save_and_emit_interrupt_pause(verdict)
+            except PipelineStatePersistenceError as exc:
+                yield self._persistence_failure_event(exc)
             return
         if verdict.action == "hard_interrupt":
-            async for event in self._continue_after_sidecar_hard_interrupt(verdict):
+            async for event in self._continue_after_sidecar_hard_interrupt(verdict, source_input=user_input):
                 yield event
             return
         self.resume_agent_loops()
-        async for event in self._continue_from_current(user_input=user_input, resume_running_step=True):
+        async for event in self._continue_from_current(
+            **self._continue_input_kwargs(user_input),
+            resume_running_step=True,
+        ):
             yield event
 
     async def _continue_after_sidecar_hard_interrupt(
-        self, verdict: InterruptVerdict
+        self, verdict: InterruptVerdict, *, source_input: PipelineUserInput | None = None
     ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
-        parent_rollback = self.apply_hard_interrupt(verdict)
+        try:
+            if source_input is not None and source_input.has_images:
+                parent_rollback = self.apply_hard_interrupt(verdict, source_input=source_input)
+            else:
+                parent_rollback = self.apply_hard_interrupt(verdict)
+        except PipelineStatePersistenceError as exc:
+            yield self._persistence_failure_event(exc)
+            return
         if self.sidecar_status == "failed":
             current_step = getattr(self.state_machine, "current_step", None)
             yield PipelineEvent(
@@ -717,10 +1010,12 @@ def _persisted_candidate_restart_info(state: dict[str, Any]) -> RestartInfo | No
         preserved_conclusions = restart.get("preserved_conclusions")
         if not isinstance(preserved_conclusions, dict):
             preserved_conclusions = {}
+        rollback_input = _deserialize_pipeline_input_content(restart.get("rollback_input"))
         return RestartInfo(
             start_from_step=start_from_step,
             preserved_conclusions=preserved_conclusions,
             rollback_context=rollback_context,
+            rollback_input=rollback_input,
         )
 
     def _persisted_parallel_candidate_indices(self) -> list[int]:
@@ -761,16 +1056,91 @@ def _state_machine_snapshot_for_sidecar(self) -> dict[str, Any]:
         current_step_user_input = getattr(self, "_current_step_user_input", None)
         if current_step_user_input is not None:
             snapshot[_CURRENT_STEP_USER_INPUT_KEY] = current_step_user_input
+        current_step_user_input_content = getattr(self, "_current_step_user_input_content", None)
+        if current_step_user_input_content is not None:
+            snapshot[_CURRENT_STEP_USER_INPUT_CONTENT_KEY] = _serialize_pipeline_input_content(
+                current_step_user_input_content
+            )
+        current_step_resume_messages = getattr(self, "_current_step_resume_messages", None)
+        if current_step_resume_messages is not None:
+            snapshot[_CURRENT_STEP_RESUME_MESSAGES_KEY] = _serialize_pipeline_messages(current_step_resume_messages)
+        current_step_precompleted_tools = getattr(self, "_current_step_precompleted_tools", None)
+        if current_step_precompleted_tools is not None:
+            snapshot[_CURRENT_STEP_PRECOMPLETED_TOOLS_KEY] = current_step_precompleted_tools
         return snapshot
 
-    def _set_current_step_user_input(self, user_input: str | list[ContentBlock] | None) -> None:
-        self._current_step_user_input = user_input if isinstance(user_input, str) else None
+    def _restore_current_step_user_input_from_snapshot(self, snapshot: dict[str, Any]) -> None:
+        restored_display_text = snapshot.get(_CURRENT_STEP_USER_INPUT_KEY)
+        if not isinstance(restored_display_text, str):
+            restored_display_text = None
+        restored_content = _deserialize_pipeline_input_content(snapshot.get(_CURRENT_STEP_USER_INPUT_CONTENT_KEY))
+        if restored_content is None:
+            restored_content = restored_display_text
+        self._restored_current_step_user_input = (
+            normalize_pipeline_user_input(restored_content, display_text=restored_display_text)
+            if restored_content is not None
+            else None
+        )
+        self._current_step_user_input = restored_display_text
+        self._current_step_user_input_content = (
+            self._restored_current_step_user_input.content
+            if self._restored_current_step_user_input is not None and self._restored_current_step_user_input.has_images
+            else None
+        )
+        self._restored_current_step_resume_messages = _deserialize_pipeline_messages(
+            snapshot.get(_CURRENT_STEP_RESUME_MESSAGES_KEY)
+        )
+        self._restored_current_step_precompleted_tools = _deserialize_precompleted_tools(
+            snapshot.get(_CURRENT_STEP_PRECOMPLETED_TOOLS_KEY)
+        )
+        self._current_step_resume_messages = self._restored_current_step_resume_messages
+        self._current_step_precompleted_tools = self._restored_current_step_precompleted_tools
+
+    def _set_current_step_user_input(
+        self,
+        user_input: str | list[ContentBlock] | PipelineUserInput | None,
+        *,
+        display_text: str | None = None,
+    ) -> None:
+        if user_input is None:
+            self._current_step_user_input = None
+            self._current_step_user_input_content = None
+            self._set_current_step_resume_state()
+            return
+        pipeline_input = normalize_pipeline_user_input(user_input, display_text=display_text)
+        self._current_step_user_input = display_text if display_text is not None else pipeline_input.display_text
+        self._current_step_user_input_content = pipeline_input.content if pipeline_input.has_images else None
 
-    def _consume_restored_current_step_user_input(self) -> str | None:
+    def _set_current_step_resume_state(
+        self,
+        *,
+        resume_messages: list[Message] | None = None,
+        precompleted_tools: dict[str, dict[str, Any]] | None = None,
+    ) -> None:
+        self._current_step_resume_messages = list(resume_messages) if resume_messages is not None else None
+        self._current_step_precompleted_tools = dict(precompleted_tools) if precompleted_tools is not None else None
+
+    @staticmethod
+    def _continue_input_kwargs(user_input: PipelineUserInput) -> dict[str, Any]:
+        kwargs: dict[str, Any] = {"user_input": user_input.content}
+        if not isinstance(user_input.content, str) or user_input.display_text != user_input.content:
+            kwargs["user_input_display_text"] = user_input.display_text
+        return kwargs
+
+    def _consume_restored_current_step_user_input(self) -> PipelineUserInput | None:
         user_input = self._restored_current_step_user_input
         self._restored_current_step_user_input = None
         return user_input
 
+    def _consume_restored_current_step_resume_state(
+        self,
+    ) -> tuple[list[Message] | None, dict[str, dict[str, Any]] | None]:
+        resume_messages = self._restored_current_step_resume_messages
+        precompleted_tools = self._restored_current_step_precompleted_tools
+        self._restored_current_step_resume_messages = None
+        self._restored_current_step_precompleted_tools = None
+        return resume_messages, precompleted_tools
+
     def _step_attempts_from_snapshot(self, snapshot: dict[str, Any]) -> dict[str, int]:
         attempts = snapshot.get("step_attempts", {})
         if not isinstance(attempts, dict):
@@ -968,61 +1338,99 @@ def _attempt_has_resume_transcript(self, attempt: dict[str, Any] | None) -> bool
             return False
         return bool(self._transcript_storage.load(self._cwd, transcript_id))
 
+    def _record_sidecar_save_failure(self, status: str, operation: str, exc: Exception) -> None:
+        self._sidecar_status = None
+        observability = getattr(self, "_observability", None)
+        if observability is not None:
+            failure = public_error_from_exception(exc)
+            observability.sidecar_failed(
+                operation=operation,
+                status=status,
+                error_type=failure.details["type"],
+                error_summary=failure.summary,
+                error_id=failure.error_id,
+            )
+        logger.warning(
+            "Failed to persist pipeline sidecar during %s (pipeline=%s, session_id=%s, status=%s)",
+            operation,
+            getattr(getattr(self, "_loaded", None), "name", ""),
+            getattr(self, "_session_id", ""),
+            status,
+            exc_info=True,
+        )
+
+    def _append_pipeline_session_meta_best_effort(self, meta: dict[str, Any], *, operation: str) -> None:
+        try:
+            self._session_storage.append_meta(self._cwd, self._session_id, meta)
+        except Exception:
+            logger.warning(
+                "Failed to append pipeline session metadata during %s (pipeline=%s, session_id=%s, meta_type=%s)",
+                operation,
+                getattr(getattr(self, "_loaded", None), "name", ""),
+                getattr(self, "_session_id", ""),
+                meta.get("type"),
+                exc_info=True,
+            )
+
+    def _persistence_failure_event(self, exc: PipelineStatePersistenceError) -> PipelineEvent:
+        step_id = exc.step_id
+        try:
+            current_step = getattr(self.state_machine, "current_step", None)
+            step_id = step_id or getattr(current_step, "step_id", None)
+        except (AttributeError, IndexError):
+            step_id = step_id or self._terminal_current_step_id() or None
+        return PipelineEvent(
+            type=PipelineEventType.STEP_FAILED,
+            step_id=step_id,
+            timestamp=time.time(),
+            data={
+                "error": _("Pipeline state persistence failed."),
+                "error_summary": _("Pipeline state persistence failed."),
+                "error_details": {"type": "PipelineStatePersistenceError"},
+            },
+        )
+
+    @staticmethod
+    def _is_persistence_failure_event(event: object) -> bool:
+        if not isinstance(event, PipelineEvent) or event.type != PipelineEventType.STEP_FAILED:
+            return False
+        error_details = event.data.get("error_details", {})
+        return isinstance(error_details, dict) and error_details.get("type") == "PipelineStatePersistenceError"
+
     async def _try_save_sidecar(
         self,
         status: str,
         operation: str,
         save: Callable[[], Awaitable[None]],
+        *,
+        step_id: str | None = None,
     ) -> None:
         try:
             await save()
         except Exception as exc:
-            self._sidecar_status = None
-            observability = getattr(self, "_observability", None)
-            if observability is not None:
-                failure = public_error_from_exception(exc)
-                observability.sidecar_failed(
-                    operation=operation,
-                    status=status,
-                    error_type=failure.details["type"],
-                    error_summary=failure.summary,
-                    error_id=failure.error_id,
-                )
-            logger.warning(
-                "Failed to persist pipeline sidecar during %s (pipeline=%s, session_id=%s, status=%s)",
-                operation,
-                getattr(getattr(self, "_loaded", None), "name", ""),
-                getattr(self, "_session_id", ""),
-                status,
-                exc_info=True,
-            )
-            return
+            self._record_sidecar_save_failure(status, operation, exc)
+            raise PipelineStatePersistenceError(
+                f"pipeline state persistence failed during {operation}",
+                step_id=step_id,
+            ) from exc
         self._sidecar_status = status
 
-    def _try_save_sidecar_sync(self, status: str, operation: str, save: Callable[[], None]) -> None:
+    def _try_save_sidecar_sync(
+        self,
+        status: str,
+        operation: str,
+        save: Callable[[], None],
+        *,
+        step_id: str | None = None,
+    ) -> None:
         try:
             save()
         except Exception as exc:
-            self._sidecar_status = None
-            observability = getattr(self, "_observability", None)
-            if observability is not None:
-                failure = public_error_from_exception(exc)
-                observability.sidecar_failed(
-                    operation=operation,
-                    status=status,
-                    error_type=failure.details["type"],
-                    error_summary=failure.summary,
-                    error_id=failure.error_id,
-                )
-            logger.warning(
-                "Failed to persist pipeline sidecar during %s (pipeline=%s, session_id=%s, status=%s)",
-                operation,
-                getattr(getattr(self, "_loaded", None), "name", ""),
-                getattr(self, "_session_id", ""),
-                status,
-                exc_info=True,
-            )
-            return
+            self._record_sidecar_save_failure(status, operation, exc)
+            raise PipelineStatePersistenceError(
+                f"pipeline state persistence failed during {operation}",
+                step_id=step_id,
+            ) from exc
         self._sidecar_status = status
 
     async def _save_running(self, current_step: str, reason: str | None = None) -> None:
@@ -1045,7 +1453,7 @@ async def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        await self._try_save_sidecar("running", "save_running", save)
+        await self._try_save_sidecar("running", "save_running", save, step_id=current_step)
 
     def _save_running_sync(self, current_step: str, reason: str | None = None) -> None:
         if not self.session:
@@ -1067,7 +1475,7 @@ def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        self._try_save_sidecar_sync("running", "save_running_sync", save)
+        self._try_save_sidecar_sync("running", "save_running_sync", save, step_id=current_step)
 
     async def _save_waiting_input(self, current_step: str) -> None:
         if not self.session:
@@ -1089,7 +1497,7 @@ async def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        await self._try_save_sidecar("waiting_input", "save_waiting_input", save)
+        await self._try_save_sidecar("waiting_input", "save_waiting_input", save, step_id=current_step)
 
     async def _save_completed(self, current_step: str, reason: str | None = None) -> None:
         if not self.session:
@@ -1111,7 +1519,7 @@ async def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        await self._try_save_sidecar("completed", "save_completed", save)
+        await self._try_save_sidecar("completed", "save_completed", save, step_id=current_step)
 
     async def _save_failed(self, current_step: str, reason: str) -> None:
         self._mark_active_attempt_failed()
@@ -1134,7 +1542,7 @@ async def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        await self._try_save_sidecar("failed", "save_failed", save)
+        await self._try_save_sidecar("failed", "save_failed", save, step_id=current_step)
 
     def _save_failed_sync(self, current_step: str, reason: str) -> None:
         self._mark_active_attempt_failed()
@@ -1157,7 +1565,7 @@ def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        self._try_save_sidecar_sync("failed", "save_failed_sync", save)
+        self._try_save_sidecar_sync("failed", "save_failed_sync", save, step_id=current_step)
 
     def mark_user_aborted(self, reason: str) -> None:
         self._mark_active_attempt_failed_preserve_execution()
@@ -1193,7 +1601,7 @@ def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        self._try_save_sidecar_sync("user_aborted", "save_user_aborted_sync", save)
+        self._try_save_sidecar_sync("user_aborted", "save_user_aborted_sync", save, step_id=current_step or None)
 
     async def _save_rollback(self, from_step: str, to_step: str, reason: str) -> None:
         if not self.session:
@@ -1216,7 +1624,7 @@ async def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        await self._try_save_sidecar("running", "save_rollback", save)
+        await self._try_save_sidecar("running", "save_rollback", save, step_id=from_step)
 
     def _save_rollback_sync(self, from_step: str, to_step: str, reason: str) -> None:
         session = getattr(self, "session", None)
@@ -1239,17 +1647,21 @@ def save() -> None:
                 attempts=dict(self._attempts),
             )
 
-        self._try_save_sidecar_sync("running", "save_rollback_sync", save)
+        self._try_save_sidecar_sync("running", "save_rollback_sync", save, step_id=from_step)
 
     async def _save_after_advance(self, completed_step_id: str) -> None:
         self._set_current_step_user_input(None)
-        if self.state_machine.is_complete:
-            await self._save_completed(completed_step_id, reason="pipeline completed")
-            return
-        await self._save_running(
-            self.state_machine.current_step.step_id,
-            reason=f"advanced from {completed_step_id}",
-        )
+        try:
+            if self.state_machine.is_complete:
+                await self._save_completed(completed_step_id, reason="pipeline completed")
+                return
+            await self._save_running(
+                self.state_machine.current_step.step_id,
+                reason=f"advanced from {completed_step_id}",
+            )
+        except PipelineStatePersistenceError as exc:
+            exc.step_id = completed_step_id
+            raise
 
     def iter_active_agent_loops(self):
         """Yield all currently-active AgentLoops (problem 6 — /status aggregation).
@@ -1362,6 +1774,7 @@ def _restored_parallel_prompt_contexts(self, current_step: StepSpec) -> list[Pro
             permission_context_getter=self._permission_context_getter,
             memory_content_getter=self._memory_content_getter,
             auto_trigger_skills=self._auto_trigger_skills,
+            surface=self._surface,
         )
         self._apply_telemetry_correlation(sub_context_executor)
         sub_context_dependencies = sub_context_executor._sub_context_dependencies(sub_spec)
@@ -1404,6 +1817,7 @@ def _restored_parallel_prompt_contexts(self, current_step: StepSpec) -> list[Pro
                 permission_context_getter=self._permission_context_getter,
                 memory_content_getter=self._memory_content_getter,
                 auto_trigger_skills=self._auto_trigger_skills,
+                surface=self._surface,
             )
             self._apply_telemetry_correlation(step_executor)
             agent_context = step_executor.build_agent_loop_context(
@@ -1448,6 +1862,11 @@ def _option_display_value(option: Any) -> str | None:
         return None
 
     def _infer_selected_index(self, selected_value: str, options: list[Any]) -> int | None:
+        structured = parse_selected_candidate(selected_value)
+        if structured is not None and structured.selected_candidate_index is not None:
+            idx = structured.selected_candidate_index
+            if 0 <= idx < len(options):
+                return idx
         matches = [idx for idx, option in enumerate(options) if self._option_display_value(option) == selected_value]
         if len(matches) == 1:
             return matches[0]
@@ -1504,15 +1923,21 @@ def _prompt_context_from_agent_loop(
             sub_pipeline_id=sub_pipeline_id,
         )
 
-    async def run(self, user_input: str) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
+    async def run(
+        self, user_input: str | list[ContentBlock] | PipelineUserInput
+    ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
         """Start the pipeline from the first step."""
-        self._session_storage.append_meta(
-            self._cwd,
-            self._session_id,
+        pipeline_input = normalize_pipeline_user_input(user_input)
+        self._set_current_step_user_input(pipeline_input)
+        try:
+            await self._save_running(self.state_machine.current_step.step_id, reason="pipeline started")
+        except PipelineStatePersistenceError as exc:
+            yield self._persistence_failure_event(exc)
+            return
+        self._append_pipeline_session_meta_best_effort(
             {"type": "pipeline_init", "pipeline_type": self._loaded.name},
+            operation="pipeline_init",
         )
-        self._set_current_step_user_input(user_input)
-        await self._save_running(self.state_machine.current_step.step_id, reason="pipeline started")
         self._observability.pipeline_started(
             total_steps=self.state_machine.total_steps,
             step_names=list(self.state_machine._order),
@@ -1528,16 +1953,20 @@ async def run(self, user_input: str) -> AsyncGenerator[StreamEvent | PipelineEve
             },
         )
         with self._observability.pipeline_run_span(total_steps=self.state_machine.total_steps):
-            async for event in self._continue_from_current(user_input=user_input):
+            async for event in self._continue_from_current(**self._continue_input_kwargs(pipeline_input)):
                 yield event
 
-    async def resume(self, user_input: str) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
+    async def resume(
+        self, user_input: str | list[ContentBlock] | PipelineUserInput
+    ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
         """Resume after user input at a USER_INPUT_REQUIRED pause."""
         if self.has_pending_pipeline_pause_confirmation():
             async for event in self._continue_from_sidecar_with_input(user_input):
                 yield event
             return
 
+        pipeline_input = normalize_pipeline_user_input(user_input)
+        user_text = pipeline_input.display_text
         step = self.state_machine.current_step
         step_index = self.state_machine.current_step_index + 1
         step_attempt = self._current_step_attempt(step.step_id)
@@ -1552,48 +1981,57 @@ async def resume(self, user_input: str) -> AsyncGenerator[StreamEvent | Pipeline
             if isinstance(restored_options, list):
                 waiting_options = restored_options
         selected_index: int | None = None
-        self._observability.user_input_received(
-            step_id=step.step_id,
-            step_index=step_index,
-            step_attempt=step_attempt,
-            total_steps=self.state_machine.total_steps,
-            ui_mode=step.ui_mode,
-            user_input=user_input,
-            wait_duration_ms=wait_duration_ms,
-        )
         if step.ui_mode == "candidate_selection":
-            selected_index = self._infer_selected_index(user_input, waiting_options)
+            selected_index = self._infer_selected_index(user_text, waiting_options)
             if selected_index is None:
                 logger.debug(
                     "Pipeline candidate selection did not match a unique option: step_id=%s option_count=%d",
                     step.step_id,
                     len(waiting_options),
                 )
-            else:
-                self._observability.selection_made(
-                    step_id=step.step_id,
-                    step_attempt=step_attempt,
-                    ui_mode=step.ui_mode,
-                    option_count=len(waiting_options),
-                    selected_index=selected_index,
-                    selected_value=user_input,
-                )
-        current_conclusion["user_input"] = user_input
+        current_conclusion["user_input"] = user_text
         self.context.set_conclusion(step.conclusion_field, current_conclusion)
+        self._set_current_step_user_input(pipeline_input)
+        try:
+            await self._save_running(step.step_id, reason="user input received")
+        except PipelineStatePersistenceError as exc:
+            yield self._persistence_failure_event(exc)
+            return
+        self._observability.user_input_received(
+            step_id=step.step_id,
+            step_index=step_index,
+            step_attempt=step_attempt,
+            total_steps=self.state_machine.total_steps,
+            ui_mode=step.ui_mode,
+            user_input=user_text,
+            wait_duration_ms=wait_duration_ms,
+        )
+        if step.ui_mode == "candidate_selection" and selected_index is not None:
+            self._observability.selection_made(
+                step_id=step.step_id,
+                step_attempt=step_attempt,
+                ui_mode=step.ui_mode,
+                option_count=len(waiting_options),
+                selected_index=selected_index,
+                selected_value=user_text,
+            )
 
         yield PipelineEvent(
             type=PipelineEventType.USER_INPUT_RECEIVED,
             step_id=step.step_id,
             timestamp=time.time(),
             data=_user_input_received_data(
-                user_input,
+                pipeline_input,
                 ui_mode=step.ui_mode,
                 selected_index=selected_index,
                 waiting_options=waiting_options,
             ),
         )
 
-        async for event in self._continue_from_current(user_input=user_input, resume_waiting_step=True):
+        async for event in self._continue_from_current(
+            **self._continue_input_kwargs(pipeline_input),
+            resume_waiting_step=True,
+        ):
             yield event
 
     async def resume_ask_user_question(
@@ -1602,6 +2040,7 @@ async def resume_ask_user_question(
         *,
         tool_use_id: str,
         pending_input: dict[str, Any] | None = None,
+        supplemental_input: str | list[ContentBlock] | PipelineUserInput | None = None,
     ) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
         """Resume an in-step ask_user_question after process restart."""
         payload = {
@@ -1621,16 +2060,32 @@ async def resume_ask_user_question(
             content=json.dumps(payload, ensure_ascii=False),
             is_error=False,
         )
+        supplemental = normalize_pipeline_user_input(supplemental_input) if supplemental_input is not None else None
+        if supplemental is not None and not supplemental.has_images:
+            supplemental = None
+        tool_result_message = Message(role="user", content=[tool_result])
+        user_message: str | list[ContentBlock] | None = (
+            supplemental.content if supplemental is not None else [tool_result]
+        )
         candidate_index = _candidate_index_from_pending_input(pending_input)
         if candidate_index is not None:
             step = self.state_machine.current_step
             if step.step_type == PipelineStepType.PARALLEL_SUB_PIPELINE.value:
                 previous = getattr(self, "_restored_ask_user_question", None)
+                candidate_resume_messages = [tool_result_message] if supplemental is not None else None
+                candidate_precompleted_tools = {"ask_user_question": payload}
                 self._restored_ask_user_question = {
                     "candidate_index": candidate_index,
-                    "user_message": [tool_result],
-                    "precompleted_tools": {"ask_user_question": payload},
+                    "user_message": user_message,
+                    "resume_messages": candidate_resume_messages,
+                    "precompleted_tools": candidate_precompleted_tools,
                 }
+                self._set_candidate_ask_user_question_resume_state(
+                    candidate_index,
+                    user_message=user_message,
+                    resume_messages=candidate_resume_messages,
+                    precompleted_tools=candidate_precompleted_tools,
+                )
                 try:
                     async for event in self._continue_from_current(resume_running_step=True):
                         yield event
@@ -1642,8 +2097,19 @@ async def resume_ask_user_question(
                         self._restored_ask_user_question = previous
                 return
 
+        if supplemental is not None:
+            async for event in self._continue_from_current(
+                **self._continue_input_kwargs(supplemental),
+                resume_messages=[*resume_messages, tool_result_message],
+                precompleted_tools={"ask_user_question": payload},
+                resume_waiting_step=True,
+            ):
+                yield event
+            return
+
+        resume_kwargs: dict[str, Any] = {"user_input": user_message}
         async for event in self._continue_from_current(
-            user_input=[tool_result],
+            **resume_kwargs,
             resume_messages=resume_messages,
             precompleted_tools={"ask_user_question": payload},
             resume_waiting_step=True,
@@ -1767,16 +2233,20 @@ def _get_state_for_judge(self) -> dict:
 
         return state
 
-    async def handle_user_interrupt(self, message: str) -> InterruptVerdict:
+    async def handle_user_interrupt(self, message: str | list[ContentBlock] | PipelineUserInput) -> InterruptVerdict:
         """Engine-layer interrupt entry point. All clients call this uniformly."""
 
-        verdict = await self._interrupt_controller.judge(message)
+        pipeline_input = normalize_pipeline_user_input(message)
+        judge_input: str | PipelineUserInput = (
+            pipeline_input if pipeline_input.has_images else pipeline_input.display_text
+        )
+        verdict = await self._interrupt_controller.judge(judge_input)
 
         if self._is_judgment_error_verdict(verdict):
             return self._apply_interrupt_judge_failure_policy(verdict)
 
         if verdict.action == "supplement":
-            injected = self._inject_supplement(verdict, message)
+            injected = self._inject_supplement(verdict, pipeline_input.content)
             if not injected:
                 # Don't silently lose the user's message — flag it via reason
                 # prefix so the UI can render a clear "supplement was dropped"
@@ -1829,7 +2299,25 @@ def resume_agent_loops(self) -> None:
         """
         self._agent_pause_event.set()
 
-    def apply_hard_interrupt(self, verdict: InterruptVerdict) -> bool:
+    @staticmethod
+    def _input_for_interrupt_verdict(
+        verdict: InterruptVerdict,
+        source_input: str | list[ContentBlock] | PipelineUserInput | None,
+    ) -> PipelineUserInput | None:
+        source = normalize_pipeline_user_input(source_input) if source_input is not None else None
+        rollback_context = verdict.rollback_context or ""
+        if source is None:
+            return normalize_pipeline_user_input(rollback_context) if rollback_context else None
+        if rollback_context:
+            return source.with_prepended_text(rollback_context)
+        return source
+
+    def apply_hard_interrupt(
+        self,
+        verdict: InterruptVerdict,
+        *,
+        source_input: str | list[ContentBlock] | PipelineUserInput | None = None,
+    ) -> bool:
         """Execute state rollback after hard interrupt.
 
         Returns True if a parent-level rollback was performed (caller should
@@ -1844,6 +2332,7 @@ def apply_hard_interrupt(self, verdict: InterruptVerdict) -> bool:
                 getattr(self, "_session_id", ""),
             )
             self._rollback_context = None
+            self._rollback_input = None
             return False
 
         target = verdict.rollback_target or self.state_machine.current_step.step_id
@@ -1889,7 +2378,10 @@ def apply_hard_interrupt(self, verdict: InterruptVerdict) -> bool:
                 target = self.state_machine.current_step.step_id
 
         if is_candidate_restart:
-            self._schedule_candidate_restart(verdict)
+            if source_input is None:
+                self._schedule_candidate_restart(verdict)
+            else:
+                self._schedule_candidate_restart(verdict, source_input=source_input)
             self._emit_hard_interrupt_telemetry(
                 rollback_scope="candidate",
                 from_step=from_step,
@@ -1928,9 +2420,11 @@ def apply_hard_interrupt(self, verdict: InterruptVerdict) -> bool:
                 logger.warning("Cannot apply hard interrupt fallback target %r: %s", target, validation_error)
                 self._save_failed_sync(from_step, fallback_reason)
                 self._rollback_context = None
+                self._rollback_input = None
                 return False
             verdict = replace(verdict, rollback_target=target, reason=fallback_reason)
 
+        cleanup_from_step = self.state_machine.current_step
         self.state_machine.interrupt_rollback(target, verdict.reason)
         current_attempt_id = self._execution.get("active_attempt_id")
         self._mark_attempt_status(current_attempt_id, "discarded")
@@ -1938,8 +2432,16 @@ def apply_hard_interrupt(self, verdict: InterruptVerdict) -> bool:
         target_field = next((s.conclusion_field for s in self._loaded.steps if s.step_id == target), None)
         if target_field:
             self.context.mark_stale(target_field)
-        self._rollback_context = verdict.rollback_context
-        self._set_current_step_user_input(verdict.rollback_context)
+        rollback_input = self._input_for_interrupt_verdict(verdict, source_input)
+        self._rollback_context = rollback_input.display_text if rollback_input is not None else None
+        self._rollback_input = rollback_input.content if rollback_input is not None else None
+        self._set_current_step_user_input(rollback_input)
+        self._mark_rollback_cleanup_required(
+            cleanup_from_step,
+            target,
+            verdict.reason,
+            from_attempt_id=current_attempt_id if isinstance(current_attempt_id, str) else None,
+        )
         self._save_rollback_sync(from_step, target, verdict.reason)
         hard_interrupt_attrs = {
             "rollback_scope": "parent",
@@ -2030,19 +2532,26 @@ def _cancel_active_candidates(self, reason: str = "cancelled") -> list[asyncio.T
 
     def continue_after_interrupt(self) -> AsyncGenerator[StreamEvent | PipelineEvent | StepResult, None]:
         """Create a new event stream after interrupt rollback."""
+        rollback_input = self._rollback_input
         context = self._rollback_context
+        self._rollback_input = None
         self._rollback_context = None
+        if rollback_input is not None:
+            kwargs: dict[str, Any] = {"user_input": rollback_input}
+            if not isinstance(rollback_input, str) or context != rollback_input:
+                kwargs["user_input_display_text"] = context
+            return self._continue_from_current(**kwargs)
         return self._continue_from_current(user_input=context)
 
     @staticmethod
-    def _try_inject_into_agent_loop(agent_loop: object | None, message: str) -> bool:
+    def _try_inject_into_agent_loop(agent_loop: object | None, message: PipelineInputContent) -> bool:
         if agent_loop is None:
             return False
 
         if inspect.getattr_static(agent_loop, "try_inject_user_message", None) is not None:
             try_inject = getattr(agent_loop, "try_inject_user_message", None)
             if callable(try_inject):
-                return bool(try_inject(message))
+                return try_inject(message) is not False
 
         can_accept = getattr(agent_loop, "can_accept_injected_user_message", True)
         if can_accept is False:
@@ -2054,7 +2563,7 @@ def _try_inject_into_agent_loop(agent_loop: object | None, message: str) -> bool
         inject(message)
         return True
 
-    def _inject_supplement(self, verdict: InterruptVerdict, message: str) -> bool:
+    def _inject_supplement(self, verdict: InterruptVerdict, message: PipelineInputContent) -> bool:
         """Inject supplement message into the correct AgentLoop.
 
         Returns True if the message was injected into at least one AgentLoop,
@@ -2095,6 +2604,39 @@ def _inject_supplement(self, verdict: InterruptVerdict, message: str) -> bool:
                 return self._try_inject_into_agent_loop(al, message)
         return False
 
+    @staticmethod
+    def _candidate_target_from_pending_question_envelope(envelope: dict[str, Any] | None) -> str | None:
+        if not isinstance(envelope, dict):
+            return None
+        candidate = envelope.get("candidate")
+        if not isinstance(candidate, dict):
+            return None
+        for key in ("index", "candidateIndex", "candidate_index"):
+            value = candidate.get(key)
+            if isinstance(value, int):
+                return f"candidate:{value}"
+            if isinstance(value, str):
+                try:
+                    return f"candidate:{int(value)}"
+                except ValueError:
+                    continue
+        return None
+
+    def inject_pending_question_supplement(
+        self,
+        message: PipelineInputContent,
+        *,
+        envelope: dict[str, Any] | None = None,
+    ) -> bool:
+        """Inject image/text supplied alongside an active ask_user_question answer."""
+        target = self._candidate_target_from_pending_question_envelope(envelope)
+        verdict = InterruptVerdict(
+            action="supplement",
+            reason="ask_user_question supplemental input",
+            supplement_target=target,
+        )
+        return self._inject_supplement(verdict, message)
+
     @staticmethod
     def _candidate_index_from_target(target: str | None) -> int | None:
         if not target or not (target.startswith("candidate:") or target.startswith("candidate_index:")):
@@ -2104,6 +2646,59 @@ def _candidate_index_from_target(target: str | None) -> int | None:
         except (ValueError, IndexError):
             return None
 
+    def _candidate_execution_state_for_resume(self, candidate_index: int) -> dict[str, Any] | None:
+        execution = getattr(self, "_execution", None)
+        if not isinstance(execution, dict):
+            return None
+        candidates = execution.get("candidates")
+        if not isinstance(candidates, dict):
+            return None
+        for key in (str(candidate_index), candidate_index):
+            state = candidates.get(key)
+            if isinstance(state, dict):
+                return state
+        return None
+
+    def _set_candidate_ask_user_question_resume_state(
+        self,
+        candidate_index: int,
+        *,
+        user_message: PipelineInputContent,
+        resume_messages: list[Message] | None,
+        precompleted_tools: dict[str, dict[str, Any]] | None,
+    ) -> None:
+        execution = self._execution if isinstance(self._execution, dict) else {}
+        candidates = execution.setdefault("candidates", {})
+        if not isinstance(candidates, dict):
+            candidates = {}
+            execution["candidates"] = candidates
+        state = candidates.setdefault(str(candidate_index), {})
+        if not isinstance(state, dict):
+            state = {}
+            candidates[str(candidate_index)] = state
+        state[_PENDING_ASK_USER_QUESTION_RESUME_KEY] = _serialize_ask_user_question_resume_state(
+            user_message=user_message,
+            resume_messages=resume_messages,
+            precompleted_tools=precompleted_tools,
+        )
+        self._execution = execution
+
+    def _candidate_ask_user_question_resume_state(self, candidate_index: int) -> dict[str, Any] | None:
+        restored_ask = getattr(self, "_restored_ask_user_question", None)
+        if isinstance(restored_ask, dict) and restored_ask.get("candidate_index") == candidate_index:
+            return restored_ask
+        active_state = getattr(self, "_active_candidates", {}).get(candidate_index)
+        if isinstance(active_state, dict):
+            restored = _deserialize_ask_user_question_resume_state(
+                active_state.get(_PENDING_ASK_USER_QUESTION_RESUME_KEY)
+            )
+            if restored is not None:
+                return restored
+        state = self._candidate_execution_state_for_resume(candidate_index)
+        if state is None:
+            return None
+        return _deserialize_ask_user_question_resume_state(state.get(_PENDING_ASK_USER_QUESTION_RESUME_KEY))
+
     def _candidate_user_message_for_restored_supplement(
         self,
         candidate_index: int,
@@ -2122,20 +2717,24 @@ def _candidate_user_message_for_restored_ask_user_question(
         self,
         candidate_index: int,
     ) -> list[ContentBlock] | None:
-        restored_ask = getattr(self, "_restored_ask_user_question", None)
-        if not isinstance(restored_ask, dict) or restored_ask.get("candidate_index") != candidate_index:
-            return None
-        user_message = restored_ask.get("user_message")
+        restored_ask = self._candidate_ask_user_question_resume_state(candidate_index)
+        user_message = restored_ask.get("user_message") if restored_ask is not None else None
         return user_message if isinstance(user_message, list) else None
 
+    def _candidate_resume_messages_for_restored_ask_user_question(
+        self,
+        candidate_index: int,
+    ) -> list[Message] | None:
+        restored_ask = self._candidate_ask_user_question_resume_state(candidate_index)
+        resume_messages = restored_ask.get("resume_messages") if restored_ask is not None else None
+        return resume_messages if isinstance(resume_messages, list) else None
+
     def _candidate_precompleted_tools_for_restored_ask_user_question(
         self,
         candidate_index: int,
     ) -> dict[str, dict[str, Any]] | None:
-        restored_ask = getattr(self, "_restored_ask_user_question", None)
-        if not isinstance(restored_ask, dict) or restored_ask.get("candidate_index") != candidate_index:
-            return None
-        precompleted_tools = restored_ask.get("precompleted_tools")
+        restored_ask = self._candidate_ask_user_question_resume_state(candidate_index)
+        precompleted_tools = restored_ask.get("precompleted_tools") if restored_ask is not None else None
         return precompleted_tools if isinstance(precompleted_tools, dict) else None
 
     def _requested_candidate_indices(self, scope: str | None) -> list[int]:
@@ -2191,12 +2790,18 @@ def _candidate_current_sub_step_index(self, state: dict[str, Any], step_ids: lis
 
         return None
 
-    def _schedule_candidate_restart(self, verdict: InterruptVerdict) -> None:
+    def _schedule_candidate_restart(
+        self,
+        verdict: InterruptVerdict,
+        *,
+        source_input: str | list[ContentBlock] | PipelineUserInput | None = None,
+    ) -> None:
         """Cancel specified candidate(s) and schedule restart."""
         target_step = verdict.rollback_target
         indices = self._requested_candidate_indices(verdict.candidate_scope)
         current_step = self.state_machine.current_step
         sub_spec = self._loaded.sub_pipelines.get(current_step.sub_pipeline_name or "")
+        rollback_input = self._input_for_interrupt_verdict(verdict, source_input)
 
         for idx in indices:
             state = self._active_candidates.get(idx)
@@ -2210,7 +2815,10 @@ def _schedule_candidate_restart(self, verdict: InterruptVerdict) -> None:
             self._pending_candidate_restarts[idx] = RestartInfo(
                 start_from_step=target_step,
                 preserved_conclusions=preserved,
-                rollback_context=verdict.rollback_context,
+                rollback_context=rollback_input.display_text
+                if rollback_input is not None
+                else verdict.rollback_context,
+                rollback_input=rollback_input.content if rollback_input is not None else None,
             )
             if target_step and sub_spec:
                 sub_pipeline_id = state.get("sub_pipeline_id") or f"{sub_spec.name}_candidate_{idx}"
@@ -2250,6 +2858,15 @@ def _schedule_candidate_restart(self, verdict: InterruptVerdict) -> None:
                     for stale_step in sub_spec.steps[target_index:]:
                         sub_context.mark_stale(stale_step.conclusion_field)
                     context_snapshot = sub_context.to_snapshot()
+                pending_restart: dict[str, Any] = {
+                    "start_from_step": target_step,
+                    "preserved_conclusions": preserved,
+                    "rollback_context": rollback_input.display_text
+                    if rollback_input is not None
+                    else verdict.rollback_context,
+                }
+                if rollback_input is not None and rollback_input.has_images:
+                    pending_restart["rollback_input"] = _serialize_pipeline_input_content(rollback_input.content)
                 entry = {
                     "status": "running",
                     "candidate": state.get("candidate", state.get("raw_candidate", {})),
@@ -2261,11 +2878,7 @@ def _schedule_candidate_restart(self, verdict: InterruptVerdict) -> None:
                     "active_attempt_id": new_attempt["attempt_id"],
                     "transcript_id": new_attempt["transcript_id"],
                     "conclusions": preserved,
-                    "pending_restart": {
-                        "start_from_step": target_step,
-                        "preserved_conclusions": preserved,
-                        "rollback_context": verdict.rollback_context,
-                    },
+                    "pending_restart": pending_restart,
                 }
                 existing_candidate = self._execution.get("candidates", {}).get(str(idx), {}).get("candidate")
                 if existing_candidate is not None:
@@ -2297,6 +2910,7 @@ async def _continue_from_current(
         self,
         user_input: str | list[ContentBlock] | None = None,
         *,
+        user_input_display_text: str | None = None,
         resume_messages: list[Message] | None = None,
         precompleted_tools: dict[str, dict[str, Any]] | None = None,
         resume_waiting_step: bool = False,
@@ -2306,8 +2920,35 @@ async def _continue_from_current(
         terminal_pipeline_telemetry_emitted = False
         step_result: StepResult | None = None
         restored_step_user_input = self._consume_restored_current_step_user_input() if user_input is None else None
-        first_step_user_input = user_input if user_input is not None else restored_step_user_input
+        restored_resume_messages, restored_precompleted_tools = (
+            self._consume_restored_current_step_resume_state() if user_input is None else (None, None)
+        )
+        first_step_user_input = (
+            user_input
+            if user_input is not None
+            else restored_step_user_input.content
+            if restored_step_user_input is not None
+            else None
+        )
+        first_step_user_input_display_text = (
+            user_input_display_text
+            if user_input is not None
+            else restored_step_user_input.display_text
+            if restored_step_user_input is not None
+            else None
+        )
         first_step_user_input_is_restored = user_input is None and restored_step_user_input is not None
+        first_step_resume_messages = resume_messages if resume_messages is not None else restored_resume_messages
+        first_step_precompleted_tools = (
+            precompleted_tools if precompleted_tools is not None else restored_precompleted_tools
+        )
+        if first_step_resume_messages is not None or first_step_precompleted_tools is not None:
+            self._set_current_step_resume_state(
+                resume_messages=first_step_resume_messages,
+                precompleted_tools=first_step_precompleted_tools,
+            )
+        elif user_input is not None:
+            self._set_current_step_resume_state()
 
         def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
             nonlocal terminal_pipeline_telemetry_emitted
@@ -2323,7 +2964,8 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
         while not self.state_machine.is_complete:
             step = self.state_machine.current_step
             step_user_message = first_step_user_input if is_first_step else None
-            self._set_current_step_user_input(step_user_message)
+            step_user_display_text = first_step_user_input_display_text if is_first_step else None
+            self._set_current_step_user_input(step_user_message, display_text=step_user_display_text)
             step_start = time.time()
             step_started_at = self._observability.now()
             step_index = self.state_machine.current_step_index + 1
@@ -2335,10 +2977,18 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
 
             if resume_current_step:
                 step_attempt = self._current_step_attempt(step.step_id)
-                await self._save_running(step.step_id, reason="resumed from user input")
+                try:
+                    await self._save_running(step.step_id, reason="resumed from user input")
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
             else:
                 step_attempt = self._next_step_attempt(step.step_id)
-                await self._save_running(step.step_id, reason="step started")
+                try:
+                    await self._save_running(step.step_id, reason="step started")
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
                 self._observability.step_started(
                     step_id=step.step_id,
                     step_index=step_index,
@@ -2384,13 +3034,19 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
                             emit_step_completed_event=False,
                         ):
                             yield event
+                            if self._is_persistence_failure_event(event):
+                                return
                 except Exception as exc:
                     failure = public_error(
                         message=str(exc) or type(exc).__name__,
                         error_type="StepFailed",
                         extra_details={"step_id": step.step_id},
                     )
-                    await self._save_failed(step.step_id, str(exc) or type(exc).__name__)
+                    try:
+                        await self._save_failed(step.step_id, str(exc) or type(exc).__name__)
+                    except PipelineStatePersistenceError as persistence_exc:
+                        yield self._persistence_failure_event(persistence_exc)
+                        return
                     self._observability.step_failed(
                         step_id=step.step_id,
                         duration_ms=self._observability.duration_ms(step_started_at),
@@ -2425,6 +3081,14 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
                     break
 
                 duration_ms = self._observability.duration_ms(step_started_at)
+                self._mark_attempt_status(attempt.get("attempt_id"), "completed")
+                completed_step_id = step.step_id
+                self.state_machine.advance()
+                try:
+                    await self._save_after_advance(completed_step_id)
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
                 self._observability.step_completed(
                     step_id=step.step_id,
                     duration_ms=duration_ms,
@@ -2444,7 +3108,6 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
                     ui_mode=step.ui_mode,
                     duration_ms=duration_ms,
                 )
-                self._mark_attempt_status(attempt.get("attempt_id"), "completed")
                 if step.forward is None:
                     emit_pipeline_completed(failed=False, early_exit=False)
                 parallel_result = self.context.get_conclusion(step.conclusion_field)
@@ -2460,9 +3123,6 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
                         "conclusion": parallel_result,
                     },
                 )
-                completed_step_id = step.step_id
-                self.state_machine.advance()
-                await self._save_after_advance(completed_step_id)
                 continue
 
             with self._observability.step_span(
@@ -2474,20 +3134,23 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
             ):
                 first_step = is_first_step
                 is_first_step = False
-                step_resume_messages = resume_messages if first_step else None
-                step_precompleted_tools = precompleted_tools if first_step else None
-                if (
-                    step_resume_messages is None
-                    and self._transcript_storage is not None
-                    and attempt.get("status") == "running"
-                ):
+                step_resume_messages = first_step_resume_messages if first_step else None
+                step_precompleted_tools = first_step_precompleted_tools if first_step else None
+                if self._transcript_storage is not None and attempt.get("status") == "running":
                     loaded = self._transcript_storage.load(self._cwd, attempt["transcript_id"])
-                    step_resume_messages = self._transcript_storage.repair_interrupted(loaded)
+                    repaired_resume_messages = self._transcript_storage.repair_interrupted(loaded)
+                    step_resume_messages = reconcile_resume_messages(
+                        repaired_resume_messages,
+                        step_resume_messages,
+                    )
                 if (
                     first_step
                     and first_step_user_input_is_restored
-                    and isinstance(step_user_message, str)
                     and step_resume_messages
+                    and (
+                        isinstance(step_user_message, str)
+                        or user_message_already_in_resume(step_user_message, step_resume_messages)
+                    )
                 ):
                     step_user_message = None
                 execute_kwargs: dict[str, Any] = {
@@ -2518,6 +3181,17 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
                     if isinstance(event, StepResult):
                         step_result = event
                     else:
+                        if isinstance(event, ResourceObservedEvent):
+                            try:
+                                for warning_event in self._handle_resource_observed(
+                                    step,
+                                    event,
+                                    attempt_id=attempt.get("attempt_id"),
+                                ):
+                                    yield warning_event
+                            except PipelineStatePersistenceError as exc:
+                                yield self._persistence_failure_event(exc)
+                                return
                         yield event
 
             if (
@@ -2535,7 +3209,11 @@ def emit_pipeline_completed(*, failed: bool, early_exit: bool) -> None:
                     extra_details={"step_id": step.step_id},
                 )
                 error_summary = failure.summary
-                await self._save_failed(step.step_id, reason)
+                try:
+                    await self._save_failed(step.step_id, reason)
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
                 self._observability.step_failed(
                     step_id=step.step_id,
                     duration_ms=self._observability.duration_ms(step_started_at),
@@ -2598,8 +3276,9 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                         ui_mode=step.ui_mode,
                         duration_ms=duration_ms,
                     )
-                self._session_storage.append_meta(
-                    self._cwd, self._session_id, {"type": "pipeline_step_complete", "step_id": step.step_id}
+                self._append_pipeline_session_meta_best_effort(
+                    {"type": "pipeline_step_complete", "step_id": step.step_id},
+                    operation="pipeline_step_complete",
                 )
                 step_success_observed = True
 
@@ -2621,8 +3300,12 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                 matched = actual is ec_value if isinstance(ec_value, bool) else actual == ec_value
                 if matched:
                     logger.info("Exit condition met for step %s: %s=%r", step.step_id, ec_field, ec_value)
+                    try:
+                        await self._save_completed(step.step_id, reason="exit condition met")
+                    except PipelineStatePersistenceError as exc:
+                        yield self._persistence_failure_event(exc)
+                        return
                     emit_step_success_observability()
-                    await self._save_completed(step.step_id, reason="exit condition met")
                     emit_pipeline_completed(failed=False, early_exit=True)
                     yield step_completed_event
                     yield PipelineEvent(
@@ -2637,7 +3320,7 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                 target, reason = step_result.rollback_request
                 current_attempt_id = attempt.get("attempt_id")
                 try:
-                    self.state_machine.rollback(target, reason, allow_completed_non_future=True)
+                    self.state_machine.rollback(target, reason)
                 except ValueError as exc:
                     valid_targets = self.state_machine.completed_non_future_rollback_targets()
                     error_message = f"Invalid rollback target {target!r}. Valid targets: {valid_targets}. ({exc})"
@@ -2656,7 +3339,11 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                         step.step_id,
                         valid_targets,
                     )
-                    await self._save_failed(step.step_id, str(exc))
+                    try:
+                        await self._save_failed(step.step_id, str(exc))
+                    except PipelineStatePersistenceError as persistence_exc:
+                        yield self._persistence_failure_event(persistence_exc)
+                        return
                     self._observability.step_failed(
                         step_id=step.step_id,
                         duration_ms=self._observability.duration_ms(step_started_at),
@@ -2707,9 +3394,24 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                 self._create_parent_attempt(target)
                 target_field = next((s.conclusion_field for s in self._loaded.steps if s.step_id == target), None)
                 stale = self.context.mark_stale(target_field) if target_field else []
-                emit_step_success_observability()
                 self._set_current_step_user_input(None)
-                await self._save_rollback(step.step_id, target, reason)
+                try:
+                    for warning_event in self._mark_rollback_cleanup_required(
+                        step,
+                        target,
+                        reason,
+                        from_attempt_id=current_attempt_id if isinstance(current_attempt_id, str) else None,
+                    ):
+                        yield warning_event
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
+                try:
+                    await self._save_rollback(step.step_id, target, reason)
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
+                emit_step_success_observability()
                 self._observability.rollback(
                     from_step=step.step_id,
                     to_step=target,
@@ -2717,10 +3419,9 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                     rollback_scope="parent",
                     stale_fields=stale,
                 )
-                self._session_storage.append_meta(
-                    self._cwd,
-                    self._session_id,
+                self._append_pipeline_session_meta_best_effort(
                     {"type": "pipeline_rollback", "from": step.step_id, "to": target, "reason": reason},
+                    operation="pipeline_rollback",
                 )
                 yield step_completed_event
                 yield PipelineEvent(
@@ -2737,18 +3438,26 @@ def emit_step_success_observability(funnel_status: str | None = "completed") ->
                 continue
 
             if step.auto_advance or resume_current_step:
+                completed_step_id = step.step_id
+                self.state_machine.advance()
+                try:
+                    await self._save_after_advance(completed_step_id)
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
                 emit_step_success_observability()
                 if step.forward is None:
                     emit_pipeline_completed(failed=False, early_exit=False)
                 yield step_completed_event
-                completed_step_id = step.step_id
-                self.state_machine.advance()
-                await self._save_after_advance(completed_step_id)
             else:
+                self._set_current_step_user_input(None)
+                try:
+                    await self._save_waiting_input(step.step_id)
+                except PipelineStatePersistenceError as exc:
+                    yield self._persistence_failure_event(exc)
+                    return
                 emit_step_success_observability(funnel_status=None)
                 yield step_completed_event
-                self._set_current_step_user_input(None)
-                await self._save_waiting_input(step.step_id)
                 conclusion = step_result.conclusion or {}
                 prompt = conclusion.get("user_prompt", "")
                 options = conclusion.get("options", [])
@@ -2845,6 +3554,7 @@ async def _execute_parallel_sub_pipeline(
                 permission_context_getter=self._permission_context_getter,
                 memory_content_getter=self._memory_content_getter,
                 auto_trigger_skills=self._auto_trigger_skills,
+                surface=self._surface,
             )
             for _ in candidates
         ]
@@ -2902,6 +3612,12 @@ async def save_candidate_execution_state(
             conclusions = payload.get("conclusions")
             if conclusions is not None:
                 entry["conclusions"] = conclusions
+            active_state = self._active_candidates.get(i)
+            pending_ask_resume = (
+                active_state.get(_PENDING_ASK_USER_QUESTION_RESUME_KEY) if isinstance(active_state, dict) else None
+            )
+            if pending_ask_resume is not None and entry["status"] == "running":
+                entry[_PENDING_ASK_USER_QUESTION_RESUME_KEY] = pending_ask_resume
             self._execution.setdefault("candidates", {})[str(i)] = entry
             await self._save_running(step.step_id, reason=reason or "parallel sub-pipeline running")
 
@@ -2965,6 +3681,9 @@ async def run_candidate(
                 "active_attempt_id": (resume_state or {}).get("active_attempt_id"),
                 "transcript_id": (resume_state or {}).get("transcript_id"),
             }
+            pending_ask_resume = (resume_state or {}).get(_PENDING_ASK_USER_QUESTION_RESUME_KEY)
+            if pending_ask_resume is not None:
+                state[_PENDING_ASK_USER_QUESTION_RESUME_KEY] = pending_ask_resume
             self._active_candidates[i] = state
 
             def allocate_sub_step_attempt(request: dict[str, Any]) -> dict[str, Any]:
@@ -3009,11 +3728,14 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
                 start_from_step = restart_info.start_from_step if restart_info else None
                 preserved_conclusions = restart_info.preserved_conclusions if restart_info else None
                 candidate_user_message = (
-                    restart_info.rollback_context
+                    restart_info.rollback_input
+                    if restart_info and restart_info.rollback_input is not None
+                    else restart_info.rollback_context
                     if restart_info
                     else self._candidate_user_message_for_restored_supplement(i, user_message)
                 )
                 ask_user_message = self._candidate_user_message_for_restored_ask_user_question(i)
+                candidate_resume_messages = self._candidate_resume_messages_for_restored_ask_user_question(i)
                 candidate_precompleted_tools = self._candidate_precompleted_tools_for_restored_ask_user_question(i)
                 if ask_user_message is not None:
                     candidate_user_message = ask_user_message
@@ -3030,6 +3752,8 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
                     }
                     if "precompleted_tools" in parameters or has_var_keyword:
                         recovery_kwargs["precompleted_tools"] = candidate_precompleted_tools
+                    if "resume_messages" in parameters or has_var_keyword:
+                        recovery_kwargs["resume_messages"] = candidate_resume_messages
                     event_stream = execute_streaming(
                         sub_spec=sub_spec,
                         candidate=candidate,
@@ -3062,7 +3786,6 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
                     state["agent_loop"] = sub_executors[i].current_step_executor_agent_loop
                     if isinstance(event, PipelineEvent):
                         _normalize_failed_sub_pipeline_completed_event(event)
-                    await event_queue.put(event)
                     if (
                         isinstance(event, PipelineEvent)
                         and event.type == PipelineEventType.SUB_PIPELINE_COMPLETED
@@ -3079,8 +3802,11 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
                         state["error"] = event.data.get("error")
                         state["error_details"] = event.data.get("error_details")
                         await save_candidate_failed(i, state)
+                    await event_queue.put(event)
             except asyncio.CancelledError:
                 logger.debug("Candidate %d cancelled", i)
+            except PipelineStatePersistenceError as exc:
+                await event_queue.put(exc)
             except Exception as exc:
                 failure = public_error_from_exception(exc)
                 error_summary = failure.summary
@@ -3128,6 +3854,11 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
                 )
                 state["error"] = error_summary
                 state["error_details"] = failure.details
+                try:
+                    await save_candidate_failed(i, state)
+                except PipelineStatePersistenceError as persistence_exc:
+                    await event_queue.put(persistence_exc)
+                    return
                 await event_queue.put(
                     PipelineEvent(
                         type=PipelineEventType.SUB_PIPELINE_COMPLETED,
@@ -3145,7 +3876,6 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
                         },
                     )
                 )
-                await save_candidate_failed(i, state)
             finally:
                 self._active_candidates.pop(i, None)
                 await event_queue.put(CandidateSentinel(candidate_index=i))
@@ -3187,6 +3917,9 @@ async def record_sub_step_state(payload: dict[str, Any]) -> None:
             total = len(candidates)
             while done_count < total:
                 event = await event_queue.get()
+                if isinstance(event, PipelineStatePersistenceError):
+                    yield self._persistence_failure_event(event)
+                    return
                 if isinstance(event, CandidateSentinel):
                     idx = event.candidate_index
                     if idx in self._pending_candidate_restarts:
diff --git a/src/iac_code/pipeline/engine/recovery.py b/src/iac_code/pipeline/engine/recovery.py
index ce657a45..e5b8f3b4 100644
--- a/src/iac_code/pipeline/engine/recovery.py
+++ b/src/iac_code/pipeline/engine/recovery.py
@@ -2,10 +2,13 @@
 
 from __future__ import annotations
 
-import json
 from typing import Any
 
 from iac_code.agent.message import Message, ToolResultBlock, ToolUseBlock
+from iac_code.pipeline.engine.completion_guard_state import (
+    ensure_completion_guard_state,
+    record_completion_guard_tool_result,
+)
 from iac_code.pipeline.engine.types import StepResult, StepStatus
 
 
@@ -59,26 +62,21 @@ def reconstruct_step_result(messages: list[Message], step_id: str) -> StepResult
 
 def reconstruct_completion_guard_state(messages: list[Message]) -> dict[str, Any]:
     tool_uses = _tool_uses_by_id(messages)
-    successful_tools: set[str] = set()
-    tool_results: dict[str, Any] = {}
+    state = ensure_completion_guard_state({})
     for message in messages:
         if message.role != "user" or isinstance(message.content, str):
             continue
         for block in message.content:
-            if not isinstance(block, ToolResultBlock) or block.is_error:
+            if not isinstance(block, ToolResultBlock):
                 continue
             tool_use = tool_uses.get(block.tool_use_id)
             if tool_use is None:
                 continue
-            if tool_use.name != "ask_user_question":
-                continue
-            successful_tools.add("ask_user_question")
-            try:
-                tool_results["ask_user_question"] = json.loads(block.content)
-            except json.JSONDecodeError:
-                tool_results["ask_user_question"] = {
-                    "selected_id": "",
-                    "selected_label": "",
-                    "free_text": block.content,
-                }
-    return {"successful_tools": successful_tools, "tool_results": tool_results}
+            record_completion_guard_tool_result(
+                state,
+                tool_name=tool_use.name,
+                tool_input=tool_use.input,
+                content=block.content,
+                is_error=block.is_error,
+            )
+    return state
diff --git a/src/iac_code/pipeline/engine/resume_recovery.py b/src/iac_code/pipeline/engine/resume_recovery.py
new file mode 100644
index 00000000..526d2aea
--- /dev/null
+++ b/src/iac_code/pipeline/engine/resume_recovery.py
@@ -0,0 +1,72 @@
+"""Helpers for reconciling durable transcript recovery with sidecar resume state."""
+
+from __future__ import annotations
+
+import json
+
+from iac_code.agent.message import ContentBlock, Message, ToolResultBlock
+
+
+def _message_key(message: Message) -> str:
+    return json.dumps(message.to_dict(), ensure_ascii=False, sort_keys=True)
+
+
+def _tool_result_ids(message: Message) -> set[str]:
+    if not isinstance(message.content, list):
+        return set()
+    return {block.tool_use_id for block in message.content if isinstance(block, ToolResultBlock) and block.tool_use_id}
+
+
+def _without_seen_tool_results(message: Message, seen_tool_result_ids: set[str]) -> Message | None:
+    if not isinstance(message.content, list):
+        return message
+    content = [
+        block
+        for block in message.content
+        if not isinstance(block, ToolResultBlock) or block.tool_use_id not in seen_tool_result_ids
+    ]
+    if not content:
+        return None
+    if len(content) == len(message.content):
+        return message
+    return message.model_copy(update={"content": content})
+
+
+def reconcile_resume_messages(
+    transcript_messages: list[Message] | None,
+    sidecar_messages: list[Message] | None,
+) -> list[Message] | None:
+    """Merge sidecar resume messages into repaired transcript messages without duplicating tool results."""
+    merged = list(transcript_messages or [])
+    if not sidecar_messages:
+        return merged or None
+    if not merged:
+        return list(sidecar_messages)
+
+    seen_keys = {_message_key(message) for message in merged}
+    seen_tool_result_ids: set[str] = set()
+    for message in merged:
+        seen_tool_result_ids.update(_tool_result_ids(message))
+
+    for message in sidecar_messages:
+        key = _message_key(message)
+        if key in seen_keys:
+            continue
+        filtered = _without_seen_tool_results(message, seen_tool_result_ids)
+        if filtered is None:
+            continue
+        merged.append(filtered)
+        seen_keys.add(_message_key(filtered))
+        seen_tool_result_ids.update(_tool_result_ids(filtered))
+    return merged or None
+
+
+def user_message_already_in_resume(
+    user_message: str | list[ContentBlock] | None,
+    resume_messages: list[Message] | None,
+) -> bool:
+    if user_message is None or not resume_messages:
+        return False
+    candidate = Message(role="user", content=user_message)
+    candidate_key = _message_key(candidate)
+    return any(_message_key(message) == candidate_key for message in resume_messages)
diff --git a/src/iac_code/pipeline/engine/session.py b/src/iac_code/pipeline/engine/session.py
index 5b8f9b0f..961a7e7c 100644
--- a/src/iac_code/pipeline/engine/session.py
+++ b/src/iac_code/pipeline/engine/session.py
@@ -4,8 +4,6 @@
 
 import json
 import logging
-import os
-import tempfile
 import time
 from dataclasses import dataclass
 from pathlib import Path
@@ -14,6 +12,7 @@
 import yaml
 
 from iac_code.pipeline.engine.types import StepStatus
+from iac_code.utils.state_io import atomic_write_text
 
 PipelineStatus = Literal["running", "waiting_input", "completed", "user_aborted", "failed", "discarded"]
 RESUMABLE_STATUSES: set[PipelineStatus] = {"running", "waiting_input"}
@@ -373,9 +372,6 @@ def save_rollback_sync(
         normal_handoff: _MetadataValue = _PRESERVE_METADATA,
     ) -> None:
         self.session_dir.mkdir(parents=True, exist_ok=True)
-        self._append_event(
-            {"type": "rollback", "from": from_step, "to": to_step, "reason": reason, "timestamp": time.time()}
-        )
         self.save_running_sync(
             to_step,
             state_machine_snapshot,
@@ -386,6 +382,9 @@ def save_rollback_sync(
             attempts=attempts,
             normal_handoff=normal_handoff,
         )
+        self._append_event(
+            {"type": "rollback", "from": from_step, "to": to_step, "reason": reason, "timestamp": time.time()}
+        )
 
     def mark_discarded(self, reason: str | None = None) -> None:
         self.session_dir.mkdir(parents=True, exist_ok=True)
@@ -781,19 +780,6 @@ def _valid_positive_int(self, value: Any) -> bool:
         return isinstance(value, int) and not isinstance(value, bool) and value >= 1
 
     def _atomic_write_yaml(self, path: Path, data: dict) -> None:
-        tmp_path = None
-        try:
-            with tempfile.NamedTemporaryFile(
-                "w",
-                dir=self.session_dir,
-                prefix=f".{path.name}.",
-                suffix=".tmp",
-                encoding="utf-8",
-                delete=False,
-            ) as tmp_file:
-                tmp_path = Path(tmp_file.name)
-                yaml.dump(data, tmp_file, allow_unicode=True)
-            os.replace(tmp_path, path)
-        finally:
-            if tmp_path is not None:
-                tmp_path.unlink(missing_ok=True)
+        self.session_dir.mkdir(parents=True, exist_ok=True)
+        content = yaml.safe_dump(data, allow_unicode=True, sort_keys=False)
+        atomic_write_text(path, content, durable=True)
diff --git a/src/iac_code/pipeline/engine/state_machine.py b/src/iac_code/pipeline/engine/state_machine.py
index efb65c65..ccfae86b 100644
--- a/src/iac_code/pipeline/engine/state_machine.py
+++ b/src/iac_code/pipeline/engine/state_machine.py
@@ -14,8 +14,8 @@ class StateMachine:
     """Generic pipeline state machine.
 
     Steps are ordered linearly. Each step's config defines its forward
-    target and rollback rules. The state machine tracks the current
-    position, step statuses, and rollback count.
+    target. The state machine tracks the current position, step statuses,
+    and rollback count.
     """
 
     def __init__(self, steps: list[StepSpec], max_rollbacks: int = 3, max_interrupt_rollbacks: int = 10) -> None:
@@ -63,9 +63,9 @@ def advance(self) -> StepSpec | None:
         self._step_statuses[step.forward] = StepStatus.RUNNING
         return self.current_step
 
-    def rollback(self, target_step_id: str, reason: str, *, allow_completed_non_future: bool = False) -> StepSpec:
+    def rollback(self, target_step_id: str, reason: str) -> StepSpec:
         """Roll back to target step, marking intermediates as stale."""
-        if not self.can_rollback_to(target_step_id, allow_completed_non_future=allow_completed_non_future):
+        if not self.can_rollback_to(target_step_id):
             raise ValueError(f"Cannot rollback from {self.current_step.step_id} to {target_step_id}")
         if self._rollback_count >= self._max_rollbacks:
             raise ValueError(f"Max rollbacks ({self._max_rollbacks}) exceeded")
@@ -81,14 +81,8 @@ def rollback(self, target_step_id: str, reason: str, *, allow_completed_non_futu
         self._step_statuses[target_step_id] = StepStatus.RUNNING
         return self.current_step
 
-    def can_rollback_to(self, target_step_id: str, *, allow_completed_non_future: bool = False) -> bool:
-        if allow_completed_non_future:
-            return target_step_id in self.completed_non_future_rollback_targets()
-        step = self.current_step
-        return any(r.target_step == target_step_id for r in step.rollback_rules)
-
-    def get_rollback_options(self) -> list:
-        return self.current_step.rollback_rules
+    def can_rollback_to(self, target_step_id: str) -> bool:
+        return target_step_id in self.completed_non_future_rollback_targets()
 
     def completed_non_future_rollback_targets(self) -> list[str]:
         """Return completed rollback targets at or before the current position."""
@@ -114,7 +108,7 @@ def can_interrupt_rollback_to(self, target_step_id: str) -> tuple[bool, str | No
         return True, None
 
     def interrupt_rollback(self, target_step_id: str, reason: str) -> StepSpec:
-        """User-interrupt rollback. Not constrained by rollback_rules but has its own limit."""
+        """User-interrupt rollback to current or prior steps with its own limit."""
         ok, error = self.can_interrupt_rollback_to(target_step_id)
         if not ok:
             if error == "unknown_step":
diff --git a/src/iac_code/pipeline/engine/step_executor.py b/src/iac_code/pipeline/engine/step_executor.py
index 6804faec..64e78055 100644
--- a/src/iac_code/pipeline/engine/step_executor.py
+++ b/src/iac_code/pipeline/engine/step_executor.py
@@ -15,6 +15,10 @@
 from iac_code.agent.message import ContentBlock, Message
 from iac_code.agent.system_prompt import SECTION_BUILDERS, build_base_sections
 from iac_code.pipeline.engine.complete_step_tool import CompleteStepTool
+from iac_code.pipeline.engine.completion_guard_state import (
+    ensure_completion_guard_state,
+    record_completion_guard_tool_result,
+)
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.events import PipelineEvent
 from iac_code.pipeline.engine.observability import PipelineObservability
@@ -49,6 +53,7 @@ class StepAgentLoopContext:
     agent_loop: Any | None
     initial_prompt: str | list[ContentBlock]
     resume_messages: list[Message]
+    completion_guard_state: dict[str, Any]
     restored_step_result: StepResult | None = None
 
 
@@ -67,6 +72,7 @@ def __init__(
         permission_context_getter: Callable[[], Any] | None = None,
         memory_content_getter: Callable[[], str] | None = None,
         auto_trigger_skills: list[Any] | None = None,
+        surface: str = "repl",
     ) -> None:
         self._provider_manager = provider_manager
         self._base_tool_registry = base_tool_registry
@@ -78,6 +84,7 @@ def __init__(
         self._permission_context_getter = permission_context_getter
         self._memory_content_getter = memory_content_getter
         self._auto_trigger_skills = auto_trigger_skills or []
+        self._surface = surface
         self._current_agent_loop = None
         pipeline_name = getattr(pipeline, "name", "")
         if not isinstance(pipeline_name, str):
@@ -152,8 +159,10 @@ async def execute(
         agent_loop = agent_context.agent_loop
         assert agent_loop is not None
         self._current_agent_loop = agent_loop
+        completion_guard_state = agent_context.completion_guard_state
 
         complete_step_ids: set[str] = set()
+        pending_tool_inputs: dict[str, dict[str, Any]] = {}
         pending_complete_input: dict[str, dict] = {}
         complete_step_input: dict | None = None
         terminal_failed_step_result: StepResult | None = None
@@ -171,17 +180,31 @@ async def consume_complete_step_events(
             async for event in stream:
                 if isinstance(event, ToolUseStartEvent) and event.name == "complete_step":
                     complete_step_ids.add(event.tool_use_id)
-                elif isinstance(event, ToolUseEndEvent) and event.tool_use_id in complete_step_ids:
-                    pending_complete_input[event.tool_use_id] = event.input
-                elif isinstance(event, ToolResultEvent) and event.tool_use_id in complete_step_ids:
-                    step_result = (event.metadata or {}).get("step_result")
-                    if isinstance(step_result, StepResult) and step_result.status == StepStatus.FAILED:
-                        terminal_failed_step_result = step_result
-                    if not event.is_error:
-                        complete_step_input = pending_complete_input.get(event.tool_use_id)
-                    else:
-                        last_complete_step_error = event.result
-                        last_complete_step_input = pending_complete_input.get(event.tool_use_id)
+                elif isinstance(event, ToolUseEndEvent):
+                    pending_tool_inputs[event.tool_use_id] = {"tool_name": event.name, "input": dict(event.input)}
+                    if event.tool_use_id in complete_step_ids:
+                        pending_complete_input[event.tool_use_id] = event.input
+                elif isinstance(event, ToolResultEvent):
+                    tool_record = pending_tool_inputs.get(event.tool_use_id)
+                    if isinstance(tool_record, dict):
+                        tool_input_raw = tool_record.get("input")
+                        tool_input: dict[str, Any] = tool_input_raw if isinstance(tool_input_raw, dict) else {}
+                        record_completion_guard_tool_result(
+                            completion_guard_state,
+                            tool_name=str(tool_record.get("tool_name") or event.tool_name),
+                            tool_input=tool_input,
+                            content=event.result,
+                            is_error=event.is_error,
+                        )
+                    if event.tool_use_id in complete_step_ids:
+                        step_result = (event.metadata or {}).get("step_result")
+                        if isinstance(step_result, StepResult) and step_result.status == StepStatus.FAILED:
+                            terminal_failed_step_result = step_result
+                        if not event.is_error:
+                            complete_step_input = pending_complete_input.get(event.tool_use_id)
+                        else:
+                            last_complete_step_error = event.result
+                            last_complete_step_input = pending_complete_input.get(event.tool_use_id)
                 yield event
 
         try:
@@ -247,6 +270,7 @@ async def consume_complete_step_events(
                     transcript_id=transcript_id,
                     resume_messages=None,
                     precompleted_tools=None,
+                    completion_guard_state_seed=completion_guard_state,
                     rollback_targets=rollback_targets,
                     rollback_count=rollback_count,
                     max_rollbacks=max_rollbacks,
@@ -299,6 +323,7 @@ def build_agent_loop_context(
         transcript_id: str | None = None,
         resume_messages: list | None = None,
         precompleted_tools: dict[str, dict[str, Any]] | None = None,
+        completion_guard_state_seed: dict[str, Any] | None = None,
         rollback_targets: list[str] | None = None,
         rollback_count: int = 0,
         max_rollbacks: int = 5,
@@ -307,12 +332,17 @@ def build_agent_loop_context(
         initial_prompt = user_message or f"请完成当前步骤：{step.step_id}。"
 
         repaired_messages = list(resume_messages or [])
-        completion_guard_state: dict[str, Any] = reconstruct_completion_guard_state(repaired_messages)
-        completion_guard_state.setdefault("successful_tools", set())
-        completion_guard_state.setdefault("tool_results", {})
+        completion_guard_state: dict[str, Any] = ensure_completion_guard_state(
+            reconstruct_completion_guard_state(repaired_messages)
+        )
         if precompleted_tools:
-            completion_guard_state["successful_tools"].update(precompleted_tools)
+            completion_guard_state["successful_tools"].update(precompleted_tools.keys())
             completion_guard_state["tool_results"].update(precompleted_tools)
+        if completion_guard_state_seed:
+            seed = ensure_completion_guard_state(completion_guard_state_seed)
+            completion_guard_state["successful_tools"].update(seed.get("successful_tools", set()))
+            completion_guard_state["tool_results"].update(seed.get("tool_results", {}))
+            completion_guard_state["tool_result_records"].extend(seed.get("tool_result_records", []))
 
         build_tool_kwargs: dict[str, Any] = {
             "rollback_targets": rollback_targets,
@@ -338,6 +368,7 @@ def build_agent_loop_context(
                 agent_loop=None,
                 initial_prompt=initial_prompt,
                 resume_messages=repaired_messages,
+                completion_guard_state=completion_guard_state,
                 restored_step_result=restored_step_result,
             )
 
@@ -346,6 +377,7 @@ def build_agent_loop_context(
         from iac_code.agent.agent_loop import AgentLoop
 
         agent_session_id = transcript_id or session_id
+        step_skill_roots = self._resolve_step_skill_roots(step)
         agent_loop = AgentLoop(
             provider_manager=self._provider_manager,
             system_prompt=system_prompt,
@@ -358,11 +390,15 @@ def build_agent_loop_context(
             pause_event=self._pause_event,
             permission_context_getter=self._permission_context_getter,
             auto_trigger_skills=self._resolve_auto_trigger_skills(step),
+            tool_context_trusted_read_directories=step_skill_roots,
+            tool_context_relative_read_directories=step_skill_roots,
+            pipeline_mode=True,
         )
         return StepAgentLoopContext(
             agent_loop=agent_loop,
             initial_prompt=initial_prompt,
             resume_messages=repaired_messages,
+            completion_guard_state=completion_guard_state,
         )
 
     @staticmethod
@@ -377,7 +413,10 @@ def _restore_completed_step_result(
 
         normalized_input = copy.deepcopy(complete_step_input)
         complete_step_tool = tool_registry.get("complete_step")
-        if complete_step_tool is not None:
+        if isinstance(complete_step_tool, CompleteStepTool):
+            if complete_step_tool.validate_completion_input(normalized_input) is not None:
+                return None
+        elif complete_step_tool is not None:
             complete_step_tool.normalize_input(normalized_input)
 
         conclusion = normalized_input.get("conclusion", {})
@@ -403,8 +442,9 @@ def _build_full_system_prompt(self, step: StepSpec, context: PipelineContext) ->
             memory_content=memory_content,
         )
 
-        prompt_path = self._pipeline_dir / step.prompt_file
-        step_prompt = prompt_path.read_text(encoding="utf-8") if step.prompt_file else ""
+        prompt_file = step.prompt_file_for_surface(self._surface)
+        prompt_path = self._pipeline_dir / prompt_file
+        step_prompt = prompt_path.read_text(encoding="utf-8") if prompt_file else ""
         rendered_step_prompt = render_prompt(step_prompt, context, step.context_fields)
 
         skill_content = ""
@@ -586,6 +626,28 @@ def _resolve_skill_prompt(self, skill_name: str) -> str | None:
 
         return None
 
+    def _resolve_step_skill_roots(self, step: StepSpec) -> list[str]:
+        if not step.skill:
+            return []
+        root = self._resolve_skill_root(step.skill)
+        return [root] if root else []
+
+    def _resolve_skill_root(self, skill_name: str) -> str:
+        root = self._pipeline.skill_roots.get(skill_name, "")
+        if root:
+            return root
+
+        try:
+            from iac_code.skills.bundled import get_bundled_skills
+
+            for skill_def in get_bundled_skills():
+                if skill_def.name == skill_name:
+                    return skill_def.skill_root
+        except ImportError:
+            pass
+
+        return ""
+
     @staticmethod
     def _with_skill_base_directory(content: str, skill_root: str) -> str:
         if not skill_root:
@@ -621,18 +683,17 @@ def _build_step_tools(
             step_id=step.step_id,
             conclusion_field=step.conclusion_field,
             forward=step.forward,
-            rollback_rules=step.rollback_rules,
             auto_advance=step.auto_advance,
             max_agent_turns=step.max_agent_turns,
             conclusion_schema=step.conclusion_schema,
-            rollback_targets=rollback_targets
-            if rollback_targets is not None
-            else [r.target_step for r in step.rollback_rules],
+            rollback_targets=rollback_targets if rollback_targets is not None else [],
             max_conclusion_retries=step.max_conclusion_retries,
             rollback_count=rollback_count,
             max_rollbacks=max_rollbacks,
         )
-        guard_state = completion_guard_state if completion_guard_state is not None else {"successful_tools": set()}
+        guard_state = ensure_completion_guard_state(
+            completion_guard_state if completion_guard_state is not None else {}
+        )
         registry.register(
             CompleteStepTool(
                 step_config,
@@ -642,8 +703,9 @@ def _build_step_tools(
             )
         )
 
-        if step.inject_tools:
-            self._register_injectable_tools(registry, step.inject_tools, guard_state)
+        inject_tools = step.inject_tools_for_surface(self._surface)
+        if inject_tools:
+            self._register_injectable_tools(registry, inject_tools, guard_state)
 
         return registry
 
diff --git a/src/iac_code/pipeline/engine/step_spec.py b/src/iac_code/pipeline/engine/step_spec.py
index e7271781..85ded9ff 100644
--- a/src/iac_code/pipeline/engine/step_spec.py
+++ b/src/iac_code/pipeline/engine/step_spec.py
@@ -7,7 +7,6 @@
 from dataclasses import dataclass, field
 
 from iac_code.pipeline.engine.context import PipelineContext
-from iac_code.pipeline.engine.types import RollbackRule
 
 
 @dataclass
@@ -27,6 +26,14 @@ class A2AArtifactSpec:
     media_type: str = "auto"
 
 
+@dataclass(frozen=True)
+class StepSurfaceOverride:
+    """Per-surface overrides for selected step fields."""
+
+    prompt_file: str | None = None
+    inject_tools: list[str] | None = None
+
+
 @dataclass
 class HandoffContextConfig:
     """Context fields to include when handing off from pipeline to normal chat."""
@@ -55,7 +62,6 @@ class StepSpec:
     step_type: str = "normal"
     sub_pipeline_name: str | None = None
     tools: IncludeExcludeConfig | None = None
-    rollback_rules: list[RollbackRule] = field(default_factory=list)
     auto_advance: bool = True
     max_agent_turns: int = 50
     context_fields: list[str] = field(default_factory=list)
@@ -63,6 +69,8 @@ class StepSpec:
     hooks_file: str | None = None
     on_enter: Callable[[PipelineContext], None] | None = None
     on_exit: Callable[[PipelineContext, dict], None] | None = None
+    on_resource_observed: Callable[..., object] | None = None
+    on_rollback_cleanup_required: Callable[..., object] | None = None
     base_prompt_sections: IncludeExcludeConfig | None = None
     inject_tools: list[str] = field(default_factory=list)
     ui_mode: str | None = None
@@ -73,6 +81,19 @@ class StepSpec:
     description: str = ""
     exit_condition: dict | None = None
     a2a_artifacts: list[A2AArtifactSpec] = field(default_factory=list)
+    surface_overrides: dict[str, StepSurfaceOverride] = field(default_factory=dict)
+
+    def prompt_file_for_surface(self, surface: str | None) -> str:
+        override = self.surface_overrides.get(surface or "")
+        if override is not None and override.prompt_file is not None:
+            return override.prompt_file
+        return self.prompt_file
+
+    def inject_tools_for_surface(self, surface: str | None) -> list[str]:
+        override = self.surface_overrides.get(surface or "")
+        if override is not None and override.inject_tools is not None:
+            return list(override.inject_tools)
+        return list(self.inject_tools)
 
 
 @dataclass
diff --git a/src/iac_code/pipeline/engine/sub_pipeline_executor.py b/src/iac_code/pipeline/engine/sub_pipeline_executor.py
index 81098275..bbeab523 100644
--- a/src/iac_code/pipeline/engine/sub_pipeline_executor.py
+++ b/src/iac_code/pipeline/engine/sub_pipeline_executor.py
@@ -12,12 +12,13 @@
 from pathlib import Path
 from typing import Any
 
-from iac_code.agent.message import ContentBlock
+from iac_code.agent.message import ContentBlock, Message
 from iac_code.i18n import _
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.pipeline.engine.observability import PipelineObservability
 from iac_code.pipeline.engine.public_errors import public_error, public_error_from_exception
+from iac_code.pipeline.engine.resume_recovery import reconcile_resume_messages, user_message_already_in_resume
 from iac_code.pipeline.engine.state_machine import StateMachine
 from iac_code.pipeline.engine.step_executor import StepExecutor
 from iac_code.pipeline.engine.step_spec import LoadedPipeline, SubPipelineSpec
@@ -71,6 +72,7 @@ def __init__(
         permission_context_getter: Callable[[], Any] | None = None,
         memory_content_getter: Callable[[], str] | None = None,
         auto_trigger_skills: list[Any] | None = None,
+        surface: str = "repl",
     ) -> None:
         self._provider_manager = provider_manager
         self._base_tool_registry = base_tool_registry
@@ -82,6 +84,7 @@ def __init__(
         self._permission_context_getter = permission_context_getter
         self._memory_content_getter = memory_content_getter
         self._auto_trigger_skills = auto_trigger_skills or []
+        self._surface = surface
         self._active_step_executor = None
         self._telemetry_correlation: dict[str, str] = {}
         pipeline_name = getattr(pipeline, "name", "")
@@ -159,6 +162,7 @@ async def execute(
             permission_context_getter=self._permission_context_getter,
             memory_content_getter=self._memory_content_getter,
             auto_trigger_skills=self._auto_trigger_skills,
+            surface=self._surface,
         )
         self._apply_telemetry_correlation(step_executor)
 
@@ -262,7 +266,7 @@ async def execute(
                 if step_result.rollback_request:
                     target, reason = step_result.rollback_request
                     try:
-                        state_machine.rollback(target, reason, allow_completed_non_future=True)
+                        state_machine.rollback(target, reason)
                         conclusions = self._conclusions_before_step(sub_spec, target, conclusions)
                         self._mark_rolled_back_fields_stale(sub_context, sub_spec, target)
                     except ValueError as e:
@@ -332,6 +336,7 @@ def _make_step_executor(self) -> StepExecutor:
             permission_context_getter=self._permission_context_getter,
             memory_content_getter=self._memory_content_getter,
             auto_trigger_skills=self._auto_trigger_skills,
+            surface=self._surface,
         )
         self._apply_telemetry_correlation(executor)
         return executor
@@ -347,6 +352,7 @@ async def execute_streaming(
         start_from_step: str | None = None,
         preserved_conclusions: dict[str, Any] | None = None,
         user_message: str | list[ContentBlock] | None = None,
+        resume_messages: list[Message] | None = None,
         parent_step_id: str | None = None,
         resume_state: dict[str, Any] | None = None,
         sub_step_attempt_allocator: Callable[[dict[str, Any]], dict[str, Any]] | None = None,
@@ -578,7 +584,19 @@ def sub_step_attrs_for_current(step, step_index: int) -> dict[str, Any]:
 
                         step_msg = user_message if is_first_step else None
                         step_precompleted_tools = precompleted_tools if is_first_step else None
-                        if isinstance(step_msg, str) and attempt_info.get("resume_messages"):
+                        attempt_resume_messages = attempt_info.get("resume_messages")
+                        if not isinstance(attempt_resume_messages, list):
+                            attempt_resume_messages = []
+                        explicit_resume_messages = (
+                            resume_messages if is_first_step and resume_messages is not None else []
+                        )
+                        step_resume_messages = reconcile_resume_messages(
+                            attempt_resume_messages,
+                            explicit_resume_messages,
+                        )
+                        if step_resume_messages and (
+                            isinstance(step_msg, str) or user_message_already_in_resume(step_msg, step_resume_messages)
+                        ):
                             step_msg = None
                         is_first_step = False
                         step_result: StepResult | None = None
@@ -587,7 +605,7 @@ def sub_step_attrs_for_current(step, step_index: int) -> dict[str, Any]:
                                 "user_message": step_msg,
                                 "attempt_id": attempt_info.get("attempt_id"),
                                 "transcript_id": attempt_info.get("transcript_id"),
-                                "resume_messages": attempt_info.get("resume_messages"),
+                                "resume_messages": step_resume_messages,
                                 "precompleted_tools": step_precompleted_tools,
                                 "rollback_targets": state_machine.completed_non_future_rollback_targets(),
                                 "rollback_count": state_machine.rollback_count,
@@ -679,7 +697,7 @@ def sub_step_attrs_for_current(step, step_index: int) -> dict[str, Any]:
                         if step_result.rollback_request:
                             target, reason = step_result.rollback_request
                             try:
-                                state_machine.rollback(target, reason, allow_completed_non_future=True)
+                                state_machine.rollback(target, reason)
                                 conclusions = self._conclusions_before_step(sub_spec, target, conclusions)
                                 self._observability.sub_step_completed(
                                     duration_ms=self._observability.duration_ms(sub_step_started_at),
diff --git a/src/iac_code/pipeline/engine/types.py b/src/iac_code/pipeline/engine/types.py
index 99b54a31..aa3f7d31 100644
--- a/src/iac_code/pipeline/engine/types.py
+++ b/src/iac_code/pipeline/engine/types.py
@@ -14,15 +14,6 @@ class StepStatus(str, Enum):
     FAILED = "failed"
 
 
-@dataclass
-class RollbackRule:
-    """Configurable rollback rule for a step."""
-
-    target_step: str
-    condition: str
-    invalidates: list[str] = field(default_factory=list)
-
-
 @dataclass
 class StepConfig:
     """Static configuration for a pipeline step."""
@@ -30,7 +21,6 @@ class StepConfig:
     step_id: str
     conclusion_field: str
     forward: str | None
-    rollback_rules: list[RollbackRule] = field(default_factory=list)
     auto_advance: bool = True
     max_agent_turns: int = 50
     conclusion_schema: dict | None = None
diff --git a/src/iac_code/pipeline/engine/ui_contract.py b/src/iac_code/pipeline/engine/ui_contract.py
index 459dcc9d..c40e9d99 100644
--- a/src/iac_code/pipeline/engine/ui_contract.py
+++ b/src/iac_code/pipeline/engine/ui_contract.py
@@ -4,7 +4,7 @@
 
 import json
 import re
-from dataclasses import dataclass
+from dataclasses import dataclass, field
 from enum import Enum
 from typing import Any
 
@@ -33,22 +33,28 @@ class SelectedCandidate:
 
     selected_candidate_name: str
     selected_candidate_index: int | None = None
+    parameter_overrides: dict[str, Any] = field(default_factory=dict)
 
 
-def encode_selected_candidate(candidate_name: str, candidate_index: int | None) -> str:
-    return json.dumps(
-        {
-            "selected_candidate_name": candidate_name,
-            "selected_candidate_index": candidate_index,
-        },
-        ensure_ascii=False,
-    )
+def encode_selected_candidate(
+    candidate_name: str,
+    candidate_index: int | None,
+    parameter_overrides: dict[str, Any] | None = None,
+) -> str:
+    payload: dict[str, Any] = {
+        "selected_candidate_name": candidate_name,
+        "selected_candidate_index": candidate_index,
+    }
+    if parameter_overrides:
+        payload["parameter_overrides"] = parameter_overrides
+    return json.dumps(payload, ensure_ascii=False)
 
 
 def parse_selected_candidate(value: Any) -> SelectedCandidate | None:
     if isinstance(value, dict):
         name = value.get("selected_candidate_name")
         index = value.get("selected_candidate_index")
+        parameter_overrides = _parse_parameter_overrides(value)
     elif isinstance(value, str):
         stripped = value.strip()
         if not stripped:
@@ -64,9 +70,12 @@ def parse_selected_candidate(value: Any) -> SelectedCandidate | None:
             return None
         name = decoded.get("selected_candidate_name")
         index = decoded.get("selected_candidate_index")
+        parameter_overrides = _parse_parameter_overrides(decoded)
     else:
         return None
 
+    if parameter_overrides is None:
+        return None
     if index is not None and not isinstance(index, int):
         return None
     if isinstance(name, str) and name.strip():
@@ -75,7 +84,11 @@ def parse_selected_candidate(value: Any) -> SelectedCandidate | None:
         candidate_name = ""
     else:
         return None
-    return SelectedCandidate(selected_candidate_name=candidate_name, selected_candidate_index=index)
+    return SelectedCandidate(
+        selected_candidate_name=candidate_name,
+        selected_candidate_index=index,
+        parameter_overrides=parameter_overrides,
+    )
 
 
 def _parse_candidate_index_hint(value: str) -> int | None:
@@ -88,3 +101,27 @@ def _parse_candidate_index_hint(value: str) -> int | None:
         except ValueError:
             return None
     return None
+
+
+def _parse_parameter_overrides(payload: dict[str, Any]) -> dict[str, Any] | None:
+    raw: Any = None
+    found = False
+    for key in ("parameter_overrides", "deployment_parameters", "parameters"):
+        if key in payload:
+            raw = payload.get(key)
+            found = True
+            break
+
+    if not found or raw is None:
+        return {}
+    if not isinstance(raw, dict):
+        return None
+
+    overrides: dict[str, Any] = {}
+    for key, value in raw.items():
+        if not isinstance(key, str) or not key.strip():
+            return None
+        if value is None:
+            continue
+        overrides[key.strip()] = value
+    return overrides
diff --git a/src/iac_code/pipeline/engine/user_input.py b/src/iac_code/pipeline/engine/user_input.py
new file mode 100644
index 00000000..5d8b21e9
--- /dev/null
+++ b/src/iac_code/pipeline/engine/user_input.py
@@ -0,0 +1,91 @@
+"""User input wrapper for pipeline entry points.
+
+Pipeline execution needs the original content blocks for model calls, while
+UI, A2A status, telemetry, and sidecar metadata need text-only display data.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+
+from iac_code.agent.message import ContentBlock, ImageBlock, TextBlock, ToolResultBlock
+from iac_code.i18n import _
+
+PipelineInputContent = str | list[ContentBlock]
+IMAGE_INPUT_PLACEHOLDER = _("[Image input]")
+
+
+def content_has_images(content: PipelineInputContent | None) -> bool:
+    if not isinstance(content, list):
+        return False
+    return any(isinstance(block, ImageBlock) or getattr(block, "type", None) == "image" for block in content)
+
+
+def content_display_text(content: PipelineInputContent | None) -> str:
+    if content is None:
+        return ""
+    if isinstance(content, str):
+        return content
+    parts: list[str] = []
+    has_images = False
+    for block in content:
+        if isinstance(block, TextBlock):
+            parts.append(block.text)
+            continue
+        if isinstance(block, ToolResultBlock):
+            parts.append(block.content)
+            continue
+        if isinstance(block, ImageBlock) or getattr(block, "type", None) == "image":
+            has_images = True
+    text = "\n".join(part for part in parts if part)
+    if text.strip():
+        return text
+    return IMAGE_INPUT_PLACEHOLDER if has_images else ""
+
+
+@dataclass(frozen=True)
+class PipelineUserInput:
+    content: PipelineInputContent
+    display_text: str
+    has_images: bool
+
+    @property
+    def is_empty(self) -> bool:
+        return not self.display_text.strip() and not self.has_images
+
+    def with_prepended_text(self, text: str) -> "PipelineUserInput":
+        prefix = text.strip()
+        if not prefix:
+            return self
+        if isinstance(self.content, str):
+            content: PipelineInputContent = f"{prefix}\n\n{self.content}" if self.content else prefix
+        else:
+            content = [TextBlock(text=prefix), *self.content]
+        display_text = f"{prefix}\n\n{self.display_text}" if self.display_text.strip() else prefix
+        return PipelineUserInput(
+            content=content,
+            display_text=display_text,
+            has_images=content_has_images(content),
+        )
+
+
+def normalize_pipeline_user_input(
+    user_input: str | list[ContentBlock] | PipelineUserInput | None,
+    *,
+    display_text: str | None = None,
+) -> PipelineUserInput:
+    if isinstance(user_input, PipelineUserInput):
+        if display_text is None:
+            return user_input
+        return PipelineUserInput(
+            content=user_input.content,
+            display_text=display_text or content_display_text(user_input.content),
+            has_images=user_input.has_images,
+        )
+    content: PipelineInputContent = "" if user_input is None else user_input
+    resolved_display_text = display_text if display_text is not None else content_display_text(content)
+    return PipelineUserInput(
+        content=content,
+        display_text=resolved_display_text,
+        has_images=content_has_images(content),
+    )
diff --git a/src/iac_code/pipeline/selling/hooks/deploying.py b/src/iac_code/pipeline/selling/hooks/deploying.py
index 43a8b3b8..2ccc3c80 100644
--- a/src/iac_code/pipeline/selling/hooks/deploying.py
+++ b/src/iac_code/pipeline/selling/hooks/deploying.py
@@ -1,10 +1,17 @@
 """Hook for the deploying step."""
 
-from dataclasses import asdict, dataclass
+import logging
+import time
+from dataclasses import dataclass
 from typing import Any
 
+from iac_code.pipeline.engine.cleanup import CleanupLedger, CleanupResource, ObservedResource
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.ui_contract import SelectedCandidate, parse_selected_candidate
+from iac_code.types.stream_events import ResourceObservedEvent
+
+_DEPLOYING_STEP_ID = "deploying"
+logger = logging.getLogger(__name__)
 
 
 @dataclass(frozen=True)
@@ -74,7 +81,7 @@ def normalize_selected_plan(
 
     candidates = evaluated_candidates or []
     resolution = resolve_selected_candidate(selected, candidates)
-    plan["selection"] = asdict(selected)
+    plan["selection"] = _selection_dict(selected)
     if resolution.error:
         plan["selection_valid"] = False
         plan["selection_error"] = resolution.error
@@ -83,18 +90,53 @@ def normalize_selected_plan(
     plan["selection_valid"] = True
     plan["selected_candidate"] = resolution.candidate
     plan["selected_candidate_result"] = resolution.result
+    plan["parameter_overrides"] = dict(selected.parameter_overrides)
+    effective_parameters = _effective_deployment_parameters(resolution.result, selected.parameter_overrides)
+    if effective_parameters:
+        plan["effective_deployment_parameters"] = effective_parameters
+    plan["cost_estimate_parameter_overridden"] = bool(selected.parameter_overrides)
     return plan
 
 
 def _selection_payload(plan: dict[str, Any]) -> Any:
     if "selected_candidate_index" in plan or "selected_candidate_name" in plan:
-        return {
+        payload = {
             "selected_candidate_name": plan.get("selected_candidate_name", ""),
             "selected_candidate_index": plan.get("selected_candidate_index"),
         }
+        if "parameter_overrides" in plan:
+            payload["parameter_overrides"] = plan.get("parameter_overrides")
+        elif "parameters" in plan:
+            payload["parameters"] = plan.get("parameters")
+        return payload
     return plan.get("user_input")
 
 
+def _selection_dict(selected: SelectedCandidate) -> dict[str, Any]:
+    data: dict[str, Any] = {
+        "selected_candidate_name": selected.selected_candidate_name,
+        "selected_candidate_index": selected.selected_candidate_index,
+    }
+    if selected.parameter_overrides:
+        data["parameter_overrides"] = dict(selected.parameter_overrides)
+    return data
+
+
+def _effective_deployment_parameters(
+    selected_candidate_result: dict[str, Any] | None,
+    parameter_overrides: dict[str, Any],
+) -> dict[str, Any]:
+    parameters: dict[str, Any] = {}
+    if isinstance(selected_candidate_result, dict):
+        cost = selected_candidate_result.get("cost")
+        if isinstance(cost, dict):
+            deployment_parameters = cost.get("deployment_parameters")
+            if isinstance(deployment_parameters, dict):
+                parameters.update(deployment_parameters)
+    parameters.update(parameter_overrides)
+    return parameters
+
+
 def on_enter(ctx: PipelineContext) -> None:
     """Resolve the structured selected candidate before rendering the deploying prompt."""
     selected_plan = ctx.get_conclusion("selected_plan")
@@ -104,3 +146,66 @@ def on_enter(ctx: PipelineContext) -> None:
         evaluated_candidates if isinstance(evaluated_candidates, list) else [],
     )
     ctx.set_conclusion("selected_plan", normalized)
+
+
+def on_resource_observed(
+    ctx: PipelineContext,
+    event: ResourceObservedEvent,
+    *,
+    ledger: CleanupLedger,
+    step_id: str,
+    attempt_id: str | None,
+) -> ObservedResource | None:
+    """Persist only ROS stacks created by the deploying step."""
+    _ = ctx
+    if step_id != _DEPLOYING_STEP_ID:
+        return None
+    if event.provider.lower() != "ros" or event.resource_type.lower() != "stack":
+        return None
+    if event.action != "CreateStack" or not event.resource_id:
+        return None
+
+    observed = ObservedResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id=event.resource_id,
+        resource_name=event.resource_name,
+        region_id=event.region_id,
+        source_step_id=step_id,
+        source_attempt_id=attempt_id,
+        observed_action=event.action,
+        observed_at=time.time(),
+        metadata={
+            "tool_name": event.tool_name,
+            "tool_use_id": event.tool_use_id,
+        },
+    )
+    return observed
+
+
+def on_rollback_cleanup_required(
+    ctx: PipelineContext,
+    *,
+    ledger: CleanupLedger,
+    from_step: str,
+    from_attempt_id: str | None,
+    to_step: str,
+    reason: str,
+) -> list[CleanupResource]:
+    """Mark deploying-created ROS stacks for cleanup when deploying rolls back."""
+    _ = (ctx, to_step)
+    if from_step != _DEPLOYING_STEP_ID:
+        return []
+    if not from_attempt_id:
+        logger.warning("Skipping deploying cleanup hook because from_attempt_id is missing")
+        return []
+    resources = [
+        CleanupResource.from_observed(resource, reason=reason)
+        for resource in ledger.observed_resources()
+        if resource.source_step_id == _DEPLOYING_STEP_ID
+        and resource.source_attempt_id == from_attempt_id
+        and resource.provider.lower() == "ros"
+        and resource.resource_type.lower() == "stack"
+        and resource.observed_action == "CreateStack"
+    ]
+    return resources
diff --git a/src/iac_code/pipeline/selling/pipeline.yaml b/src/iac_code/pipeline/selling/pipeline.yaml
index 116d68a8..acb5962d 100644
--- a/src/iac_code/pipeline/selling/pipeline.yaml
+++ b/src/iac_code/pipeline/selling/pipeline.yaml
@@ -44,7 +44,7 @@ context_dependencies:
   architecture: [intent]
   evaluated_candidates: [architecture]
   selected_plan: [evaluated_candidates]
-  deployment: [selected_plan]
+  deployment: [intent, selected_plan]
 
 max_rollbacks: 3
 
@@ -71,6 +71,9 @@ sub_pipelines:
         skill: iac-aliyun-template-generating
         prompt: prompts/template_generating.md
         context_fields: [candidate]
+        tools:
+          include: []
+          exclude: [write_memory]
 
       - id: reviewing
         description: "审查模板的安全性和最佳实践"
@@ -83,9 +86,6 @@ sub_pipelines:
         tools:
           include: [-]
           exclude: []
-        rollback:
-          - target: template_generating
-            condition: template_issue
 
       - id: cost_estimating
         description: "评估模板的资源成本"
@@ -100,7 +100,7 @@ sub_pipelines:
         context_fields: [template]
         tools:
           include: []
-          exclude: [bash]
+          exclude: [bash, write_memory]
 
 steps:
   - id: intent_parsing
@@ -113,7 +113,7 @@ steps:
       field: is_infra_intent
       value: false
     tools:
-      include: [-]
+      include: [read_memory]
       exclude: []
     inject_tools: [ask_user_question]
     completion_guards:
@@ -181,11 +181,8 @@ steps:
     prompt: prompts/architecture_planning.md
     context_fields: [intent]
     tools:
-      include: [read_file, list_files, glob, grep, web_fetch, aliyun_doc_search]
+      include: [read_memory, read_file, list_files, glob, grep, web_fetch, aliyun_doc_search]
       exclude: []
-    rollback:
-      - target: intent_parsing
-        condition: intent_unclear
 
   - id: evaluate_candidates
     description: "并行生成各候选方案的 IaC 模板并评估成本"
@@ -204,6 +201,10 @@ steps:
     auto_advance: false
     ui_mode: candidate_selection
     inject_tools: [show_architecture_diagram, show_candidate_detail]
+    surface_overrides:
+      a2a:
+        prompt: prompts/confirm_and_select.a2a.md
+        inject_tools: []
     tools:
       include: [read_file]
       exclude: []
@@ -238,9 +239,9 @@ steps:
         selected_candidate_index:
           type: integer
           description: 用户最终选择的候选方案在 evaluated_candidates 中的 0 基下标；首次展示方案时可省略
-    rollback:
-      - target: architecture_planning
-        condition: want_different_plans
+        parameter_overrides:
+          type: object
+          description: 用户选择方案时传入的部署参数覆盖字典；键为 ROS Parameters 名称，值为用户指定的部署参数值；首次展示方案时可省略
 
   - id: deploying
     description: "执行用户选定方案的部署"
@@ -249,10 +250,19 @@ steps:
     skill: iac-aliyun-deploying
     prompt: prompts/deploying.md
     interrupt_judge_failure: pause
-    context_fields: [selected_plan, evaluated_candidates]
+    context_fields: [intent, selected_plan, evaluated_candidates]
     hooks_file: hooks/deploying.py
-    rollback:
-      - target: confirm_and_select
-        condition: invalid_selection
-      - target: architecture_planning
-        condition: need_different_architecture
+    completion_guards:
+      - when_conclusion_field_equals:
+          status: success
+        required_conclusion_field: stack_id
+        require_tool_result:
+          tool: ros_stack
+          action_in: [CreateStack, ContinueCreateStack]
+          is_success: true
+          status_in: [CREATE_COMPLETE]
+          match_conclusion_field: stack_id
+        message: "部署成功必须等待 ros_stack CreateStack 返回 CREATE_COMPLETE。"
+    tools:
+      include: []
+      exclude: [write_memory]
diff --git a/src/iac_code/pipeline/selling/prompts/architecture_planning.md b/src/iac_code/pipeline/selling/prompts/architecture_planning.md
index b8af59bb..0c993896 100644
--- a/src/iac_code/pipeline/selling/prompts/architecture_planning.md
+++ b/src/iac_code/pipeline/selling/prompts/architecture_planning.md
@@ -22,6 +22,8 @@
 - 示例：`templates/1-simple-nginx.yml`、`templates/2-high-availability-slb.yml`
 
 ## 注意事项
-- 不要读取项目文件或记忆，所需的上下文已在上方提供。
+- 不要读取项目文件，所需的主要上下文已在上方提供。
+- 你可以按需自主使用 `read_memory` 补充规划上下文：在生成方案前，如用户意图涉及已有资源、默认地域、已有 VPC/Zone、网段约束、成本偏好、高可用偏好、架构偏好、命名规范或历史项目约束，先调用 `read_memory({})` 查看索引，再读取相关 name。
+- 记忆只用于补充方案设计背景；若记忆与当前用户意图冲突，以当前用户意图为准。
 - 直接根据已知意图设计架构方案。
 - 如果意图信息不足以设计架构，可在 rollback_request 中请求回退到 intent_parsing。
diff --git a/src/iac_code/pipeline/selling/prompts/confirm_and_select.a2a.md b/src/iac_code/pipeline/selling/prompts/confirm_and_select.a2a.md
new file mode 100644
index 00000000..226378e1
--- /dev/null
+++ b/src/iac_code/pipeline/selling/prompts/confirm_and_select.a2a.md
@@ -0,0 +1,63 @@
+# 步骤：方案确认与选择
+
+你正在执行 AI 售卖流程的方案确认步骤。
+
+## 任务
+基于候选方案评估结果生成可选择方案列表，并在用户选择后提交最终选择结果。
+
+## 评估结果
+```json
+{evaluated_candidates}
+```
+
+## 首次执行
+
+如果当前没有用户选择消息，直接调用 `complete_step` 提交待选择结论，随后流程会等待用户输入。
+
+仅包含 `failed` 为 `false` 的方案；失败方案不要加入 `options`。
+
+### 待选择结论
+
+`complete_step.conclusion.options` 中每个可选方案必须包含：
+- `options[].name`：候选方案名称，取 `candidate.name`
+- `options[].summary`：候选方案摘要
+- `options[].candidate_index`：候选方案在 `evaluated_candidates` 数组中的 0 基下标
+
+`complete_step.conclusion.user_prompt` 必须是展示给用户的选择提示，例如“请选择要部署的方案：”。
+
+## 收到用户选择
+
+如果当前用户消息是在选择方案（例如包含“选择方案0”、“方案1”、候选方案名称，或表达“选便宜/高可用/已有VPC”等偏好），请直接根据用户输入和上方 `evaluated_candidates` 判断最终选择，并调用 `complete_step` 提交最终结论。
+
+如果当前用户消息是结构化 JSON 选择消息，例如：
+```json
+{
+  "selected_candidate_index": 0,
+  "parameter_overrides": {
+    "ZoneId": "cn-hangzhou-k",
+    "InstanceType": "ecs.g7.large"
+  }
+}
+```
+
+必须按以下规则处理：
+- `selected_candidate_index`：按 0 基下标选择对应候选方案
+- `selected_candidate_name`：如果用户提供名称，则按候选方案名称匹配
+- `parameter_overrides`：用户传入的部署参数覆盖字典，必须原样整理为 `parameter_overrides`
+- `parameters`：兼容字段，若用户传入 `parameters`，也必须整理为 `parameter_overrides`
+
+收到用户选择后再次调用 `complete_step` 提交最终结论，结论必须保留 `options`，并额外包含：
+- `user_input`：用户本次选择的原始文本
+- `selected_candidate_name`：最终选择的候选方案名称，必须取 `candidate.name`
+- `selected_candidate_index`：最终选择的候选方案在 `evaluated_candidates` 数组中的 0 基下标
+- `parameter_overrides`：用户选择方案时传入的部署参数覆盖字典；没有传入时可省略
+
+如果用户输入可以明确映射到某个方案编号（例如“方案0”），按 0 基下标选择对应方案。
+如果用户输入匹配某个候选方案名称，选择该方案。
+如果用户用偏好描述选择方案，请根据候选方案摘要、架构特点、成本和用户偏好选择最匹配的方案。
+
+## 约束
+- 不要读取项目文件或记忆，所需上下文已在上方提供。
+- 不要在本步骤重新询价。
+- 不要修改模板 Default。
+- 不要把 `parameter_overrides` 写入模板；后续部署步骤会基于最终选择结果处理部署参数。
diff --git a/src/iac_code/pipeline/selling/prompts/confirm_and_select.md b/src/iac_code/pipeline/selling/prompts/confirm_and_select.md
index 5b351f86..db56acef 100644
--- a/src/iac_code/pipeline/selling/prompts/confirm_and_select.md
+++ b/src/iac_code/pipeline/selling/prompts/confirm_and_select.md
@@ -3,28 +3,30 @@
 你正在执行 AI 售卖流程的方案确认步骤。
 
 ## 任务
-向用户展示所有候选方案的评估结果，帮助用户选择最终部署方案。
+基于候选方案评估结果生成可选择方案列表，并在用户选择后提交最终选择结果。
 
 ## 评估结果
 ```json
 {evaluated_candidates}
 ```
 
-## 展示流程
+## 首次执行
 
-如果当前用户消息是在选择方案（例如包含“选择方案0”、“方案1”、候选方案名称，或表达“选便宜/高可用/已有VPC”等偏好），不要再次展示所有方案，也不要再次调用展示工具；请直接根据用户输入和上方 `evaluated_candidates` 判断最终选择，并调用 `complete_step` 提交最终结论。
+如果当前没有用户选择消息，按以下流程展示候选方案，并在展示完成后调用 `complete_step` 提交待选择结论，随后流程会等待用户输入。
 
-如果当前没有用户选择消息，按以下流程展示候选方案并等待用户选择。
+仅展示 `failed` 为 `false` 的方案；失败方案不要调用展示工具，也不要加入 `options`。
+
+### 展示候选方案
 
 对每个 `failed` 为 `false` 的方案，依次调用以下两个工具：
 
-### 1. 生成架构图
+#### 1. 生成架构图
 调用 `show_architecture_diagram` 工具：
 - `file_path`：取 `candidate.output_path`
 - `candidate_name`：取 `candidate.name`
 - `candidate_index`：该方案在 `evaluated_candidates` 数组中的 0 基下标
 
-### 2. 展示方案详情
+#### 2. 展示方案详情
 调用 `show_candidate_detail` 工具：
 - `candidate_name`：取 `candidate.name`（必须与架构图的 candidate_name 一致）
 - `candidate_index`：该方案在 `evaluated_candidates` 数组中的 0 基下标
@@ -35,27 +37,51 @@
   - `monthly_cost`：月费用（如 "¥200/月"）
 - `total_monthly_cost`：月度总费用（如 "¥1,234/月"）
 
-## 注意事项
 - 先为所有方案调用 `show_architecture_diagram`，再为所有方案调用 `show_candidate_detail`
 - 不要用文字输出对比表格或方案信息 — 所有展示数据通过上述工具传递
-- 失败的方案跳过，不调用工具
 
-## 输出
-首次展示完成后调用 `complete_step` 提交待选择结论，随后流程会等待用户输入。
+### 待选择结论
 
 `complete_step.conclusion.options` 中每个可选方案必须包含：
 - `options[].name`：候选方案名称，取 `candidate.name`
 - `options[].summary`：候选方案摘要
-- `options[].candidate_index`：该方案在 `evaluated_candidates` 数组中的 0 基下标
+- `options[].candidate_index`：候选方案在 `evaluated_candidates` 数组中的 0 基下标
+
+`complete_step.conclusion.user_prompt` 必须是展示给用户的选择提示，例如“请选择要部署的方案：”。
+
+## 收到用户选择
+
+如果当前用户消息是在选择方案（例如包含“选择方案0”、“方案1”、候选方案名称，或表达“选便宜/高可用/已有VPC”等偏好），请直接根据用户输入和上方 `evaluated_candidates` 判断最终选择，并调用 `complete_step` 提交最终结论。
+
+如果当前用户消息是结构化 JSON 选择消息，例如：
+```json
+{
+  "selected_candidate_index": 0,
+  "parameter_overrides": {
+    "ZoneId": "cn-hangzhou-k",
+    "InstanceType": "ecs.g7.large"
+  }
+}
+```
+
+必须按以下规则处理：
+- `selected_candidate_index`：按 0 基下标选择对应候选方案
+- `selected_candidate_name`：如果用户提供名称，则按候选方案名称匹配
+- `parameter_overrides`：用户传入的部署参数覆盖字典，必须原样整理为 `parameter_overrides`
+- `parameters`：兼容字段，若用户传入 `parameters`，也必须整理为 `parameter_overrides`
 
 收到用户选择后再次调用 `complete_step` 提交最终结论，结论必须保留 `options`，并额外包含：
 - `user_input`：用户本次选择的原始文本
 - `selected_candidate_name`：最终选择的候选方案名称，必须取 `candidate.name`
 - `selected_candidate_index`：最终选择的候选方案在 `evaluated_candidates` 数组中的 0 基下标
+- `parameter_overrides`：用户选择方案时传入的部署参数覆盖字典；没有传入时可省略
 
 如果用户输入可以明确映射到某个方案编号（例如“方案0”），按 0 基下标选择对应方案。
 如果用户输入匹配某个候选方案名称，选择该方案。
 如果用户用偏好描述选择方案，请根据候选方案摘要、架构特点、成本和用户偏好选择最匹配的方案。
 
-## 其他
-- 不要读取项目文件或记忆，所需的上下文已在上方提供。
+## 约束
+- 不要读取项目文件或记忆，所需上下文已在上方提供。
+- 不要在本步骤重新询价。
+- 不要修改模板 Default。
+- 不要把 `parameter_overrides` 写入模板；后续部署步骤会基于最终选择结果处理部署参数。
diff --git a/src/iac_code/pipeline/selling/prompts/cost_estimating.md b/src/iac_code/pipeline/selling/prompts/cost_estimating.md
index 78408a86..5e3f142f 100644
--- a/src/iac_code/pipeline/selling/prompts/cost_estimating.md
+++ b/src/iac_code/pipeline/selling/prompts/cost_estimating.md
@@ -1,6 +1,6 @@
 # 步骤：成本预估
 
-你正在为候选方案预估部署费用。使用 ROS `GetTemplateEstimateCost` API 获取费用预估。
+你正在为候选方案预估部署费用。优先通过 `aliyun_api(product="ros", action="PreviewStack")` 形成 Preview-Validated Pricing Parameter Set，不要使用 `ros_stack` 执行 `PreviewStack`；PreviewStack 不是硬门禁，若完整部署参数暂时无法自动补齐，记录参数缺口后可用当前已选参数调用 ROS `GetTemplateEstimateCost` API 获取费用预估。
 
 ## 模板信息
 - 文件路径：`{template.file_path}`
@@ -14,10 +14,5 @@
 ## 输出
 API 调用完成后调用 `complete_step` 提交费用预估。
 
-补充说明：
-- `cost` 字段为字符串，包含金额和计费周期（如 "¥800/月"）
-- 若修复了模板，设置 `template_fixed: true` 并在 `fix_summary` 中说明
-- 询价失败时 `monthly_estimate` 填 "询价失败"，`error` 说明原因
-
 ## 注意事项
 - 不要读取项目文件或记忆，所需的上下文已在上方提供。
diff --git a/src/iac_code/pipeline/selling/prompts/deploying.md b/src/iac_code/pipeline/selling/prompts/deploying.md
index 89efabdf..710cf399 100644
--- a/src/iac_code/pipeline/selling/prompts/deploying.md
+++ b/src/iac_code/pipeline/selling/prompts/deploying.md
@@ -3,7 +3,21 @@
 你正在执行 AI 售卖流程的最终步骤：将用户选择的方案模板部署到阿里云。
 
 ## 部署执行
-用户已在上一步确认选择了该方案，该选择等价于本步骤的部署确认。不要再次询问是否确认部署，也不要询问是否确认部署参数。完成模板校验、可用性查询和参数选择后，直接调用 `ros_stack` 执行部署。
+用户已在上一步确认选择了该方案，该选择等价于本步骤的部署确认。不要再次询问是否确认部署，也不要询问是否确认部署参数。完成模板校验、可用性查询和参数装配后，直接调用 `ros_stack` 执行部署。
+
+上述确认只适用于部署执行，不适用于删除已有 Stack。删除请求本身不等于删除确认；只有用户明确回复“确认删除”“我确认删除”等删除确认语句，或上下文显式提供 `delete_confirmed: true` 时，才可执行删除。未收到明确删除确认前，不得调用 `ros_stack` 的 `DeleteStack`。
+
+## 原始用户需求与约束
+部署时必须继续遵守原始用户需求中的地域、资源命名、StackName、是否复用已有资源等约束。如果这些约束与候选方案、模板文件名或默认参数冲突，以原始用户需求为准。
+
+调用 `ros_stack` 的 `CreateStack` 前必须逐项核对工具参数：
+- 如果原始用户需求、`intent.non_functional.stack_name`、`intent.user_message_summary` 或 `intent.additional_notes` 中明确指定了资源栈名称，`params.StackName` 必须精确等于该名称。
+- 不要把模板文件名、候选方案名或默认名称误当成用户指定的 StackName。
+- 用户未明确指定 StackName 时，按部署工具和产品既有命名策略处理。
+
+```json
+{intent}
+```
 
 ## 用户选择的方案
 ```json
@@ -14,6 +28,8 @@
 `selected_plan.selection_valid` 为 `true` 时，使用 `selected_plan.selected_candidate` 和
 `selected_plan.selected_candidate_result` 中的模板、费用、审查信息进行部署。
 
+部署参数装配规则见技能。部署步骤不计算费用。
+
 如果 `selected_plan.selection_valid` 为 `false`，不要部署。调用 `rollback_request` 回到
 `confirm_and_select`，reason 使用 `selected_plan.selection_error`。
 
@@ -23,12 +39,8 @@
 
 ## 输出
 部署完成后调用 `complete_step` 提交部署结果。
-- 不得用 status: cancelled 表示等待用户确认。
-- 只有用户明确取消部署时，才可以提交 `status: cancelled`。
-- 如果因为权限、配额、参数或云产品限制导致无法部署，提交 `status: failed` 并说明原因；需要架构变更时使用 rollback_request。
 
 ## 错误处理
-- 可用区不可用 → 自动更换可用区重试
 - 模板校验失败 → 就地修复模板后重试（最多 5 轮）
 - 架构层面必须变更（如产品组合不可行）→ rollback_request 到 `architecture_planning`
 
diff --git a/src/iac_code/pipeline/selling/prompts/intent_parsing.md b/src/iac_code/pipeline/selling/prompts/intent_parsing.md
index 7ffafe66..acb756d9 100644
--- a/src/iac_code/pipeline/selling/prompts/intent_parsing.md
+++ b/src/iac_code/pipeline/selling/prompts/intent_parsing.md
@@ -14,7 +14,10 @@
 - **阿里云基础设施需求**：信息足够时直接调用 `complete_step`，不需要额外文字输出。
 
 ## 注意事项
-- 不要读取项目文件或记忆，用户的需求已经在下一条消息中。
+- 不要读取项目文件，用户的需求已经在下一条消息中。
+- 你可以按需自主使用 `read_memory` 辅助理解用户上下文：当用户提到已有资源、资源命名、VPC/网络、地域、预算、可用性偏好、历史项目或“沿用之前配置”等线索时，先调用 `read_memory({})` 查看索引，再按相关 name 读取具体记忆。
+- 记忆只作为辅助上下文，不能替代当前用户输入和必要澄清；若记忆与当前用户输入冲突，以当前用户输入为准。
+- 不要因为没有相关记忆而阻塞，也不要为了读记忆而跳过必须的 `ask_user_question` 澄清。
 - 直接根据用户描述进行分析；如遇 low 置信度或非基础设施但可引导的输入，必须先调用 `ask_user_question` 让用户补充或选择方向。
 - 对“帮我做个网站”“我有个项目想上线”“做个小程序/应用”这类没有明确阿里云资源，且缺少足够部署约束、规模、预算或可用性信息的输入，直接调用 `complete_step` 视为错误；必须先调用 `ask_user_question`。
 - 不要询问用户是否要使用 IaC，也不要问“是否转成 IaC”。这个 pipeline 默认处理部署/云资源方案；提问应帮助用户把模糊意图变清晰。
@@ -28,4 +31,5 @@
 - 若 `free_text` 包含阿里云部署目标，基于补充文本重新提取意图，并将 `free_text` 写入 `clarification_text`。
 - 若用户选择的选项表示“暂不处理”“不是部署需求”或“仍使用非阿里云平台”，填写 `is_infra_intent: false`，说明原因，并将 `selected_id` 写入 `clarification_choice`。
 - 调用 `complete_step` 的参数必须是 `{"conclusion": {...}}`。不要把 `is_infra_intent`、`confidence` 等结论字段放在工具参数顶层，全部放进 `conclusion` 内。
+- 如用户指定“资源栈名称”“StackName”或 ROS 资源栈名称，必须将精确名称写入 `non_functional.stack_name`；如用户指定 VPC ID、ZoneId、CidrBlock、已有网络资源或多个网段关系，写入 `non_functional.network_constraints`。
 - 不要回退或重启 step 来做澄清；也不要在没有明确澄清需要时额外确认。
diff --git a/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/SKILL.md b/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/SKILL.md
index 7ad6a078..fcedac4e 100644
--- a/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/SKILL.md
+++ b/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/SKILL.md
@@ -5,7 +5,7 @@ when_to_use: 当需要对阿里云 ROS 模板进行费用预估时
 user_invocable: false
 conclusion_schema:
   type: object
-  required: [monthly_estimate, currency, resources, template_fixed]
+  required: [monthly_estimate, currency, resources, template_fixed, deployment_parameters]
   additionalProperties: false
   properties:
     monthly_estimate:
@@ -26,6 +26,22 @@ conclusion_schema:
             type: string
     template_fixed:
       type: boolean
+    deployment_parameters:
+      type: object
+      description: 当前已选、已验证或已用于询价并传递给 deploying 的模板参数字典；可由后续选择阶段补充覆盖
+    missing_deployment_parameters:
+      type: array
+      description: PreviewStack 或最终部署仍缺少、需要用户在后续选择阶段补充的参数
+      items:
+        type: object
+        required: [name, reason]
+        properties:
+          name:
+            type: string
+          reason:
+            type: string
+    parameter_set_summary:
+      type: string
     fix_summary:
       type: string
     error:
@@ -38,16 +54,18 @@ conclusion_schema:
 
 使用阿里云 ROS `GetTemplateEstimateCost` API 预估部署费用。
 
-前一步已完成模板校验；本步骤先直接询价，避免在成本预估前重复校验。只有在修复或改写模板后，才调用 `ValidateTemplate` 校验改动。
+前一步已完成模板校验；本步骤避免在成本预估前重复校验模板。首次询价前优先按参数推荐流程形成 Preview-Validated Pricing Parameter Set，再调用询价 API。PreviewStack 不是硬门禁；完整部署参数暂时无法自动形成时，仍可用当前已选参数调用询价 API，并把缺口留给后续选择阶段补充。只有在修复或改写模板后，才调用 `ValidateTemplate` 校验改动。
 
 ## 执行流程
 
 1. **解析模板** — 从上下文的 `template` 字段获取模板内容和文件路径
 2. **提取参数** — 从模板 Parameters 中提取所有参数及其默认值
-3. **调用询价 API** — 使用 `GetTemplateEstimateCost` 获取费用预估
-4. **按需修复问题** — 仅当询价失败且错误指向模板问题，或你必须修复/改写模板时，修改模板并写回原文件路径
-5. **修改后校验并重新询价** — 调用 `ValidateTemplate` 校验改动；通过后调用 `GetTemplateEstimateCost` 重新询价；失败则修复重试（最多 7 轮）
-6. **输出结果** — 汇总费用并调用 `complete_step`
+3. **推荐并预览验证询价参数** — 按「询价参数推荐与传递」优先形成 Preview-Validated Pricing Parameter Set，不得跳过约束求解直接编造库存值
+4. **调用询价 API** — 优先使用 Preview-Validated Pricing Parameter Set；若 PreviewStack 因完整部署参数缺口无法通过，可用当前已选或可用于询价的参数调用 `GetTemplateEstimateCost`
+5. **按需修复问题** — 仅当询价失败且错误指向模板问题，或你必须修复/改写模板时，修改模板并写回原文件路径
+6. **修改后校验并重新询价** — 调用 `ValidateTemplate` 校验改动；通过后调用 `GetTemplateEstimateCost` 重新询价；失败则修复重试（最多 7 轮）
+7. **结构化传递参数** — 在 `complete_step.conclusion.deployment_parameters` 输出当前已选或已用于询价的参数字典；在 `missing_deployment_parameters` 输出仍需用户补充的完整部署参数缺口
+8. **输出结果** — 汇总费用并调用 `complete_step`
 
 ## 按需校验模板
 
@@ -75,9 +93,25 @@ aliyun_api(
 
 > **TemplateURL 支持本地文件路径**：`TemplateURL` 可传本地路径（如 `/tmp/template.yml`），工具会自动读取文件内容。避免将大模板内容直接作为参数传递。
 
+## 询价参数推荐与传递
+
+缺少 Default 或上下文值时，按 [references/template-parameter-recommendation.md](references/template-parameter-recommendation.md) 的参数推荐规则求解，并优先通过 `aliyun_api(product="ros", action="PreviewStack")` 形成 **Preview-Validated Pricing Parameter Set**。不要使用 `ros_stack` 执行 `PreviewStack`；本步骤只验证参数与模板可预览，不执行部署确认或 `CreateStack`。
+
+PreviewStack 必须传 StackName；调用 PreviewStack 前，必须先确定唯一 `StackName` 并传入 `PreviewStack` 参数。`StackName` 使用候选方案或服务简名作为前缀，并追加时间或 6 位小写字母/数字随机串后缀（如 `ai-app-20260623-a1b2c3`），避免重名。该 `StackName` 是 ROS API 参数，不写入模板 `Parameters`，不放入 `deployment_parameters`。
+
+PreviewStack 不是硬门禁。它要求完整部署参数，常比 `GetTemplateEstimateCost` 需要更多外部输入；如果完整部署参数无法自动补齐、或 PreviewStack 因外部参数缺口失败，但已有参数足以询价，则可以调用 `GetTemplateEstimateCost` 估算费用。此时必须在 `parameter_set_summary` 说明 PreviewStack 状态，在 `missing_deployment_parameters` 列出缺口，后续选择阶段可通过 `parameter_overrides` 补齐，deploying 再做最终部署校验。
+
+本步骤的裁剪规则：
+- 优先使用上下文已有值和模板 Default；库存相关参数缺值时，先通过 `GetTemplateParameterConstraints` 获取合法 `AllowedValues`，必要时再按 [references/cloud-products/](references/cloud-products/) 的可用性 API 与选型策略补足。
+- VpcId、VSwitchId、SecurityGroupId、KeyPairName 等已有资源参数：先查询约束或只读资源候选；API 返回候选不是编造，可作为参数候选参与回溯与 PreviewStack。没有上下文值、模板 Default、用户提供值或 API 返回候选时，才按外部输入缺失处理。
+- 只能在合法候选内筛选或排序，不得编造 API 未返回的库存值；LicenseKey、Token、证书、真实域名等外部输入不得编造。不要仅因参数名是 VpcId、VSwitchId、SecurityGroupId 或 KeyPairName 就跳过参数推荐并直接停止询价。
+- `PreviewStack` 因候选组合不可行失败时，按 reference 的回溯规则更换候选；因外部输入缺失失败时，记录缺口，不用占位值伪造，并按上方软门禁规则决定是否继续询价。
+- 最终得到的参数集不写入模板 `Default`；将当前已选、已验证或已用于询价的参数作为结构化数据放入 `complete_step.conclusion.deployment_parameters`，传递给 deploying。模板 Default 只是参数求解的输入来源之一，不是跨步骤传参介质。
+- PreviewStack 成功但询价失败时，不要丢弃 Preview-Validated Pricing Parameter Set；仍在 `deployment_parameters` 输出该参数集，同时如实报告询价失败原因。
+
 ## 调用询价 API
 
-通过 `TemplateURL` 传递模板文件路径（不要用 `TemplateBody` 内联模板内容，模板可能很大）。模板参数必须按 `Parameters.<N>.ParameterKey` / `Parameters.<N>.ParameterValue` 平铺（下标从 1 起），不要把参数名作为顶层 key 传入：
+通过 `TemplateURL` 传递模板文件路径（不要用 `TemplateBody` 内联模板内容，模板可能很大）。ROS API 的 `Parameters` 直接传字典格式，工具会自动展开为 API 所需的平铺参数；不要手动展开：
 
 ```python
 aliyun_api(
@@ -85,22 +119,22 @@ aliyun_api(
     action="GetTemplateEstimateCost",
     params={
         "TemplateURL": "/tmp/ros-template.yml",
-        "Parameters.1.ParameterKey": "ZoneId",
-        "Parameters.1.ParameterValue": "cn-hangzhou-k",
-        "Parameters.2.ParameterKey": "InstanceType",
-        "Parameters.2.ParameterValue": "ecs.g7.large",
-        "Parameters.3.ParameterKey": "ImageId",
-        "Parameters.3.ParameterValue": "centos_stream_9_x64_20G_alibase_20260414.vhd",
-        "Parameters.4.ParameterKey": "SystemDiskCategory",
-        "Parameters.4.ParameterValue": "cloud_essd",
+        "Parameters": {
+            "ZoneId": "cn-hangzhou-k",
+            "InstanceType": "ecs.g7.large",
+            "ImageId": "centos_stream_9_x64_20G_alibase_20260414.vhd",
+            "SystemDiskCategory": "cloud_essd",
+        },
     },
     region_id="cn-hangzhou",
 )
 ```
 
 参数值来源：
-- 模板 Parameters 中有 Default 值的 → 使用默认值
-- 没有默认值的库存相关参数（ZoneId、InstanceType 等）→ 使用上下文中提供的值或合理默认值
+- 上下文中已有部署/可用性选择结果的 → 使用上下文值
+- 模板 Parameters 中有 Default 值且上下文未覆盖的 → 使用默认值
+- 没有 Default 的库存相关参数（ZoneId、InstanceType 等）→ 按「询价参数推荐与传递」求解，不要直接编造
+- PreviewStack 成功时，最终用于询价的参数集必须与 PreviewStack 验证通过的参数集一致；PreviewStack 未通过但继续询价时，`deployment_parameters` 填当前已用于询价的参数，`missing_deployment_parameters` 填完整部署参数缺口
 
 ## ROS 模板修复参考
 
@@ -112,27 +146,6 @@ aliyun_api(
 | [references/template-parameters.md](references/template-parameters.md) | 模板参数规范：AssociationProperty、Label、分组 | 修复 Parameters 定义（缺少 AssociationProperty、Label 等）时 |
 | [references/ros-template.md](references/ros-template.md) | ROS 模板最佳实践：RunCommand、嵌套栈、条件部署 | 修复资源定义、内置函数用法等模板结构问题时 |
 
-### 参数化规则
-
-以下属性必须定义为 Parameters：
-
-| 产品 | 须参数化的属性 |
-|------|---------------|
-| ECS | ZoneId, InstanceType, ImageId, SystemDiskCategory, DataDiskCategory |
-| RDS | ZoneId, DBInstanceClass, DBInstanceStorageType |
-| Redis | ZoneId, InstanceClass |
-| SLB/ALB | ZoneId |
-
-### 常用资源类型
-
-- ALIYUN::ECS::VPC — 专有网络
-- ALIYUN::ECS::VSwitch — 交换机
-- ALIYUN::ECS::SecurityGroup — 安全组
-- ALIYUN::ECS::InstanceGroup — ECS 实例（通过 MaxAmount 指定数量）
-- ALIYUN::RDS::DBInstance — RDS 数据库实例
-- ALIYUN::REDIS::Instance — Redis 缓存实例
-- ALIYUN::SLB::LoadBalancer — 负载均衡
-
 ### 查询资源属性 Schema
 
 不确定资源属性时：
@@ -154,5 +167,8 @@ aliyun_api(product="ros", action="GetResourceType", params={"ResourceType": "<
 
 补充说明：
 - `cost` 字段为字符串，包含金额和计费周期（如 "¥800/月"、"¥0.5/小时"、"¥0"）
-- 若修复了模板，设置 `template_fixed: true` 并在 `fix_summary` 中说明修复内容
+- 若修复了模板，设置 `template_fixed: true` 并在 `fix_summary` 中说明修复内容；仅形成或输出 `deployment_parameters` 不算模板修复
+- `deployment_parameters` 填当前已选、已验证或已用于 `GetTemplateEstimateCost` 的参数字典；PreviewStack 成功但询价失败时仍填该参数集；没有任何可用参数时填 `{}`
+- `missing_deployment_parameters` 填完整部署或 PreviewStack 仍缺少的参数及原因；没有缺口时可省略或填 `[]`
+- `parameter_set_summary` 可简要说明参数来源、可用性筛选、PreviewStack 验证结果以及是否使用软门禁继续询价
 - 询价失败时 `monthly_estimate` 填 "询价失败"，`resources` 为空数组，`error` 说明原因
diff --git a/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/evals.json b/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/evals.json
index 09af2187..cd40c1a0 100644
--- a/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/evals.json
+++ b/src/iac_code/pipeline/selling/skills/iac-aliyun-cost/evals.json
@@ -1,6 +1,6 @@
 {
   "skill_name": "iac-aliyun-cost",
-  "description": "验证成本预估技能：正确调用 GetTemplateEstimateCost API、参数平铺格式、模板校验修复、错误处理",
+  "description": "验证成本预估技能：正确调用 GetTemplateEstimateCost API、Parameters 字典格式、参数推荐传递、模板按需校验修复、错误处理",
   "evals": [
     {
       "id": 1,
@@ -11,12 +11,14 @@
         "file_path": "templates/1-simple-ecs.yml",
         "region": "cn-hangzhou"
       },
-      "expected_behavior": "直接调用 GetTemplateEstimateCost，参数按 Parameters.<N>.ParameterKey/ParameterValue 平铺传递",
+      "expected_behavior": "先形成 Preview-Validated Pricing Parameter Set，再调用 GetTemplateEstimateCost，Parameters 以字典形式传递，并在 conclusion.deployment_parameters 输出同一参数集",
       "assertions": [
+        {"name": "uses_preview_stack_api", "check": "PreviewStack 通过 aliyun_api(product=\"ros\", action=\"PreviewStack\") 调用，不使用 ros_stack"},
         {"name": "uses_estimate_cost_api", "check": "调用了 GetTemplateEstimateCost API"},
-        {"name": "params_flattened", "check": "参数使用 Parameters.1.ParameterKey / Parameters.1.ParameterValue 格式平铺"},
+        {"name": "params_dictionary", "check": "参数使用 Parameters 字典格式传递，由工具展开 API 参数"},
         {"name": "uses_template_url", "check": "通过 TemplateURL 传递模板文件路径而非内联模板内容"},
         {"name": "outputs_monthly_estimate", "check": "conclusion 中包含 monthly_estimate 和 resources 费用明细"},
+        {"name": "outputs_deployment_parameters", "check": "conclusion.deployment_parameters 包含最终用于询价的参数字典，供 deploying 使用"},
         {"name": "no_doc_search", "check": "不调用 aliyun_doc_search 或搜索定价文档"}
       ]
     },
@@ -29,11 +31,13 @@
         "file_path": "templates/2-ecs-rds.yml",
         "region": "cn-beijing"
       },
-      "expected_behavior": "ECS 和 RDS 的参数都通过平铺格式传入询价 API，费用明细分别列出",
+      "expected_behavior": "ECS 和 RDS 的参数都通过 Parameters 字典传入询价 API，费用明细分别列出，并输出 deployment_parameters",
       "assertions": [
+        {"name": "uses_preview_stack_api", "check": "PreviewStack 通过 aliyun_api(product=\"ros\", action=\"PreviewStack\") 调用，不使用 ros_stack"},
         {"name": "uses_estimate_cost_api", "check": "调用了 GetTemplateEstimateCost API"},
         {"name": "all_params_included", "check": "所有 6 个参数（ZoneId、InstanceType、ImageId、SystemDiskCategory、DBInstanceClass、DBInstanceStorageType）都传入 API"},
         {"name": "multi_resource_breakdown", "check": "费用明细中分别列出了 ECS 和 RDS 的费用"},
+        {"name": "outputs_deployment_parameters", "check": "conclusion.deployment_parameters 包含最终用于询价的完整参数字典"},
         {"name": "no_self_estimate", "check": "不自行估算费用数字，完全基于 API 返回"}
       ]
     },
@@ -47,12 +51,13 @@
         "region": "cn-hangzhou",
         "description": "VSwitch 缺少 CidrBlock，ImageId 引用了不存在的参数"
       },
-      "expected_behavior": "先校验发现模板问题，修复（补 CidrBlock、修正 ImageId 参数引用），再询价",
+      "expected_behavior": "先形成 Preview-Validated Pricing Parameter Set 并调用询价；当询价失败且错误指向模板问题时，修复（补 CidrBlock、修正 ImageId 参数引用），再校验改动并重新询价",
       "assertions": [
-        {"name": "validates_first", "check": "先调用 ValidateTemplate 校验模板"},
+        {"name": "uses_preview_stack_api", "check": "PreviewStack 通过 aliyun_api(product=\"ros\", action=\"PreviewStack\") 调用，不使用 ros_stack"},
+        {"name": "validates_after_template_change", "check": "仅在修复或改写模板后调用 ValidateTemplate 校验改动"},
         {"name": "fixes_template", "check": "修复了模板中的错误（VSwitch CidrBlock、ImageId 参数引用）"},
         {"name": "writes_back", "check": "修复后将模板写回文件"},
-        {"name": "retries_after_fix", "check": "修复后重新校验或直接询价"},
+        {"name": "retries_after_fix", "check": "修复并校验通过后重新询价"},
         {"name": "template_fixed_true", "check": "conclusion 中 template_fixed 为 true 且包含 fix_summary"}
       ]
     },
@@ -66,25 +71,66 @@
         "region": "cn-shanghai",
         "description": "仅 VPC+OSS 的模板，OSS 可能不支持询价"
       },
-      "expected_behavior": "询价 API 可能返回错误（OSS 不支持询价），应报告错误而不编造费用",
+      "expected_behavior": "PreviewStack 成功但询价失败（如 OSS 不支持询价）时，应报告错误而不编造费用，同时不丢弃已验证的 deployment_parameters",
       "assertions": [
+        {"name": "uses_preview_stack_api", "check": "PreviewStack 通过 aliyun_api(product=\"ros\", action=\"PreviewStack\") 调用，不使用 ros_stack"},
         {"name": "attempts_pricing", "check": "尝试调用了 GetTemplateEstimateCost API"},
         {"name": "reports_error_honestly", "check": "如果 API 返回错误，如实报告错误原因"},
         {"name": "no_fabricated_cost", "check": "不编造费用数据"},
+        {"name": "keeps_preview_parameters", "check": "PreviewStack 成功但询价失败时不丢弃 deployment_parameters"},
         {"name": "error_in_conclusion", "check": "conclusion 中包含 error 字段说明失败原因"}
       ]
     },
     {
       "id": 5,
+      "name": "existing-vpc-vswitch-cost",
+      "prompt": "预估在已有 VPC 中创建 VSwitch 的费用",
+      "template_context": {
+        "template": "ROSTemplateFormatVersion: '2015-09-01'\nParameters:\n  VpcId:\n    Type: String\n    AssociationProperty: ALIYUN::ECS::VPC::VPCId\n    AssociationPropertyMetadata:\n      RegionId: ${ALIYUN::Region}\n  ZoneId:\n    Type: String\n    AssociationProperty: ALIYUN::ECS::ZoneId\n    AssociationPropertyMetadata:\n      RegionId: ${ALIYUN::Region}\nResources:\n  VSwitch:\n    Type: ALIYUN::ECS::VSwitch\n    Properties:\n      VpcId: !Ref VpcId\n      ZoneId: !Ref ZoneId\n      CidrBlock: 192.168.1.0/24",
+        "file_path": "templates/5-existing-vpc-vswitch.yml",
+        "region": "cn-hangzhou",
+        "description": "VpcId 和 ZoneId 都没有 Default，VpcId 是已有资源参数"
+      },
+      "expected_behavior": "先通过 GetTemplateParameterConstraints 或只读资源候选求解 VpcId/ZoneId；API 返回候选不是编造，可用于 PreviewStack。不要仅因 VpcId 是已有资源参数就直接停止询价；PreviewStack 成功后调用 GetTemplateEstimateCost，并输出 deployment_parameters",
+      "assertions": [
+        {"name": "queries_parameter_constraints", "check": "调用 GetTemplateParameterConstraints 或等价只读查询获取 VpcId/ZoneId 候选"},
+        {"name": "api_candidates_not_fabricated", "check": "明确区分 API 返回候选不是编造，不把 VpcId 名称本身当作停止条件"},
+        {"name": "uses_preview_stack_api", "check": "PreviewStack 通过 aliyun_api(product=\"ros\", action=\"PreviewStack\") 调用，不使用 ros_stack"},
+        {"name": "attempts_pricing", "check": "PreviewStack 成功后调用 GetTemplateEstimateCost API"},
+        {"name": "outputs_deployment_parameters", "check": "conclusion.deployment_parameters 包含最终用于 PreviewStack 的 VpcId 和 ZoneId"}
+      ]
+    },
+    {
+      "id": 6,
+      "name": "preview-soft-gate-partial-pricing",
+      "prompt": "预估使用已有网络部署一台 ECS 的费用，网络参数可以稍后由用户补充",
+      "template_context": {
+        "template": "ROSTemplateFormatVersion: '2015-09-01'\nParameters:\n  VpcId:\n    Type: String\n    AssociationProperty: ALIYUN::ECS::VPC::VPCId\n  VSwitchId:\n    Type: String\n    AssociationProperty: ALIYUN::VPC::VSwitch::VSwitchId\n  SecurityGroupId:\n    Type: String\n    AssociationProperty: ALIYUN::ECS::SecurityGroup::SecurityGroupId\n  ZoneId:\n    Type: String\n    Default: cn-hangzhou-k\n  InstanceType:\n    Type: String\n    Default: ecs.g7.large\n  ImageId:\n    Type: String\n    Default: centos_stream_9_x64_20G_alibase_20260414.vhd\n  SystemDiskCategory:\n    Type: String\n    Default: cloud_essd\nResources:\n  Ecs:\n    Type: ALIYUN::ECS::InstanceGroup\n    Properties:\n      VpcId: !Ref VpcId\n      VSwitchId: !Ref VSwitchId\n      SecurityGroupId: !Ref SecurityGroupId\n      ZoneId: !Ref ZoneId\n      InstanceType: !Ref InstanceType\n      ImageId: !Ref ImageId\n      SystemDiskCategory: !Ref SystemDiskCategory\n      MaxAmount: 1",
+        "file_path": "templates/6-existing-network-ecs.yml",
+        "region": "cn-hangzhou",
+        "description": "PreviewStack 需要完整的已有网络参数，但 ECS 费用可先基于规格和磁盘参数估算"
+      },
+      "expected_behavior": "优先尝试参数推荐和 PreviewStack；如果 VpcId/VSwitchId/SecurityGroupId 无法自动补齐，PreviewStack 不是硬门禁，不要直接终止。可用 ZoneId、InstanceType、ImageId、SystemDiskCategory 等当前可询价参数调用 GetTemplateEstimateCost，并在 conclusion.missing_deployment_parameters 中列出仍需用户通过选择阶段 parameter_overrides 补充的完整部署参数缺口",
+      "assertions": [
+        {"name": "preview_is_soft_gate", "check": "明确说明 PreviewStack 不是硬门禁，不能仅因完整部署参数暂缺就停止询价"},
+        {"name": "attempts_pricing_with_available_params", "check": "调用 GetTemplateEstimateCost，用当前已选或可用于询价的参数估算费用"},
+        {"name": "reports_missing_deployment_parameters", "check": "conclusion.missing_deployment_parameters 包含 VpcId、VSwitchId、SecurityGroupId 等缺口"},
+        {"name": "outputs_partial_deployment_parameters", "check": "conclusion.deployment_parameters 保留已用于询价的 ZoneId、InstanceType、ImageId、SystemDiskCategory"},
+        {"name": "mentions_later_overrides", "check": "说明用户后续可在选择阶段通过 parameter_overrides 补充缺失参数"}
+      ]
+    },
+    {
+      "id": 7,
       "name": "ha-slb-ecs-cost",
       "prompt": "预估高可用方案（SLB + 2台 ECS）的费用",
       "template_context": {
         "template": "ROSTemplateFormatVersion: '2015-09-01'\nParameters:\n  ZoneId:\n    Type: String\n    Default: cn-hangzhou-i\n  InstanceType:\n    Type: String\n    Default: ecs.c7.xlarge\n  ImageId:\n    Type: String\n    Default: centos_stream_9_x64_20G_alibase_20260414.vhd\n  SystemDiskCategory:\n    Type: String\n    Default: cloud_essd\nResources:\n  Vpc:\n    Type: ALIYUN::ECS::VPC\n    Properties:\n      CidrBlock: 10.0.0.0/16\n  VSwitch:\n    Type: ALIYUN::ECS::VSwitch\n    Properties:\n      VpcId: !Ref Vpc\n      ZoneId: !Ref ZoneId\n      CidrBlock: 10.0.1.0/24\n  SecurityGroup:\n    Type: ALIYUN::ECS::SecurityGroup\n    Properties:\n      VpcId: !Ref Vpc\n  EcsGroup:\n    Type: ALIYUN::ECS::InstanceGroup\n    Properties:\n      VpcId: !Ref Vpc\n      VSwitchId: !Ref VSwitch\n      SecurityGroupId: !Ref SecurityGroup\n      ZoneId: !Ref ZoneId\n      InstanceType: !Ref InstanceType\n      ImageId: !Ref ImageId\n      SystemDiskCategory: !Ref SystemDiskCategory\n      MaxAmount: 2\n  Slb:\n    Type: ALIYUN::SLB::LoadBalancer\n    Properties:\n      VpcId: !Ref Vpc\n      VSwitchId: !Ref VSwitch\n      LoadBalancerSpec: slb.s1.small\n      PayType: PayOnDemand",
-        "file_path": "templates/5-ha-slb-ecs.yml",
+        "file_path": "templates/7-ha-slb-ecs.yml",
         "region": "cn-hangzhou"
       },
       "expected_behavior": "正确处理多资源模板，费用明细包含 ECS（x2）和 SLB",
       "assertions": [
+        {"name": "uses_preview_stack_api", "check": "PreviewStack 通过 aliyun_api(product=\"ros\", action=\"PreviewStack\") 调用，不使用 ros_stack"},
         {"name": "uses_estimate_cost_api", "check": "调用了 GetTemplateEstimateCost API"},
         {"name": "includes_ecs_and_slb", "check": "费用明细中包含 ECS 和 SLB 的费用"},
         {"name": "ecs_count_reflected", "check": "ECS 费用描述中体现了 2 台实例（MaxAmount=2）"},
diff --git a/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/SKILL.md b/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/SKILL.md
index ae418e1c..08b0c649 100644
--- a/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/SKILL.md
+++ b/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/SKILL.md
@@ -24,6 +24,21 @@ conclusion_schema:
     error:
       type: string
       description: 失败原因（status 为 failed 时必填）
+  allOf:
+    - if:
+        properties:
+          status:
+            const: success
+        required: [status]
+      then:
+        required: [stack_id]
+    - if:
+        properties:
+          status:
+            const: failed
+        required: [status]
+      then:
+        required: [error]
 ---
 
 # 阿里云 ROS 部署技能
@@ -45,6 +60,7 @@ conclusion_schema:
 - 当 pipeline prompt 明确说明用户已确认选择/部署时，表示 pipeline 已完成部署确认，不要再次请求用户确认。
 - 在已确认的 pipeline 部署步骤中，可展示将使用的 VPC、可用区、网段、Stack 名等参数摘要，但展示后必须继续执行部署，不要询问“是否确认部署”或“是否确认部署参数”。
 - 仅当本技能被用户直接触发，或删除/更新等高风险操作没有上层确认时，才需要先询问用户确认；删除/更新操作使用 ⚠️ 警告措辞。
+- 删除请求本身不等于删除确认。只有用户明确回复“确认删除”“我确认删除”等删除确认语句，或上下文显式提供 `delete_confirmed: true` 时，才可执行删除；未收到明确删除确认前，不得调用 `ros_stack` 的 `DeleteStack`。
 - `status: cancelled` 只表示用户明确取消部署，不得用 status: cancelled 表示等待用户确认。
 
 ## 模板校验
@@ -64,16 +80,33 @@ conclusion_schema:
 查询步骤：
 1. 解析模板 Parameters，识别库存相关参数及对应产品
 2. 调用各产品可用性 API（具体 API 见 [references/cloud-products/](references/cloud-products/) 各产品文件的「可用性查询」节）
-3. 找出公共可用区（所有资源都有库存的可用区）
-4. 按 cloud-products 中的推荐规格优先匹配，不可用时选最接近的替代
-5. 得到选定参数；若上层 pipeline 已确认部署，展示选定结果后继续执行，不要再次请求用户确认。
+3. 核对最终部署参数中的可用区和规格是否可用
+4. 参数不可用时先报告冲突详情并尝试调整非用户指定参数；仍无法成功创建资源栈时，才可调整用户指定参数
 
 无法找到公共可用区时，告知用户冲突详情，建议换规格系列或换地域。
 
+## 部署参数装配
+
+CreateStack 前按以下优先级确定 `Parameters`：
+
+1. `selected_plan.effective_deployment_parameters` 非空时，直接作为最终部署参数集。
+2. 否则使用 `selected_plan.selected_candidate_result.cost.deployment_parameters`。
+3. 仍缺少模板必填参数时，使用模板 Default 或上下文已有值补足；无法补足时返回 `status: failed` 或通过 rollback_request 回到 `confirm_and_select`。
+
+装配参数时不得改写模板 `Default`，不得编造缺失的外部输入（LicenseKey、Token、证书、真实域名、已有资源 ID、VpcId、VSwitchId、SecurityGroupId、KeyPairName 等）。参数不可用或 CreateStack 无法成功时，优先调整非用户指定参数；仍无法成功创建资源栈时，才可调整用户指定参数。部署步骤不计算费用。
+
+## StackName
+
+新建 Stack 时，一开始就确定唯一 `StackName`，并传给 `CreateStack`。`StackName` 使用方案或服务简名作为前缀，并追加时间或 6 位小写字母/数字随机串后缀（如 `ai-app-20260623-a1b2c3`），避免重名。
+
+- CreateStack 必须传 StackName，不要省略，不要使用容易重复的固定名称。
+- `UpdateStack`、`ContinueCreateStack`、`DeleteStack` 面向已有 Stack 时，使用上下文中的现有 Stack 标识，不要生成新的 StackName。
+
 ## 执行部署
 
 - 使用 ros_stack 工具执行 CreateStack/UpdateStack/ContinueCreateStack/DeleteStack，禁止用 Bash
 - CreateStack 必须传 `DisableRollback: true`
+- CreateStack 使用装配后的 `Parameters` 字典；不要手动展开为 `Parameters.N.ParameterKey`
 
 > **TemplateURL 支持本地文件路径**：ros_stack 中 TemplateURL 可传本地文件路径（如 `/tmp/template.yml`），工具会自动读取文件内容。避免将大模板内容直接作为参数传递。
 
diff --git a/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/evals.json b/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/evals.json
index bdfa50cf..ce3b9525 100644
--- a/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/evals.json
+++ b/src/iac_code/pipeline/selling/skills/iac-aliyun-deploying/evals.json
@@ -98,11 +98,11 @@
         "region": "cn-hangzhou",
         "stack_id": "stack-to-delete-456"
       },
-      "expected_behavior": "使用 ⚠️ 警告措辞强调删除不可逆，确认后使用 ros_stack DeleteStack",
+      "expected_behavior": "使用 ⚠️ 警告措辞强调删除不可逆，等待用户明确确认；未确认前不调用 ros_stack DeleteStack",
       "assertions": [
         {"name": "deletion_warning", "check": "使用了 ⚠️ 警告措辞强调删除操作不可逆"},
         {"name": "user_confirmation", "check": "等待用户明确确认后才执行删除"},
-        {"name": "uses_delete_stack", "check": "调用 ros_stack 的 DeleteStack 操作"}
+        {"name": "no_delete_without_confirmation", "check": "未收到明确确认前不调用 ros_stack 的 DeleteStack 操作"}
       ]
     },
     {
@@ -169,6 +169,23 @@
         {"name": "re_validates_after_fix", "check": "修复后重新调用 ValidateTemplate 确认通过"},
         {"name": "deploys_after_validation", "check": "校验通过后才继续执行部署流程"}
       ]
+    },
+    {
+      "id": 9,
+      "name": "delete-stack-confirmed",
+      "prompt": "确认删除这个 Stack",
+      "selected_plan": {
+        "candidate_id": "plan-a",
+        "region": "cn-hangzhou",
+        "stack_id": "stack-to-delete-456",
+        "delete_confirmed": true
+      },
+      "expected_behavior": "用户已明确确认删除后，使用 ros_stack DeleteStack 执行删除，并报告删除请求已提交",
+      "assertions": [
+        {"name": "deletion_warning", "check": "使用了 ⚠️ 警告措辞强调删除操作不可逆"},
+        {"name": "uses_delete_stack", "check": "调用 ros_stack 的 DeleteStack 操作"},
+        {"name": "completed_success", "check": "调用 complete_step 且 status 为 success"}
+      ]
     }
   ]
 }
diff --git a/src/iac_code/pipeline/selling/skills/iac-aliyun-intent/SKILL.md b/src/iac_code/pipeline/selling/skills/iac-aliyun-intent/SKILL.md
index 121904f0..dbff56f6 100644
--- a/src/iac_code/pipeline/selling/skills/iac-aliyun-intent/SKILL.md
+++ b/src/iac_code/pipeline/selling/skills/iac-aliyun-intent/SKILL.md
@@ -54,6 +54,21 @@ conclusion_schema:
       description: 逐资源生命周期意图；后续步骤必须优先使用此字段判断新建、复用、引用或禁止
     non_functional:
       type: object
+      properties:
+        region_preference:
+          type: string
+          description: 用户指定或默认的阿里云地域，如 cn-hangzhou
+        stack_name:
+          type: string
+          description: 用户明确指定的 ROS 资源栈名称或 StackName，必须原样保留
+        naming_constraints:
+          type: array
+          items:
+            type: string
+          description: 其它资源命名或禁止使用默认名称的约束
+        network_constraints:
+          type: object
+          description: 用户指定的 VPC、可用区、CIDR 等网络参数约束
     scale_hint:
       type: string
     budget_constraint:
@@ -165,6 +180,8 @@ conclusion_schema:
 - `scale_hint`：根据上下文推断的业务规模，影响后续规格选择
 - `budget_constraint`：如用户提到预算则填写（如 "月预算500以内"），否则为 null
 - `region_preference`（在 `non_functional` 中）：如用户有地域偏好则填写，否则默认 "cn-hangzhou"
+- `stack_name`（在 `non_functional` 中）：如用户指定“资源栈名称”“StackName”或 ROS 资源栈名称，必须把精确名称写入该字段；不得把模板名、候选方案名或默认名称替代为 stack_name
+- `network_constraints`（在 `non_functional` 中）：如用户指定 VPC ID、ZoneId、CidrBlock、已有网络资源或多个网段关系，必须原样保留
 
 ### 资源生命周期提取规则
 
diff --git a/src/iac_code/pipeline/selling/skills/iac-aliyun-template-generating/SKILL.md b/src/iac_code/pipeline/selling/skills/iac-aliyun-template-generating/SKILL.md
index a6ace80f..2e3d8f44 100644
--- a/src/iac_code/pipeline/selling/skills/iac-aliyun-template-generating/SKILL.md
+++ b/src/iac_code/pipeline/selling/skills/iac-aliyun-template-generating/SKILL.md
@@ -39,10 +39,11 @@ conclusion_schema:
 
 1. 分析架构方案，确定资源列表
 2. 查阅 [references/cloud-products/](references/cloud-products/) 下对应产品文件，了解选型策略和库存相关属性
-3. 生成 ROS YAML 模板（库存相关属性按「参数化规则」定义为 Parameters，所有 Parameters 必须添加 AssociationProperty）并写入文件
-4. 调用 aliyun_api(product="ros", action="ValidateTemplate", params={"TemplateURL": <模板文件路径>}) 校验
-5. 校验失败 → 分析错误 → 修复 → 重试（最多 5 轮）
-6. 校验通过 → 完成
+3. **必须**阅读 [references/ros-template.md](references/ros-template.md)，了解 ROS 模板最佳实践，未阅读不得生成模板
+4. 生成 ROS YAML 模板（库存相关属性按 [references/cloud-products/](references/cloud-products/) 与 [references/template-parameters.md](references/template-parameters.md) 定义为 Parameters，所有 Parameters 必须添加 AssociationProperty）并写入文件
+5. 调用 aliyun_api(product="ros", action="ValidateTemplate", params={"TemplateURL": <模板文件路径>}) 校验
+6. 校验失败 → 分析错误 → 修复 → 重试（最多 5 轮）
+7. 校验通过 → 完成
 
 > **TemplateURL 支持本地文件路径**：aliyun_api（product=ros）中，TemplateURL 可传本地文件路径（如 `/tmp/template.yml`），工具会自动读取文件内容。避免将大模板内容直接作为参数传递。
 
@@ -59,14 +60,7 @@ conclusion_schema:
 
 ## 参数化规则
 
-生成模板时，以下属性**必须**定义为 Parameters（部署前通过 API 查询确定实际值）：
-
-| 产品 | 须参数化的属性 |
-|------|---------------|
-| ECS | ZoneId, InstanceType, ImageId, SystemDiskCategory, DataDiskCategory |
-| RDS | ZoneId, DBInstanceClass, DBInstanceStorageType |
-| Redis | ZoneId, InstanceClass |
-| SLB/ALB | ZoneId |
+生成模板时，库存相关属性**必须**定义为 Parameters（部署前通过 API 查询确定实际值）。具体字段按 [references/cloud-products/](references/cloud-products/) 的产品文件和 [references/template-parameters.md](references/template-parameters.md) 执行，不在本技能重复维护产品字段清单。
 
 以下属性**不需要**参数化，直接使用合理默认值：
 - 网络：VPC CIDR、VSwitch CIDR
@@ -88,22 +82,6 @@ conclusion_schema:
 - 使用 `!Ref`、`!GetAtt` 等内置函数引用参数和资源属性，避免硬编码
 - Outputs 中所有输出变量必须定义 Label
 
-## 常用资源类型
-
-- ALIYUN::ECS::VPC: 创建专有网络
-- ALIYUN::ECS::VSwitch: 创建交换机
-- ALIYUN::ECS::SecurityGroup: 创建安全组
-- ALIYUN::ECS::InstanceGroup: 创建 N 个 ECS 实例（通过 `MaxAmount` 指定数量）
-- ALIYUN::ECS::RunCommand: 在实例中执行自定义命令
-- ALIYUN::ECS::Invocation: 执行公共命令
-
-## 在实例中执行命令
-
-**不要使用 UserData + WaitCondition**。根据场景选择：
-
-- **自定义命令** → `ALIYUN::ECS::RunCommand` + `CommandContent`
-- **公共命令** → `ALIYUN::ECS::Invocation` + `CommandName`
-
 ## 资源和文档搜索
 
 - 不确定的资源属性或 Schema → aliyun_api(product="ros", action="GetResourceType", params={"ResourceType": "<类型>"})
diff --git a/src/iac_code/services/context_manager.py b/src/iac_code/services/context_manager.py
index 3d771d60..a10dab06 100644
--- a/src/iac_code/services/context_manager.py
+++ b/src/iac_code/services/context_manager.py
@@ -132,7 +132,8 @@ def add_raw_message(self, raw_msg: dict[str, Any]) -> Message:
         """Add a raw message dict (e.g. from ToolResult.new_messages) to the conversation."""
         role = raw_msg.get("role", "user")
         content = raw_msg.get("content", "")
-        msg = Message(role=role, content=content)
+        metadata = raw_msg.get("metadata")
+        msg = Message(role=role, content=content, metadata=dict(metadata) if isinstance(metadata, dict) else {})
         self._conversation.messages.append(msg)
         msg.token_count = self._token_counter.count_message(msg.to_api_format())
         return msg
@@ -147,6 +148,15 @@ def load_messages(self, messages: list[Message]) -> None:
     def get_messages(self) -> list[Message]:
         return self._conversation.messages
 
+    def remove_cleanup_prompt_messages(self) -> int:
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
+        kept = [message for message in self._conversation.messages if not is_cleanup_prompt_message(message)]
+        removed = len(self._conversation.messages) - len(kept)
+        if removed:
+            self._conversation.replace_messages(kept)
+        return removed
+
     def get_api_messages(self) -> list[dict[str, Any]]:
         return self._conversation.to_api_messages()
 
@@ -248,13 +258,15 @@ def _split_messages_for_compaction(self) -> tuple[list[Message], list[Message]]:
 
     def build_compaction_prompt(self) -> str:
         """Build compaction prompt from old messages only (recent are preserved)."""
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
         old_messages, _recent = self._split_messages_for_compaction()
         if not old_messages:
             return ""
 
         conversation_text = []
         for msg in old_messages:
-            if is_recalled_memory_message(msg):
+            if is_recalled_memory_message(msg) or is_cleanup_prompt_message(msg):
                 continue
             role = msg.role.upper()
             text = msg.get_text()
@@ -278,14 +290,17 @@ def build_compaction_prompt(self) -> str:
 
     def apply_compaction(self, summary: str) -> tuple[int, int]:
         """Replace old messages with summary, keep recent messages intact."""
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
         original_tokens = self._conversation.get_total_tokens()
 
-        _old, recent = self._split_messages_for_compaction()
+        old, recent = self._split_messages_for_compaction()
+        preserved_hidden = [msg for msg in old if is_cleanup_prompt_message(msg)]
 
         summary_msg = Message(role="user", content=f"[Conversation Summary]\n{summary}")
         summary_msg.token_count = self._token_counter.count_message(summary_msg.to_api_format())
 
-        self._conversation.replace_messages([summary_msg] + recent)
+        self._conversation.replace_messages([summary_msg] + preserved_hidden + recent)
         new_tokens = self._conversation.get_total_tokens()
         logger.info(f"Compaction: {original_tokens} -> {new_tokens} tokens")
         return (original_tokens, new_tokens)
diff --git a/src/iac_code/services/session_index.py b/src/iac_code/services/session_index.py
index 6daba1df..a639aa2c 100644
--- a/src/iac_code/services/session_index.py
+++ b/src/iac_code/services/session_index.py
@@ -15,6 +15,7 @@
 from pathlib import Path
 
 from iac_code.agent.message import RECALLED_MEMORY_MARKER, RECALLED_MEMORY_METADATA_TYPE
+from iac_code.pipeline.constants import CLEANUP_PROMPT_METADATA_TYPE
 from iac_code.services.session_metadata import SESSION_JSONL_FILENAME, read_session_metadata
 from iac_code.utils.project_paths import (
     get_project_dir,
@@ -24,6 +25,16 @@
 )
 
 LITE_READ_BUF_SIZE = 64 * 1024
+_LEGACY_CLEANUP_CHINESE_PREFIX = "检测到 pipeline rollback 后仍需要清理的云资源"
+_LEGACY_CLEANUP_ROLLBACK_PHRASES = ("rollback cleanup required",)
+_LEGACY_CLEANUP_RESOURCE_PHRASES = (
+    "leftover resource",
+    "stack-",
+    "delete_complete",
+    "仍需要清理",
+    "待清理资源",
+    "回滚残留资源",
+)
 
 
 @dataclass
@@ -161,12 +172,25 @@ def _is_recalled_memory_text(text: str | None) -> bool:
     return bool(text and RECALLED_MEMORY_MARKER in text)
 
 
-def _is_recalled_memory_row(obj: dict) -> bool:
+def _is_cleanup_prompt_text(text: str | None) -> bool:
+    if not text:
+        return False
+    if _LEGACY_CLEANUP_CHINESE_PREFIX in text and "DELETE_COMPLETE" in text:
+        return True
+    lowered = text.lower()
+    has_rollback_context = any(phrase in lowered for phrase in _LEGACY_CLEANUP_ROLLBACK_PHRASES)
+    has_cleanup_resource_context = any(phrase in lowered for phrase in _LEGACY_CLEANUP_RESOURCE_PHRASES)
+    return has_rollback_context and has_cleanup_resource_context
+
+
+def _is_hidden_prompt_row(obj: dict) -> bool:
     metadata = obj.get("metadata")
     if isinstance(metadata, dict) and metadata.get("type") == RECALLED_MEMORY_METADATA_TYPE:
         return True
+    if isinstance(metadata, dict) and metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE:
+        return True
     content = obj.get("content")
-    return isinstance(content, str) and _is_recalled_memory_text(content)
+    return isinstance(content, str) and (_is_recalled_memory_text(content) or _is_cleanup_prompt_text(content))
 
 
 def _extract_first_user_text(head: str) -> str | None:
@@ -187,7 +211,7 @@ def _extract_first_user_text(head: str) -> str | None:
             continue
         if not isinstance(obj, dict) or obj.get("role") != "user":
             continue
-        if _is_recalled_memory_row(obj):
+        if _is_hidden_prompt_row(obj):
             continue
         content = obj.get("content")
         if isinstance(content, str) and content.strip():
@@ -227,7 +251,7 @@ def read_lite_metadata(path: Path) -> LiteMetadata:
         head, "git_branch"
     )
     last_prompt = extract_last_json_string_field(tail, "last_prompt")
-    if _is_recalled_memory_text(last_prompt):
+    if _is_recalled_memory_text(last_prompt) or _is_cleanup_prompt_text(last_prompt):
         last_prompt = None
     first_prompt = _extract_first_user_text(head)
     return LiteMetadata(
diff --git a/src/iac_code/services/session_storage.py b/src/iac_code/services/session_storage.py
index 1dc1662d..a8e3555d 100644
--- a/src/iac_code/services/session_storage.py
+++ b/src/iac_code/services/session_storage.py
@@ -25,12 +25,12 @@
 import json
 from datetime import datetime, timezone
 from pathlib import Path
-from shutil import move
 from typing import Any
 
 from iac_code import __version__
 from iac_code.agent.message import ContentBlock, Message, ToolResultBlock
 from iac_code.i18n import _
+from iac_code.pipeline.constants import CLEANUP_PROMPT_METADATA_TYPE
 from iac_code.services.session_metadata import (
     SESSION_JSONL_FILENAME,
     SessionMetadata,
@@ -45,12 +45,32 @@
     get_session_path,
     is_conversation_session_file,
 )
+from iac_code.utils.state_io import append_jsonl_locked, atomic_write_text, safe_replace
 
 
 def _utc_now() -> str:
     return datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")
 
 
+def _cleanup_prompt_identity(message: Message) -> str:
+    metadata = message.metadata
+    if metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE:
+        metadata = {
+            "type": metadata.get("type"),
+            "source": metadata.get("source"),
+            "cleanupLedgerPath": metadata.get("cleanupLedgerPath") or metadata.get("cleanup_ledger_path"),
+        }
+    return json.dumps(
+        {
+            "role": message.role,
+            "content": message.to_dict().get("content"),
+            "metadata": metadata,
+        },
+        ensure_ascii=False,
+        sort_keys=True,
+    )
+
+
 class SessionStorage:
     """Persist conversation sessions partitioned by working directory."""
 
@@ -132,8 +152,7 @@ def append(
         path = self._session_path(cwd, session_id)
         ensure_private_dir(path.parent)
         data = self._stamp(message.to_dict(), cwd, session_id, git_branch)
-        with open(path, "a", encoding="utf-8") as f:
-            f.write(json.dumps(data, ensure_ascii=False) + "\n")
+        append_jsonl_locked(path, [data])
         ensure_private_file(path)
 
     def append_meta(self, cwd: str, session_id: str, meta_entry: dict[str, Any]) -> None:
@@ -144,8 +163,7 @@ def append_meta(self, cwd: str, session_id: str, meta_entry: dict[str, Any]) ->
         ensure_private_dir(path.parent)
         entry = dict(meta_entry)
         entry["session_id"] = session_id
-        with open(path, "a", encoding="utf-8") as f:
-            f.write(json.dumps(entry, ensure_ascii=False) + "\n")
+        append_jsonl_locked(path, [entry])
         ensure_private_file(path)
 
     def save(
@@ -155,16 +173,44 @@ def save(
         messages: list[Message],
         *,
         git_branch: str | None = None,
+        preserve_cleanup_prompts: bool = False,
     ) -> None:
         """Overwrite the session file with the given messages."""
+        if preserve_cleanup_prompts:
+            messages = self._merge_preserved_cleanup_prompts(cwd, session_id, messages)
         path = self._session_path(cwd, session_id)
         ensure_private_dir(path.parent)
-        with open(path, "w", encoding="utf-8") as f:
-            for msg in messages:
-                data = self._stamp(msg.to_dict(), cwd, session_id, git_branch)
-                f.write(json.dumps(data, ensure_ascii=False) + "\n")
+        lines = []
+        for msg in messages:
+            data = self._stamp(msg.to_dict(), cwd, session_id, git_branch)
+            lines.append(json.dumps(data, ensure_ascii=False) + "\n")
+        atomic_write_text(path, "".join(lines), durable=True)
         ensure_private_file(path)
 
+    def _merge_preserved_cleanup_prompts(
+        self,
+        cwd: str,
+        session_id: str,
+        messages: list[Message],
+    ) -> list[Message]:
+        try:
+            from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+        except Exception:
+            return messages
+
+        path = self._session_path(cwd, session_id)
+        if not path.exists():
+            return messages
+        existing = self.load(cwd, session_id)
+        preserved = [message for message in existing if is_cleanup_prompt_message(message)]
+        if not preserved:
+            return messages
+        existing_keys = {
+            _cleanup_prompt_identity(message) for message in messages if is_cleanup_prompt_message(message)
+        }
+        missing = [message for message in preserved if _cleanup_prompt_identity(message) not in existing_keys]
+        return [*messages, *missing] if missing else messages
+
     # ------------------------------------------------------------------
     # Read
     # ------------------------------------------------------------------
@@ -227,7 +273,7 @@ def _ensure_directory_format(self, cwd: str, session_id: str) -> Path:
             ensure_private_file(directory_path)
             return session_dir
         ensure_private_dir(session_dir)
-        move(str(legacy_path), str(directory_path))
+        safe_replace(str(legacy_path), str(directory_path))
         ensure_private_file(directory_path)
         return session_dir
 
diff --git a/src/iac_code/tools/base.py b/src/iac_code/tools/base.py
index 794afd0b..c7bfaf38 100644
--- a/src/iac_code/tools/base.py
+++ b/src/iac_code/tools/base.py
@@ -7,7 +7,7 @@
 from abc import ABC, abstractmethod
 from collections.abc import Callable
 from dataclasses import dataclass, field
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, cast
 
 from iac_code.i18n import _
 
@@ -15,7 +15,10 @@
     from iac_code.types.permissions import PermissionResult
 
 
-@dataclass
+_DEFAULT_CWD = object()
+
+
+@dataclass(init=False)
 class ToolContext:
     """Execution context passed to tools."""
 
@@ -26,6 +29,40 @@ class ToolContext:
     # downstream (e.g. in the renderer's per-tab accumulator). Populated by the
     # ToolExecutor on each call.
     tool_use_id: str | None = None
+    additional_directories: list[str] = field(default_factory=list)
+    trusted_read_directories: list[str] = field(default_factory=list)
+    relative_read_directories: list[str] = field(default_factory=list)
+    # True when this tool call is being executed as part of a pipeline step.
+    pipeline_mode: bool = False
+
+    def __init__(
+        self,
+        cwd: str | object = _DEFAULT_CWD,
+        event_queue: asyncio.Queue | None = None,
+        tool_use_id: str | list[str] | None = None,
+        additional_directories: list[str] | None = None,
+        trusted_read_directories: list[str] | str | None = None,
+        relative_read_directories: list[str] | None = None,
+        pipeline_mode: bool = False,
+    ) -> None:
+        if isinstance(tool_use_id, list) and isinstance(additional_directories, list):
+            old_additional_directories = tool_use_id
+            old_trusted_read_directories = additional_directories
+            old_tool_use_id = trusted_read_directories
+
+            tool_use_id = old_tool_use_id if isinstance(old_tool_use_id, str) else None
+            additional_directories = old_additional_directories
+            trusted_read_directories = old_trusted_read_directories
+
+        self.cwd = os.getcwd() if cwd is _DEFAULT_CWD else cast(str, cwd)
+        self.event_queue = event_queue
+        self.tool_use_id = tool_use_id if isinstance(tool_use_id, str) else None
+        self.additional_directories = list(additional_directories or [])
+        self.trusted_read_directories = (
+            list(trusted_read_directories or []) if isinstance(trusted_read_directories, list) else []
+        )
+        self.relative_read_directories = list(relative_read_directories or [])
+        self.pipeline_mode = pipeline_mode
 
 
 @dataclass
diff --git a/src/iac_code/tools/cloud/aliyun/aliyun_api.py b/src/iac_code/tools/cloud/aliyun/aliyun_api.py
index 1ae7b0db..6fd40bb9 100644
--- a/src/iac_code/tools/cloud/aliyun/aliyun_api.py
+++ b/src/iac_code/tools/cloud/aliyun/aliyun_api.py
@@ -21,8 +21,10 @@
 from iac_code.services.telemetry.names import Events, Metrics
 from iac_code.services.telemetry.sanitize import sanitize_error_message
 from iac_code.tools.base import ToolContext, ToolResult
+from iac_code.tools.cloud.aliyun.template_source import reject_template_body_param
 from iac_code.tools.cloud.aliyun.user_agent import build_user_agent
 from iac_code.tools.cloud.base_api import BaseCloudApi
+from iac_code.types.stream_events import ResourceObservedEvent
 
 logger = logging.getLogger(__name__)
 
@@ -144,6 +146,10 @@ def _emit_validate_template_event(response_body: dict | Any, duration_ms: int) -
     )
 
 
+def _string_value(value: Any) -> str | None:
+    return value if isinstance(value, str) and value else None
+
+
 class AliyunApi(BaseCloudApi):
     """Generic Alibaba Cloud API tool.
 
@@ -408,6 +414,8 @@ async def execute(self, *, tool_input: dict[str, Any], context: ToolContext) ->
 
         # ROS: TemplateURL as local file path → read into TemplateBody
         if product == "ros":
+            if error := reject_template_body_param(params, pipeline_mode=context.pipeline_mode):
+                return ToolResult.error(error)
             template_url = params.get("TemplateURL", "")
             if template_url and not template_url.startswith(("http://", "https://", "oss://")):
                 params["TemplateBody"] = Path(template_url).read_text(encoding="utf-8")
@@ -518,6 +526,22 @@ async def execute(self, *, tool_input: dict[str, Any], context: ToolContext) ->
             if api_service == "ROS" and action == "ValidateTemplate":
                 _emit_validate_template_event(body, duration_ms)
 
+            if context.event_queue is not None and product == "ros" and action == "CreateStack":
+                stack_id = _string_value(body.get("StackId")) if isinstance(body, dict) else None
+                if stack_id:
+                    await context.event_queue.put(
+                        ResourceObservedEvent(
+                            provider="ros",
+                            resource_type="stack",
+                            resource_id=stack_id,
+                            resource_name=str(params.get("StackName") or params.get("stack_name") or ""),
+                            region_id=region,
+                            action=action,
+                            tool_name=self.name,
+                            tool_use_id=context.tool_use_id,
+                        )
+                    )
+
             return ToolResult.success(json.dumps(body, ensure_ascii=False, indent=2))
         except Exception as e:
             self._last_action = ""
diff --git a/src/iac_code/tools/cloud/aliyun/ros_stack.py b/src/iac_code/tools/cloud/aliyun/ros_stack.py
index add19250..0b04c7d8 100644
--- a/src/iac_code/tools/cloud/aliyun/ros_stack.py
+++ b/src/iac_code/tools/cloud/aliyun/ros_stack.py
@@ -22,7 +22,9 @@
     sanitize_resource_type,
     sanitize_terraform_provider,
 )
+from iac_code.tools.base import ToolContext
 from iac_code.tools.cloud.aliyun.ros_client import RosClientFactory
+from iac_code.tools.cloud.aliyun.template_source import reject_template_body_param
 from iac_code.tools.cloud.base_stack import BaseCloudStack
 from iac_code.tools.cloud.types import ResourceStatus, StackStatus
 
@@ -472,7 +474,12 @@ def _get_client(self, region: str) -> Any:
         cred = credentials.get_provider("aliyun")
         return RosClientFactory.create(cred, region_id=region)
 
-    async def call_action(self, action: str, params: dict, region: str) -> str:
+    def _call_action_kwargs(self, context: ToolContext) -> dict[str, Any]:
+        return {"pipeline_mode": context.pipeline_mode}
+
+    async def call_action(self, action: str, params: dict, region: str, *, pipeline_mode: bool = False) -> str:
+        if error := reject_template_body_param(params, pipeline_mode=pipeline_mode):
+            raise ValueError(error)
         client = self._get_client(region)
         # Ensure RegionId is always in params for the API request
         if region:
@@ -482,7 +489,7 @@ async def call_action(self, action: str, params: dict, region: str) -> str:
         if template_url and not template_url.startswith(_URL_SCHEMES):
             params["TemplateBody"] = Path(template_url).read_text(encoding="utf-8")
             del params["TemplateURL"]
-        # TemplateBody must be a JSON string; models may pass a dict
+        # TemplateBody must be a JSON string; non-pipeline callers may still pass a dict.
         if isinstance(params.get("TemplateBody"), dict):
             params["TemplateBody"] = json.dumps(params["TemplateBody"], ensure_ascii=False)
 
diff --git a/src/iac_code/tools/cloud/aliyun/template_source.py b/src/iac_code/tools/cloud/aliyun/template_source.py
new file mode 100644
index 00000000..54b82fb5
--- /dev/null
+++ b/src/iac_code/tools/cloud/aliyun/template_source.py
@@ -0,0 +1,17 @@
+"""ROS template source parameter helpers."""
+
+from __future__ import annotations
+
+from typing import Any
+
+from iac_code.i18n import _
+
+
+def reject_template_body_param(params: dict[str, Any], *, pipeline_mode: bool) -> str | None:
+    """Return an error message when a caller provides TemplateBody directly."""
+    if not pipeline_mode or "TemplateBody" not in params:
+        return None
+    return _(
+        "ROS template calls must use TemplateURL instead of TemplateBody. "
+        "Save the template to a file and pass params.TemplateURL, for example a local file path or OSS/HTTP URL."
+    )
diff --git a/src/iac_code/tools/cloud/base_stack.py b/src/iac_code/tools/cloud/base_stack.py
index dc4c75cb..59cefb82 100644
--- a/src/iac_code/tools/cloud/base_stack.py
+++ b/src/iac_code/tools/cloud/base_stack.py
@@ -11,7 +11,7 @@
 from iac_code.i18n import _
 from iac_code.tools.base import Tool, ToolContext, ToolResult
 from iac_code.tools.cloud.types import ResourceStatus, StackStatus, translate_status
-from iac_code.types.stream_events import StackProgressEvent
+from iac_code.types.stream_events import ResourceObservedEvent, StackProgressEvent
 
 POLL_INTERVAL = 5
 
@@ -138,6 +138,9 @@ def user_facing_name(self, input: dict | None = None) -> str:
     def _resolve_region(self, input: dict) -> str:
         return input.get("region_id") or self._get_default_region()
 
+    def _call_action_kwargs(self, context: ToolContext) -> dict[str, Any]:
+        return {}
+
     def render_tool_use_message(self, input: dict, *, verbose: bool = False) -> str | None:
         action = input.get("action", "")
         region = self._resolve_region(input)
@@ -223,10 +226,24 @@ async def execute(self, *, tool_input: dict[str, Any], context: ToolContext) ->
         region = self._resolve_region(tool_input)
 
         try:
-            stack_id = await self.call_action(action, params, region)
+            stack_id = await self.call_action(action, params, region, **self._call_action_kwargs(context))
         except Exception as e:
             return ToolResult.error(f"[{action}] {e}")
 
+        if context.event_queue is not None and action == "CreateStack" and stack_id:
+            await context.event_queue.put(
+                ResourceObservedEvent(
+                    provider=self.provider_name,
+                    resource_type="stack",
+                    resource_id=stack_id,
+                    resource_name=str(params.get("StackName") or params.get("stack_name") or ""),
+                    region_id=region,
+                    action=action,
+                    tool_name=self.name,
+                    tool_use_id=context.tool_use_id,
+                )
+            )
+
         start_time = time.monotonic()
 
         try:
diff --git a/src/iac_code/tools/path_safety.py b/src/iac_code/tools/path_safety.py
index 85104822..8270f3ba 100644
--- a/src/iac_code/tools/path_safety.py
+++ b/src/iac_code/tools/path_safety.py
@@ -4,6 +4,7 @@
 
 import os
 import sys
+import tempfile
 from collections.abc import Iterator, Sequence
 from dataclasses import dataclass
 from pathlib import Path
@@ -79,7 +80,7 @@ def _normalize_for_platform(path: str, *, case_insensitive: bool | None = None)
     if case_insensitive is None:
         case_insensitive = sys.platform == "win32"
     if case_insensitive:
-        return normalized.lower()
+        return normalized.casefold()
     return normalized
 
 
@@ -158,13 +159,52 @@ def get_iac_code_application_root() -> Path:
 
 
 def _path_is_under(path: str, root: str) -> bool:
-    path_r = _normalize_for_platform(os.path.realpath(path))
-    root_r = _normalize_for_platform(os.path.realpath(root))
+    root_real_raw = os.path.realpath(root)
+    case_insensitive = _should_casefold_for_under_check(root_real_raw)
+    path_r = _normalize_for_platform(os.path.realpath(path), case_insensitive=case_insensitive)
+    root_r = _normalize_for_platform(root_real_raw, case_insensitive=case_insensitive)
     if path_r == root_r:
         return True
     return path_r.startswith(root_r.rstrip("/") + "/")
 
 
+def _should_casefold_for_under_check(root: str) -> bool:
+    if sys.platform == "win32":
+        return True
+    if sys.platform == "darwin":
+        return not _path_case_sensitive(root)
+    return False
+
+
+def _path_case_sensitive(root: str) -> bool:
+    probe_dir = _existing_probe_dir(root)
+    if probe_dir is None:
+        return True
+    try:
+        fd, probe_path = tempfile.mkstemp(prefix=".iac-code-case-", dir=probe_dir)
+    except OSError:
+        return True
+    os.close(fd)
+    alternate = os.path.join(probe_dir, os.path.basename(probe_path).swapcase())
+    try:
+        return not os.path.exists(alternate)
+    finally:
+        try:
+            os.unlink(probe_path)
+        except OSError:
+            pass
+
+
+def _existing_probe_dir(path: str) -> str | None:
+    candidate = path if os.path.isdir(path) else os.path.dirname(path)
+    while candidate and not os.path.isdir(candidate):
+        parent = os.path.dirname(candidate)
+        if parent == candidate:
+            return None
+        candidate = parent
+    return candidate or None
+
+
 def _is_in_allowed_roots(path: str, roots: list[str]) -> bool:
     return any(_path_is_under(path, root) for root in roots if root)
 
diff --git a/src/iac_code/tools/read_file.py b/src/iac_code/tools/read_file.py
index 64a42ed6..51ba7a68 100644
--- a/src/iac_code/tools/read_file.py
+++ b/src/iac_code/tools/read_file.py
@@ -8,15 +8,28 @@
 
 from iac_code.i18n import _
 from iac_code.tools.base import Tool, ToolContext, ToolResult
-from iac_code.tools.path_safety import check_read_path, resolve_candidate
+from iac_code.tools.path_safety import _path_is_under, check_read_path, resolve_candidate
 from iac_code.types.permissions import PermissionDecisionReason, PermissionResult, ToolPermissionContext
 
 MAX_READ_BYTES = 10 * 1024 * 1024
 MAX_READ_LINES = 50_000
 
 
-def _resolve_input_path(path: str, cwd: str) -> str:
-    return resolve_candidate(path, cwd)
+def _resolve_input_path(
+    path: str,
+    cwd: str,
+    *,
+    relative_read_directories: list[str] | None = None,
+) -> str:
+    primary = resolve_candidate(path, cwd)
+    if os.path.isabs(os.path.expanduser(path)) or os.path.exists(primary):
+        return primary
+
+    for root in relative_read_directories or []:
+        candidate = resolve_candidate(path, root)
+        if _path_is_under(candidate, root) and os.path.exists(candidate):
+            return candidate
+    return primary
 
 
 class ReadFileTool(Tool):
@@ -85,7 +98,11 @@ async def check_permissions(self, input: dict, context=None) -> PermissionResult
         return decision.to_permission_result()
 
     async def execute(self, *, tool_input: dict[str, Any], context: ToolContext) -> ToolResult:
-        path = _resolve_input_path(tool_input["path"], context.cwd)
+        path = _resolve_input_path(
+            tool_input["path"],
+            context.cwd,
+            relative_read_directories=context.relative_read_directories,
+        )
         start_line = tool_input.get("start_line")
         end_line = tool_input.get("end_line")
 
diff --git a/src/iac_code/tools/tool_executor.py b/src/iac_code/tools/tool_executor.py
index 0708f3ce..dd29fb05 100644
--- a/src/iac_code/tools/tool_executor.py
+++ b/src/iac_code/tools/tool_executor.py
@@ -69,7 +69,11 @@ async def _validate_and_execute(self, call: ToolCallRequest, context: ToolContex
         context = ToolContext(
             cwd=context.cwd,
             event_queue=call.event_queue if call.event_queue is not None else context.event_queue,
+            additional_directories=list(context.additional_directories),
+            trusted_read_directories=list(context.trusted_read_directories),
+            relative_read_directories=list(context.relative_read_directories),
             tool_use_id=call.id,
+            pipeline_mode=context.pipeline_mode,
         )
 
         timeout = tool.timeout if tool.timeout is not None else self._tool_timeout
diff --git a/src/iac_code/types/stream_events.py b/src/iac_code/types/stream_events.py
index e0b20cc4..db2879cd 100644
--- a/src/iac_code/types/stream_events.py
+++ b/src/iac_code/types/stream_events.py
@@ -189,6 +189,22 @@ class ToolEmittedEvent:
     pass
 
 
+@dataclass
+class ResourceObservedEvent(ToolEmittedEvent):
+    """A cloud resource id became known before the lifecycle tool completed."""
+
+    provider: str
+    resource_type: str
+    resource_id: str
+    resource_name: str = ""
+    region_id: str = ""
+    action: str = ""
+    tool_name: str = ""
+    tool_use_id: str | None = None
+    metadata: dict[str, Any] = field(default_factory=dict)
+    type: Literal["resource_observed"] = "resource_observed"
+
+
 @dataclass
 class StackProgressEvent(ToolEmittedEvent):
     """Real-time progress from a stack lifecycle operation."""
@@ -295,6 +311,7 @@ class AskUserQuestionEvent(ToolEmittedEvent):
     TaskNotificationEvent,
     QueuedInputSubmittedEvent,
     SubAgentToolEvent,
+    ResourceObservedEvent,
     StackProgressEvent,
     StackInstancesProgressEvent,
     PlanEvent,
diff --git a/src/iac_code/ui/core/prompt_input.py b/src/iac_code/ui/core/prompt_input.py
index 5d1d8de8..fc86199b 100644
--- a/src/iac_code/ui/core/prompt_input.py
+++ b/src/iac_code/ui/core/prompt_input.py
@@ -643,7 +643,7 @@ def _input_loop(self, prompt: str, *, initial_text: str = "", transient: bool =
         self._buffer = list(initial_text)
         self._cursor = len(self._buffer)
         self._pasted_contents = {}
-        self._next_paste_id = 1
+        self._next_paste_id = self._initial_paste_id()
         self._submitted = False
         self._cancelled = False
         self._esc_pressed = False
@@ -742,3 +742,13 @@ def _input_loop(self, prompt: str, *, initial_text: str = "", transient: bool =
         if self._cancelled:
             return None
         return self._get_text()
+
+    def _initial_paste_id(self) -> int:
+        next_image_id = getattr(self._image_store, "next_image_id", None)
+        if not callable(next_image_id):
+            return 1
+        try:
+            value = int(next_image_id())
+        except Exception:
+            return 1
+        return value if value > 0 else 1
diff --git a/src/iac_code/ui/dialogs/resume_picker.py b/src/iac_code/ui/dialogs/resume_picker.py
index c8bc484c..39e727df 100644
--- a/src/iac_code/ui/dialogs/resume_picker.py
+++ b/src/iac_code/ui/dialogs/resume_picker.py
@@ -28,6 +28,7 @@
 
 from iac_code.agent.message import Message, ToolResultBlock, is_recalled_memory_message
 from iac_code.i18n import _, ngettext
+from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
 from iac_code.services.session_index import SessionEntry, SessionIndex
 from iac_code.ui.components.fuzzy_picker import fuzzy_match
 from iac_code.ui.components.search_box import SearchBox
@@ -676,7 +677,7 @@ def _fallback_render(console: Console, messages: list[Message]) -> None:
         """Minimal renderer used in tests / when no live renderer is provided."""
         first = True
         for msg in messages:
-            if is_recalled_memory_message(msg):
+            if is_recalled_memory_message(msg) or is_cleanup_prompt_message(msg):
                 continue
             if not first:
                 console.print()
diff --git a/src/iac_code/ui/renderer.py b/src/iac_code/ui/renderer.py
index d25d3984..b034c927 100644
--- a/src/iac_code/ui/renderer.py
+++ b/src/iac_code/ui/renderer.py
@@ -18,6 +18,7 @@
 import threading
 import time
 from dataclasses import dataclass, field
+from pathlib import Path
 from typing import TYPE_CHECKING, Any, AsyncGenerator, Awaitable, Callable
 
 if sys.platform != "win32":
@@ -32,6 +33,7 @@
 from rich.markdown import ListItem, Markdown
 from rich.rule import Rule
 from rich.segment import Segment
+from rich.style import Style
 from rich.table import Table
 from rich.text import Text
 
@@ -270,10 +272,15 @@ def __init__(
         tool_registry: "ToolRegistry",
         status_callback: Callable[[], str] | None = None,
         app_state_store: "AppStateStore | None" = None,
+        *,
+        image_path_resolver: Callable[[int], str | None] | None = None,
+        image_block_path_resolver: Callable[[Any], str | None] | None = None,
     ) -> None:
         self.console = console
         self._tool_registry = tool_registry
         self._status_callback = status_callback
+        self._image_path_resolver = image_path_resolver
+        self._image_block_path_resolver = image_block_path_resolver
         self._verbose = False
         self._text_flushed = False  # tracks whether current text block was partially flushed
         self._message_history: list[RenderedTurn] = []
@@ -331,6 +338,37 @@ def print_user_message(self, text: str) -> None:
         t.append(text)
         self.console.print(t)
 
+    def _image_ref_style(self, image_id: int) -> Style | None:
+        if self._image_path_resolver is None:
+            return None
+        try:
+            image_path = self._image_path_resolver(image_id)
+            if not image_path:
+                return None
+            return Style(color="cyan", link=self._file_url(image_path))
+        except Exception:
+            return None
+
+    @staticmethod
+    def _file_url(path: str) -> str:
+        resolved = Path(path).expanduser()
+        if not resolved.is_absolute():
+            resolved = resolved.resolve(strict=False)
+        return resolved.as_uri()
+
+    def _image_block_style(self, block: Any) -> Style | None:
+        if self._image_block_path_resolver is not None:
+            try:
+                image_path = self._image_block_path_resolver(block)
+                if image_path:
+                    return Style(color="cyan", link=self._file_url(image_path))
+            except Exception:
+                pass
+        ref_id = getattr(block, "ref_id", None)
+        if isinstance(ref_id, int):
+            return self._image_ref_style(ref_id)
+        return None
+
     def print_command_result(self, command: str, result: str) -> None:
         t = Text()
         t.append("  └ ", style="dim")
@@ -1795,12 +1833,19 @@ def _format_token_count(count: int, label: str) -> str:
 
     def replay_history(self, messages: list) -> None:
         """Replay saved Message objects to scrollback with 1:1 visual fidelity."""
-        from iac_code.agent.message import TextBlock, ToolResultBlock, ToolUseBlock, is_recalled_memory_message
+        from iac_code.agent.message import (
+            ImageBlock,
+            TextBlock,
+            ToolResultBlock,
+            ToolUseBlock,
+            is_recalled_memory_message,
+        )
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
 
         # Build a lookup of tool_use_id → ToolResultBlock from all user messages
         tool_results: dict[str, ToolResultBlock] = {}
         for msg in messages:
-            if is_recalled_memory_message(msg):
+            if is_recalled_memory_message(msg) or is_cleanup_prompt_message(msg):
                 continue
             if msg.role == "user" and isinstance(msg.content, list):
                 for block in msg.content:
@@ -1809,7 +1854,7 @@ def replay_history(self, messages: list) -> None:
 
         first_turn = True
         for msg in messages:
-            if is_recalled_memory_message(msg):
+            if is_recalled_memory_message(msg) or is_cleanup_prompt_message(msg):
                 continue
             if msg.role == "user":
                 if self.is_internal_skill_context_message(msg):
@@ -1822,12 +1867,13 @@ def replay_history(self, messages: list) -> None:
                 if not first_turn:
                     self.console.print()
                 first_turn = False
-                if isinstance(msg.content, str):
-                    self.print_user_message(msg.content)
-                else:
-                    text = msg.get_text()
-                    if text:
-                        self.print_user_message(text)
+                rendered = self._render_user_content(
+                    msg.content,
+                    text_block_type=TextBlock,
+                    image_block_type=ImageBlock,
+                )
+                if rendered.plain.strip():
+                    self.console.print(rendered)
                 self.console.print()  # blank line between user input and agent response
             elif msg.role == "assistant":
                 segments: list[_Segment] = []
@@ -1858,6 +1904,25 @@ def replay_history(self, messages: list) -> None:
                         Text(f"✻ {random_completion_verb()} {_format_elapsed(msg.elapsed_seconds)}", style="dim italic")
                     )
 
+    def _render_user_content(self, content: Any, *, text_block_type: type, image_block_type: type) -> Text:
+        text = Text()
+        text.append("❯ ", style="bold cyan")
+        if isinstance(content, str):
+            text.append(content)
+            return text
+        if not isinstance(content, list):
+            return text
+        image_count = 0
+        for block in content:
+            if isinstance(block, text_block_type):
+                text.append(block.text)
+            elif isinstance(block, image_block_type):
+                image_count += 1
+                image_id = getattr(block, "ref_id", None)
+                label_id = image_id if isinstance(image_id, int) else image_count
+                text.append(f"[Image #{label_id}]", style=self._image_block_style(block))
+        return text
+
     @staticmethod
     def is_internal_skill_context_message(message: Any) -> bool:
         content = getattr(message, "content", None)
diff --git a/src/iac_code/ui/repl.py b/src/iac_code/ui/repl.py
index d6d60da5..f5e7630c 100644
--- a/src/iac_code/ui/repl.py
+++ b/src/iac_code/ui/repl.py
@@ -91,6 +91,7 @@
     from iac_code.pipeline import PipelineRunner
     from iac_code.pipeline.config import RunMode
     from iac_code.pipeline.engine.events import PipelineEvent
+    from iac_code.pipeline.engine.user_input import PipelineUserInput
 
 termios: ModuleType | None
 try:
@@ -105,7 +106,7 @@
 # pipeline's allow_user_escapes.command setting (problem 5). Permanent whitelist
 # so users are never locked out of the basics while a pipeline is running.
 _PIPELINE_SAFE_COMMANDS: frozenset[str] = frozenset({"/exit", "/help", "/status", "/prompt", "/resume"})
-PipelineHandoffResult = Literal["not_applicable", "succeeded", "failed"]
+PipelineHandoffResult = Literal["not_applicable", "succeeded", "failed", "persistence_failed"]
 
 
 class ExitREPLError(Exception):
@@ -261,6 +262,8 @@ def __init__(
             self.tool_registry,
             status_callback=self._status_text,
             app_state_store=self.store,
+            image_path_resolver=self._image_store.get_path,
+            image_block_path_resolver=self._image_store.store_block,
         )
 
         self._pipeline: PipelineRunner | None = None
@@ -268,6 +271,8 @@ def __init__(
         self._pipeline_restored_status: str | None = None
         self._pipeline_display_recorder = None
         self._pipeline_display_current_step_id: str | None = None
+        self._pipeline_state_persistence_failed: bool = False
+        self._pipeline_state_persistence_warning_rendered: bool = False
 
         # Keybinding manager
         self._keybinding_manager = KeybindingManager()
@@ -455,11 +460,13 @@ def _on_sigint() -> None:
         try:
             loop.add_signal_handler(signal.SIGINT, _on_sigint)
             _has_sigint_handler = True
-        except (NotImplementedError, OSError):
+        except (NotImplementedError, OSError, RuntimeError):
             pass  # Windows or restricted environment
 
         if initial_prompt is None:
-            await self._resume_pipeline_sidecar_on_startup()
+            resumed_pipeline = await self._resume_pipeline_sidecar_on_startup()
+            if not resumed_pipeline:
+                await self._maybe_start_normal_chat_cleanup_on_startup()
 
         first_turn = True
         last_ctrl_c_time: float = 0.0
@@ -774,6 +781,7 @@ def _open_history_search(self) -> bool:
     def _history_search_messages(self) -> list[dict[str, str]]:
         """Build searchable user-history rows from prompt history and conversation context."""
         from iac_code.agent.message import RECALLED_MEMORY_MARKER, is_recalled_memory_message
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
 
         entries: list[str] = []
         seen: set[str] = set()
@@ -802,7 +810,11 @@ def add_text(text: str) -> None:
         for msg in context_messages:
             if getattr(msg, "role", None) != "user":
                 continue
-            if is_recalled_memory_message(msg) or Renderer.is_internal_skill_context_message(msg):
+            if (
+                is_recalled_memory_message(msg)
+                or is_cleanup_prompt_message(msg)
+                or Renderer.is_internal_skill_context_message(msg)
+            ):
                 continue
             get_text = getattr(msg, "get_text", None)
             if callable(get_text):
@@ -927,6 +939,16 @@ def _is_pipeline_safe_command(self, user_input: str) -> bool:
         first = user_input.split(None, 1)[0] if user_input else ""
         return first in _PIPELINE_SAFE_COMMANDS
 
+    def _pipeline_memory_content_getter(self) -> None:
+        """Return pipeline prompt memory provider.
+
+        Pipeline steps should not receive all auto-memory topic bodies in the
+        system prompt. They also intentionally do not receive MemoryRecallService,
+        so no side recall is triggered. Relevant topic memories are available
+        through the explicit read_memory tool when a step's tool policy allows it.
+        """
+        return None
+
     def _maybe_block_user_escape(self, user_input: str) -> bool:
         """Return True if the input is a gated escape and we should NOT process it.
 
@@ -1188,7 +1210,13 @@ def _pipeline_display_replay_insert_index(cls, messages: list[Message]) -> int |
 
     @classmethod
     def _pipeline_visible_resume_messages(cls, messages: list[Message]) -> list[Message]:
-        return [message for message in messages if not cls._is_pipeline_handoff_context_message(message)]
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
+
+        return [
+            message
+            for message in messages
+            if not cls._is_pipeline_handoff_context_message(message) and not is_cleanup_prompt_message(message)
+        ]
 
     @staticmethod
     def _is_pipeline_handoff_context_message(message: Message) -> bool:
@@ -1263,6 +1291,8 @@ def _render_pipeline_display_transcript_window(self, messages: list[Message]) ->
             self.tool_registry,
             status_callback=self._status_text,
             app_state_store=self.store,
+            image_path_resolver=self._image_store.get_path,
+            image_block_path_resolver=self._image_store.store_block,
         )
         temp_renderer.replay_history(messages)
         rendered = stream.getvalue().rstrip()
@@ -1305,12 +1335,17 @@ async def _handle_chat_continue(self) -> list[str]:
             logger.error("_handle_chat_continue called in pipeline mode; this is a bug")
             return []
 
+        if self._block_if_cleanup_ledger_unreadable():
+            return []
+
         self.store.set_state(is_busy=True)
         try:
             streaming_input = StreamingInputBuffer()
-            events = self._agent_loop.run_streaming(
-                "",
-                queued_input_provider=lambda: streaming_input.drain_queued_inputs(self._should_submit_mid_turn),
+            events = self._wrap_cleanup_observer(
+                self._agent_loop.run_streaming(
+                    "",
+                    queued_input_provider=lambda: streaming_input.drain_queued_inputs(self._should_submit_mid_turn),
+                )
             )
             result = await self.renderer.run_streaming_output(
                 events,
@@ -1327,24 +1362,784 @@ async def _handle_chat_continue(self) -> list[str]:
                     self._streaming_error_log.append((err, msg_count))
             return queued_inputs
         finally:
+            self._prune_cleanup_prompts_if_no_pending_cleanup()
             self.store.set_state(is_busy=False)
 
+    def _cleanup_ledger_for_pipeline(self, pipeline: object | None):
+        if pipeline is None:
+            return None
+        from iac_code.pipeline.engine.cleanup import CleanupLedger
+
+        getter = getattr(pipeline, "cleanup_ledger", None)
+        if not callable(getter):
+            return None
+        try:
+            ledger = getter()
+        except Exception:
+            logger.warning("Failed to load pipeline cleanup ledger", exc_info=True)
+            return None
+        return ledger if isinstance(ledger, CleanupLedger) else None
+
+    def _cleanup_ledger_for_normal_chat(self):
+        from pathlib import Path
+
+        from iac_code.pipeline.engine.cleanup import CleanupLedger
+
+        prompt_path = self._cleanup_ledger_path_from_active_prompt()
+        if prompt_path is not None:
+            return CleanupLedger(prompt_path)
+
+        explicit_path = getattr(self, "_pipeline_cleanup_ledger_path", None)
+        if explicit_path:
+            ledger = CleanupLedger(Path(explicit_path))
+            has_active_prompt = self._cleanup_prompt_exists_anywhere()
+            if has_active_prompt:
+                return ledger
+            if not ledger.path.exists():
+                self._clear_pipeline_cleanup_ledger_path(ledger.path)
+                return None
+            if ledger.load_failed():
+                return ledger
+            if ledger.pending_resources():
+                return ledger
+            self._clear_pipeline_cleanup_ledger_path(ledger.path)
+            return None
+
+        has_active_prompt = self._cleanup_prompt_exists_anywhere()
+
+        candidate_cwds: list[str] = []
+        try:
+            from iac_code.pipeline.config import get_working_directory
+
+            pipeline_cwd = get_working_directory()
+            if pipeline_cwd:
+                candidate_cwds.append(pipeline_cwd)
+        except Exception:
+            pass
+        original_cwd = getattr(self, "_original_cwd", None)
+        if original_cwd:
+            candidate_cwds.append(original_cwd)
+
+        session_storage = getattr(self, "_session_storage", None)
+        session_id = getattr(self, "_session_id", None)
+        if session_storage is None or not isinstance(session_id, str) or not session_id:
+            return None
+
+        seen: set[str] = set()
+        completed_prompt_ledger = None
+        for cwd in candidate_cwds:
+            if cwd in seen:
+                continue
+            seen.add(cwd)
+            try:
+                path = Path(session_storage.session_dir(cwd, session_id)) / "pipeline" / "cleanup.yaml"
+            except Exception:
+                continue
+            if path.exists():
+                ledger = CleanupLedger(path)
+                if ledger.load_failed():
+                    continue
+                if ledger.pending_resources():
+                    return ledger
+                if has_active_prompt and completed_prompt_ledger is None:
+                    completed_prompt_ledger = ledger
+        return completed_prompt_ledger
+
+    def _cleanup_ledger_for_resume_summary(self):
+        from pathlib import Path
+
+        from iac_code.pipeline.engine.cleanup import CleanupLedger
+
+        prompt_path = self._cleanup_ledger_path_from_any_cleanup_prompt()
+        if prompt_path is not None:
+            return CleanupLedger(prompt_path)
+
+        explicit_path = getattr(self, "_pipeline_cleanup_ledger_path", None)
+        if explicit_path:
+            return CleanupLedger(Path(explicit_path))
+
+        return None
+
+    def _clear_pipeline_cleanup_ledger_path(self, path=None) -> None:
+        from pathlib import Path
+
+        explicit_path = getattr(self, "_pipeline_cleanup_ledger_path", None)
+        if explicit_path is None:
+            return
+        if path is not None:
+            try:
+                if Path(explicit_path) != Path(path):
+                    return
+            except TypeError:
+                return
+        try:
+            delattr(self, "_pipeline_cleanup_ledger_path")
+        except AttributeError:
+            pass
+
+    def _cleanup_ledger_path_from_active_prompt(self):
+        from pathlib import Path
+
+        from iac_code.pipeline.engine.cleanup import cleanup_prompt_ledger_path, is_active_cleanup_prompt_message
+
+        for message in [*self._cleanup_prompt_messages_from_context(), *self._cleanup_prompt_messages_from_session()]:
+            if not is_active_cleanup_prompt_message(message):
+                continue
+            ledger_path = cleanup_prompt_ledger_path(message)
+            if ledger_path:
+                return Path(ledger_path)
+        return None
+
+    def _cleanup_ledger_path_from_any_cleanup_prompt(self):
+        from pathlib import Path
+
+        from iac_code.pipeline.engine.cleanup import cleanup_prompt_ledger_path, is_cleanup_prompt_message
+
+        for message in [*self._cleanup_prompt_messages_from_context(), *self._cleanup_prompt_messages_from_session()]:
+            if not is_cleanup_prompt_message(message):
+                continue
+            ledger_path = cleanup_prompt_ledger_path(message)
+            if ledger_path:
+                return Path(ledger_path)
+        return None
+
+    def _wrap_cleanup_observer(self, events, *, ledger=None):
+        from iac_code.pipeline.engine.cleanup import CleanupLedger, CleanupObserver
+
+        cleanup_ledger = ledger or self._cleanup_ledger_for_normal_chat()
+        if not isinstance(cleanup_ledger, CleanupLedger):
+            return events
+        if cleanup_ledger.load_failed():
+            return events
+
+        async def observed_stream():
+            observer = CleanupObserver(cleanup_ledger)
+            previous = self._cleanup_resource_state_map(cleanup_ledger)
+            async for event in events:
+                observer.observe(event)
+                previous = self._print_cleanup_status_changes(cleanup_ledger, previous)
+                yield event
+
+        return observed_stream()
+
+    @staticmethod
+    def _cleanup_resource_state(resource) -> tuple[object, ...]:
+        return (
+            getattr(resource, "cleanup_status", None),
+            getattr(resource, "progress_status", None),
+            getattr(resource, "progress_percentage", None),
+            getattr(resource, "cleanup_tool_use_id", None),
+            getattr(resource, "last_error", None),
+        )
+
+    def _cleanup_resource_state_map(self, ledger) -> dict[str, tuple[object, ...]]:
+        try:
+            resources = ledger.cleanup_resources()
+        except Exception:
+            return {}
+        return {resource.key: self._cleanup_resource_state(resource) for resource in resources}
+
+    def _print_cleanup_status_changes(
+        self,
+        ledger,
+        previous: dict[str, tuple[object, ...]],
+    ) -> dict[str, tuple[object, ...]]:
+        try:
+            resources = ledger.cleanup_resources()
+        except Exception:
+            return previous
+        current = {resource.key: self._cleanup_resource_state(resource) for resource in resources}
+        printer = getattr(getattr(self, "renderer", None), "print_system_message", None)
+        if not callable(printer):
+            return current
+        for resource in resources:
+            state = current.get(resource.key)
+            if state is None or previous.get(resource.key) == state:
+                continue
+            message = self._cleanup_resource_status_message(resource)
+            if not message:
+                continue
+            printer(message, style=self._cleanup_status_style(getattr(resource, "cleanup_status", "")))
+        return current
+
+    @staticmethod
+    def _cleanup_status_style(status: str) -> str:
+        if status == "failed":
+            return "red"
+        if status in {"completed", "skipped"}:
+            return "green"
+        return "yellow"
+
+    @staticmethod
+    def _cleanup_resource_status_message(resource) -> str:
+        status = str(getattr(resource, "cleanup_status", "") or "pending")
+        resource_id = str(getattr(resource, "resource_id", "") or "")
+        label = str(getattr(resource, "resource_name", "") or resource_id)
+        region = str(getattr(resource, "region_id", "") or "unknown")
+        progress = str(getattr(resource, "progress_status", "") or status)
+        last_error = str(getattr(resource, "last_error", "") or "")
+        badge = InlineREPL._cleanup_status_badge(status, progress)
+        detail = InlineREPL._cleanup_status_detail(status, progress)
+        parts = [
+            _("↺ Rollback cleanup [{badge}] {label}").format(badge=badge, label=label),
+            _("{kind} {resource_id}").format(
+                kind=InlineREPL._cleanup_resource_kind_label(resource),
+                resource_id=InlineREPL._short_cleanup_resource_id(resource_id),
+            ),
+            region,
+            detail,
+        ]
+        if last_error:
+            parts.append(_("Error: {error}").format(error=InlineREPL._safe_cleanup_error(last_error)))
+        return " · ".join(part for part in parts if part)
+
+    @staticmethod
+    def _cleanup_status_badge(status: str, progress: str) -> str:
+        if status == "started":
+            return _("Deleting")
+        if status == "completed":
+            return _("Completed")
+        if status == "failed":
+            return _("Failed")
+        if status == "skipped":
+            return _("Skipped")
+        if status == "pending":
+            return _("Pending")
+        if progress and not progress.startswith("DELETE"):
+            return _("Checking")
+        if progress in {"DELETE_REQUESTED", "DELETE_STARTED", "DELETE_IN_PROGRESS"}:
+            return _("Deleting")
+        return _("Progress")
+
+    @staticmethod
+    def _cleanup_status_detail(status: str, progress: str) -> str:
+        if status == "started":
+            if progress:
+                return _("DeleteStack submitted; waiting for deletion to complete ({progress})").format(
+                    progress=progress
+                )
+            return _("DeleteStack submitted; waiting for deletion to complete")
+        if status == "completed":
+            return progress or "completed"
+        if status == "failed":
+            return progress or "failed"
+        if status == "skipped":
+            return _("Skipped")
+        if progress == "DELETE_IN_PROGRESS":
+            return _("Deleting ({progress})").format(progress=progress)
+        if progress in {"DELETE_REQUESTED", "DELETE_STARTED"}:
+            return _("DeleteStack submitted; waiting for deletion to complete ({progress})").format(progress=progress)
+        if progress and not progress.startswith("DELETE"):
+            return _("{progress}; deletion required").format(progress=progress)
+        return progress or status
+
+    @staticmethod
+    def _cleanup_resource_kind_label(resource) -> str:
+        provider = str(getattr(resource, "provider", "") or "").lower()
+        resource_type = str(getattr(resource, "resource_type", "") or "").lower()
+        if provider == "ros" and resource_type == "stack":
+            return _("stack")
+        return _("resource")
+
+    @staticmethod
+    def _short_cleanup_resource_id(resource_id: str) -> str:
+        if len(resource_id) <= 18:
+            return resource_id
+        return "{}…{}".format(resource_id[:8], resource_id[-4:])
+
+    @staticmethod
+    def _safe_cleanup_error(error: str) -> str:
+        from iac_code.utils.public_errors import sanitize_public_text
+
+        sanitized = sanitize_public_text(error)
+        return sanitized[:1000] + "..." if len(sanitized) > 1000 else sanitized
+
+    def _remove_cleanup_prompts_from_context(self) -> int:
+        context_manager = getattr(getattr(self, "_agent_loop", None), "context_manager", None)
+        remover = getattr(context_manager, "remove_cleanup_prompt_messages", None)
+        if not callable(remover):
+            return 0
+        try:
+            removed = remover()
+        except Exception:
+            logger.warning("Failed to remove pipeline cleanup prompt from context", exc_info=True)
+            return 0
+        return removed if isinstance(removed, int) else 0
+
+    def _warn_cleanup_ledger_load_failed(self, ledger) -> None:
+        if getattr(self, "_cleanup_ledger_load_failed_warning_printed", False):
+            return
+        self._cleanup_ledger_load_failed_warning_printed = True
+        load_error = ""
+        get_load_error = getattr(ledger, "load_error", None)
+        if callable(get_load_error):
+            try:
+                load_error = get_load_error() or ""
+            except Exception:
+                load_error = ""
+        if load_error:
+            logger.warning("Pipeline cleanup ledger is unreadable: %s", load_error)
+        else:
+            ledger_path = getattr(ledger, "path", None)
+            if ledger_path:
+                logger.warning("Pipeline cleanup ledger is unavailable: %s", ledger_path)
+        self.renderer.print_system_message(
+            _("Could not read rollback cleanup records. The cleanup prompt was kept; retry later or inspect manually."),
+            style="yellow",
+        )
+
+    def _prune_cleanup_prompts_if_no_pending_cleanup(self, ledger=None) -> None:
+        cleanup_ledger = ledger or self._cleanup_ledger_for_normal_chat()
+        if self._cleanup_ledger_unavailable_with_prompt(cleanup_ledger):
+            self._warn_cleanup_ledger_load_failed(cleanup_ledger)
+            return
+        if cleanup_ledger is not None:
+            load_failed = getattr(cleanup_ledger, "load_failed", None)
+            if callable(load_failed) and load_failed():
+                self._warn_cleanup_ledger_load_failed(cleanup_ledger)
+                return
+        if cleanup_ledger is None or not cleanup_ledger.pending_resources():
+            if cleanup_ledger is not None:
+                self._mark_cleanup_prompts_completed(cleanup_ledger)
+                self._clear_pipeline_cleanup_ledger_path(getattr(cleanup_ledger, "path", None))
+            self._remove_cleanup_prompts_from_context()
+
+    def _print_cleanup_resume_summary(self) -> None:
+        ledger = self._cleanup_ledger_for_resume_summary()
+        if ledger is None:
+            return
+        load_failed = getattr(ledger, "load_failed", None)
+        if callable(load_failed) and load_failed():
+            return
+        ledger_path = str(getattr(ledger, "path", "") or "")
+        printed_paths = getattr(self, "_cleanup_resume_summary_printed_paths", set())
+        if ledger_path and ledger_path in printed_paths:
+            return
+        try:
+            resume_resources = self._cleanup_resume_resources(ledger)
+        except Exception:
+            return
+        if not resume_resources:
+            return
+        printer = getattr(getattr(self, "renderer", None), "print_system_message", None)
+        if not callable(printer):
+            return
+        printer(
+            self._cleanup_resume_summary_message(resume_resources),
+            style=self._cleanup_resume_summary_style(resume_resources),
+        )
+        detail_resources = [
+            resource for resource in resume_resources if self._cleanup_resume_should_show_detail(resource)
+        ]
+        visible_resources = detail_resources[-5:]
+        for resource in visible_resources:
+            printer(
+                self._cleanup_resume_resource_line(resource),
+                style=self._cleanup_status_style(str(getattr(resource, "cleanup_status", "") or "")),
+            )
+        if len(detail_resources) > 5:
+            printer(
+                _("{count} additional resources needing attention were not shown.").format(
+                    count=len(detail_resources) - 5
+                ),
+                style="yellow",
+            )
+        if ledger_path:
+            printed_paths = set(printed_paths)
+            printed_paths.add(ledger_path)
+            self._cleanup_resume_summary_printed_paths = printed_paths
+
+    @staticmethod
+    def _cleanup_resume_resources(ledger) -> list[Any]:
+        resources = ledger.cleanup_resources()
+        history_resources = InlineREPL._cleanup_resume_history_resources(ledger)
+        if not history_resources:
+            return resources
+
+        history_by_key = {resource.key: resource for resource in history_resources}
+        merged: list[Any] = []
+        seen: set[str] = set()
+        for resource in resources:
+            key = resource.key
+            merged.append(history_by_key.get(key, resource))
+            seen.add(key)
+        for resource in history_resources:
+            if resource.key not in seen:
+                merged.append(resource)
+        return merged
+
+    @staticmethod
+    def _cleanup_resume_summary_message(resources: list[Any]) -> str:
+        total = len(resources)
+        counts = InlineREPL._cleanup_resume_status_counts(resources)
+        if total > 0 and counts["completed"] == total:
+            return _("↺ Rollback cleanup resume: all {count} records are completed.").format(count=total)
+
+        parts: list[str] = []
+        for key, label in (
+            ("failed", _("failed")),
+            ("pending", _("pending")),
+            ("active", _("in progress")),
+            ("completed", _("completed")),
+            ("skipped", _("skipped")),
+        ):
+            count = counts[key]
+            if count:
+                parts.append(_("{count} {label}").format(count=count, label=label))
+        if parts:
+            return _("↺ Rollback cleanup resume: {count} records, {summary}.").format(
+                count=total,
+                summary=", ".join(parts),
+            )
+        return _("↺ Rollback cleanup resume: {count} records.").format(count=total)
+
+    @staticmethod
+    def _cleanup_resume_status_counts(resources: list[Any]) -> dict[str, int]:
+        counts = {
+            "pending": 0,
+            "active": 0,
+            "completed": 0,
+            "failed": 0,
+            "skipped": 0,
+        }
+        for resource in resources:
+            status = str(getattr(resource, "cleanup_status", "") or "pending")
+            if status in {"started", "in_progress"}:
+                counts["active"] += 1
+            elif status in counts:
+                counts[status] += 1
+            else:
+                counts["pending"] += 1
+        return counts
+
+    @staticmethod
+    def _cleanup_resume_summary_style(resources: list[Any]) -> str:
+        if resources and all(
+            str(getattr(resource, "cleanup_status", "") or "pending") in {"completed", "skipped"}
+            for resource in resources
+        ):
+            return "green"
+        return "yellow"
+
+    @staticmethod
+    def _cleanup_resume_should_show_detail(resource) -> bool:
+        status = str(getattr(resource, "cleanup_status", "") or "pending")
+        return status not in {"completed", "skipped"}
+
+    @staticmethod
+    def _cleanup_resume_history_resources(ledger) -> list[Any]:
+        from iac_code.pipeline.constants import (
+            PIPELINE_EVENT_CLEANUP_COMPLETED,
+            PIPELINE_EVENT_CLEANUP_FAILED,
+            PIPELINE_EVENT_CLEANUP_PROGRESS,
+            PIPELINE_EVENT_CLEANUP_STARTED,
+        )
+        from iac_code.pipeline.engine.cleanup import CleanupResource
+
+        get_history = getattr(ledger, "history_entries", None)
+        if not callable(get_history):
+            return []
+        resources_by_key = {}
+        for entry in get_history():
+            event_type = str(entry.get("type") or "")
+            if event_type not in {
+                PIPELINE_EVENT_CLEANUP_STARTED,
+                PIPELINE_EVENT_CLEANUP_PROGRESS,
+                PIPELINE_EVENT_CLEANUP_COMPLETED,
+                PIPELINE_EVENT_CLEANUP_FAILED,
+                "cleanup_skipped",
+                "cleanup_pending",
+            }:
+                continue
+            resource_data = dict(entry.get("resource") or {})
+            if not resource_data:
+                continue
+            for key in (
+                "cleanup_status",
+                "cleanup_tool_use_id",
+                "cleanup_action",
+                "progress_status",
+                "progress_percentage",
+                "last_error",
+            ):
+                if entry.get(key) is not None:
+                    resource_data[key] = entry[key]
+            if entry.get("timestamp") is not None:
+                resource_data["updated_at"] = entry["timestamp"]
+            resource = CleanupResource.from_dict(resource_data)
+            if resource.resource_id:
+                resources_by_key.pop(resource.key, None)
+                resources_by_key[resource.key] = resource
+        return list(resources_by_key.values())
+
+    @staticmethod
+    def _cleanup_resume_resource_line(resource) -> str:
+        status = str(getattr(resource, "cleanup_status", "") or "pending")
+        resource_id = str(getattr(resource, "resource_id", "") or "")
+        label = str(getattr(resource, "resource_name", "") or resource_id)
+        region = str(getattr(resource, "region_id", "") or "unknown")
+        progress = str(getattr(resource, "progress_status", "") or status)
+        last_error = str(getattr(resource, "last_error", "") or "")
+        badge = InlineREPL._cleanup_status_badge(status, progress)
+        detail = InlineREPL._cleanup_status_detail(status, progress)
+        parts = [
+            _("  [{badge}] {label}").format(badge=badge, label=label),
+            _("{kind} {resource_id}").format(
+                kind=InlineREPL._cleanup_resource_kind_label(resource),
+                resource_id=InlineREPL._short_cleanup_resource_id(resource_id),
+            ),
+            region,
+            detail,
+        ]
+        if last_error:
+            parts.append(_("Error: {error}").format(error=InlineREPL._safe_cleanup_error(last_error)))
+        return " · ".join(part for part in parts if part)
+
+    async def _maybe_start_normal_chat_cleanup_on_startup(self) -> bool:
+        from iac_code.pipeline.config import RunMode
+
+        if self._get_runtime_mode() != RunMode.NORMAL:
+            return False
+        self._print_cleanup_resume_summary()
+        ledger = self._cleanup_ledger_for_normal_chat()
+        if self._cleanup_ledger_unavailable_with_prompt(ledger):
+            self._warn_cleanup_ledger_load_failed(ledger)
+            return False
+        if ledger is None:
+            self._remove_cleanup_prompts_from_context()
+            return False
+        if ledger.load_failed():
+            self._warn_cleanup_ledger_load_failed(ledger)
+            return False
+        if not ledger.pending_resources():
+            self._prune_cleanup_prompts_if_no_pending_cleanup(ledger)
+            return False
+        return await self._start_pipeline_cleanup_from_ledger(ledger)
+
+    async def _maybe_start_pipeline_cleanup(self, pipeline: object | None) -> bool:
+        from iac_code.pipeline.config import RunMode
+
+        if pipeline is None or self._get_runtime_mode() != RunMode.NORMAL:
+            return False
+        ledger = self._cleanup_ledger_for_pipeline(pipeline)
+        if ledger is None:
+            return False
+        return await self._start_pipeline_cleanup_from_ledger(ledger)
+
+    async def _start_pipeline_cleanup_from_ledger(self, ledger) -> bool:
+        from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
+
+        load_failed = getattr(ledger, "load_failed", None)
+        if callable(load_failed) and load_failed():
+            self._warn_cleanup_ledger_load_failed(ledger)
+            return False
+        cleanup_prompt = ledger.build_pending_prompt()
+        if cleanup_prompt is None:
+            return False
+
+        self._pipeline_cleanup_ledger_path = ledger.path
+        ledger.record_prompt_queued(cleanup_prompt, ui_surface="repl")
+        self.renderer.print_system_message("\n" + cleanup_prompt.status_message, style="yellow")
+        session_prompt_exists = self._cleanup_prompt_exists_in_session(cleanup_prompt.prompt)
+        self._remove_cleanup_prompts_from_context()
+        message = create_cleanup_prompt_message(
+            cleanup_prompt.prompt,
+            cleanup_ledger_path=ledger.path,
+            cleanup_status="pending",
+        )
+        try:
+            injected = self._agent_loop.context_manager.add_raw_message(message.to_dict())
+            if not session_prompt_exists:
+                self._session_storage.append(
+                    self._original_cwd,
+                    self._session_id,
+                    injected,
+                    git_branch=self.current_git_branch(),
+                )
+        except Exception as exc:
+            logger.warning("Failed to inject pipeline cleanup prompt: %s", exc)
+            self.renderer.print_system_message(
+                _("Detected rollback cleanup resources, but cleanup prompt injection failed."),
+                style="yellow",
+            )
+            return False
+
+        self.store.set_state(is_busy=True)
+        try:
+            streaming_input = StreamingInputBuffer()
+            events = self._wrap_cleanup_observer(self._agent_loop.continue_streaming(), ledger=ledger)
+            result = await self.renderer.run_streaming_output(
+                events,
+                permission_handler=self.renderer.prompt_permission,
+                streaming_input=streaming_input,
+            )
+            elapsed, queued_inputs, draft_input = self._normalize_streaming_output_result(result)
+            self._streaming_draft_input = draft_input
+            if elapsed >= 1.0:
+                self._agent_loop.stamp_last_turn_elapsed(elapsed)
+            if queued_inputs:
+                self._streaming_draft_input = "\n".join([*queued_inputs, draft_input]).strip()
+            if self.renderer._last_streaming_errors:
+                msg_count = len(self._agent_loop.context_manager.get_messages())
+                for err in self.renderer._last_streaming_errors:
+                    self._streaming_error_log.append((err, msg_count))
+        finally:
+            self._prune_cleanup_prompts_if_no_pending_cleanup(ledger)
+            self.store.set_state(is_busy=False)
+        return True
+
+    def _cleanup_prompt_messages_from_context(self):
+        context_manager = getattr(getattr(self, "_agent_loop", None), "context_manager", None)
+        get_messages = getattr(context_manager, "get_messages", None)
+        if not callable(get_messages):
+            return []
+        try:
+            messages = get_messages()
+        except Exception:
+            return []
+        return messages if isinstance(messages, list) else []
+
+    def _cleanup_prompt_messages_from_session(self):
+        session_storage = getattr(self, "_session_storage", None)
+        load = getattr(session_storage, "load", None)
+        if not callable(load):
+            return []
+        original_cwd = getattr(self, "_original_cwd", None)
+        session_id = getattr(self, "_session_id", None)
+        if not isinstance(original_cwd, str) or not isinstance(session_id, str):
+            return []
+        try:
+            messages = load(original_cwd, session_id)
+        except Exception:
+            return []
+        return messages if isinstance(messages, list) else []
+
+    def _mark_cleanup_prompts_completed(self, ledger) -> None:
+        from iac_code.pipeline.engine.cleanup import mark_cleanup_prompt_message_completed
+
+        ledger_path = getattr(ledger, "path", None)
+        for message in self._cleanup_prompt_messages_from_context():
+            mark_cleanup_prompt_message_completed(message, cleanup_ledger_path=ledger_path)
+
+        session_storage = getattr(self, "_session_storage", None)
+        save = getattr(session_storage, "save", None)
+        if not callable(save):
+            return
+        messages = self._cleanup_prompt_messages_from_session()
+        changed = False
+        for message in messages:
+            changed = mark_cleanup_prompt_message_completed(message, cleanup_ledger_path=ledger_path) or changed
+        if not changed:
+            return
+        original_cwd = getattr(self, "_original_cwd", None)
+        session_id = getattr(self, "_session_id", None)
+        if not isinstance(original_cwd, str) or not isinstance(session_id, str):
+            return
+        try:
+            save(
+                original_cwd,
+                session_id,
+                messages,
+                git_branch=self.current_git_branch(),
+            )
+        except Exception:
+            logger.warning("Failed to mark pipeline cleanup prompt completed in session", exc_info=True)
+
+    def _cleanup_prompt_exists_in_context(self, prompt: str) -> bool:
+        from iac_code.pipeline.engine.cleanup import is_active_cleanup_prompt_message
+
+        return any(
+            is_active_cleanup_prompt_message(message) and message.content == prompt
+            for message in self._cleanup_prompt_messages_from_context()
+        )
+
+    def _cleanup_prompt_exists_in_session(self, prompt: str) -> bool:
+        from iac_code.pipeline.engine.cleanup import is_active_cleanup_prompt_message
+
+        return any(
+            is_active_cleanup_prompt_message(message) and message.content == prompt
+            for message in self._cleanup_prompt_messages_from_session()
+        )
+
+    def _context_has_cleanup_prompt(self) -> bool:
+        from iac_code.pipeline.engine.cleanup import is_active_cleanup_prompt_message
+
+        return any(
+            is_active_cleanup_prompt_message(message) for message in self._cleanup_prompt_messages_from_context()
+        )
+
+    def _session_has_cleanup_prompt(self) -> bool:
+        from iac_code.pipeline.engine.cleanup import is_active_cleanup_prompt_message
+
+        return any(
+            is_active_cleanup_prompt_message(message) for message in self._cleanup_prompt_messages_from_session()
+        )
+
+    def _cleanup_prompt_exists_anywhere(self) -> bool:
+        return self._context_has_cleanup_prompt() or self._session_has_cleanup_prompt()
+
+    def _cleanup_ledger_unavailable_with_prompt(self, ledger) -> bool:
+        if not self._cleanup_prompt_exists_anywhere():
+            return False
+        if ledger is None:
+            return True
+        path = getattr(ledger, "path", None)
+        try:
+            if path is not None and not path.exists():
+                return True
+        except Exception:
+            return True
+        load_failed = getattr(ledger, "load_failed", None)
+        return bool(callable(load_failed) and load_failed())
+
+    def _block_if_cleanup_ledger_unreadable(self) -> bool:
+        ledger = self._cleanup_ledger_for_normal_chat()
+        if not self._cleanup_ledger_unavailable_with_prompt(ledger):
+            return False
+        self._warn_cleanup_ledger_load_failed(ledger)
+        return True
+
+    async def _run_pending_cleanup_before_normal_turn(self, *, draft_text: str) -> bool:
+        ledger = self._cleanup_ledger_for_normal_chat()
+        if self._cleanup_ledger_unavailable_with_prompt(ledger):
+            self._warn_cleanup_ledger_load_failed(ledger)
+            self._streaming_draft_input = draft_text
+            return False
+        if ledger is None:
+            return True
+        if ledger.load_failed():
+            if self._context_has_cleanup_prompt():
+                self._warn_cleanup_ledger_load_failed(ledger)
+                self._streaming_draft_input = draft_text
+                return False
+            return True
+        if not ledger.pending_resources():
+            self._mark_cleanup_prompts_completed(ledger)
+            self._remove_cleanup_prompts_from_context()
+            return True
+
+        if not await self._start_pipeline_cleanup_from_ledger(ledger):
+            self._streaming_draft_input = draft_text
+            return False
+        if ledger.load_failed() or ledger.pending_resources():
+            self._streaming_draft_input = draft_text
+            self.renderer.print_system_message(
+                _("Rollback cleanup is still in progress. Please continue after cleanup completes."),
+                style="yellow",
+            )
+            return False
+        return True
+
     async def _handle_chat(self, user_input: PromptInputResult | str) -> list[str]:
         """Send the user message to the agent loop and stream output."""
         from iac_code.pipeline.config import RunMode
 
         if self._get_runtime_mode() == RunMode.PIPELINE:
-            # Pipeline mode doesn't accept multimodal input — flatten to text.
-            text = user_input.text if isinstance(user_input, PromptInputResult) else user_input
-            # U-I4: warn user if we're about to drop pasted image content.
-            if isinstance(user_input, PromptInputResult) and user_input.pasted_contents:
-                has_image = any(pc.type == "image" for pc in user_input.pasted_contents.values())
-                if has_image:
-                    self.renderer.print_system_message(
-                        _("Note: images are not supported in pipeline mode and will be ignored."),
-                        style="yellow",
-                    )
-            await self._handle_pipeline_chat(text)
+            await self._handle_pipeline_chat(self._pipeline_user_input_from_repl_input(user_input))
+            return []
+
+        draft_text = user_input.text if isinstance(user_input, PromptInputResult) else user_input
+        if not await self._run_pending_cleanup_before_normal_turn(draft_text=draft_text):
             return []
 
         from iac_code.utils.image.processor import process_user_input
@@ -1367,9 +2162,11 @@ async def _handle_chat(self, user_input: PromptInputResult | str) -> list[str]:
         self.renderer.record_user_turn(record_text)
         try:
             streaming_input = StreamingInputBuffer()
-            events = self._agent_loop.run_streaming(
-                payload,
-                queued_input_provider=lambda: streaming_input.drain_queued_inputs(self._should_submit_mid_turn),
+            events = self._wrap_cleanup_observer(
+                self._agent_loop.run_streaming(
+                    payload,
+                    queued_input_provider=lambda: streaming_input.drain_queued_inputs(self._should_submit_mid_turn),
+                )
             )
             result = await self.renderer.run_streaming_output(
                 events,
@@ -1386,6 +2183,7 @@ async def _handle_chat(self, user_input: PromptInputResult | str) -> list[str]:
                     self._streaming_error_log.append((err, msg_count))
             return queued_inputs
         finally:
+            self._prune_cleanup_prompts_if_no_pending_cleanup()
             self.store.set_state(is_busy=False)
 
     async def _flush_pipeline_telemetry(self) -> None:
@@ -1413,6 +2211,8 @@ def _refresh_pipeline_display_recorder(self) -> None:
             self._pipeline_display_recorder = None
 
     def _record_pipeline_display_event(self, event) -> None:
+        if self._is_pipeline_state_persistence_failure_event(event):
+            self._pipeline_state_persistence_failed = True
         recorder = getattr(self, "_pipeline_display_recorder", None)
         if recorder is None:
             return
@@ -1516,7 +2316,7 @@ async def ensure_pipeline_restored_for_prompt(self) -> bool:
             session_id=self._session_id,
             cwd=pipeline_cwd,
             permission_context_getter=lambda: self.store.get_state().permission_context,
-            memory_content_getter=(lambda: self._memory_manager.get_prompt_content() if self._memory_manager else ""),
+            memory_content_getter=self._pipeline_memory_content_getter(),
             auto_trigger_skills=self.command_registry.get_model_invocable_skills(),
             resume_from_sidecar=True,
         )
@@ -1540,12 +2340,47 @@ async def ensure_pipeline_restored_for_prompt(self) -> bool:
         self._pipeline_waiting_input = restored.status == "waiting_input"
         return True
 
-    async def _handle_pipeline_chat(self, user_input: str) -> None:
+    def _pipeline_user_input_from_repl_input(
+        self, user_input: PromptInputResult | str | "PipelineUserInput" | None
+    ) -> "PipelineUserInput":
+        """Convert REPL input to the pipeline wrapper used by model-facing entry points."""
+        from iac_code.pipeline.engine.user_input import normalize_pipeline_user_input
+        from iac_code.utils.image.processor import process_user_input
+
+        if isinstance(user_input, PromptInputResult):
+            blocks = process_user_input(user_input.text, pasted_contents=user_input.pasted_contents)
+            content: str | list[ContentBlock]
+            if any(isinstance(block, ImageBlock) for block in blocks):
+                content = blocks
+            else:
+                content = user_input.text
+            return normalize_pipeline_user_input(content, display_text=user_input.text)
+        return normalize_pipeline_user_input(user_input)
+
+    async def _read_pipeline_interrupt_input(self) -> "PipelineUserInput":
+        user_input = await self._prompt_input.get_input(prompt="✎ ", transient=True)
+        if user_input is not None:
+            make_result = getattr(self._prompt_input, "make_result", None)
+            if callable(make_result):
+                result = make_result()
+                if isinstance(result, PromptInputResult):
+                    return self._pipeline_user_input_from_repl_input(result)
+        return self._pipeline_user_input_from_repl_input(user_input)
+
+    async def _handle_pipeline_chat(self, user_input: str | "PipelineUserInput") -> None:
         """Drive the pipeline and render output."""
         from iac_code.pipeline import create_pipeline
         from iac_code.pipeline.config import get_pipeline_name, get_working_directory
+        from iac_code.pipeline.engine.user_input import normalize_pipeline_user_input
 
-        self.renderer.record_user_turn(user_input)
+        pipeline_input = normalize_pipeline_user_input(user_input)
+        self.renderer.record_user_turn(pipeline_input.display_text)
+        if self._pipeline is not None and getattr(self, "_pipeline_state_persistence_failed", False):
+            self.renderer.print_system_message(
+                _("Pipeline state persistence failed. The pipeline is paused; do not continue until state is durable."),
+                style="yellow",
+            )
+            return
 
         if self._pipeline is None:
             pipeline_cwd = get_working_directory() or self._original_cwd
@@ -1557,9 +2392,7 @@ async def _handle_pipeline_chat(self, user_input: str) -> None:
                 session_id=self._session_id,
                 cwd=pipeline_cwd,
                 permission_context_getter=lambda: self.store.get_state().permission_context,
-                memory_content_getter=(
-                    lambda: self._memory_manager.get_prompt_content() if self._memory_manager else ""
-                ),
+                memory_content_getter=self._pipeline_memory_content_getter(),
                 auto_trigger_skills=self.command_registry.get_model_invocable_skills(),
             )
             self._refresh_pipeline_display_recorder()
@@ -1580,13 +2413,13 @@ async def _handle_pipeline_chat(self, user_input: str) -> None:
                 if self._pipeline_current_step_is_candidate_selection() is True:
                     resume_waiting_candidate_selection = True
                 else:
-                    event_stream = self._pipeline.resume(user_input)
+                    event_stream = cast(Any, self._pipeline).resume(pipeline_input)
             elif restored and restored.ok and restored.status == "running":
                 self._pipeline_waiting_input = False
-                event_stream = self._pipeline.continue_from_sidecar(user_input=user_input)
+                event_stream = cast(Any, self._pipeline).continue_from_sidecar(user_input=pipeline_input)
             else:
-                self._persist_pipeline_visible_user_turn(user_input)
-                event_stream = self._pipeline.run(user_input)
+                self._persist_pipeline_visible_user_turn(pipeline_input)
+                event_stream = cast(Any, self._pipeline).run(pipeline_input)
         else:
             self._refresh_pipeline_display_recorder()
             self._pipeline_waiting_input = False
@@ -1595,14 +2428,14 @@ async def _handle_pipeline_chat(self, user_input: str) -> None:
             resume_waiting_candidate_selection = False
             event_stream = None
             if restored_status == "running":
-                event_stream = self._pipeline.continue_from_sidecar(user_input=user_input)
+                event_stream = cast(Any, self._pipeline).continue_from_sidecar(user_input=pipeline_input)
             elif restored_status == "waiting_input":
                 if self._pipeline_current_step_is_candidate_selection() is True:
                     resume_waiting_candidate_selection = True
                 else:
-                    event_stream = self._pipeline.resume(user_input)
+                    event_stream = cast(Any, self._pipeline).resume(pipeline_input)
             else:
-                event_stream = self._pipeline.resume(user_input)
+                event_stream = cast(Any, self._pipeline).resume(pipeline_input)
 
         # No except for CancelledError/KeyboardInterrupt here: Ctrl+C must
         # propagate to the run() loop's single handler (which keeps the REPL
@@ -1625,6 +2458,7 @@ async def _handle_pipeline_chat(self, user_input: str) -> None:
             self._finalize_pipeline_after_render(terminal_event)
             if pipeline_for_flush is not None:
                 await self._flush_pipeline_telemetry()
+                await self._maybe_start_pipeline_cleanup(pipeline_for_flush)
 
     def _pipeline_current_step_is_candidate_selection(self) -> bool:
         pipeline = getattr(self, "_pipeline", None)
@@ -1658,7 +2492,11 @@ async def _resume_pipeline_sidecar_on_startup(self) -> bool:
                 self._pipeline_waiting_input = True
         finally:
             self.store.set_state(is_busy=False)
+            pipeline_for_flush = self._pipeline
             self._finalize_pipeline_after_render(terminal_event)
+            if pipeline_for_flush is not None:
+                await self._flush_pipeline_telemetry()
+                await self._maybe_start_pipeline_cleanup(pipeline_for_flush)
         return True
 
     def _render_pipeline_display_replay_on_startup(self) -> None:
@@ -1810,11 +2648,28 @@ def _clear_pipeline_runtime_state(self) -> None:
         self._pipeline_restored_status = None
         self._pipeline_display_recorder = None
         self._pipeline_display_current_step_id = None
+        self._pipeline_state_persistence_failed = False
+        self._pipeline_state_persistence_warning_rendered = False
 
     def _finalize_pipeline_after_render(self, terminal_event: PipelineEvent | None) -> None:
         # Keep terminal sidecars on disk for debugging. Terminal metadata
         # controls whether they are resumable.
+        if getattr(self, "_pipeline_state_persistence_failed", False):
+            if self._pipeline is not None:
+                pause_agent_loops = getattr(self._pipeline, "pause_agent_loops", None)
+                if callable(pause_agent_loops):
+                    pause_agent_loops()
+            self._pipeline_waiting_input = False
+            self._warn_pipeline_state_persistence_failed_once()
+            return
         handoff_result = self._handoff_pipeline_to_normal(terminal_event)
+        if handoff_result == "persistence_failed":
+            if self._pipeline is not None:
+                pause_agent_loops = getattr(self._pipeline, "pause_agent_loops", None)
+                if callable(pause_agent_loops):
+                    pause_agent_loops()
+            self._pipeline_waiting_input = False
+            return
         if handoff_result in {"succeeded", "failed"}:
             self._clear_pipeline_runtime_state()
         elif self._pipeline is not None and self._pipeline.sidecar_status == "failed":
@@ -1822,7 +2677,13 @@ def _finalize_pipeline_after_render(self, terminal_event: PipelineEvent | None)
         elif self._pipeline is not None and self._pipeline.state_machine.is_complete:
             self._clear_pipeline_runtime_state()
         elif self._pipeline is not None and not self._pipeline_waiting_input:
-            self._pipeline.mark_user_aborted("pipeline interrupted by user or renderer cancellation")
+            from iac_code.pipeline.engine.pipeline_runner import PipelineStatePersistenceError
+
+            try:
+                self._pipeline.mark_user_aborted("pipeline interrupted by user or renderer cancellation")
+            except PipelineStatePersistenceError as exc:
+                self._handle_pipeline_state_persistence_failure(exc)
+                return
             self._switch_user_aborted_pipeline_to_normal()
             self._clear_pipeline_runtime_state()
 
@@ -1838,7 +2699,17 @@ def _handoff_pipeline_to_normal(self, terminal_event: PipelineEvent | None) -> P
         if not pipeline.should_switch_to_normal(terminal_event.data):
             return "not_applicable"
 
-        self._set_runtime_mode(RunMode.NORMAL)
+        try:
+            pipeline.mark_normal_handoff(status="pending", failed_reason=None)
+        except Exception as exc:
+            self._pipeline_state_persistence_failed = True
+            logger.opt(exception=True).warning("Pipeline handoff metadata persistence failed: {}", exc)
+            self.renderer.print_system_message(
+                _("Pipeline state persistence failed. Normal chat handoff was not marked durable."),
+                style="yellow",
+            )
+            return "persistence_failed"
+
         try:
             summary = pipeline.build_normal_handoff_summary(terminal_event.data)
             injected = self._agent_loop.context_manager.add_raw_message({"role": "user", "content": summary})
@@ -1852,22 +2723,65 @@ def _handoff_pipeline_to_normal(self, terminal_event: PipelineEvent | None) -> P
                 git_branch=self.current_git_branch(),
             )
         except Exception as exc:
-            pipeline.mark_normal_handoff(status="failed", failed_reason=str(exc))
+            try:
+                pipeline.mark_normal_handoff(status="failed", failed_reason=str(exc))
+            except Exception as persistence_exc:
+                self._pipeline_state_persistence_failed = True
+                logger.opt(exception=True).warning(
+                    "Pipeline handoff failure metadata persistence failed: {}",
+                    persistence_exc,
+                )
+                self.renderer.print_system_message(
+                    _("Pipeline state persistence failed. Normal chat handoff was not marked durable."),
+                    style="yellow",
+                )
+                return "persistence_failed"
             logger.opt(exception=True).warning("Pipeline-to-normal handoff injection failed: {}", exc)
             self.renderer.print_system_message(
-                _("Pipeline completed. Normal chat is active, but the handoff context could not be injected or saved."),
+                _("Pipeline completed, but the handoff context could not be injected or saved."),
                 style="yellow",
             )
+            self._set_runtime_mode(RunMode.NORMAL)
             return "failed"
-        else:
+        try:
             pipeline.mark_normal_handoff(status="succeeded", failed_reason=None)
+        except Exception as exc:
+            self._pipeline_state_persistence_failed = True
+            logger.opt(exception=True).warning("Pipeline handoff metadata persistence failed: {}", exc)
             self.renderer.print_system_message(
-                _("Pipeline completed. Normal chat is now active."),
-                style="green",
+                _("Pipeline state persistence failed. Normal chat handoff was not marked durable."),
+                style="yellow",
             )
+            return "persistence_failed"
+        self._set_runtime_mode(RunMode.NORMAL)
+        self.renderer.print_system_message(
+            _("Pipeline completed. Normal chat is now active."),
+            style="green",
+        )
         return "succeeded"
 
-    async def _handle_mid_pipeline_message(self, msg: str, suppress_render: bool = False) -> tuple[bool, str]:
+    def _handle_pipeline_state_persistence_failure(self, exc: Exception) -> None:
+        logger.opt(exception=True).warning("Pipeline state persistence failed during interrupt handling: {}", exc)
+        self._pipeline_state_persistence_failed = True
+        self._last_interrupt_paused = True
+        self._pipeline_waiting_input = False
+        pause_agent_loops = getattr(self._pipeline, "pause_agent_loops", None)
+        if callable(pause_agent_loops):
+            pause_agent_loops()
+        self._warn_pipeline_state_persistence_failed_once()
+
+    def _warn_pipeline_state_persistence_failed_once(self) -> None:
+        if getattr(self, "_pipeline_state_persistence_warning_rendered", False):
+            return
+        self._pipeline_state_persistence_warning_rendered = True
+        self.renderer.print_system_message(
+            _("Pipeline state persistence failed. The pipeline is paused; do not continue until state is durable."),
+            style="yellow",
+        )
+
+    async def _handle_mid_pipeline_message(
+        self, msg: PromptInputResult | str | "PipelineUserInput", suppress_render: bool = False
+    ) -> tuple[bool, str]:
         """Process a user message received during pipeline execution via judge.
 
         Returns (needs_restart, feedback_text). When suppress_render is True,
@@ -1876,6 +2790,12 @@ async def _handle_mid_pipeline_message(self, msg: str, suppress_render: bool = F
         """
         if self._pipeline is None:
             return False, ""
+        from iac_code.pipeline.engine.pipeline_runner import PipelineStatePersistenceError
+
+        pipeline_input = self._pipeline_user_input_from_repl_input(msg)
+        if pipeline_input.is_empty:
+            return False, ""
+        display_text = pipeline_input.display_text
 
         from rich.spinner import Spinner
 
@@ -1885,15 +2805,19 @@ async def _handle_mid_pipeline_message(self, msg: str, suppress_render: bool = F
             refresh_per_second=10,
             transient=True,
         ):
-            verdict = await self._pipeline.handle_user_interrupt(msg)
+            verdict = await cast(Any, self._pipeline).handle_user_interrupt(pipeline_input)
 
         self._last_interrupt_paused = bool(getattr(verdict, "paused", False))
         if verdict.action == "continue":
-            feedback = self._format_interrupt_feedback("continue", msg, verdict)
+            feedback = self._format_interrupt_feedback("continue", display_text, verdict)
             if getattr(verdict, "paused", False):
                 save_interrupt_pause = getattr(self._pipeline, "save_interrupt_pause", None)
                 if callable(save_interrupt_pause):
-                    await save_interrupt_pause(verdict)
+                    try:
+                        await save_interrupt_pause(verdict)
+                    except PipelineStatePersistenceError as exc:
+                        self._handle_pipeline_state_persistence_failure(exc)
+                        return False, ""
                 self._pipeline_waiting_input = True
             # P-I18: surface ambiguous continue verdicts so users see their input wasn't understood
             if verdict.reason and verdict.reason.startswith("[ambiguous]"):
@@ -1905,27 +2829,34 @@ async def _handle_mid_pipeline_message(self, msg: str, suppress_render: bool = F
                     style="yellow",
                 )
             if not suppress_render:
-                self._render_interrupt_feedback("continue", msg, verdict)
+                self._render_interrupt_feedback("continue", display_text, verdict)
             return False, feedback
         if verdict.action == "supplement":
-            feedback = self._format_interrupt_feedback("supplement", msg, verdict)
+            feedback = self._format_interrupt_feedback("supplement", display_text, verdict)
             if not suppress_render:
-                self._render_interrupt_feedback("supplement", msg, verdict)
+                self._render_interrupt_feedback("supplement", display_text, verdict)
             return False, feedback
         if verdict.action == "hard_interrupt":
-            is_parent_rollback = self._pipeline.apply_hard_interrupt(verdict)
+            try:
+                if pipeline_input.has_images:
+                    is_parent_rollback = self._pipeline.apply_hard_interrupt(verdict, source_input=pipeline_input)
+                else:
+                    is_parent_rollback = self._pipeline.apply_hard_interrupt(verdict)
+            except PipelineStatePersistenceError as exc:
+                self._handle_pipeline_state_persistence_failure(exc)
+                return False, ""
             applied_verdict = getattr(self._pipeline, "last_applied_interrupt_verdict", None)
             feedback_verdict = (
                 applied_verdict if getattr(applied_verdict, "action", None) == "hard_interrupt" else verdict
             )
             if not is_parent_rollback:
-                feedback = self._format_interrupt_feedback("hard_interrupt_candidate", msg, feedback_verdict)
+                feedback = self._format_interrupt_feedback("hard_interrupt_candidate", display_text, feedback_verdict)
                 if not suppress_render:
-                    self._render_interrupt_feedback("hard_interrupt_candidate", msg, feedback_verdict)
+                    self._render_interrupt_feedback("hard_interrupt_candidate", display_text, feedback_verdict)
                 return False, feedback
-            feedback = self._format_interrupt_feedback("hard_interrupt_parent", msg, feedback_verdict)
+            feedback = self._format_interrupt_feedback("hard_interrupt_parent", display_text, feedback_verdict)
             if not suppress_render:
-                self._render_interrupt_feedback("hard_interrupt_parent", msg, feedback_verdict)
+                self._render_interrupt_feedback("hard_interrupt_parent", display_text, feedback_verdict)
             return True, feedback
         return False, ""
 
@@ -2146,10 +3077,10 @@ async def _stop_renderer() -> bool:
                             self._pipeline.pause_agent_loops()
                         try:
                             had_renderer = await _stop_renderer()
-                            user_input = await self._prompt_input.get_input(prompt="✎ ", transient=True)
-                            if user_input and user_input.strip():
+                            user_input = await self._read_pipeline_interrupt_input()
+                            if not user_input.is_empty:
                                 needs_restart, feedback = await self._handle_mid_pipeline_message(
-                                    user_input.strip(), suppress_render=True
+                                    user_input, suppress_render=True
                                 )
                                 if needs_restart and self._pipeline:
                                     event_stream = await self._restart_pipeline_stream_after_interrupt(
@@ -2223,6 +3154,10 @@ async def _stop_renderer() -> bool:
                                 and selection_result.type == PipelineEventType.PIPELINE_COMPLETED
                             ):
                                 return selection_result
+                            if isinstance(
+                                selection_result, PipelineEvent
+                            ) and self._is_pipeline_state_persistence_failure_event(selection_result):
+                                return selection_result
                             if self._pipeline_waiting_input:
                                 return None
                             if selection_result is True and self._pipeline:
@@ -2251,6 +3186,10 @@ async def _stop_renderer() -> bool:
                                 and tabs_interrupted.type == PipelineEventType.PIPELINE_COMPLETED
                             ):
                                 return tabs_interrupted
+                            if isinstance(
+                                tabs_interrupted, PipelineEvent
+                            ) and self._is_pipeline_state_persistence_failure_event(tabs_interrupted):
+                                return tabs_interrupted
                             if self._pipeline_waiting_input:
                                 return None
                             if tabs_interrupted is True and self._pipeline:
@@ -2408,9 +3347,6 @@ def _live_update(content):
 
         stop_keys = asyncio.Event()
         interrupt_requested = asyncio.Event()
-        input_mode = False
-        input_chars: list[str] = []
-        input_done = asyncio.Event()
         parent_task = asyncio.current_task()
 
         def _request_pipeline_cancel() -> None:
@@ -2420,7 +3356,6 @@ def _request_pipeline_cancel() -> None:
                 parent_task.cancel()
 
         async def key_reader():
-            nonlocal input_mode
             loop = asyncio.get_running_loop()
             try:
                 with RawInputCapture(use_cbreak=True) as cap:
@@ -2433,26 +3368,6 @@ async def key_reader():
                             _request_pipeline_cancel()
                             return
 
-                        if input_mode:
-                            if key_event.key == "enter":
-                                input_done.set()
-                                return
-                            if key_event.key == "escape":
-                                input_chars.clear()
-                                input_done.set()
-                                return
-                            if key_event.key == "backspace":
-                                if input_chars:
-                                    input_chars.pop()
-                            elif key_event.key == "paste":
-                                if key_event.char:
-                                    input_chars.extend(key_event.char)
-                            elif key_event.char and key_event.char.isprintable():
-                                input_chars.append(key_event.char)
-                            tabs.set_status_message(f"✎ {''.join(input_chars)}█")
-                            _live_update(tabs.render())
-                            continue
-
                         if key_event.key == "escape":
                             interrupt_requested.set()
                             if self._pipeline:
@@ -2471,26 +3386,24 @@ async def key_reader():
                 pass
 
         async def _handle_esc_interrupt() -> bool:
-            """Handle ESC interrupt inline (no live.stop). Returns True if pipeline restarted."""
-            nonlocal input_mode, interrupt_feedback
+            """Handle ESC interrupt prompt. Returns True if pipeline restarted."""
+            nonlocal interrupt_feedback
             if self._pipeline:
                 self._last_interrupt_paused = False
                 self._pipeline.pause_agent_loops()
+            live_stopped = False
             try:
-                input_mode = True
-                input_chars.clear()
-                input_done.clear()
-                tabs.set_status_message("✎ █")
+                await _cancel_key_task()
+                tabs.set_status_message("✎")
                 _live_update(tabs.render())
 
-                nonlocal key_task
-                key_task = asyncio.create_task(key_reader())
-                await input_done.wait()
-
-                user_input = "".join(input_chars).strip()
-                input_mode = False
+                live.stop()
+                live_stopped = True
+                user_input = await self._read_pipeline_interrupt_input()
+                live.start()
+                live_stopped = False
 
-                if user_input:
+                if not user_input.is_empty:
                     tabs.set_status_message(_("Judging your input..."))
                     _live_update(tabs.render())
                     needs_restart, feedback = await self._handle_mid_pipeline_message(user_input, suppress_render=True)
@@ -2504,6 +3417,8 @@ async def _handle_esc_interrupt() -> bool:
                 else:
                     tabs.set_status_message("")
             finally:
+                if live_stopped:
+                    live.start()
                 if self._pipeline and not getattr(self, "_last_interrupt_paused", False):
                     self._pipeline.resume_agent_loops()
             interrupt_requested.clear()
@@ -2595,7 +3510,10 @@ async def _stop_key_reader() -> None:
                         PipelineEventType.PIPELINE_COMPLETED,
                         PipelineEventType.ROLLBACK_TRIGGERED,
                     ):
-                        if event.type == PipelineEventType.PIPELINE_COMPLETED:
+                        if (
+                            event.type == PipelineEventType.PIPELINE_COMPLETED
+                            or self._is_pipeline_state_persistence_failure_event(event)
+                        ):
                             terminal_event = event
                         break
 
@@ -2675,6 +3593,7 @@ async def _stop_key_reader() -> None:
             return terminal_event
 
         if selected and self._pipeline is not None:
+            self._pipeline_waiting_input = False
             selected_name = selected.selected_candidate_name
             selected_label = selected.display_label or selected_name
             self._record_pipeline_display_candidate_selected(
@@ -2745,9 +3664,6 @@ async def _render_parallel_tabs(self, event_stream, progress_bar_fn=None) -> boo
 
         stop_keys = asyncio.Event()
         interrupt_requested = asyncio.Event()
-        input_mode = False
-        input_chars: list[str] = []
-        input_done = asyncio.Event()
         parent_task = asyncio.current_task()
 
         def _request_pipeline_cancel() -> None:
@@ -2757,7 +3673,6 @@ def _request_pipeline_cancel() -> None:
                 parent_task.cancel()
 
         async def key_reader():
-            nonlocal input_mode
             loop = asyncio.get_running_loop()
             try:
                 with RawInputCapture(use_cbreak=True) as cap:
@@ -2770,27 +3685,6 @@ async def key_reader():
                             _request_pipeline_cancel()
                             return
 
-                        if input_mode:
-                            if key_event.key == "enter":
-                                input_done.set()
-                                return
-                            if key_event.key == "escape":
-                                input_chars.clear()
-                                input_done.set()
-                                return
-                            if key_event.key == "backspace":
-                                if input_chars:
-                                    input_chars.pop()
-                            elif key_event.key == "paste":
-                                if key_event.char:
-                                    input_chars.extend(key_event.char)
-                            elif key_event.char and key_event.char.isprintable():
-                                input_chars.append(key_event.char)
-                            if tabs_renderer:
-                                tabs_renderer.set_input_line("".join(input_chars))
-                            _update_live()
-                            continue
-
                         if key_event.key == "escape":
                             interrupt_requested.set()
                             if self._pipeline:
@@ -2847,7 +3741,7 @@ def _update_live():
         key_task: asyncio.Task | None = None
 
         async def _prompt_child_permission(sub_id: str, inner: PermissionRequestEvent) -> None:
-            nonlocal input_mode, key_task, live
+            nonlocal key_task, live
             response_future = inner.response_future
             if response_future is None or response_future.done():
                 return
@@ -2855,9 +3749,6 @@ async def _prompt_child_permission(sub_id: str, inner: PermissionRequestEvent) -
             allowed = False
             try:
                 await _stop_key_reader()
-                input_mode = False
-                input_chars.clear()
-                input_done.clear()
                 if tabs_renderer:
                     tabs_renderer.set_input_line(None)
                 live.stop()
@@ -2887,22 +3778,22 @@ async def _prompt_child_permission(sub_id: str, inner: PermissionRequestEvent) -
                     if self._pipeline:
                         self._last_interrupt_paused = False
                         self._pipeline.pause_agent_loops()
+                    live_stopped = False
                     try:
-                        input_mode = True
-                        input_chars.clear()
-                        input_done.clear()
+                        await _cancel_key_task()
                         if tabs_renderer:
-                            tabs_renderer.set_input_line("")
+                            tabs_renderer.set_input_line("✎")
                         _update_live()
-                        key_task = asyncio.create_task(key_reader())
-                        await input_done.wait()
 
-                        user_input = "".join(input_chars).strip()
-                        input_mode = False
+                        live.stop()
+                        live_stopped = True
+                        user_input = await self._read_pipeline_interrupt_input()
+                        live.start()
+                        live_stopped = False
                         if tabs_renderer:
                             tabs_renderer.set_input_line(None)
 
-                        if user_input:
+                        if not user_input.is_empty:
                             if tabs_renderer:
                                 tabs_renderer.set_input_line(_("Judging your input..."))
                             _update_live()
@@ -2929,6 +3820,8 @@ async def _prompt_child_permission(sub_id: str, inner: PermissionRequestEvent) -
                                 for acc in accumulators.values():
                                     acc.text_buffer += "\n" + feedback + "\n"
                     finally:
+                        if live_stopped:
+                            live.start()
                         if self._pipeline and not getattr(self, "_last_interrupt_paused", False):
                             self._pipeline.resume_agent_loops()
                     interrupt_requested.clear()
@@ -2995,7 +3888,10 @@ async def _prompt_child_permission(sub_id: str, inner: PermissionRequestEvent) -
                         PipelineEventType.PIPELINE_COMPLETED,
                         PipelineEventType.STEP_FAILED,
                     ):
-                        if event.type == PipelineEventType.PIPELINE_COMPLETED:
+                        if (
+                            event.type == PipelineEventType.PIPELINE_COMPLETED
+                            or self._is_pipeline_state_persistence_failure_event(event)
+                        ):
                             terminal_event = event
                         break
 
@@ -3072,11 +3968,25 @@ def _update_pipeline_state_from_event(self, event):
         """
         from iac_code.pipeline.engine.events import PipelineEventType
 
+        if self._is_pipeline_state_persistence_failure_event(event):
+            self._pipeline_state_persistence_failed = True
         if event.type == PipelineEventType.PIPELINE_STARTED:
             self._pipeline_step_names = event.data.get("step_names", [])
             self._pipeline_start_time = time.time()
             self._pipeline_completed_indices = set()
 
+    @staticmethod
+    def _is_pipeline_state_persistence_failure_event(event) -> bool:
+        from iac_code.pipeline.engine.events import PipelineEventType
+
+        if getattr(event, "type", None) != PipelineEventType.STEP_FAILED:
+            return False
+        data = getattr(event, "data", {})
+        if not isinstance(data, dict):
+            return False
+        error_details = data.get("error_details", {})
+        return isinstance(error_details, dict) and error_details.get("type") == "PipelineStatePersistenceError"
+
     def _render_pipeline_event(self, event):
         from rich.panel import Panel
 
@@ -3105,6 +4015,10 @@ def _render_pipeline_event(self, event):
                 err = event.data.get("error", "")
                 step_id = event.step_id or ""
                 con.print(f"  [red]✗ {display_step_name(step_id)}[/] [dim]── {err}[/]")
+            case PipelineEventType.PIPELINE_WARNING:
+                reason = str(event.data.get("reason") or "warning")
+                message = str(event.data.get("message") or _("Pipeline warning: {reason}").format(reason=reason))
+                con.print(f"  [yellow]⚠[/] [yellow]{message}[/]")
             case PipelineEventType.USER_INPUT_REQUIRED:
                 options = event.data.get("options", [])
                 prompt_text = event.data.get("prompt", "")
@@ -3454,12 +4368,16 @@ def _terminal_pipeline_status(self, pipeline_cwd: str, session_id: str) -> str |
             logger.warning("Failed to inspect terminal pipeline sidecar: {}", exc)
             return None
 
-    def _persist_pipeline_visible_user_turn(self, user_input: str) -> None:
+    def _persist_pipeline_visible_user_turn(self, user_input: str | "PipelineUserInput") -> None:
         """Persist the user-visible pipeline prompt into the root session."""
-        if not isinstance(user_input, str) or not user_input.strip():
+        from iac_code.pipeline.engine.user_input import normalize_pipeline_user_input
+
+        pipeline_input = normalize_pipeline_user_input(user_input)
+        if pipeline_input.is_empty:
             return
+        visible_input = pipeline_input.content if pipeline_input.has_images else pipeline_input.display_text
         try:
-            injected = self._agent_loop.context_manager.add_raw_message({"role": "user", "content": user_input})
+            injected = self._agent_loop.context_manager.add_raw_message({"role": "user", "content": visible_input})
             self._session_storage.append(
                 self._original_cwd,
                 self._session_id,
@@ -3698,12 +4616,13 @@ def _status_region() -> str:
     @staticmethod
     def _count_user_turns(messages: list) -> int:
         from iac_code.agent.message import ToolResultBlock, is_recalled_memory_message
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
 
         turns = 0
         for message in messages:
             if getattr(message, "role", None) != "user":
                 continue
-            if is_recalled_memory_message(message):
+            if is_recalled_memory_message(message) or is_cleanup_prompt_message(message):
                 continue
             content = getattr(message, "content", "")
             if isinstance(content, list) and any(isinstance(block, ToolResultBlock) for block in content):
@@ -3729,6 +4648,7 @@ def swap_session(self, new_session_id: str) -> None:
         new_messages = self._with_terminal_pipeline_abort_notice(new_messages, pipeline_cwd, new_session_id)
         self._agent_loop.replace_session(new_session_id, new_messages or None)
         self._session_id = new_session_id
+        self._clear_pipeline_cleanup_ledger_path()
         self._was_resumed = True
         self._session_name = self._load_current_session_name()
 
@@ -3752,6 +4672,8 @@ def swap_session(self, new_session_id: str) -> None:
                 session_name=self._session_name,
             )
         )
+        self._print_cleanup_resume_summary()
+        self._prune_cleanup_prompts_if_no_pending_cleanup()
         if new_messages:
             self._replay_resume_messages(new_messages)
             self.console.print()
@@ -3812,9 +4734,7 @@ async def swap_session_async(self, new_session_id: str) -> None:
                 session_id=new_session_id,
                 cwd=pipeline_cwd,
                 permission_context_getter=lambda: self.store.get_state().permission_context,
-                memory_content_getter=(
-                    lambda: self._memory_manager.get_prompt_content() if self._memory_manager else ""
-                ),
+                memory_content_getter=self._pipeline_memory_content_getter(),
                 auto_trigger_skills=self.command_registry.get_model_invocable_skills(),
                 resume_from_sidecar=True,
             )
@@ -3850,7 +4770,23 @@ async def _confirm_pipeline_resume(self, meta_path) -> str:
         from iac_code.pipeline.display_names import display_step_name
         from iac_code.ui.components.select import InputOption, Select, SelectLayout, TextOption
 
-        meta = _yaml.safe_load(meta_path.read_text(encoding="utf-8")) or {}
+        try:
+            loaded = _yaml.safe_load(meta_path.read_text(encoding="utf-8"))
+        except (FileNotFoundError, OSError, UnicodeDecodeError, _yaml.YAMLError) as exc:
+            self.renderer.print_system_message(
+                _("Could not read pipeline state metadata: {reason}").format(reason=str(exc) or type(exc).__name__),
+                style="yellow",
+            )
+            return "discard"
+        if loaded is None:
+            loaded = {}
+        if not isinstance(loaded, dict):
+            self.renderer.print_system_message(
+                _("Pipeline state metadata is invalid; continuing as normal chat."),
+                style="yellow",
+            )
+            return "discard"
+        meta = loaded
         current_step = display_step_name(str(meta.get("current_step", "?")))
 
         title = _("Found pipeline state in this session (paused at: {step}).").format(step=current_step)
@@ -3945,11 +4881,12 @@ def _write_last_prompt_meta(self) -> None:
     def _extract_last_user_text(messages: list) -> str:
         """Walk messages from newest to oldest, return first plain user text."""
         from iac_code.agent.message import RECALLED_MEMORY_MARKER, TextBlock, is_recalled_memory_message
+        from iac_code.pipeline.engine.cleanup import is_cleanup_prompt_message
 
         for msg in reversed(messages):
             if msg.role != "user":
                 continue
-            if is_recalled_memory_message(msg):
+            if is_recalled_memory_message(msg) or is_cleanup_prompt_message(msg):
                 continue
             content = msg.content
             if isinstance(content, str):
diff --git a/src/iac_code/utils/file_security.py b/src/iac_code/utils/file_security.py
index db4bb7aa..625cf982 100644
--- a/src/iac_code/utils/file_security.py
+++ b/src/iac_code/utils/file_security.py
@@ -6,40 +6,24 @@
 import subprocess
 import sys
 import tempfile
-import time
 from pathlib import Path
 
+from iac_code.utils.state_io import atomic_write_text as durable_atomic_write_text
+from iac_code.utils.state_io import safe_replace as durable_safe_replace
+
 _IS_WINDOWS = sys.platform == "win32"
+# Kept as a module attribute for callers that patch atomic_write_text internals.
+_TEMPFILE_FOR_COMPAT = tempfile
 
 
-def safe_replace(src: str, dst: str) -> None:
+def safe_replace(src: str | Path, dst: str | Path) -> None:
     """os.replace with retry for Windows file locking."""
-    for attempt in range(3):
-        try:
-            os.replace(src, dst)
-            return
-        except PermissionError:
-            if attempt == 2:
-                raise
-            time.sleep(0.1 * (attempt + 1))
+    durable_safe_replace(src, dst)
 
 
 def atomic_write_text(path: Path, content: str, *, encoding: str = "utf-8") -> None:
     """Atomically replace *path* with text content."""
-    fd, temp_name = tempfile.mkstemp(prefix=f".{path.name}.", suffix=".tmp", dir=path.parent)
-    temp_path = Path(temp_name)
-    try:
-        with os.fdopen(fd, "w", encoding=encoding) as file:
-            file.write(content)
-            file.flush()
-            os.fsync(file.fileno())
-        safe_replace(str(temp_path), str(path))
-    except Exception:
-        try:
-            temp_path.unlink()
-        except FileNotFoundError:
-            pass
-        raise
+    durable_atomic_write_text(path, content, encoding=encoding, durable=True, _safe_replace=safe_replace)
 
 
 def restrict_file_permissions(path: Path, *, directory: bool) -> None:
diff --git a/src/iac_code/utils/image/processor.py b/src/iac_code/utils/image/processor.py
index fa26ac63..5a9267cc 100644
--- a/src/iac_code/utils/image/processor.py
+++ b/src/iac_code/utils/image/processor.py
@@ -31,6 +31,7 @@ def process_user_input(
             ImageBlock(
                 media_type=pc.media_type or "image/png",
                 data=pc.content,
+                ref_id=pc.id,
             )
         )
         cursor = ref.end
diff --git a/src/iac_code/utils/image/store.py b/src/iac_code/utils/image/store.py
index 75e06372..c9fe89da 100644
--- a/src/iac_code/utils/image/store.py
+++ b/src/iac_code/utils/image/store.py
@@ -1,6 +1,7 @@
 from __future__ import annotations
 
 import base64
+import hashlib
 import os
 import shutil
 import time
@@ -13,6 +14,7 @@
 
 IMAGE_STORE_DIR_NAME = "image-cache"
 MAX_STORED_IMAGE_PATHS = 200
+KNOWN_IMAGE_SUFFIXES = (".png", ".jpeg", ".jpg", ".gif", ".webp")
 # Concurrent REPL sessions each schedule background cleanup. To avoid
 # wiping a sibling session's still-in-use cache, only delete dirs whose
 # mtime is older than this threshold. Storing an image refreshes the
@@ -57,6 +59,31 @@ def store(self, pc: PastedContent) -> str | None:
         self.cache_path(pc.id, str(path))
         return str(path)
 
+    def store_block(self, block: object) -> str | None:
+        data = getattr(block, "data", "")
+        if not data:
+            return None
+        ensure_private_dir(_get_base_dir())
+        d = ensure_private_dir(self._session_dir())
+        media_type = getattr(block, "media_type", None) or "image/png"
+        ext = media_type.split("/")[-1]
+        digest = hashlib.sha256(str(data).encode()).hexdigest()[:32]
+        path = d / f"block-{digest}.{ext}"
+        if path.is_file():
+            return str(path)
+        try:
+            decoded = base64.b64decode(data)
+            fd = os.open(str(path), os.O_WRONLY | os.O_CREAT | os.O_EXCL, 0o600)
+            try:
+                os.write(fd, decoded)
+            finally:
+                os.close(fd)
+        except FileExistsError:
+            return str(path)
+        except Exception:
+            return None
+        return str(path)
+
     def cache_path(self, image_id: int, path: str) -> None:
         if image_id in self._paths:
             self._paths.move_to_end(image_id)
@@ -65,7 +92,39 @@ def cache_path(self, image_id: int, path: str) -> None:
             self._paths.popitem(last=False)
 
     def get_path(self, image_id: int) -> str | None:
-        return self._paths.get(image_id)
+        cached = self._paths.get(image_id)
+        if cached:
+            return cached
+        discovered = self._discover_cached_path(image_id)
+        if discovered:
+            self.cache_path(image_id, discovered)
+        return discovered
+
+    def _discover_cached_path(self, image_id: int) -> str | None:
+        session_dir = self._session_dir()
+        if not session_dir.exists():
+            return None
+        for suffix in KNOWN_IMAGE_SUFFIXES:
+            path = session_dir / f"{image_id}{suffix}"
+            if path.is_file():
+                return str(path)
+        for path in sorted(session_dir.glob(f"{image_id}.*")):
+            if path.is_file():
+                return str(path)
+        return None
+
+    def next_image_id(self) -> int:
+        image_ids = [image_id for image_id in self._paths if image_id > 0]
+        session_dir = self._session_dir()
+        if session_dir.exists():
+            for path in session_dir.iterdir():
+                if not path.is_file():
+                    continue
+                try:
+                    image_ids.append(int(path.stem))
+                except ValueError:
+                    continue
+        return max(image_ids, default=0) + 1
 
     def clear(self) -> None:
         self._paths.clear()
diff --git a/src/iac_code/utils/path_locks.py b/src/iac_code/utils/path_locks.py
new file mode 100644
index 00000000..4abcca00
--- /dev/null
+++ b/src/iac_code/utils/path_locks.py
@@ -0,0 +1,35 @@
+from __future__ import annotations
+
+import threading
+import weakref
+from collections.abc import Iterator
+from contextlib import contextmanager
+from pathlib import Path
+
+
+class PathLockRegistry:
+    """Weak per-path RLock registry that preserves uniqueness for live locks."""
+
+    def __init__(self) -> None:
+        self._locks: weakref.WeakValueDictionary[Path, threading.RLock] = weakref.WeakValueDictionary()
+        self._guard = threading.Lock()
+
+    @contextmanager
+    def lock_for(self, path: str | Path) -> Iterator[threading.RLock]:
+        lock = self._get_lock(Path(path))
+        with lock:
+            yield lock
+
+    def prune(self) -> None:
+        with self._guard:
+            # Touching WeakValueDictionary materializes pending removals.
+            list(self._locks.items())
+
+    def _get_lock(self, path: Path) -> threading.RLock:
+        resolved = path.resolve()
+        with self._guard:
+            lock = self._locks.get(resolved)
+            if lock is None:
+                lock = threading.RLock()
+                self._locks[resolved] = lock
+            return lock
diff --git a/src/iac_code/utils/state_io.py b/src/iac_code/utils/state_io.py
new file mode 100644
index 00000000..bfcc271c
--- /dev/null
+++ b/src/iac_code/utils/state_io.py
@@ -0,0 +1,200 @@
+"""Durable state-file I/O helpers for recovery-critical files."""
+
+from __future__ import annotations
+
+import json
+import os
+import shutil
+import sys
+import tempfile
+import time
+from collections.abc import Callable, Iterable
+from contextlib import contextmanager, suppress
+from pathlib import Path
+from typing import Any, Iterator
+
+from iac_code.utils.path_locks import PathLockRegistry
+
+_PATH_LOCKS = PathLockRegistry()
+
+
+def _path_lock(path: Path):
+    return _PATH_LOCKS.lock_for(path)
+
+
+def safe_replace(src: str | Path, dst: str | Path, *, attempts: int = 3, delay: float = 0.05) -> None:
+    if attempts < 1:
+        raise ValueError("attempts must be >= 1")
+    for attempt in range(attempts):
+        try:
+            os.replace(src, dst)
+            return
+        except PermissionError:
+            if attempt >= attempts - 1:
+                raise
+            time.sleep(delay * (attempt + 1))
+        except OSError as exc:
+            if exc.errno != getattr(os, "EXDEV", 18):
+                raise
+            _copy_replace_across_devices(Path(src), Path(dst), attempts=attempts, delay=delay)
+            return
+
+
+def _copy_replace_across_devices(src: Path, dst: Path, *, attempts: int, delay: float) -> None:
+    dst.parent.mkdir(parents=True, exist_ok=True)
+    handle = tempfile.NamedTemporaryFile(
+        prefix=f".{dst.name}.",
+        suffix=".tmp",
+        dir=dst.parent,
+        delete=False,
+    )
+    tmp_path = Path(handle.name)
+    handle.close()
+    try:
+        shutil.copy2(src, tmp_path)
+        try:
+            with tmp_path.open("rb") as handle:
+                os.fsync(handle.fileno())
+        except OSError:
+            pass
+        safe_replace(tmp_path, dst, attempts=attempts, delay=delay)
+        fsync_parent_dir(dst)
+        src.unlink()
+    except Exception:
+        with suppress(OSError):
+            tmp_path.unlink()
+        raise
+
+
+def fsync_parent_dir(path: Path) -> None:
+    if sys.platform == "win32":
+        return
+    try:
+        fd = os.open(str(path.parent), os.O_RDONLY)
+    except OSError:
+        return
+    try:
+        try:
+            os.fsync(fd)
+        except OSError:
+            return
+    finally:
+        os.close(fd)
+
+
+def atomic_write_bytes(
+    path: str | Path,
+    content: bytes,
+    *,
+    durable: bool = True,
+    replace_attempts: int = 3,
+    _safe_replace: Callable[[str | Path, str | Path], None] | None = None,
+) -> None:
+    target = Path(path)
+    target.parent.mkdir(parents=True, exist_ok=True)
+    fd, tmp_name = tempfile.mkstemp(prefix=f".{target.name}.", suffix=".tmp", dir=target.parent)
+    tmp_path = Path(tmp_name)
+    try:
+        with os.fdopen(fd, "wb") as handle:
+            handle.write(content)
+            handle.flush()
+            if durable:
+                os.fsync(handle.fileno())
+        if _safe_replace is None:
+            safe_replace(tmp_path, target, attempts=replace_attempts)
+        else:
+            _safe_replace(tmp_path, target)
+        if durable:
+            fsync_parent_dir(target)
+    except Exception:
+        try:
+            tmp_path.unlink()
+        except FileNotFoundError:
+            pass
+        raise
+
+
+def atomic_write_text(
+    path: str | Path,
+    content: str,
+    *,
+    encoding: str = "utf-8",
+    durable: bool = True,
+    replace_attempts: int = 3,
+    _safe_replace: Callable[[str | Path, str | Path], None] | None = None,
+) -> None:
+    atomic_write_bytes(
+        path,
+        content.encode(encoding),
+        durable=durable,
+        replace_attempts=replace_attempts,
+        _safe_replace=_safe_replace,
+    )
+
+
+def atomic_write_json(
+    path: str | Path,
+    value: Any,
+    *,
+    durable: bool = True,
+    replace_attempts: int = 3,
+) -> None:
+    content = json.dumps(value, ensure_ascii=False, indent=2, sort_keys=True, allow_nan=False) + "\n"
+    atomic_write_text(path, content, durable=durable, replace_attempts=replace_attempts)
+
+
+@contextmanager
+def _cross_process_append_lock(path: Path) -> Iterator[None]:
+    lock_path = path.with_name(f".{path.name}.lock")
+    lock_path.parent.mkdir(parents=True, exist_ok=True)
+    with lock_path.open("a+b") as lock_file:
+        if sys.platform == "win32":
+            import msvcrt
+
+            try:
+                lock_file.seek(0)
+                msvcrt.locking(lock_file.fileno(), msvcrt.LK_LOCK, 1)
+            except OSError as exc:
+                raise RuntimeError(f"could not acquire append lock for {path}") from exc
+            try:
+                yield
+            finally:
+                lock_file.seek(0)
+                msvcrt.locking(lock_file.fileno(), msvcrt.LK_UNLCK, 1)
+        else:
+            import fcntl
+
+            try:
+                fcntl.flock(lock_file.fileno(), fcntl.LOCK_EX)
+            except OSError as exc:
+                raise RuntimeError(f"could not acquire append lock for {path}") from exc
+            try:
+                yield
+            finally:
+                fcntl.flock(lock_file.fileno(), fcntl.LOCK_UN)
+
+
+def append_jsonl_locked(
+    path: str | Path,
+    records: Iterable[dict[str, Any]],
+    *,
+    durable: bool = False,
+) -> None:
+    target = Path(path)
+    target.parent.mkdir(parents=True, exist_ok=True)
+    lines = [
+        json.dumps(record, ensure_ascii=False, separators=(",", ":"), allow_nan=False) + "\n" for record in records
+    ]
+    if not lines:
+        return
+    with _path_lock(target):
+        with _cross_process_append_lock(target):
+            created = not target.exists()
+            with target.open("ab") as handle:
+                for line in lines:
+                    handle.write(line.encode("utf-8"))
+                handle.flush()
+                if durable:
+                    os.fsync(handle.fileno())
+            if durable and created:
+                fsync_parent_dir(target)
diff --git a/tests/a2a/test_app.py b/tests/a2a/test_app.py
index 0451f3bc..df1bbef5 100644
--- a/tests/a2a/test_app.py
+++ b/tests/a2a/test_app.py
@@ -37,6 +37,7 @@
 from iac_code.a2a.pipeline_journal import A2APipelineJournal
 from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore, reduce_pipeline_events
 from iac_code.a2a.transports.dispatcher import create_runtime_components
+from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.services.session_storage import SessionStorage
 from iac_code.types.stream_events import TextDeltaEvent, ToolResultEvent
 
@@ -486,6 +487,14 @@ def _pipeline_event(sequence: int, event_id: str) -> dict:
     }
 
 
+def _sse_json_events(body: str) -> list[dict]:
+    events: list[dict] = []
+    for line in body.splitlines():
+        if line.startswith("data: "):
+            events.append(json.loads(line.removeprefix("data: ")))
+    return events
+
+
 def _pipeline_pending_ask_event() -> dict:
     event = _pipeline_event(1, "evt-ask")
     event["eventType"] = "input_required"
@@ -789,6 +798,188 @@ def test_streaming_v03_method_with_v10_header_returns_sse(monkeypatch, tmp_path)
     assert loop.prompts == ["hello mixed"]
 
 
+def test_streaming_v03_active_sidecar_mismatch_preserves_recoverable_error_data(
+    monkeypatch,
+    tmp_path: Path,
+) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    persistence_dir = tmp_path / "a2a"
+    session_id = "session-ctx-1"
+    persistence = A2APersistenceStore(persistence_dir)
+    persistence.save_context(A2AContextSnapshot(context_id="ctx-1", session_id=session_id, cwd=str(tmp_path)))
+    persistence.save_task(A2ATaskSnapshot(task_id="task-owner", context_id="ctx-1", state="working"))
+    persistence.save_task(A2ATaskSnapshot(task_id="task-new", context_id="ctx-1", state="input-required"))
+
+    pipeline_dir = SessionStorage().session_dir(str(tmp_path), session_id) / "a2a" / "pipeline"
+    owner_event = _pipeline_event(1, "evt-owner")
+    owner_event["taskId"] = "task-owner"
+    A2APipelineJournal(pipeline_dir).append(owner_event)
+    A2APipelineSnapshotStore(pipeline_dir).save(reduce_pipeline_events([owner_event]))
+
+    class RunningPipeline:
+        pipeline_name = "selling"
+        sidecar_status = "running"
+        handoff_enabled = False
+
+        def __init__(self) -> None:
+            self.session = SimpleNamespace(
+                session_dir=SessionStorage().session_dir(str(tmp_path), session_id) / "pipeline"
+            )
+
+        async def run(self, prompt: str):  # pragma: no cover - regression asserts this is not reached
+            yield TextDeltaEvent(text=f"unexpected {prompt}")
+
+        def clear_sidecar(self) -> None:  # pragma: no cover - regression asserts this is not reached
+            raise AssertionError("active sidecar should not be cleared")
+
+    fake_runtime = SimpleNamespace(provider_manager=object(), tool_registry=object())
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_agent_runtime", lambda options: fake_runtime)
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_pipeline", lambda *args, **kwargs: RunningPipeline())
+
+    app = create_app(
+        host="127.0.0.1",
+        port=41242,
+        token=None,
+        model="qwen3.6-plus",
+        persistence_dir=persistence_dir,
+    )
+
+    with TestClient(app) as client:
+        with client.stream(
+            "POST",
+            "/",
+            headers={"A2A-Version": "1.0"},
+            json={
+                "jsonrpc": "2.0",
+                "id": "1",
+                "method": "message/stream",
+                "params": {
+                    "message": {
+                        "messageId": "msg-new",
+                        "taskId": "task-new",
+                        "contextId": "ctx-1",
+                        "role": "user",
+                        "parts": [{"kind": "text", "text": "new request"}],
+                        "metadata": {"iac_code": {"cwd": str(tmp_path)}},
+                    },
+                    "configuration": {"acceptedOutputModes": ["text/plain"]},
+                },
+            },
+        ) as response:
+            body = response.read().decode()
+
+    events = _sse_json_events(body)
+    assert response.status_code == 200
+    assert events
+    error = events[-1]["error"]
+    assert error["code"] == -32602
+    assert error["data"] == {
+        "recoverableTaskId": "task-owner",
+        "contextId": "ctx-1",
+        "sidecarStatus": "running",
+    }
+
+
+def test_pipeline_streaming_starts_with_task_before_status_update(monkeypatch, tmp_path: Path) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+
+    class StreamingPipeline:
+        pipeline_name = "selling"
+        sidecar_status = None
+
+        def __init__(self) -> None:
+            self.prompts: list[str] = []
+            self.session = SimpleNamespace(session_dir=tmp_path / "pipeline-sidecar")
+            self.handoff_enabled = False
+
+        async def run(self, prompt: str):
+            self.prompts.append(prompt)
+            yield PipelineEvent(
+                type=PipelineEventType.PIPELINE_STARTED,
+                step_id=None,
+                timestamp=1717821600.0,
+                data={"total_steps": 1, "step_names": ["intent_parsing"]},
+            )
+            yield TextDeltaEvent(text="pipeline streaming output")
+
+        def should_switch_to_normal(self, data: dict) -> bool:  # noqa: ARG002
+            return False
+
+    fake_pipeline = StreamingPipeline()
+    fake_runtime = SimpleNamespace(provider_manager=object(), tool_registry=object())
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_agent_runtime", lambda options: fake_runtime)
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_pipeline", lambda *args, **kwargs: fake_pipeline)
+
+    app = create_app(host="127.0.0.1", port=41242, token=None, model="qwen3.6-plus")
+
+    with TestClient(app) as client:
+        with client.stream(
+            "POST",
+            "/",
+            headers={"A2A-Version": "1.0"},
+            json={
+                "jsonrpc": "2.0",
+                "id": "1",
+                "method": "SendStreamingMessage",
+                "params": {
+                    "message": {
+                        "messageId": "msg-1",
+                        "role": "ROLE_USER",
+                        "parts": [{"text": "选择一个已有vpc，创建一个vswitch"}],
+                        "metadata": {"iac_code": {"cwd": str(tmp_path)}},
+                    },
+                    "configuration": {"acceptedOutputModes": ["text/plain"]},
+                },
+            },
+        ) as response:
+            body = response.read().decode()
+
+    assert response.status_code == 200
+    assert "Agent should enqueue Task before TaskStatusUpdateEvent event" not in body
+    assert "pipeline streaming output" in body
+    assert fake_pipeline.prompts == ["选择一个已有vpc，创建一个vswitch"]
+
+
+def test_pipeline_streaming_workspace_error_returns_request_error(monkeypatch, tmp_path: Path) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    allowed = tmp_path / "allowed"
+    outside = tmp_path / "outside"
+    allowed.mkdir()
+    outside.mkdir()
+    monkeypatch.setenv("IACCODE_A2A_ALLOWED_CWDS", str(allowed))
+
+    app = create_app(host="127.0.0.1", port=41242, token=None, model="qwen3.6-plus")
+
+    with TestClient(app) as client:
+        with client.stream(
+            "POST",
+            "/",
+            headers={"A2A-Version": "1.0"},
+            json={
+                "jsonrpc": "2.0",
+                "id": "1",
+                "method": "SendStreamingMessage",
+                "params": {
+                    "message": {
+                        "messageId": "msg-1",
+                        "role": "ROLE_USER",
+                        "parts": [{"text": "选择一个已有vpc，创建一个vswitch"}],
+                        "metadata": {"iac_code": {"cwd": str(outside)}},
+                    },
+                    "configuration": {"acceptedOutputModes": ["text/plain"]},
+                },
+            },
+        ) as response:
+            body = response.read().decode()
+
+    assert response.status_code == 200
+    assert "Agent should enqueue Task before TaskStatusUpdateEvent event" not in body
+    data = response.json()
+    assert data["error"]["code"] == -32602
+    assert data["error"]["message"] == "Invalid A2A workspace metadata."
+    assert data["error"]["data"][0]["reason"] == "INVALID_PARAMS"
+
+
 def test_follow_up_message_through_sdk_route_updates_existing_task(monkeypatch, tmp_path) -> None:
     class EchoAgentLoop:
         def __init__(self) -> None:
@@ -1686,7 +1877,12 @@ async def test_cancel_input_required_pipeline_task_after_restart_marks_canceled(
         assert persistence.load_task("task-1").state == "canceled"
         snapshot = A2APipelineSnapshotStore(pipeline_dir).load()
         assert snapshot["status"] == "canceled"
-        assert A2APipelineJournal(pipeline_dir).read_all_repairing_tail()[-1]["eventType"] == "pipeline_canceled"
+        assert snapshot["normalHandoff"]["action"] == "switch_to_normal"
+        assert snapshot["normalHandoff"]["targetMode"] == "normal"
+        assert snapshot["normalHandoff"]["outcome"] == "canceled"
+        assert "Outcome: canceled" in snapshot["normalHandoff"]["summary"]
+        events = A2APipelineJournal(pipeline_dir).read_all_repairing_tail()
+        assert [event["eventType"] for event in events[-2:]] == ["pipeline_canceled", "pipeline_handoff_ready"]
     finally:
         await components.aclose()
 
diff --git a/tests/a2a/test_executor.py b/tests/a2a/test_executor.py
index 2193c6c8..4ca31db0 100644
--- a/tests/a2a/test_executor.py
+++ b/tests/a2a/test_executor.py
@@ -4,6 +4,7 @@
 
 import pytest
 from a2a.types import TaskStatusUpdateEvent
+from a2a.utils.errors import InvalidParamsError
 from google.protobuf.json_format import MessageToDict
 
 from iac_code.a2a.executor import IacCodeA2AExecutor
@@ -13,6 +14,8 @@
 from iac_code.a2a.pipeline_journal import A2APipelineJournal
 from iac_code.a2a.pipeline_paths import a2a_pipeline_dir_for_session
 from iac_code.a2a.task_store import A2ATaskStore
+from iac_code.agent.message import ImageBlock
+from iac_code.pipeline.engine.user_input import PipelineUserInput
 from iac_code.types.stream_events import PermissionRequestEvent, TextDeltaEvent, ToolResultEvent
 
 from .fakes import FakeAgentLoop, FakeEventQueue, FakeRequestContext, FakeRuntime, pending_future
@@ -22,6 +25,14 @@ def dump(event):
     return MessageToDict(event, preserving_proto_field_name=False)
 
 
+def _image_only_pipeline_input() -> PipelineUserInput:
+    return PipelineUserInput(
+        content=[ImageBlock(media_type="image/png", data="aGVsbG8=")],
+        display_text="[Image input]",
+        has_images=True,
+    )
+
+
 @pytest.fixture(autouse=True)
 def default_normal_mode(monkeypatch: pytest.MonkeyPatch) -> None:
     monkeypatch.delenv("IAC_CODE_MODE", raising=False)
@@ -388,8 +399,18 @@ class SpyPipelineExecutor:
         def __init__(self, **kwargs):
             calls.append(("init", kwargs))
 
-        async def execute(self, *, context, event_queue, task, task_id, context_id, cwd, prompt):
-            calls.append(("execute", {"task_id": task_id, "context_id": context_id, "cwd": cwd, "prompt": prompt}))
+        async def execute(self, *, context, event_queue, task, task_id, context_id, cwd, pipeline_input):
+            calls.append(
+                (
+                    "execute",
+                    {
+                        "task_id": task_id,
+                        "context_id": context_id,
+                        "cwd": cwd,
+                        "pipeline_input": pipeline_input,
+                    },
+                )
+            )
 
     monkeypatch.setattr("iac_code.a2a.executor.IacCodeA2APipelineExecutor", SpyPipelineExecutor)
 
@@ -400,7 +421,12 @@ async def execute(self, *, context, event_queue, task, task_id, context_id, cwd,
 
     assert calls[-1] == (
         "execute",
-        {"task_id": "task-1", "context_id": "ctx-1", "cwd": str(tmp_path), "prompt": "hello"},
+        {
+            "task_id": "task-1",
+            "context_id": "ctx-1",
+            "cwd": str(tmp_path),
+            "pipeline_input": PipelineUserInput(content="hello", display_text="hello", has_images=False),
+        },
     )
 
 
@@ -435,8 +461,18 @@ class SpyPipelineExecutor:
         def __init__(self, **kwargs):
             calls.append(("init", kwargs))
 
-        async def execute(self, *, context, event_queue, task, task_id, context_id, cwd, prompt):
-            calls.append(("execute", {"task_id": task_id, "context_id": context_id, "cwd": cwd, "prompt": prompt}))
+        async def execute(self, *, context, event_queue, task, task_id, context_id, cwd, pipeline_input):
+            calls.append(
+                (
+                    "execute",
+                    {
+                        "task_id": task_id,
+                        "context_id": context_id,
+                        "cwd": cwd,
+                        "pipeline_input": pipeline_input,
+                    },
+                )
+            )
 
     monkeypatch.setattr("iac_code.a2a.executor.IacCodeA2APipelineExecutor", SpyPipelineExecutor)
 
@@ -455,10 +491,103 @@ async def execute(self, *, context, event_queue, task, task_id, context_id, cwd,
 
     assert calls[-1] == (
         "execute",
-        {"task_id": "task-1", "context_id": "ctx-1", "cwd": str(tmp_path), "prompt": "继续"},
+        {
+            "task_id": "task-1",
+            "context_id": "ctx-1",
+            "cwd": str(tmp_path),
+            "pipeline_input": PipelineUserInput(content="继续", display_text="继续", has_images=False),
+        },
     )
 
 
+@pytest.mark.asyncio
+async def test_pipeline_mode_accepts_image_only_input(monkeypatch: pytest.MonkeyPatch, tmp_path: Path) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    pipeline_input = _image_only_pipeline_input()
+    calls = []
+
+    class CapturingPipelineExecutor:
+        def __init__(self, **kwargs):
+            pass
+
+        async def execute(self, **kwargs):
+            calls.append(kwargs)
+
+    monkeypatch.setattr("iac_code.a2a.executor.IacCodeA2APipelineExecutor", CapturingPipelineExecutor)
+    monkeypatch.setattr(
+        IacCodeA2AExecutor,
+        "_pipeline_input_from_context",
+        lambda self, context, *, cwd: pipeline_input,
+    )
+    monkeypatch.setattr("iac_code.a2a.executor.is_model_multimodal", lambda *args, **kwargs: True)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics())
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+    queue = FakeEventQueue()
+
+    await executor.execute(FakeRequestContext(metadata={"iac_code": {"cwd": str(tmp_path)}}), queue)
+
+    assert calls
+    assert calls[0]["pipeline_input"] == pipeline_input
+    states = [dump(event)["status"]["state"] for event in queue.events if isinstance(event, TaskStatusUpdateEvent)]
+    assert "TASK_STATE_FAILED" not in states
+
+
+@pytest.mark.asyncio
+async def test_pipeline_mode_image_input_checks_provider_context(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Path
+) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    monkeypatch.setattr(
+        IacCodeA2AExecutor,
+        "_pipeline_input_from_context",
+        lambda self, context, *, cwd: _image_only_pipeline_input(),
+    )
+    seen = {}
+
+    def fake_is_model_multimodal(model, *, provider_key=None, base_url=None, api_key=None):
+        seen.update(
+            {
+                "model": model,
+                "provider_key": provider_key,
+                "base_url": base_url,
+                "api_key": api_key,
+            }
+        )
+        return False
+
+    monkeypatch.setattr("iac_code.a2a.executor.get_active_provider_key", lambda: "openai_compatible")
+    monkeypatch.setattr(
+        "iac_code.a2a.executor.get_provider_config",
+        lambda provider_key: {"keyName": provider_key, "apiBase": "https://example.test/v1"},
+    )
+    monkeypatch.setattr(
+        "iac_code.a2a.executor.load_credentials",
+        lambda model=None: {"openai_compatible": "test-key"},
+    )
+    monkeypatch.setattr("iac_code.a2a.executor.is_model_multimodal", fake_is_model_multimodal)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics())
+    executor = IacCodeA2AExecutor(task_store=store, model="custom-vl")
+
+    queue = FakeEventQueue()
+    with pytest.raises(InvalidParamsError, match="Current model custom-vl does not support image input"):
+        await executor.execute(
+            FakeRequestContext(metadata={"iac_code": {"cwd": str(tmp_path)}}),
+            queue,
+        )
+
+    assert seen == {
+        "model": "custom-vl",
+        "provider_key": "openai_compatible",
+        "base_url": "https://example.test/v1",
+        "api_key": "test-key",
+    }
+    assert not [event for event in queue.events if isinstance(event, TaskStatusUpdateEvent)]
+    with pytest.raises(ValueError, match="A2A task not found"):
+        await store.get_task_record("task-1")
+
+
 @pytest.mark.asyncio
 async def test_executor_empty_prompt_takes_precedence_over_pipeline_mode(
     monkeypatch: pytest.MonkeyPatch, tmp_path: Path
@@ -475,11 +604,11 @@ def fail_if_called(options):  # noqa: ARG001
     queue = FakeEventQueue()
     context = FakeRequestContext(text="   ", metadata={"iac_code": {"cwd": str(tmp_path)}})
 
-    await executor.execute(context, queue)
-
-    dumped = dump(queue.events[-1])
-    assert dumped["status"]["state"] == "TASK_STATE_FAILED"
-    assert dumped["status"]["message"]["parts"][0]["text"] == "A2A server currently accepts text input only."
+    with pytest.raises(InvalidParamsError, match="A2A server received empty input"):
+        await executor.execute(context, queue)
+    assert not [event for event in queue.events if isinstance(event, TaskStatusUpdateEvent)]
+    with pytest.raises(ValueError, match="A2A task not found"):
+        await store.get_task_record("task-1")
 
 
 @pytest.mark.asyncio
@@ -846,6 +975,80 @@ async def execute(self, **kwargs) -> None:
     assert any(getattr(message, "content", "") == "[Pipeline Handoff Context]" for message in seen_resume[0])
 
 
+@pytest.mark.asyncio
+async def test_pipeline_handoff_image_request_uses_normal_manifest_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    from a2a.types import Message, Part, Role
+
+    from iac_code.a2a.pipeline_paths import a2a_pipeline_dir_for_session
+    from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
+    from iac_code.agent.message import Message as AgentMessage
+    from iac_code.services.session_storage import SessionStorage
+
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+
+    cwd = tmp_path / "ws"
+    cwd.mkdir()
+    session_id = "session-handoff"
+    context_id = "ctx-handoff"
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    A2APipelineSnapshotStore(a2a_pipeline_dir_for_session(cwd=str(cwd), session_id=session_id)).save(
+        {"normalHandoff": {"action": "switch_to_normal", "targetMode": "normal", "summary": "handoff"}}
+    )
+    SessionStorage().append(str(cwd), session_id, AgentMessage(role="user", content="handoff"))
+
+    def fail_pipeline_input(*args, **kwargs):
+        raise AssertionError("normal handoff must not build PipelineUserInput")
+
+    monkeypatch.setattr(IacCodeA2AExecutor, "_pipeline_input_from_context", fail_pipeline_input)
+    loop = FakeAgentLoop([TextDeltaEvent(text="normal-ok")])
+    monkeypatch.setattr(
+        "iac_code.a2a.executor.create_agent_runtime",
+        lambda options: FakeRuntime(agent_loop=loop, session_id=options.session_id),
+    )
+
+    class FailingPipelineExecutor:
+        def __init__(self, **kwargs) -> None:
+            pass
+
+        async def execute(self, **kwargs) -> None:
+            raise AssertionError("pipeline executor should not be used after normal handoff")
+
+    monkeypatch.setattr("iac_code.a2a.executor.IacCodeA2APipelineExecutor", FailingPipelineExecutor)
+
+    context = FakeRequestContext(
+        task_id="task-followup",
+        context_id=context_id,
+        text="",
+        metadata={"iac_code": {"cwd": str(cwd)}},
+    )
+    context.message = Message(
+        role=Role.ROLE_USER,
+        parts=[Part(raw=b"\x89PNG\r\n\x1a\nimage", media_type="image/png", filename="diagram.png")],
+        message_id="msg-1",
+    )
+
+    executor = IacCodeA2AExecutor(
+        task_store=A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence),
+        model="qwen3.6-plus",
+    )
+    await executor.execute(
+        context,
+        FakeEventQueue(),
+    )
+
+    assert loop.prompts
+    assert "A2A multimodal attachment:" in loop.prompts[0]
+    assert "mediaType=image/png" in loop.prompts[0]
+    assert "[Image input]" not in loop.prompts[0]
+
+
 @pytest.mark.asyncio
 async def test_pipeline_handoff_context_is_backfilled_from_snapshot_when_session_missing(
     monkeypatch: pytest.MonkeyPatch,
@@ -914,6 +1117,112 @@ async def execute(self, **kwargs) -> None:
     assert any(getattr(message, "content", "") == summary for message in loaded)
 
 
+@pytest.mark.asyncio
+async def test_pipeline_handoff_context_routes_and_backfills_public_summary_from_journal_when_snapshot_corrupt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    from iac_code.a2a.pipeline_paths import a2a_pipeline_dir_for_session
+    from iac_code.pipeline.engine.cleanup import CleanupLedger, CleanupResource
+    from iac_code.services.session_storage import SessionStorage
+
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+
+    cwd = tmp_path / "ws"
+    cwd.mkdir()
+    session_id = "session-handoff"
+    context_id = "ctx-handoff"
+    summary = "[Pipeline Handoff Context]\nPipeline: selling"
+    cleanup_prompt = "cleanup prompt for stack-123"
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    pipeline_dir = a2a_pipeline_dir_for_session(cwd=str(cwd), session_id=session_id)
+    pipeline_dir.mkdir(parents=True, exist_ok=True)
+    (pipeline_dir / "a2a-snapshot.json").write_text("{broken", encoding="utf-8")
+    A2APipelineJournal(pipeline_dir).append(
+        {
+            "schemaVersion": "1.0",
+            "eventId": "evt-handoff",
+            "sequence": 1,
+            "createdAt": "2026-01-01T00:00:00Z",
+            "eventType": "pipeline_handoff_ready",
+            "scope": "pipeline",
+            "pipelineRunId": context_id,
+            "taskId": "task-pipeline",
+            "contextId": context_id,
+            "pipelineName": "selling",
+            "status": "completed",
+            "data": {
+                "action": "switch_to_normal",
+                "targetMode": "normal",
+                "summary": summary,
+                "cleanup": {
+                    "status": "pending",
+                    "resourceCount": 1,
+                    "prompt": cleanup_prompt,
+                    "resources": [{"resourceId": "stack-123", "regionId": "cn-hangzhou"}],
+                },
+            },
+        }
+    )
+    ledger = CleanupLedger(SessionStorage().session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="completed",
+                progress_status="DELETE_COMPLETE",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+
+    loop = FakeAgentLoop([TextDeltaEvent(text="normal-ok")])
+    seen_resume: list[object | None] = []
+
+    def fake_factory(options):
+        seen_resume.append(options.resume_messages)
+        return FakeRuntime(agent_loop=loop, session_id=options.session_id)
+
+    class FailingPipelineExecutor:
+        def __init__(self, **kwargs) -> None:
+            pass
+
+        async def execute(self, **kwargs) -> None:
+            raise AssertionError("pipeline executor should not be used after normal handoff")
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", fake_factory)
+    monkeypatch.setattr("iac_code.a2a.executor.IacCodeA2APipelineExecutor", FailingPipelineExecutor)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-followup",
+            context_id=context_id,
+            text="继续解释一下",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.prompts == ["继续解释一下"]
+    assert seen_resume and seen_resume[0] is not None
+    assert any(getattr(message, "content", "") == summary for message in seen_resume[0])
+    assert not any(getattr(message, "content", "") == cleanup_prompt for message in seen_resume[0])
+    loaded = SessionStorage().load(str(cwd), session_id)
+    assert loaded is not None
+    assert any(getattr(message, "content", "") == summary for message in loaded)
+    assert not any(getattr(message, "content", "") == cleanup_prompt for message in loaded)
+
+
 @pytest.mark.asyncio
 async def test_auth_error_is_sanitized(monkeypatch: pytest.MonkeyPatch, tmp_path: Path) -> None:
     def raise_auth_error(options):
diff --git a/tests/a2a/test_executor_cleanup.py b/tests/a2a/test_executor_cleanup.py
new file mode 100644
index 00000000..f2873600
--- /dev/null
+++ b/tests/a2a/test_executor_cleanup.py
@@ -0,0 +1,1204 @@
+from __future__ import annotations
+
+from pathlib import Path
+from types import SimpleNamespace
+from unittest.mock import MagicMock
+
+import pytest
+from a2a.types import TaskStatusUpdateEvent
+from google.protobuf.json_format import MessageToDict
+
+from iac_code.a2a.executor import (
+    IacCodeA2AExecutor,
+    _a2a_deferred_cleanup_prompts_path,
+    _append_a2a_deferred_cleanup_prompt,
+    _cleanup_ledger_for_a2a_normal_chat,
+    _cleanup_payload_from_private_ledger_or_unavailable,
+    _cleanup_publisher_for_a2a_normal_chat,
+    _cleanup_resource_states,
+    _load_a2a_deferred_cleanup_prompts,
+    _observe_cleanup_stream,
+    _prune_completed_cleanup_prompt_from_runtime,
+    _publish_cleanup_resource_changes,
+)
+from iac_code.a2a.metrics import NoOpA2AMetrics
+from iac_code.a2a.persistence import A2AContextSnapshot, A2APersistenceStore
+from iac_code.a2a.pipeline_journal import A2APipelineJournal
+from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
+from iac_code.a2a.task_store import A2ATaskStore
+from iac_code.agent.message import Message
+from iac_code.pipeline.engine.cleanup import (
+    CLEANUP_PROMPT_METADATA_TYPE,
+    CleanupLedger,
+    CleanupResource,
+    ObservedResource,
+    create_cleanup_prompt_message,
+)
+from iac_code.services.session_storage import SessionStorage
+from iac_code.types.stream_events import TextDeltaEvent, ToolResultEvent, ToolUseEndEvent
+
+from .fakes import FakeAgentLoop, FakeEventQueue, FakeRequestContext, FakeRuntime
+
+
+def _dump(event):
+    return MessageToDict(event, preserving_proto_field_name=False)
+
+
+class _TaskStore:
+    def __init__(self, *, cwd: str, session_id: str) -> None:
+        self._record = SimpleNamespace(cwd=cwd, session_id=session_id)
+
+    async def get_context_record(self, context_id: str) -> SimpleNamespace:
+        return self._record
+
+
+def test_a2a_handoff_does_not_reconstruct_cleanup_prompt_from_public_snapshot(tmp_path: Path) -> None:
+    import inspect
+
+    assert "public_snapshot" not in inspect.signature(_cleanup_payload_from_private_ledger_or_unavailable).parameters
+
+    cleanup = _cleanup_payload_from_private_ledger_or_unavailable(
+        ledger_path=tmp_path / "missing-cleanup.yaml",
+    )
+
+    assert cleanup["status"] == "unavailable"
+    assert "statusMessage" in cleanup
+    assert "prompt" not in cleanup
+    assert "resources" not in cleanup
+
+
+def test_normal_chat_cleanup_ledger_ignores_observed_only_ledger(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-observed-only"
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.record_observed(
+        ObservedResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-success",
+            region_id="cn-hangzhou",
+            observed_action="CreateStack",
+            source_step_id="deploying",
+        )
+    )
+
+    class StorageFactory:
+        repair_interrupted = staticmethod(SessionStorage.repair_interrupted)
+
+        def __call__(self):
+            return storage
+
+    monkeypatch.setattr("iac_code.a2a.executor.SessionStorage", StorageFactory())
+
+    assert _cleanup_ledger_for_a2a_normal_chat(cwd=str(cwd), session_id=session_id) is None
+
+
+def test_normal_chat_cleanup_ledger_recovers_pending_cleanup_without_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup-required"
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-leftover",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+
+    class StorageFactory:
+        repair_interrupted = staticmethod(SessionStorage.repair_interrupted)
+
+        def __call__(self):
+            return storage
+
+    monkeypatch.setattr("iac_code.a2a.executor.SessionStorage", StorageFactory())
+
+    recovered = _cleanup_ledger_for_a2a_normal_chat(cwd=str(cwd), session_id=session_id)
+
+    assert recovered is not None
+    assert recovered.path == ledger.path
+
+
+def test_normal_chat_cleanup_ledger_recovers_completed_cleanup_for_legacy_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup-completed"
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-deleted",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-deleted",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+    storage.append(str(cwd), session_id, create_cleanup_prompt_message("legacy cleanup prompt without ledger path"))
+
+    class StorageFactory:
+        repair_interrupted = staticmethod(SessionStorage.repair_interrupted)
+
+        def __call__(self):
+            return storage
+
+    monkeypatch.setattr("iac_code.a2a.executor.SessionStorage", StorageFactory())
+
+    recovered = _cleanup_ledger_for_a2a_normal_chat(cwd=str(cwd), session_id=session_id)
+
+    assert recovered is not None
+    assert recovered.path == ledger.path
+
+
+@pytest.mark.asyncio
+async def test_pipeline_handoff_context_backfills_summary_without_cleanup_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    pipeline_dir = tmp_path / "pipeline"
+    ledger_path = tmp_path / "cleanup.yaml"
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    prompt = "cleanup prompt for stack-123"
+
+    A2APipelineSnapshotStore(pipeline_dir).save(
+        {
+            "normalHandoff": {
+                "action": "switch_to_normal",
+                "targetMode": "normal",
+                "summary": "[Pipeline Handoff Context]\nPipeline: selling",
+                "data": {
+                    "cleanup": {
+                        "status": "pending",
+                        "resourceCount": 1,
+                        "statusMessage": "检测到 1 个回滚残留资源，开始清理流程。",
+                        "prompt": prompt,
+                        "ledgerPath": str(ledger_path),
+                    }
+                },
+            }
+        }
+    )
+
+    class StorageFactory:
+        repair_interrupted = staticmethod(SessionStorage.repair_interrupted)
+
+        def __call__(self):
+            return storage
+
+    monkeypatch.setattr("iac_code.a2a.executor.SessionStorage", StorageFactory())
+    monkeypatch.setattr("iac_code.a2a.executor.existing_a2a_pipeline_dir_for_session", lambda **kwargs: pipeline_dir)
+
+    executor = IacCodeA2AExecutor.__new__(IacCodeA2AExecutor)
+    executor._task_store = _TaskStore(cwd=str(cwd), session_id=session_id)
+
+    await executor._ensure_pipeline_handoff_context_in_session(context_id=context_id, cwd=str(cwd))
+    await executor._ensure_pipeline_handoff_context_in_session(context_id=context_id, cwd=str(cwd))
+
+    messages = storage.load(str(cwd), session_id)
+    assert [message.content for message in messages] == [
+        "[Pipeline Handoff Context]\nPipeline: selling",
+    ]
+    assert not any(message.content == prompt for message in messages)
+    assert not any(message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE for message in messages)
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_updates_pipeline_cleanup_ledger(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    pipeline_task_id = "task-pipeline"
+    normal_task_id = "task-normal-cleanup"
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    pipeline_dir = storage.session_dir(str(cwd), session_id) / "a2a" / "pipeline"
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(
+        str(cwd),
+        session_id,
+        create_cleanup_prompt_message(
+            cleanup_prompt.prompt,
+            cleanup_ledger_path=ledger.path,
+            cleanup_status="pending",
+        ),
+    )
+    A2APipelineSnapshotStore(pipeline_dir).save(
+        {
+            "pipelineRunId": context_id,
+            "taskId": pipeline_task_id,
+            "contextId": context_id,
+            "pipelineName": "selling",
+            "cleanup": {
+                "status": "pending",
+                "resourceCount": 1,
+                "resources": [{"resourceId": "stack-123", "regionId": "cn-hangzhou"}],
+                "history": [],
+            },
+        }
+    )
+    loop = FakeAgentLoop(
+        [
+            ToolUseEndEvent(
+                tool_use_id="tool-delete",
+                name="aliyun_api",
+                input={
+                    "product": "ROS",
+                    "action": "DeleteStack",
+                    "params": {"StackId": "stack-123", "RegionId": "cn-hangzhou"},
+                },
+            ),
+            ToolResultEvent(
+                tool_use_id="tool-delete",
+                tool_name="aliyun_api",
+                result={"StackId": "stack-123"},
+                is_error=False,
+            ),
+            ToolUseEndEvent(
+                tool_use_id="tool-get",
+                name="aliyun_api",
+                input={
+                    "product": "ROS",
+                    "action": "GetStack",
+                    "params": {"StackId": "stack-123", "RegionId": "cn-hangzhou"},
+                },
+            ),
+            ToolResultEvent(
+                tool_use_id="tool-get",
+                tool_name="aliyun_api",
+                result={"Stack": {"StackId": "stack-123", "StackStatus": "DELETE_COMPLETE"}},
+                is_error=False,
+            ),
+            TextDeltaEvent(text="cleanup done"),
+        ]
+    )
+
+    async def continue_streaming():
+        for event in loop.events:
+            yield event
+
+    loop.continue_streaming = continue_streaming
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+
+    class StorageFactory:
+        repair_interrupted = staticmethod(SessionStorage.repair_interrupted)
+
+        def __call__(self):
+            return storage
+
+    monkeypatch.setattr("iac_code.a2a.executor.SessionStorage", StorageFactory())
+    monkeypatch.setattr("iac_code.a2a.executor.existing_a2a_pipeline_dir_for_session", lambda **kwargs: pipeline_dir)
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+    queue = FakeEventQueue()
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id=normal_task_id,
+            context_id=context_id,
+            text="continue",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        queue,
+    )
+
+    resource = ledger.cleanup_resources()[0]
+    assert resource.cleanup_status == "completed"
+    assert resource.cleanup_tool_use_id == "tool-get"
+    assert resource.progress_status == "DELETE_COMPLETE"
+    pipeline_updates = [
+        _dump(event)
+        for event in queue.events
+        if isinstance(event, TaskStatusUpdateEvent)
+        and "pipeline" in _dump(event).get("metadata", {}).get("iac_code", {})
+    ]
+    pipeline_events = [update["metadata"]["iac_code"]["pipeline"] for update in pipeline_updates]
+    assert [event["eventType"] for event in pipeline_events] == [
+        "cleanup_started",
+        "cleanup_progress",
+        "cleanup_completed",
+    ]
+    assert {update["taskId"] for update in pipeline_updates} == {normal_task_id}
+    assert {event["taskId"] for event in pipeline_events} == {pipeline_task_id}
+    assert {event["deliveryTaskId"] for event in pipeline_events} == {normal_task_id}
+    snapshot = A2APipelineSnapshotStore(pipeline_dir).load()
+    assert snapshot is not None
+    assert snapshot["cleanup"]["status"] == "completed"
+    assert snapshot["cleanup"]["resources"][0]["stackStatus"] == "DELETE_COMPLETE"
+    messages = storage.load(str(cwd), session_id)
+    cleanup_messages = [message for message in messages if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE]
+    assert len(cleanup_messages) == 1
+    assert cleanup_messages[0].metadata["cleanupLedgerPath"] == str(ledger.path)
+    assert cleanup_messages[0].metadata["cleanupStatus"] == "completed"
+
+
+class _FlakyCleanupPublisher:
+    def __init__(self) -> None:
+        self.calls: list[dict] = []
+        self.fail_next = True
+
+    async def publish_manual(
+        self,
+        event_type,
+        scope,
+        *,
+        status="working",
+        data=None,
+        coordinates=None,
+        require_durable_metadata=False,
+    ):
+        self.calls.append(
+            {
+                "event_type": event_type,
+                "scope": scope,
+                "status": status,
+                "data": data,
+                "coordinates": coordinates,
+                "require_durable_metadata": require_durable_metadata,
+            }
+        )
+        if self.fail_next:
+            self.fail_next = False
+            return None
+        return {"eventType": event_type}
+
+
+class _CatchUpCleanupPublisher:
+    def __init__(self, snapshot: dict) -> None:
+        self.snapshot_store = SimpleNamespace(load=lambda: snapshot)
+        self.calls: list[dict] = []
+
+    async def publish_manual(
+        self,
+        event_type,
+        scope,
+        *,
+        status="working",
+        data=None,
+        coordinates=None,
+        require_durable_metadata=False,
+    ):
+        self.calls.append(
+            {
+                "event_type": event_type,
+                "scope": scope,
+                "status": status,
+                "data": data,
+                "coordinates": coordinates,
+                "require_durable_metadata": require_durable_metadata,
+            }
+        )
+        return {"eventType": event_type}
+
+
+class _CleanupContinuationLoop:
+    def __init__(self, *, cleanup_stack_id: str = "stack-123") -> None:
+        self.run_prompts: list[str] = []
+        self.continue_calls = 0
+        self.cleanup_stack_id = cleanup_stack_id
+        self._run_events: list[object] = [TextDeltaEvent(text="user prompt handled")]
+        self.context_manager = _CleanupContextManager()
+        self.run_context_snapshots: list[list[Message]] = []
+        self.continue_context_snapshots: list[list[Message]] = []
+
+    async def run_streaming(self, prompt: str):
+        self.run_prompts.append(prompt)
+        self.run_context_snapshots.append(list(self.context_manager.get_messages()))
+        for event in self._run_events:
+            yield event
+
+    async def continue_streaming(self):
+        self.continue_calls += 1
+        self.continue_context_snapshots.append(list(self.context_manager.get_messages()))
+        yield ToolUseEndEvent(
+            tool_use_id="tool-delete",
+            name="aliyun_api",
+            input={
+                "product": "ROS",
+                "action": "DeleteStack",
+                "params": {"StackId": self.cleanup_stack_id, "RegionId": "cn-hangzhou"},
+            },
+        )
+        yield ToolResultEvent(
+            tool_use_id="tool-delete",
+            tool_name="aliyun_api",
+            result={"StackId": self.cleanup_stack_id, "Status": "DELETE_COMPLETE"},
+            is_error=False,
+        )
+
+
+class _TwoStepCleanupContinuationLoop(_CleanupContinuationLoop):
+    async def continue_streaming(self):
+        self.continue_calls += 1
+        self.continue_context_snapshots.append(list(self.context_manager.get_messages()))
+        if self.continue_calls == 1:
+            if False:
+                yield None
+            return
+        yield ToolUseEndEvent(
+            tool_use_id="tool-delete",
+            name="aliyun_api",
+            input={
+                "product": "ROS",
+                "action": "DeleteStack",
+                "params": {"StackId": self.cleanup_stack_id, "RegionId": "cn-hangzhou"},
+            },
+        )
+        yield ToolResultEvent(
+            tool_use_id="tool-delete",
+            tool_name="aliyun_api",
+            result={"StackId": self.cleanup_stack_id, "Status": "DELETE_COMPLETE"},
+            is_error=False,
+        )
+
+
+class _CleanupContextManager:
+    def __init__(self) -> None:
+        self._messages: list[Message] = []
+
+    def add_raw_message(self, raw_msg):
+        message = Message(role=raw_msg["role"], content=raw_msg["content"], metadata=raw_msg.get("metadata", {}))
+        self._messages.append(message)
+        return message
+
+    def get_messages(self):
+        return self._messages
+
+    def remove_cleanup_prompt_messages(self):
+        kept = [message for message in self._messages if message.metadata.get("type") != CLEANUP_PROMPT_METADATA_TYPE]
+        removed = len(self._messages) - len(kept)
+        self._messages = kept
+        return removed
+
+
+@pytest.mark.asyncio
+async def test_cleanup_progress_publish_retries_after_none_result(tmp_path: Path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    previous = _cleanup_resource_states(ledger)
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="in_progress",
+        progress_status="DELETE_IN_PROGRESS",
+        progress_percentage=45,
+    )
+    publisher = _FlakyCleanupPublisher()
+
+    still_previous = await _publish_cleanup_resource_changes(publisher, ledger, previous)
+    advanced = await _publish_cleanup_resource_changes(publisher, ledger, still_previous)
+
+    assert still_previous == previous
+    assert advanced != previous
+    assert [call["event_type"] for call in publisher.calls] == ["cleanup_progress", "cleanup_progress"]
+    assert [call["require_durable_metadata"] for call in publisher.calls] == [True, True]
+    assert publisher.calls[1]["data"]["progressPercentage"] == 45
+
+
+@pytest.mark.asyncio
+async def test_cleanup_observer_catches_up_snapshot_after_restart(tmp_path: Path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="in_progress",
+        progress_status="DELETE_IN_PROGRESS",
+        progress_percentage=45,
+    )
+    publisher = _CatchUpCleanupPublisher(
+        {
+            "cleanup": {
+                "resources": [
+                    {
+                        "provider": "ros",
+                        "resourceType": "stack",
+                        "resourceId": "stack-123",
+                        "regionId": "cn-hangzhou",
+                        "cleanupStatus": "pending",
+                    }
+                ]
+            }
+        }
+    )
+
+    async def empty_stream():
+        if False:
+            yield None
+
+    async for _event in _observe_cleanup_stream(empty_stream(), ledger, publisher=publisher):
+        pass
+
+    assert [call["event_type"] for call in publisher.calls] == ["cleanup_progress"]
+    assert publisher.calls[0]["data"]["progressPercentage"] == 45
+
+
+def test_a2a_cleanup_prune_keeps_prompt_when_cleanup_ledger_is_corrupt(tmp_path: Path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+    remover = MagicMock()
+    runtime = SimpleNamespace(
+        agent_loop=SimpleNamespace(
+            context_manager=SimpleNamespace(remove_cleanup_prompt_messages=remover),
+        )
+    )
+
+    _prune_completed_cleanup_prompt_from_runtime(runtime, ledger)
+
+    remover.assert_not_called()
+
+
+def test_a2a_cleanup_prune_keeps_prompt_when_cleanup_ledger_is_missing() -> None:
+    cleanup_message = create_cleanup_prompt_message("cleanup prompt for stack-123")
+    context_manager = _CleanupContextManager()
+    context_manager.add_raw_message(cleanup_message.to_dict())
+    context_manager.remove_cleanup_prompt_messages = MagicMock(wraps=context_manager.remove_cleanup_prompt_messages)
+    runtime = SimpleNamespace(agent_loop=SimpleNamespace(context_manager=context_manager))
+
+    _prune_completed_cleanup_prompt_from_runtime(runtime, None)
+
+    context_manager.remove_cleanup_prompt_messages.assert_not_called()
+
+
+def test_a2a_deferred_cleanup_prompts_keep_latest_meaningful_turn(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Path
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    prompts = [f"blocked prompt {index}" for index in range(25)]
+
+    for prompt in prompts:
+        _append_a2a_deferred_cleanup_prompt(cwd=str(cwd), session_id=session_id, prompt=prompt)
+
+    assert _load_a2a_deferred_cleanup_prompts(cwd=str(cwd), session_id=session_id) == [prompts[-1]]
+
+
+def test_a2a_deferred_cleanup_prompts_do_not_accumulate_repeated_continue_turns(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Path
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+
+    assert _append_a2a_deferred_cleanup_prompt(cwd=str(cwd), session_id=session_id, prompt="continue") is True
+    assert _append_a2a_deferred_cleanup_prompt(cwd=str(cwd), session_id=session_id, prompt="continue") is True
+
+    assert _load_a2a_deferred_cleanup_prompts(cwd=str(cwd), session_id=session_id) == ["continue"]
+
+
+def test_a2a_deferred_cleanup_continue_preserves_existing_meaningful_turn(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Path
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+
+    assert _append_a2a_deferred_cleanup_prompt(cwd=str(cwd), session_id=session_id, prompt="update template") is True
+    assert _append_a2a_deferred_cleanup_prompt(cwd=str(cwd), session_id=session_id, prompt="continue") is True
+
+    assert _load_a2a_deferred_cleanup_prompts(cwd=str(cwd), session_id=session_id) == ["update template"]
+
+
+def test_a2a_deferred_cleanup_prompt_append_does_not_overwrite_corrupt_sidecar(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Path
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    path = _a2a_deferred_cleanup_prompts_path(cwd=str(cwd), session_id=session_id)
+    path.parent.mkdir(parents=True, exist_ok=True)
+    path.write_text("{broken", encoding="utf-8")
+
+    assert _append_a2a_deferred_cleanup_prompt(cwd=str(cwd), session_id=session_id, prompt="new prompt") is False
+
+    assert path.read_text(encoding="utf-8") == "{broken"
+
+
+@pytest.mark.asyncio
+async def test_a2a_cleanup_observer_does_not_mutate_corrupt_ledger_or_prune_prompt(tmp_path: Path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+    remover = MagicMock()
+    runtime = SimpleNamespace(
+        agent_loop=SimpleNamespace(
+            context_manager=SimpleNamespace(remove_cleanup_prompt_messages=remover),
+        )
+    )
+
+    async def events():
+        yield ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "DeleteStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+
+    async for _event in _observe_cleanup_stream(events(), ledger):
+        pass
+    _prune_completed_cleanup_prompt_from_runtime(runtime, ledger)
+
+    assert path.exists()
+    assert not list(tmp_path.glob("cleanup.yaml.corrupt*"))
+    remover.assert_not_called()
+
+
+def test_cleanup_publisher_falls_back_to_journal_when_snapshot_is_unreadable(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    pipeline_dir = tmp_path / "pipeline"
+    pipeline_dir.mkdir()
+    (pipeline_dir / "a2a-snapshot.json").write_text("{broken", encoding="utf-8")
+    A2APipelineJournal(pipeline_dir).append(
+        {
+            "schemaVersion": "1.0",
+            "eventId": "evt-start",
+            "sequence": 1,
+            "createdAt": "2026-01-01T00:00:00Z",
+            "eventType": "pipeline_started",
+            "scope": "pipeline",
+            "pipelineRunId": "ctx-cleanup",
+            "taskId": "task-pipeline",
+            "contextId": "ctx-cleanup",
+            "pipelineName": "selling",
+            "status": "working",
+            "data": {"totalSteps": 1, "stepIds": ["deploying"]},
+        }
+    )
+
+    monkeypatch.setattr("iac_code.a2a.executor.existing_a2a_pipeline_dir_for_session", lambda **kwargs: pipeline_dir)
+
+    publisher = _cleanup_publisher_for_a2a_normal_chat(
+        event_queue=FakeEventQueue(),
+        cwd=str(cwd),
+        session_id="session-cleanup",
+        task_id="task-normal",
+        context_id="ctx-cleanup",
+        artifact_store=None,
+        exposure_types=None,
+    )
+
+    assert publisher is not None
+    assert publisher.translator._context.task_id == "task-pipeline"
+    assert publisher.delivery_task_id == "task-normal"
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_runs_cleanup_prompt_as_continuation_then_processes_user_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(str(cwd), session_id, create_cleanup_prompt_message(cleanup_prompt.prompt))
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _CleanupContinuationLoop()
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal",
+            context_id=context_id,
+            text="user follow-up",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.continue_calls == 1
+    assert loop.run_prompts == ["user follow-up"]
+    assert not any(
+        message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE for message in loop.run_context_snapshots[0]
+    )
+    assert ledger.cleanup_resources()[0].cleanup_status == "completed"
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_injects_cleanup_prompt_from_ledger_before_cleanup_continuation(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _CleanupContinuationLoop()
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal",
+            context_id=context_id,
+            text="user follow-up",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    messages = storage.load(str(cwd), session_id)
+    assert any(message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE for message in messages)
+    assert loop.continue_calls == 1
+    assert loop.run_prompts == ["user follow-up"]
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_defers_prompt_until_pending_cleanup_completes(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(str(cwd), session_id, create_cleanup_prompt_message(cleanup_prompt.prompt))
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _TwoStepCleanupContinuationLoop()
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal-1",
+            context_id=context_id,
+            text="update the template after cleanup",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.continue_calls == 1
+    assert loop.run_prompts == []
+    assert _load_a2a_deferred_cleanup_prompts(cwd=str(cwd), session_id=session_id) == [
+        "update the template after cleanup"
+    ]
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal-2",
+            context_id=context_id,
+            text="continue",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.continue_calls == 2
+    assert loop.run_prompts == ["update the template after cleanup"]
+    assert _load_a2a_deferred_cleanup_prompts(cwd=str(cwd), session_id=session_id) == []
+    assert not any(
+        message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE for message in loop.run_context_snapshots[0]
+    )
+    assert ledger.cleanup_resources()[0].cleanup_status == "completed"
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_does_not_overwrite_corrupt_deferred_prompt_sidecar(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(str(cwd), session_id, create_cleanup_prompt_message(cleanup_prompt.prompt))
+    deferred_path = _a2a_deferred_cleanup_prompts_path(cwd=str(cwd), session_id=session_id)
+    deferred_path.parent.mkdir(parents=True, exist_ok=True)
+    deferred_path.write_text("{broken", encoding="utf-8")
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _TwoStepCleanupContinuationLoop()
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal",
+            context_id=context_id,
+            text="update the template after cleanup",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.continue_calls == 1
+    assert loop.run_prompts == []
+    assert deferred_path.read_text(encoding="utf-8") == "{broken"
+    task = await store.get_or_create_task(task_id="task-normal", context_id=context_id)
+    assert "deferred prompt state is unavailable" in "".join(task.output_text)
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_blocks_agent_execution_when_cleanup_ledger_is_corrupt_with_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    ledger_path = storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml"
+    ledger_path.parent.mkdir(parents=True, exist_ok=True)
+    ledger_path.write_text("[broken", encoding="utf-8")
+    cleanup_message = create_cleanup_prompt_message("cleanup prompt for stack-123")
+    storage.append(str(cwd), session_id, cleanup_message)
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _CleanupContinuationLoop()
+    loop.context_manager.add_raw_message(cleanup_message.to_dict())
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal",
+            context_id=context_id,
+            text="user follow-up",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.continue_calls == 0
+    assert loop.run_prompts == []
+    task = await store.get_or_create_task(task_id="task-normal", context_id=context_id)
+    assert "cleanup state is unavailable" in "".join(task.output_text)
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_blocks_agent_execution_when_cleanup_ledger_is_missing_with_prompt(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    cleanup_message = create_cleanup_prompt_message("cleanup prompt for stack-123")
+    storage.append(str(cwd), session_id, cleanup_message)
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _CleanupContinuationLoop()
+    loop.context_manager.add_raw_message(cleanup_message.to_dict())
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal",
+            context_id=context_id,
+            text="user follow-up",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    assert loop.continue_calls == 0
+    assert loop.run_prompts == []
+    cleanup_messages = [
+        message
+        for message in loop.context_manager.get_messages()
+        if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE
+    ]
+    assert cleanup_messages
+    task = await store.get_or_create_task(task_id="task-normal", context_id=context_id)
+    assert "cleanup state is unavailable" in "".join(task.output_text)
+
+
+@pytest.mark.asyncio
+async def test_normal_a2a_turn_replaces_stale_cleanup_prompt_before_partial_cleanup_continuation(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "config"
+    config_dir.mkdir()
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(config_dir))
+    cwd = tmp_path / "workspace"
+    cwd.mkdir()
+    session_id = "session-cleanup"
+    context_id = "ctx-cleanup"
+    storage = SessionStorage()
+    ledger = CleanupLedger(storage.session_dir(str(cwd), session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-done",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-pending",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    stale_prompt = ledger.build_pending_prompt()
+    assert stale_prompt is not None
+    stale_message = create_cleanup_prompt_message(stale_prompt.prompt)
+    storage.append(str(cwd), session_id, stale_message)
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-done",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_context(A2AContextSnapshot(context_id=context_id, session_id=session_id, cwd=str(cwd)))
+    loop = _CleanupContinuationLoop(cleanup_stack_id="stack-pending")
+    loop.context_manager.add_raw_message(stale_message.to_dict())
+    runtime = FakeRuntime(agent_loop=loop, session_id=session_id)
+
+    monkeypatch.setattr("iac_code.a2a.executor.create_agent_runtime", lambda options: runtime)
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+
+    await executor.execute(
+        FakeRequestContext(
+            task_id="task-normal",
+            context_id=context_id,
+            text="user follow-up",
+            metadata={"iac_code": {"cwd": str(cwd)}},
+        ),
+        FakeEventQueue(),
+    )
+
+    cleanup_messages = [
+        message
+        for message in loop.continue_context_snapshots[0]
+        if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE
+    ]
+    assert len(cleanup_messages) == 1
+    assert "stack-pending" in cleanup_messages[0].content
+    assert "stack-done" not in cleanup_messages[0].content
diff --git a/tests/a2a/test_jsonrpc_passthrough.py b/tests/a2a/test_jsonrpc_passthrough.py
new file mode 100644
index 00000000..0d5f0fbe
--- /dev/null
+++ b/tests/a2a/test_jsonrpc_passthrough.py
@@ -0,0 +1,50 @@
+from __future__ import annotations
+
+import importlib
+from typing import Any
+
+
+def test_importing_pipeline_executor_does_not_install_jsonrpc_passthrough(monkeypatch) -> None:
+    from a2a.server.request_handlers import response_helpers
+    from a2a.server.routes import jsonrpc_dispatcher
+
+    def sentinel_build_error_response(request_id: str | int | None, error: Any) -> dict[str, Any]:
+        return {"jsonrpc": "2.0", "id": request_id, "error": {"code": getattr(error, "code", -32603)}}
+
+    monkeypatch.setattr(response_helpers, "build_error_response", sentinel_build_error_response)
+    monkeypatch.setattr(jsonrpc_dispatcher, "build_error_response", sentinel_build_error_response)
+
+    import iac_code.a2a.pipeline_executor as pipeline_executor
+
+    importlib.reload(pipeline_executor)
+
+    assert response_helpers.build_error_response is sentinel_build_error_response
+    assert jsonrpc_dispatcher.build_error_response is sentinel_build_error_response
+
+
+def test_jsonrpc_passthrough_explicit_install_is_idempotent(monkeypatch) -> None:
+    from a2a.server.request_handlers import response_helpers
+    from a2a.server.routes import jsonrpc_dispatcher
+
+    from iac_code.a2a.jsonrpc_passthrough import install_jsonrpc_error_data_passthrough
+
+    def original_build_error_response(request_id: str | int | None, error: Any) -> dict[str, Any]:
+        return {"jsonrpc": "2.0", "id": request_id, "error": {"code": getattr(error, "code", -32603)}}
+
+    class RecoverableError(Exception):
+        code = -32602
+        jsonrpc_error_data_passthrough = True
+        data = {"recoverableTaskId": "task-owner"}
+
+    monkeypatch.setattr(response_helpers, "build_error_response", original_build_error_response)
+    monkeypatch.setattr(jsonrpc_dispatcher, "build_error_response", original_build_error_response)
+
+    install_jsonrpc_error_data_passthrough()
+    installed = response_helpers.build_error_response
+    install_jsonrpc_error_data_passthrough()
+
+    assert response_helpers.build_error_response is installed
+    assert jsonrpc_dispatcher.build_error_response is installed
+    response = installed("req-1", RecoverableError("Pipeline already running"))
+    assert response["error"]["code"] == -32602
+    assert response["error"]["data"] == {"recoverableTaskId": "task-owner"}
diff --git a/tests/a2a/test_parts.py b/tests/a2a/test_parts.py
index c0f7212f..1d8deeab 100644
--- a/tests/a2a/test_parts.py
+++ b/tests/a2a/test_parts.py
@@ -1,12 +1,17 @@
 from __future__ import annotations
 
 import base64
+import io
+from types import SimpleNamespace
 
 import pytest
 from a2a.types import Part
 from google.protobuf.struct_pb2 import Value
+from PIL import Image
 
 from iac_code.a2a import parts
+from iac_code.a2a.parts import parts_to_pipeline_input
+from iac_code.agent.message import ImageBlock, TextBlock
 
 
 def _data_part(value: dict[str, object]) -> Part:
@@ -192,3 +197,134 @@ def test_message_parts_join_non_empty_values(tmp_path) -> None:
     assert parts.parts_to_prompt([Part(text="first"), Part(text=""), Part(text="second")], cwd=tmp_path) == (
         "first\nsecond"
     )
+
+
+def _resize_spy(monkeypatch, *, output: bytes, media_type: str = "image/webp") -> list[bytes]:
+    calls: list[bytes] = []
+
+    def fake_resize(content: bytes):
+        calls.append(content)
+        return SimpleNamespace(data=output, media_type=media_type)
+
+    monkeypatch.setattr("iac_code.a2a.parts.maybe_resize_and_downsample", fake_resize)
+    return calls
+
+
+def _tiny_bmp_bytes() -> bytes:
+    buf = io.BytesIO()
+    Image.new("RGB", (1, 1), color=(255, 0, 0)).save(buf, format="BMP")
+    return buf.getvalue()
+
+
+def _tiny_png_bytes() -> bytes:
+    buf = io.BytesIO()
+    Image.new("RGB", (1, 1), color=(0, 255, 0)).save(buf, format="PNG")
+    return buf.getvalue()
+
+
+def test_parts_to_pipeline_input_converts_raw_image(monkeypatch, tmp_path) -> None:
+    raw = b"fake png bytes"
+    resized = b"resized raw image"
+    calls = _resize_spy(monkeypatch, output=resized, media_type="image/webp")
+
+    value = parts_to_pipeline_input([Part(raw=raw, media_type="image/png")], cwd=tmp_path)
+
+    assert calls == [raw]
+    assert value.has_images is True
+    assert value.display_text == "[Image input]"
+    assert value.content == [ImageBlock(media_type="image/webp", data=base64.b64encode(resized).decode("ascii"))]
+
+
+def test_parts_to_pipeline_input_preserves_text_plus_image_order(monkeypatch, tmp_path) -> None:
+    raw = b"fake jpeg bytes"
+    resized = b"resized jpeg bytes"
+    calls = _resize_spy(monkeypatch, output=resized, media_type="image/jpeg")
+
+    value = parts_to_pipeline_input(
+        [
+            Part(text="inspect this", media_type="text/plain"),
+            Part(raw=raw, media_type="image/jpeg"),
+        ],
+        cwd=tmp_path,
+    )
+
+    assert calls == [raw]
+    assert value.display_text == "inspect this"
+    assert value.content == [
+        TextBlock(text="inspect this"),
+        ImageBlock(media_type="image/jpeg", data=base64.b64encode(resized).decode("ascii")),
+    ]
+
+
+def test_parts_to_pipeline_input_converts_base64_data_image(monkeypatch, tmp_path) -> None:
+    raw = b"fake data image"
+    resized = b"resized data image"
+    encoded = base64.b64encode(raw).decode("ascii")
+    calls = _resize_spy(monkeypatch, output=resized, media_type="image/png")
+
+    value = parts_to_pipeline_input([_binary_data_part({"bytes": encoded}, media_type="image/png")], cwd=tmp_path)
+
+    assert calls == [raw]
+    assert value.content == [ImageBlock(media_type="image/png", data=base64.b64encode(resized).decode("ascii"))]
+
+
+def test_parts_to_pipeline_input_converts_safe_file_url_image(monkeypatch, tmp_path) -> None:
+    raw = b"file image bytes"
+    resized = b"resized file image"
+    source = tmp_path / "diagram.png"
+    source.write_bytes(raw)
+    calls = _resize_spy(monkeypatch, output=resized, media_type="image/png")
+
+    value = parts_to_pipeline_input([Part(url=source.as_uri(), media_type="image/png")], cwd=tmp_path)
+
+    assert calls == [raw]
+    assert value.content == [ImageBlock(media_type="image/png", data=base64.b64encode(resized).decode("ascii"))]
+
+
+def test_parts_to_pipeline_input_uses_real_resizer_for_valid_image_bytes(tmp_path) -> None:
+    raw = _tiny_bmp_bytes()
+
+    value = parts_to_pipeline_input([Part(raw=raw, media_type="image/png")], cwd=tmp_path)
+
+    assert isinstance(value.content, list)
+    block = value.content[0]
+    assert isinstance(block, ImageBlock)
+    assert block.media_type == "image/png"
+    assert base64.b64decode(block.data).startswith(b"\x89PNG\r\n\x1a\n")
+
+
+def test_parts_to_pipeline_input_accepts_tiny_png_without_monkeypatch(tmp_path) -> None:
+    raw = _tiny_png_bytes()
+
+    value = parts_to_pipeline_input([Part(raw=raw, media_type="image/png")], cwd=tmp_path)
+
+    assert isinstance(value.content, list)
+    block = value.content[0]
+    assert isinstance(block, ImageBlock)
+    assert block.media_type == "image/png"
+    assert base64.b64decode(block.data).startswith(b"\x89PNG\r\n\x1a\n")
+
+
+def test_parts_to_pipeline_input_rejects_unsafe_file_url_image(tmp_path) -> None:
+    outside = tmp_path.parent / "outside-diagram.png"
+    outside.write_bytes(b"outside")
+
+    with pytest.raises(ValueError, match="outside the allowed workspace"):
+        parts_to_pipeline_input([Part(url=outside.as_uri(), media_type="image/png")], cwd=tmp_path)
+
+
+def test_parts_to_pipeline_input_rejects_invalid_base64_data_image(tmp_path) -> None:
+    with pytest.raises(ValueError, match="valid base64"):
+        parts_to_pipeline_input([_binary_data_part({"bytes": "not-base64!"}, media_type="image/png")], cwd=tmp_path)
+
+
+def test_parts_to_pipeline_input_rejects_oversized_raw_image(monkeypatch, tmp_path) -> None:
+    monkeypatch.setattr("iac_code.a2a.parts.MAX_BINARY_INLINE_BYTES", 3)
+
+    with pytest.raises(ValueError, match="too large"):
+        parts_to_pipeline_input([Part(raw=b"abcd", media_type="image/png")], cwd=tmp_path)
+
+
+def test_parts_to_pipeline_input_rejects_audio_as_true_image(tmp_path) -> None:
+    with pytest.raises(ValueError, match="unsupported image media type"):
+        parts_to_pipeline_input([Part(raw=b"audio", media_type="audio/wav")], cwd=tmp_path)
diff --git a/tests/a2a/test_pipeline_debugger_script.py b/tests/a2a/test_pipeline_debugger_script.py
index 43336d9a..94e60518 100644
--- a/tests/a2a/test_pipeline_debugger_script.py
+++ b/tests/a2a/test_pipeline_debugger_script.py
@@ -18,6 +18,19 @@
 import pytest
 
 SCRIPT_PATH = Path(__file__).resolve().parents[2] / "scripts" / "a2a" / "debugger.py"
+RECOVERABLE_JSONRPC_ERROR = {
+    "jsonrpc": "2.0",
+    "id": "1",
+    "error": {
+        "code": -32602,
+        "message": "Pipeline already running.",
+        "data": {
+            "recoverableTaskId": "task-owner",
+            "contextId": "ctx-1",
+            "sidecarStatus": "running",
+        },
+    },
+}
 
 
 def load_debugger_module():
@@ -75,7 +88,7 @@ def serve_handler(handler_cls: type[BaseHTTPRequestHandler]) -> Iterator[str]:
     thread = threading.Thread(target=server.serve_forever, daemon=True)
     thread.start()
     try:
-        host, port = server.server_address
+        host, port = server.server_address[:2]
         yield f"http://{host}:{port}"
     finally:
         server.shutdown()
@@ -100,7 +113,7 @@ def start_debugger_server(debugger, *, default_cwd: str = "/workspace/demo"):
     server = debugger.create_server(config)
     thread = threading.Thread(target=server.serve_forever, daemon=True)
     thread.start()
-    host, port = server.server_address
+    host, port = server.server_address[:2]
 
     class RunningServer:
         url = f"http://{host}:{port}"
@@ -124,7 +137,7 @@ def start_logged_debugger_server(debugger, *, log_dir: Path, default_cwd: str =
     server = debugger.create_server(config)
     thread = threading.Thread(target=server.serve_forever, daemon=True)
     thread.start()
-    host, port = server.server_address
+    host, port = server.server_address[:2]
 
     class RunningServer:
         url = f"http://{host}:{port}"
@@ -224,6 +237,61 @@ def test_build_message_stream_payload_uses_a2a_v1_method_and_cwd_metadata() -> N
     assert payload["params"]["configuration"] == {"acceptedOutputModes": ["text/plain"]}
 
 
+def test_build_message_stream_payload_adds_image_data_parts() -> None:
+    debugger = load_debugger_module()
+
+    payload = debugger.build_message_stream_payload(
+        cwd="/workspace/demo",
+        prompt="inspect this topology",
+        context_id="ctx-demo",
+        task_id="task-demo",
+        request_id="req-1",
+        message_id="msg-1",
+        images=[
+            {
+                "filename": "topology.png",
+                "mediaType": "image/png",
+                "bytes": "iVBORw0KGgo=",
+            }
+        ],
+    )
+
+    assert payload["params"]["message"]["parts"] == [
+        {"text": "inspect this topology"},
+        {
+            "data": {"filename": "topology.png", "bytes": "iVBORw0KGgo="},
+            "mediaType": "image/png",
+        },
+    ]
+
+
+def test_build_message_stream_payload_allows_image_only_parts() -> None:
+    debugger = load_debugger_module()
+
+    payload = debugger.build_message_stream_payload(
+        cwd="/workspace/demo",
+        prompt="",
+        context_id="ctx-demo",
+        task_id="task-demo",
+        request_id="req-1",
+        message_id="msg-1",
+        images=[
+            {
+                "filename": "topology.png",
+                "mediaType": "image/png",
+                "bytes": "iVBORw0KGgo=",
+            }
+        ],
+    )
+
+    assert payload["params"]["message"]["parts"] == [
+        {
+            "data": {"filename": "topology.png", "bytes": "iVBORw0KGgo="},
+            "mediaType": "image/png",
+        },
+    ]
+
+
 def test_build_message_stream_payload_omits_blank_context_id() -> None:
     debugger = load_debugger_module()
 
@@ -357,6 +425,8 @@ def test_index_html_contains_debugger_controls_and_raw_panels(tmp_path: Path) ->
         'id="context-id"',
         'id="task-id"',
         'id="prompt"',
+        'id="image-input"',
+        'id="image-summary"',
         'id="stream-button"',
         'id="fetch-state-button"',
         'id="cancel-button"',
@@ -1038,6 +1108,23 @@ def test_index_html_cancel_uses_active_task_id() -> None:
         assert expected in html
 
 
+def test_index_html_fetches_pipeline_state_after_cancel() -> None:
+    debugger = load_debugger_module()
+
+    html = debugger.render_index_html(
+        debugger.DebuggerConfig(
+            host="127.0.0.1",
+            port=41880,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="/workspace/demo",
+        )
+    )
+    cancel_body = html.split("async function cancelTask()", 1)[1].split("async function streamMessage()", 1)[0]
+
+    assert 'appendRawEvent("sse", {type: "cancel", body});' in cancel_body
+    assert "await fetchStateIfAvailable();" in cancel_body
+
+
 def test_index_html_yields_between_batched_sse_events() -> None:
     debugger = load_debugger_module()
 
@@ -1076,7 +1163,7 @@ def test_index_html_omits_completed_pipeline_task_id_after_normal_handoff() -> N
     for expected in [
         "normalHandoffReady",
         "function streamTaskIdForControls",
-        "state.normalHandoffReady && !controls.activeTaskId",
+        "state.normalHandoffReady || isTerminalPipelineTaskState(state.status)",
         'state.activeTaskId = "";',
         'return "";',
         "updateNormalHandoffState(envelope);",
@@ -1084,6 +1171,71 @@ def test_index_html_omits_completed_pipeline_task_id_after_normal_handoff() -> N
         assert expected in html
 
 
+def test_index_html_omits_terminal_pipeline_task_id_when_streaming_followup(tmp_path: Path) -> None:
+    debugger = load_debugger_module()
+
+    html = debugger.render_index_html(
+        debugger.DebuggerConfig(
+            host="127.0.0.1",
+            port=41880,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="/workspace/demo",
+        )
+    )
+    script = html[html.index("<script>") + len("<script>") : html.rindex("</script>")]
+
+    assert "function isTerminalPipelineTaskState" in script
+    assert "isTerminalPipelineTaskState(state.status)" in script
+
+    def extract_function(name: str) -> str:
+        start = script.index(f"function {name}")
+        brace = script.index("{", start)
+        depth = 0
+        for index in range(brace, len(script)):
+            char = script[index]
+            if char == "{":
+                depth += 1
+            elif char == "}":
+                depth -= 1
+                if depth == 0:
+                    return script[start : index + 1]
+        raise AssertionError(f"Could not extract {name}")
+
+    functions = [extract_function("streamTaskIdForControls")]
+    if "function isTerminalPipelineTaskState" in script:
+        functions.insert(0, extract_function("isTerminalPipelineTaskState"))
+
+    js_path = tmp_path / "stream-task-routing.js"
+    js_path.write_text(
+        "\n".join(
+            [
+                'const state = {normalHandoffReady: false, activeTaskId: "", taskId: "task-1", status: ""};',
+                *functions,
+                'state.status = "TASK_STATE_CANCELED";',
+                'if (streamTaskIdForControls({activeTaskId: "", taskId: "task-1"}) !== "") {',
+                '  throw new Error("canceled pipeline taskId should not be reused");',
+                "}",
+                'state.status = "canceled";',
+                'if (streamTaskIdForControls({activeTaskId: "", taskId: "task-1"}) !== "") {',
+                '  throw new Error("snapshot canceled pipeline taskId should not be reused");',
+                "}",
+                'state.status = "waiting_input";',
+                'if (streamTaskIdForControls({activeTaskId: "", taskId: "task-1"}) !== "task-1") {',
+                '  throw new Error("waiting input pipeline taskId should be reused");',
+                "}",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    try:
+        result = subprocess.run(["node", str(js_path)], capture_output=True, text=True, check=False)
+    except FileNotFoundError:
+        pytest.skip("node is not installed")
+
+    assert result.returncode == 0, result.stderr
+
+
 def test_index_html_clears_finished_active_task_after_normal_chat_turn() -> None:
     debugger = load_debugger_module()
 
@@ -1190,6 +1342,112 @@ def test_index_html_can_restore_debugger_log_replay_payload(tmp_path: Path) -> N
     ]
 
 
+def test_load_log_dir_replays_state_fetch_cancel_handoff_events(tmp_path: Path) -> None:
+    debugger = load_debugger_module()
+    log_dir = tmp_path / "logs"
+    log_dir.mkdir()
+    (log_dir / "sse-events.jsonl").write_text(
+        json.dumps(
+            {
+                "raw": {
+                    "statusUpdate": {
+                        "taskId": "task-pipeline",
+                        "contextId": "ctx-1",
+                        "status": {"state": "TASK_STATE_INPUT_REQUIRED"},
+                        "metadata": {
+                            "iac_code": {
+                                "pipeline": {
+                                    "eventType": "input_required",
+                                    "sequence": 72.0,
+                                    "taskId": "task-pipeline",
+                                    "contextId": "ctx-1",
+                                    "status": "input_required",
+                                }
+                            }
+                        },
+                    }
+                }
+            }
+        )
+        + "\n",
+        encoding="utf-8",
+    )
+    (log_dir / "snapshots.jsonl").write_text(
+        json.dumps(
+            {
+                "raw": {
+                    "snapshot": {
+                        "status": "canceled",
+                        "taskId": "task-pipeline",
+                        "contextId": "ctx-1",
+                        "lastSequence": 74,
+                        "normalHandoff": {
+                            "action": "switch_to_normal",
+                            "targetMode": "normal",
+                            "outcome": "canceled",
+                        },
+                    },
+                    "events": [
+                        {
+                            "eventType": "pipeline_canceled",
+                            "sequence": 73,
+                            "taskId": "task-pipeline",
+                            "contextId": "ctx-1",
+                            "status": "canceled",
+                        },
+                        {
+                            "eventType": "pipeline_handoff_ready",
+                            "sequence": 74,
+                            "taskId": "task-pipeline",
+                            "contextId": "ctx-1",
+                            "status": "canceled",
+                            "data": {
+                                "action": "switch_to_normal",
+                                "targetMode": "normal",
+                                "outcome": "canceled",
+                            },
+                        },
+                    ],
+                }
+            }
+        )
+        + "\n",
+        encoding="utf-8",
+    )
+
+    replay = debugger.load_debug_log_export(log_dir)
+
+    assert replay["task"]["taskId"] == "task-pipeline"
+    assert replay["task"]["activeTaskId"] == ""
+    assert replay["task"]["contextId"] == "ctx-1"
+    assert replay["task"]["status"] == "canceled"
+    assert replay["task"]["lastSequence"] == 74
+    assert [event["eventType"] for event in replay["sseEvents"][-2:]] == [
+        "pipeline_canceled",
+        "pipeline_handoff_ready",
+    ]
+
+
+def test_index_html_normal_handoff_summary_reads_snapshot_response_wrapper() -> None:
+    debugger = load_debugger_module()
+
+    html = debugger.render_index_html(
+        debugger.DebuggerConfig(
+            host="127.0.0.1",
+            port=41880,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="/workspace/demo",
+        )
+    )
+    normal_handoff_body = html.split("function snapshotNormalHandoff(snapshot)", 1)[1].split(
+        "function normalHandoffSummary(snapshot)",
+        1,
+    )[0]
+
+    assert "snapshotEnvelope(snapshot)" in normal_handoff_body
+    assert "snapshotObject(envelope &&" in normal_handoff_body
+
+
 def test_index_html_fills_context_and_task_id_controls_after_capture() -> None:
     debugger = load_debugger_module()
 
@@ -1254,6 +1512,26 @@ def test_index_html_reads_input_required_data_and_clears_stale_permissions() ->
         assert expected in html
 
 
+def test_index_html_highlights_pipeline_canceled_events() -> None:
+    debugger = load_debugger_module()
+
+    html = debugger.render_index_html(
+        debugger.DebuggerConfig(
+            host="127.0.0.1",
+            port=41880,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="/workspace/demo",
+        )
+    )
+
+    for expected in [
+        'type === "pipeline_canceled"',
+        'label: "pipeline canceled"',
+        "timeline-canceled",
+    ]:
+        assert expected in html
+
+
 def test_index_html_stops_stream_after_input_required_to_reenable_prompt_submit() -> None:
     debugger = load_debugger_module()
 
@@ -1707,6 +1985,73 @@ def do_POST(self) -> None:
         self.end_headers()
 
 
+class JsonRpcErrorTargetHandler(BaseHTTPRequestHandler):
+    def log_message(self, format: str, *args: object) -> None:
+        return None
+
+    def do_POST(self) -> None:
+        raw_body = self.rfile.read(int(self.headers.get("Content-Length", "0") or "0"))
+        assert raw_body
+        body = json.dumps(
+            {
+                "jsonrpc": "2.0",
+                "id": "1",
+                "error": {
+                    "code": -32602,
+                    "message": "Current model text-only-model does not support image input.",
+                    "data": {
+                        "recoverableTaskId": "task-owner",
+                        "contextId": "ctx-1",
+                        "sidecarStatus": "running",
+                    },
+                },
+            }
+        ).encode("utf-8")
+        self.send_response(200)
+        self.send_header("Content-Type", "application/json")
+        self.send_header("Content-Length", str(len(body)))
+        self.end_headers()
+        self.wfile.write(body)
+
+
+def test_jsonrpc_error_message_includes_recoverable_task_id() -> None:
+    debugger = load_debugger_module()
+
+    message = debugger._jsonrpc_error_message(RECOVERABLE_JSONRPC_ERROR)
+
+    assert message is not None
+    assert "Pipeline already running." in message
+    assert "task-owner" in message
+
+
+def test_index_html_extracts_delivery_task_aliases() -> None:
+    script = SCRIPT_PATH.read_text(encoding="utf-8")
+
+    assert "statusUpdate.deliveryTaskId" in script
+    assert "statusUpdate.deliveryContextId" in script
+    assert "task.deliveryTaskId" in script
+    assert "envelope.deliveryTaskId" in script
+
+
+def test_jsonrpc_error_message_does_not_duplicate_resume_guidance() -> None:
+    debugger = load_debugger_module()
+    value = {
+        "error": {
+            "code": -32602,
+            "message": "Pipeline already running. Resume task task-owner.",
+            "data": {
+                "recoverableTaskId": "task-owner",
+                "contextId": "ctx-1",
+                "sidecarStatus": "running",
+            },
+        }
+    }
+
+    message = debugger._jsonrpc_error_message(value)
+
+    assert message == "Pipeline already running. Resume task task-owner."
+
+
 def test_message_stream_route_forwards_sse_and_uses_stream_payload() -> None:
     debugger = load_debugger_module()
     SseTargetHandler.requests = []
@@ -1738,6 +2083,81 @@ def test_message_stream_route_forwards_sse_and_uses_stream_payload() -> None:
     assert sent["params"]["message"]["metadata"] == {"iac_code": {"cwd": "/workspace/demo"}}
 
 
+def test_message_stream_route_forwards_image_parts() -> None:
+    debugger = load_debugger_module()
+    SseTargetHandler.requests = []
+
+    with serve_handler(SseTargetHandler) as target_url:
+        running = start_debugger_server(debugger)
+        try:
+            status, body = post_raw(
+                f"{running.url}/api/message/stream",
+                {
+                    "serverUrl": target_url,
+                    "cwd": "/workspace/demo",
+                    "contextId": "ctx-1",
+                    "prompt": "inspect this diagram",
+                    "images": [
+                        {
+                            "filename": "diagram.png",
+                            "mediaType": "image/png",
+                            "bytes": "iVBORw0KGgo=",
+                        }
+                    ],
+                },
+            )
+        finally:
+            running.close()
+
+    assert status == 200
+    assert "data: " in body
+    sent = json.loads(SseTargetHandler.requests[0]["body"])
+    assert sent["params"]["message"]["parts"] == [
+        {"text": "inspect this diagram"},
+        {
+            "data": {"filename": "diagram.png", "bytes": "iVBORw0KGgo="},
+            "mediaType": "image/png",
+        },
+    ]
+
+
+def test_message_stream_route_allows_image_only_prompt() -> None:
+    debugger = load_debugger_module()
+    SseTargetHandler.requests = []
+
+    with serve_handler(SseTargetHandler) as target_url:
+        running = start_debugger_server(debugger)
+        try:
+            status, body = post_raw(
+                f"{running.url}/api/message/stream",
+                {
+                    "serverUrl": target_url,
+                    "cwd": "/workspace/demo",
+                    "contextId": "ctx-1",
+                    "prompt": "",
+                    "images": [
+                        {
+                            "filename": "diagram.png",
+                            "mediaType": "image/png",
+                            "bytes": "iVBORw0KGgo=",
+                        }
+                    ],
+                },
+            )
+        finally:
+            running.close()
+
+    assert status == 200
+    assert "data: " in body
+    sent = json.loads(SseTargetHandler.requests[0]["body"])
+    assert sent["params"]["message"]["parts"] == [
+        {
+            "data": {"filename": "diagram.png", "bytes": "iVBORw0KGgo="},
+            "mediaType": "image/png",
+        },
+    ]
+
+
 def test_message_stream_route_writes_sse_debugger_log(tmp_path: Path) -> None:
     debugger = load_debugger_module()
     SseTargetHandler.requests = []
@@ -1795,6 +2215,35 @@ def test_message_stream_route_logs_empty_upstream_stream(tmp_path: Path) -> None
     assert records[-1]["raw"] == {"type": "stream_empty", "statusCode": 200}
 
 
+def test_message_stream_route_converts_jsonrpc_error_to_sse_error(tmp_path: Path) -> None:
+    debugger = load_debugger_module()
+
+    with serve_handler(JsonRpcErrorTargetHandler) as target_url:
+        running = start_logged_debugger_server(debugger, log_dir=tmp_path)
+        try:
+            status, body = post_raw(
+                f"{running.url}/api/message/stream",
+                {
+                    "serverUrl": target_url,
+                    "cwd": "/workspace/demo",
+                    "contextId": "ctx-1",
+                    "prompt": "inspect image",
+                },
+            )
+        finally:
+            running.close()
+
+    assert status == 200
+    assert "data: " in body
+    assert "Current model text-only-model does not support image input." in body
+    assert "task-owner" in body
+    records = read_jsonl(tmp_path / "sse-events.jsonl")
+    assert records[-1]["parsedEventType"] == "error"
+    assert records[-1]["raw"]["type"] == "error"
+    assert records[-1]["raw"]["body"]["error"]["code"] == -32602
+    assert records[-1]["raw"]["body"]["error"]["data"]["recoverableTaskId"] == "task-owner"
+
+
 def test_message_stream_route_ignores_client_disconnect_without_traceback(capsys: pytest.CaptureFixture[str]) -> None:
     debugger = load_debugger_module()
 
diff --git a/tests/a2a/test_pipeline_events.py b/tests/a2a/test_pipeline_events.py
index 81426691..306b64ef 100644
--- a/tests/a2a/test_pipeline_events.py
+++ b/tests/a2a/test_pipeline_events.py
@@ -58,6 +58,61 @@ def test_pipeline_started_has_stable_envelope() -> None:
     assert envelope["data"]["totalSteps"] == 4
 
 
+def test_pipeline_warning_translates_to_non_terminal_envelope() -> None:
+    translator = PipelineEventTranslator(_ctx())
+
+    [envelope] = translator.translate(
+        PipelineEvent(
+            type=PipelineEventType.PIPELINE_WARNING,
+            step_id="deploying",
+            timestamp=1717821600.0,
+            data={
+                "reason": "cleanup_tracking_unavailable",
+                "operation": "record_observed",
+                "ledger_path": "/Users/alice/.iac-code/projects/demo/cleanup.yaml",
+                "load_error": "while parsing /Users/alice/.iac-code/projects/demo/cleanup.yaml",
+            },
+        )
+    )
+
+    assert envelope["eventType"] == "pipeline_warning"
+    assert envelope["scope"] == "pipeline"
+    assert envelope["status"] == "working"
+    assert envelope["data"]["reason"] == "cleanup_tracking_unavailable"
+    assert "ledger_path" not in envelope["data"]
+    assert "load_error" not in envelope["data"]
+
+
+def test_manual_cleanup_event_normalizes_cleanup_data_keys() -> None:
+    translator = PipelineEventTranslator(_ctx())
+
+    event = translator.manual_event(
+        "cleanup_started",
+        "cleanup",
+        data={
+            "resource_count": 1,
+            "status_message": "检测到 1 个回滚残留资源，开始清理流程。",
+            "resource_id": "stack-123",
+            "region_id": "cn-hangzhou",
+            "stack_status": "DELETE_IN_PROGRESS",
+            "cleanup_tool_use_id": "toolu-get",
+            "progress_percentage": 60,
+            "last_error": "DELETE_FAILED",
+        },
+    )
+
+    assert event["eventType"] == "cleanup_started"
+    assert event["scope"] == "cleanup"
+    assert event["data"]["resourceCount"] == 1
+    assert event["data"]["statusMessage"] == "检测到 1 个回滚残留资源，开始清理流程。"
+    assert event["data"]["resourceId"] == "stack-123"
+    assert event["data"]["regionId"] == "cn-hangzhou"
+    assert event["data"]["stackStatus"] == "DELETE_IN_PROGRESS"
+    assert event["data"]["cleanupToolUseId"] == "toolu-get"
+    assert event["data"]["progressPercentage"] == 60
+    assert event["data"]["lastError"] == "DELETE_FAILED"
+
+
 def test_parent_step_attempt_increments_after_rollback() -> None:
     translator = PipelineEventTranslator(_ctx())
     translator.translate(
@@ -768,6 +823,48 @@ def test_show_candidate_detail_tool_result_recovers_detail_from_tool_input() ->
     assert detail_event["data"]["detail"]["costItems"] == [{"name": "ecs", "monthly_cost": "CNY 60"}]
 
 
+@pytest.mark.parametrize(
+    ("stream_event", "event_type"),
+    [
+        (TextDeltaEvent(text="开始部署资源"), "text_delta"),
+        (
+            ToolResultEvent(
+                tool_use_id="toolu-read",
+                tool_name="read_file",
+                result="template content",
+                is_error=False,
+            ),
+            "tool_result",
+        ),
+        (
+            PermissionRequestEvent(
+                tool_name="ros_stack",
+                tool_input={"action": "CreateStack"},
+                tool_use_id="toolu-stack",
+            ),
+            "permission_requested",
+        ),
+    ],
+)
+def test_parent_stream_events_include_current_step_coordinate(stream_event: object, event_type: str) -> None:
+    translator = PipelineEventTranslator(_ctx())
+    translator.translate(
+        PipelineEvent(
+            type=PipelineEventType.STEP_STARTED,
+            step_id="deploying",
+            timestamp=time.time(),
+            data={"index": 5, "total": 5},
+        )
+    )
+
+    [envelope] = translator.translate(stream_event)
+
+    assert envelope["eventType"] == event_type
+    assert envelope["scope"] == "step"
+    assert envelope["step"]["id"] == "deploying"
+    assert envelope["step"]["runId"] == "step-deploying-1"
+
+
 def test_stack_current_changed_is_disabled_by_default() -> None:
     translator = PipelineEventTranslator(_ctx())
     translator.translate(
@@ -964,7 +1061,7 @@ def test_stack_current_changed_emits_after_successful_ros_create_stack() -> None
     }
 
 
-def test_stack_current_changed_clears_current_stack_after_successful_delete() -> None:
+def test_stack_current_changed_keeps_current_stack_after_statusless_successful_delete() -> None:
     ctx = _ctx()
     ctx.emit_stack_events = True
     translator = PipelineEventTranslator(ctx)
@@ -993,6 +1090,48 @@ def test_stack_current_changed_clears_current_stack_after_successful_delete() ->
     assert stack_event["eventType"] == "stack_current_changed"
     assert stack_event["data"]["action"] == "DeleteStack"
     assert stack_event["data"]["stackId"] == "stack-123"
+    assert stack_event["data"]["stackStatus"] == "DELETE_REQUESTED"
+    assert stack_event["data"]["current"] is True
+    assert "cleared" not in stack_event["data"]
+
+
+def test_stack_current_changed_clears_current_stack_after_delete_complete() -> None:
+    ctx = _ctx()
+    ctx.emit_stack_events = True
+    translator = PipelineEventTranslator(ctx)
+    translator.translate(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="ros_stack",
+            input={
+                "action": "DeleteStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123", "StackName": "demo"},
+            },
+        )
+    )
+
+    envelopes = translator.translate(
+        ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="ros_stack",
+            result=json.dumps(
+                {
+                    "stack_id": "stack-123",
+                    "stack_name": "demo",
+                    "status": "DELETE_COMPLETE",
+                    "is_success": True,
+                }
+            ),
+            is_error=False,
+        )
+    )
+
+    stack_event = envelopes[0]
+    assert stack_event["eventType"] == "stack_current_changed"
+    assert stack_event["data"]["action"] == "DeleteStack"
+    assert stack_event["data"]["stackId"] == "stack-123"
+    assert stack_event["data"]["stackStatus"] == "DELETE_COMPLETE"
     assert stack_event["data"]["current"] is False
     assert stack_event["data"]["cleared"] is True
 
diff --git a/tests/a2a/test_pipeline_executor.py b/tests/a2a/test_pipeline_executor.py
index 7b69d52a..a7f90725 100644
--- a/tests/a2a/test_pipeline_executor.py
+++ b/tests/a2a/test_pipeline_executor.py
@@ -14,10 +14,15 @@
 
 from iac_code.a2a.executor import IacCodeA2AExecutor
 from iac_code.a2a.metrics import NoOpA2AMetrics
+from iac_code.a2a.persistence import A2APersistenceStore
 from iac_code.a2a.pipeline_journal import A2APipelineJournal
 from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore, reduce_pipeline_events
 from iac_code.a2a.task_store import A2ATaskStore
+from iac_code.agent.message import ImageBlock
+from iac_code.pipeline.engine.cleanup import CleanupLedger, CleanupResource
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+from iac_code.pipeline.engine.interrupt import InterruptVerdict
+from iac_code.pipeline.engine.user_input import PipelineUserInput
 from iac_code.types.stream_events import AskUserQuestionEvent, TextDeltaEvent
 
 from .fakes import FakeEventQueue, FakeRequestContext
@@ -26,10 +31,63 @@
 AUTH_TEXT = "Authentication required. Configure credentials and retry."
 
 
+def test_active_sidecar_mismatch_error_exposes_jsonrpc_data() -> None:
+    from iac_code.a2a.pipeline_executor import _active_sidecar_mismatch_error
+
+    error = _active_sidecar_mismatch_error(
+        recoverable_task_id="task-owner",
+        context_id="ctx-1",
+        sidecar_status="running",
+    )
+
+    assert error.code == -32602
+    assert error.data == {
+        "recoverableTaskId": "task-owner",
+        "contextId": "ctx-1",
+        "sidecarStatus": "running",
+    }
+    assert "task-owner" in error.message
+
+
+def test_active_sidecar_mismatch_error_serializes_raw_jsonrpc_data() -> None:
+    from iac_code.a2a.jsonrpc_passthrough import install_jsonrpc_error_data_passthrough
+    from iac_code.a2a.pipeline_executor import _active_sidecar_mismatch_error
+
+    install_jsonrpc_error_data_passthrough()
+    from a2a.server.request_handlers.response_helpers import build_error_response
+
+    error = _active_sidecar_mismatch_error(
+        recoverable_task_id="task-owner",
+        context_id="ctx-1",
+        sidecar_status="waiting_input",
+    )
+
+    response = build_error_response("req-1", error)
+
+    assert response["error"]["code"] == -32602
+    assert response["error"]["data"] == {
+        "recoverableTaskId": "task-owner",
+        "contextId": "ctx-1",
+        "sidecarStatus": "waiting_input",
+    }
+
+
 def dump(event):
     return MessageToDict(event, preserving_proto_field_name=False)
 
 
+def image_interrupt_input() -> PipelineUserInput:
+    return PipelineUserInput(
+        content=[ImageBlock(media_type="image/png", data="aGVsbG8=")],
+        display_text="[Image input]",
+        has_images=True,
+    )
+
+
+def _display_text(value):
+    return value.display_text if isinstance(value, PipelineUserInput) else value
+
+
 class FakePipeline:
     def __init__(self, events, *, session_dir: Path) -> None:
         self.events = events
@@ -46,14 +104,14 @@ def __init__(self, events, *, session_dir: Path) -> None:
         self.handoff_summary = "handoff summary"
 
     async def run(self, prompt: str):
-        self.run_prompts.append(prompt)
+        self.run_prompts.append(_display_text(prompt))
         for event in self.events:
             if isinstance(event, BaseException):
                 raise event
             yield event
 
     async def resume(self, prompt: str):
-        self.resume_prompts.append(prompt)
+        self.resume_prompts.append(_display_text(prompt))
         for event in self.events:
             if isinstance(event, BaseException):
                 raise event
@@ -61,7 +119,7 @@ async def resume(self, prompt: str):
 
     def continue_from_sidecar(self, user_input: str | None = None):
         self.continue_calls += 1
-        self.continue_inputs.append(user_input)
+        self.continue_inputs.append(_display_text(user_input))
         return self.run(user_input or "continued")
 
     def clear_sidecar(self) -> None:
@@ -254,6 +312,96 @@ def fake_create_pipeline(*args, **kwargs):
     assert messages[-1].content == "[Pipeline Handoff Context]\nPipeline: selling"
 
 
+@pytest.mark.asyncio
+async def test_executor_publishes_normal_handoff_ready_with_cleanup_resources(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    session_dir = tmp_path / "sidecar"
+    ledger = CleanupLedger(session_dir / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                resource_name="selling-stack",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback from deploying",
+    )
+    fake_pipeline = FakePipeline(
+        [
+            PipelineEvent(
+                type=PipelineEventType.PIPELINE_COMPLETED,
+                step_id=None,
+                timestamp=1717821601.0,
+                data={"total_steps": 1},
+            ),
+        ],
+        session_dir=session_dir,
+    )
+    fake_pipeline.handoff_enabled = True
+    fake_pipeline.handoff_summary = "[Pipeline Handoff Context]\nPipeline: selling"
+    fake_pipeline.cleanup_ledger = lambda: ledger
+
+    def fake_create_pipeline(*args, **kwargs):
+        fake_pipeline._session_storage = kwargs["session_storage"]
+        fake_pipeline._session_id = kwargs["session_id"]
+        fake_pipeline._cwd = kwargs["cwd"]
+        return fake_pipeline
+
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_pipeline", fake_create_pipeline)
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_agent_runtime", lambda options: _fake_runtime())
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics())
+    executor = IacCodeA2AExecutor(task_store=store, model="qwen3.6-plus")
+    queue = FakeEventQueue()
+
+    await executor.execute(FakeRequestContext(metadata={"iac_code": {"cwd": str(tmp_path)}}), queue)
+
+    pipeline_events = [
+        dump(event)["metadata"]["iac_code"]["pipeline"]
+        for event in queue.events
+        if isinstance(event, TaskStatusUpdateEvent)
+        and "pipeline" in dump(event).get("metadata", {}).get("iac_code", {})
+    ]
+    handoff = pipeline_events[-1]
+    cleanup = handoff["data"]["cleanup"]
+    assert cleanup["status"] == "pending"
+    assert cleanup["resourceCount"] == 1
+    assert cleanup["statusMessage"] == "Detected 1 rollback cleanup resources; starting cleanup."
+    assert "prompt" not in cleanup
+    assert "ledgerPath" not in cleanup
+    assert cleanup["resources"] == [
+        {
+            "provider": "ros",
+            "resourceType": "stack",
+            "resourceId": "stack-123",
+            "resourceName": "selling-stack",
+            "regionId": "cn-hangzhou",
+            "sourceStepId": "deploying",
+            "cleanupStatus": "pending",
+            "progressStatus": None,
+            "lastError": None,
+        }
+    ]
+
+    snapshot = A2APipelineSnapshotStore(session_dir).load()
+    assert snapshot is not None
+    assert snapshot["cleanup"]["status"] == "pending"
+    assert snapshot["cleanup"]["resourceCount"] == 1
+    assert snapshot["normalHandoff"]["data"]["cleanup"]["resourceCount"] == 1
+    assert "prompt" not in snapshot["cleanup"]
+    assert "ledgerPath" not in snapshot["cleanup"]
+    assert "prompt" not in snapshot["normalHandoff"]["data"]["cleanup"]
+    assert "ledgerPath" not in snapshot["normalHandoff"]["data"]["cleanup"]
+
+
 @pytest.mark.asyncio
 async def test_executor_sets_pipeline_telemetry_correlation(
     monkeypatch: pytest.MonkeyPatch,
@@ -272,8 +420,10 @@ async def test_executor_sets_pipeline_telemetry_correlation(
         session_dir=tmp_path / "sidecar",
     )
     fake_pipeline.set_telemetry_correlation = MagicMock()
+    create_pipeline_kwargs = {}
 
     def fake_create_pipeline(*args, **kwargs):
+        create_pipeline_kwargs.update(kwargs)
         fake_pipeline._session_storage = kwargs["session_storage"]
         fake_pipeline._session_id = kwargs["session_id"]
         fake_pipeline._cwd = kwargs["cwd"]
@@ -295,6 +445,7 @@ def fake_create_pipeline(*args, **kwargs):
         context_id="ctx-1",
         pipeline_run_id="ctx-1",
     )
+    assert create_pipeline_kwargs["surface"] == "a2a"
 
 
 @pytest.mark.asyncio
@@ -775,12 +926,10 @@ async def test_executor_clears_previous_task_terminal_sidecar_and_runs_new_task(
 @pytest.mark.parametrize(
     ("sidecar_status", "event_type", "event_status"),
     [
-        ("waiting_input", "input_required", "waiting_input"),
-        ("running", "pipeline_started", "working"),
         ("completed", "pipeline_completed", "completed"),
     ],
 )
-async def test_executor_replaces_restored_pipeline_when_sidecar_owner_mismatches(
+async def test_executor_replaces_terminal_restored_pipeline_when_sidecar_owner_mismatches(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
     sidecar_status: str,
@@ -857,6 +1006,102 @@ def fake_create_pipeline(*args, **kwargs):
     assert "".join(record.output_text) == "fresh output"
 
 
+@pytest.mark.asyncio
+@pytest.mark.parametrize(
+    ("sidecar_status", "event_type", "event_status"),
+    [
+        ("waiting_input", "input_required", "waiting_input"),
+        ("running", "pipeline_started", "working"),
+    ],
+)
+async def test_executor_rejects_active_restored_pipeline_owner_mismatch_without_clearing(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+    sidecar_status: str,
+    event_type: str,
+    event_status: str,
+) -> None:
+    from iac_code.a2a.pipeline_executor import (
+        IacCodeA2APipelineExecutor,
+        RecoverablePipelineInvalidParamsError,
+    )
+
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    session_dir = tmp_path / "sidecar"
+    owner_event = {
+        "schemaVersion": "1.0",
+        "extensionUri": "urn:iac-code:a2a:pipeline-events:v1",
+        "eventId": "evt-owner",
+        "sequence": 1,
+        "createdAt": "2026-06-08T10:00:00Z",
+        "eventType": event_type,
+        "scope": "pipeline",
+        "pipelineRunId": "ctx-1",
+        "taskId": "task-owner",
+        "contextId": "ctx-1",
+        "pipelineName": "selling",
+        "status": event_status,
+        "data": {"prompt": "owner choice"} if event_type == "input_required" else {},
+    }
+    journal = A2APipelineJournal(session_dir)
+    journal.append(owner_event)
+    A2APipelineSnapshotStore(session_dir).save(reduce_pipeline_events([owner_event]))
+    restored_pipeline = FakePipeline(
+        [
+            TextDeltaEvent(text="stale restored output"),
+            PipelineEvent(type=PipelineEventType.PIPELINE_COMPLETED, step_id=None, timestamp=1717821601.0, data={}),
+        ],
+        session_dir=session_dir,
+    )
+    restored_pipeline.sidecar_status = sidecar_status
+    created_pipelines: list[FakePipeline] = []
+
+    def fake_create_pipeline(*args, **kwargs):
+        created_pipelines.append(restored_pipeline)
+        return restored_pipeline
+
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_pipeline", fake_create_pipeline)
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_agent_runtime", lambda options: _fake_runtime())
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics())
+    executor = IacCodeA2APipelineExecutor(
+        task_store=store,
+        model="qwen3.6-plus",
+        metrics=NoOpA2AMetrics(),
+        artifact_store=None,
+        push_notifier=None,
+        permission_resolver=None,
+        auto_approve_permissions=False,
+        thinking_exposure_types=None,
+    )
+
+    with pytest.raises(RecoverablePipelineInvalidParamsError) as exc_info:
+        await executor.execute(
+            context=FakeRequestContext(
+                task_id="task-new",
+                context_id="ctx-1",
+                text="new request",
+                metadata={"iac_code": {"cwd": str(tmp_path)}},
+            ),
+            event_queue=FakeEventQueue(),
+            task=await store.get_or_create_task(task_id="task-new", context_id="ctx-1"),
+            task_id="task-new",
+            context_id="ctx-1",
+            cwd=str(tmp_path),
+            prompt="new request",
+        )
+
+    assert exc_info.value.data == {
+        "recoverableTaskId": "task-owner",
+        "contextId": "ctx-1",
+        "sidecarStatus": sidecar_status,
+    }
+    assert len(created_pipelines) == 1
+    assert restored_pipeline.clear_sidecar_calls == 0
+    assert restored_pipeline.run_prompts == []
+    assert journal.read_all() == [owner_event]
+
+
 @pytest.mark.asyncio
 async def test_executor_keeps_a2a_metadata_when_mismatch_clears_pipeline_sidecar(
     monkeypatch: pytest.MonkeyPatch,
@@ -1602,10 +1847,12 @@ async def test_executor_does_not_resume_nonterminal_sidecar_when_a2a_state_is_te
 
 
 @pytest.mark.asyncio
-async def test_executor_clears_previous_task_waiting_sidecar_and_runs_new_task(
+async def test_executor_rejects_previous_task_waiting_sidecar_without_starting_new_task(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
 ) -> None:
+    from iac_code.a2a.pipeline_executor import RecoverablePipelineInvalidParamsError
+
     monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
     session_dir = tmp_path / "sidecar"
     old_input = {
@@ -1638,19 +1885,25 @@ async def test_executor_clears_previous_task_waiting_sidecar_and_runs_new_task(
 
     executor = IacCodeA2AExecutor(task_store=A2ATaskStore(metrics=NoOpA2AMetrics()), model="qwen3.6-plus")
 
-    await executor.execute(
-        FakeRequestContext(
-            task_id="task-new",
-            context_id="ctx-1",
-            text="new request",
-            metadata={"iac_code": {"cwd": str(tmp_path)}},
-        ),
-        FakeEventQueue(),
-    )
+    with pytest.raises(RecoverablePipelineInvalidParamsError) as exc_info:
+        await executor.execute(
+            FakeRequestContext(
+                task_id="task-new",
+                context_id="ctx-1",
+                text="new request",
+                metadata={"iac_code": {"cwd": str(tmp_path)}},
+            ),
+            FakeEventQueue(),
+        )
 
-    assert fake_pipeline.clear_sidecar_calls == 1
+    assert exc_info.value.data == {
+        "recoverableTaskId": "task-old",
+        "contextId": "ctx-1",
+        "sidecarStatus": "waiting_input",
+    }
+    assert fake_pipeline.clear_sidecar_calls == 0
     assert fake_pipeline.resume_prompts == []
-    assert fake_pipeline.run_prompts == ["new request"]
+    assert fake_pipeline.run_prompts == []
 
 
 @pytest.mark.asyncio
@@ -1668,6 +1921,8 @@ async def test_executor_does_not_attach_current_sidecar_to_historical_task(
     event_type: str,
     event_status: str,
 ) -> None:
+    from iac_code.a2a.pipeline_executor import RecoverablePipelineInvalidParamsError
+
     monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
     session_dir = tmp_path / "sidecar"
     old_event = {
@@ -1712,21 +1967,27 @@ async def test_executor_does_not_attach_current_sidecar_to_historical_task(
 
     executor = IacCodeA2AExecutor(task_store=A2ATaskStore(metrics=NoOpA2AMetrics()), model="qwen3.6-plus")
 
-    await executor.execute(
-        FakeRequestContext(
-            task_id="task-old",
-            context_id="ctx-1",
-            text="old followup",
-            metadata={"iac_code": {"cwd": str(tmp_path)}},
-        ),
-        FakeEventQueue(),
-    )
+    with pytest.raises(RecoverablePipelineInvalidParamsError) as exc_info:
+        await executor.execute(
+            FakeRequestContext(
+                task_id="task-old",
+                context_id="ctx-1",
+                text="old followup",
+                metadata={"iac_code": {"cwd": str(tmp_path)}},
+            ),
+            FakeEventQueue(),
+        )
 
-    assert fake_pipeline.clear_sidecar_calls == 1
+    assert exc_info.value.data == {
+        "recoverableTaskId": "task-current",
+        "contextId": "ctx-1",
+        "sidecarStatus": sidecar_status,
+    }
+    assert fake_pipeline.clear_sidecar_calls == 0
     assert fake_pipeline.resume_prompts == []
     assert fake_pipeline.continue_calls == 0
-    assert fake_pipeline.run_prompts == ["old followup"]
-    assert journal.read_all()[-1]["taskId"] == "task-old"
+    assert fake_pipeline.run_prompts == []
+    assert journal.read_all()[-1]["taskId"] == "task-current"
 
 
 @pytest.mark.asyncio
@@ -1891,10 +2152,12 @@ async def test_executor_routes_waiting_input_pause_confirmation_through_interrup
 
 
 @pytest.mark.asyncio
-async def test_executor_clears_previous_task_running_sidecar_and_runs_new_task(
+async def test_executor_rejects_previous_task_running_sidecar_without_starting_new_task(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
 ) -> None:
+    from iac_code.a2a.pipeline_executor import RecoverablePipelineInvalidParamsError
+
     monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
     session_dir = tmp_path / "sidecar"
     old_running = {
@@ -1927,37 +2190,144 @@ async def test_executor_clears_previous_task_running_sidecar_and_runs_new_task(
 
     executor = IacCodeA2AExecutor(task_store=A2ATaskStore(metrics=NoOpA2AMetrics()), model="qwen3.6-plus")
 
-    await executor.execute(
-        FakeRequestContext(
-            task_id="task-new",
-            context_id="ctx-1",
-            text="new request",
-            metadata={"iac_code": {"cwd": str(tmp_path)}},
-        ),
-        FakeEventQueue(),
-    )
+    with pytest.raises(RecoverablePipelineInvalidParamsError) as exc_info:
+        await executor.execute(
+            FakeRequestContext(
+                task_id="task-new",
+                context_id="ctx-1",
+                text="new request",
+                metadata={"iac_code": {"cwd": str(tmp_path)}},
+            ),
+            FakeEventQueue(),
+        )
 
-    assert fake_pipeline.clear_sidecar_calls == 1
+    assert exc_info.value.data == {
+        "recoverableTaskId": "task-old",
+        "contextId": "ctx-1",
+        "sidecarStatus": "running",
+    }
+    assert fake_pipeline.clear_sidecar_calls == 0
     assert fake_pipeline.continue_calls == 0
-    assert fake_pipeline.run_prompts == ["new request"]
+    assert fake_pipeline.run_prompts == []
 
 
 @pytest.mark.asyncio
-async def test_pipeline_executor_routes_second_prompt_as_interrupt(tmp_path: Path) -> None:
-    from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
-    from iac_code.a2a.pipeline_executor import A2APipelineRuntime, IacCodeA2APipelineExecutor
-    from iac_code.a2a.pipeline_journal import A2APipelineJournal
-    from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
-    from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher
+async def test_executor_rejected_active_sidecar_mismatch_does_not_persist_new_working_task(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    from iac_code.a2a.pipeline_executor import RecoverablePipelineInvalidParamsError
 
-    class InterruptiblePipeline(FakePipeline):
-        def __init__(self, *, session_dir: Path) -> None:
-            super().__init__([TextDeltaEvent(text="running")], session_dir=session_dir)
-            self.interrupts: list[str] = []
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    session_dir = tmp_path / "sidecar"
+    owner_event = {
+        "schemaVersion": "1.0",
+        "extensionUri": "urn:iac-code:a2a:pipeline-events:v1",
+        "eventId": "evt-owner-running",
+        "sequence": 1,
+        "createdAt": "2026-06-08T10:00:00Z",
+        "eventType": "pipeline_started",
+        "scope": "pipeline",
+        "pipelineRunId": "ctx-1",
+        "taskId": "task-owner",
+        "contextId": "ctx-1",
+        "pipelineName": "selling",
+        "status": "working",
+        "data": {},
+    }
+    A2APipelineJournal(session_dir).append(owner_event)
+    A2APipelineSnapshotStore(session_dir).save(reduce_pipeline_events([owner_event]))
+    fake_pipeline = FakePipeline(
+        [
+            TextDeltaEvent(text="new output"),
+            PipelineEvent(type=PipelineEventType.PIPELINE_COMPLETED, step_id=None, timestamp=1717821601.0, data={}),
+        ],
+        session_dir=session_dir,
+    )
+    fake_pipeline.sidecar_status = "running"
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_pipeline", lambda *args, **kwargs: fake_pipeline)
+    monkeypatch.setattr("iac_code.a2a.pipeline_executor.create_agent_runtime", lambda options: _fake_runtime())
 
-        async def handle_user_interrupt(self, message: str) -> SimpleNamespace:
-            self.interrupts.append(message)
-            return SimpleNamespace(
+    task_store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    executor = IacCodeA2AExecutor(task_store=task_store, model="qwen3.6-plus")
+
+    with pytest.raises(RecoverablePipelineInvalidParamsError):
+        await executor.execute(
+            FakeRequestContext(
+                task_id="task-new",
+                context_id="ctx-1",
+                text="new request",
+                metadata={"iac_code": {"cwd": str(tmp_path)}},
+            ),
+            FakeEventQueue(),
+        )
+
+    assert fake_pipeline.clear_sidecar_calls == 0
+    assert fake_pipeline.run_prompts == []
+    rejected_task = persistence.load_task("task-new")
+    assert rejected_task is not None
+    assert rejected_task.state != "working"
+    assert [task.task_id for task in persistence.list_tasks() if task.state == "working"] == []
+
+
+def test_cleanup_handoff_missing_ledger_ignores_empty_public_cleanup_snapshot(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_executor import _pipeline_cleanup_handoff_data_from_session
+
+    cleanup = _pipeline_cleanup_handoff_data_from_session(
+        cwd=str(tmp_path),
+        session_id="session-empty-cleanup",
+        public_snapshot={"cleanup": {"resourceCount": 0, "resources": [], "status": ""}},
+    )
+
+    assert cleanup is None
+
+
+def test_cleanup_handoff_missing_ledger_does_not_reconstruct_prompt_from_public_snapshot(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_executor import _pipeline_cleanup_handoff_data_from_session
+
+    cleanup = _pipeline_cleanup_handoff_data_from_session(
+        cwd=str(tmp_path),
+        session_id="session-public-cleanup-only",
+        public_snapshot={
+            "cleanup": {
+                "resourceCount": 1,
+                "resources": [
+                    {
+                        "provider": "ros",
+                        "resourceType": "stack",
+                        "resourceId": "stack-public-only",
+                        "cleanupStatus": "pending",
+                    }
+                ],
+                "status": "pending",
+            }
+        },
+    )
+
+    assert cleanup is not None
+    assert cleanup["status"] == "unavailable"
+    assert "prompt" not in cleanup
+    assert "resources" not in cleanup
+    assert "stack-public-only" not in repr(cleanup)
+
+
+@pytest.mark.asyncio
+async def test_pipeline_executor_routes_second_prompt_as_interrupt(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
+    from iac_code.a2a.pipeline_executor import A2APipelineRuntime, IacCodeA2APipelineExecutor
+    from iac_code.a2a.pipeline_journal import A2APipelineJournal
+    from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
+    from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher
+
+    class InterruptiblePipeline(FakePipeline):
+        def __init__(self, *, session_dir: Path) -> None:
+            super().__init__([TextDeltaEvent(text="running")], session_dir=session_dir)
+            self.interrupts: list[str] = []
+
+        async def handle_user_interrupt(self, message: str) -> SimpleNamespace:
+            self.interrupts.append(message)
+            return SimpleNamespace(
                 action="supplement",
                 reason="added context",
                 rollback_target=None,
@@ -2942,7 +3312,7 @@ async def handle_user_interrupt(self, message: str) -> SimpleNamespace:
         task_id="task-1",
         context_id="ctx-1",
         cwd=str(tmp_path),
-        prompt="Nginx 网站",
+        pipeline_input="Nginx 网站",
         preserve_task_record=True,
     )
 
@@ -3035,7 +3405,7 @@ async def handle_user_interrupt(self, message: str) -> SimpleNamespace:
         task_id="task-1",
         context_id="ctx-1",
         cwd=str(tmp_path),
-        prompt="Nginx 网站",
+        pipeline_input="Nginx 网站",
         preserve_task_record=True,
     )
 
@@ -3351,6 +3721,120 @@ def test_waiting_input_task_id_from_sidecar_accepts_candidate_selection(tmp_path
     assert waiting_input_task_id_from_sidecar(cwd=str(cwd), session_id=session_id, context_id=context_id) == "task-1"
 
 
+def test_cancel_waiting_input_sidecar_appends_cancel_handoff_as_durable_group(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    from iac_code.a2a.pipeline_executor import cancel_waiting_input_task_from_sidecar
+    from iac_code.a2a.pipeline_paths import a2a_pipeline_dir_for_session
+
+    cwd = tmp_path / "workspace"
+    session_id = "session-ctx-1"
+    context_id = "ctx-1"
+    pipeline_dir = a2a_pipeline_dir_for_session(cwd=str(cwd), session_id=session_id)
+    pending = {
+        "schemaVersion": "1.0",
+        "extensionUri": "urn:iac-code:a2a:pipeline-events:v1",
+        "eventId": "evt-selection",
+        "sequence": 1,
+        "createdAt": "2026-06-08T10:00:00Z",
+        "eventType": "input_required",
+        "scope": "step",
+        "pipelineRunId": context_id,
+        "taskId": "task-1",
+        "contextId": context_id,
+        "pipelineName": "selling",
+        "status": "input_required",
+        "step": {"runId": "step-confirm_and_select-1", "id": "confirm_and_select", "attempt": 1},
+        "input": {
+            "inputId": "input-confirm_and_select-1",
+            "kind": "candidate_selection",
+            "prompt": "请选择方案",
+            "options": [{"name": "方案A", "candidate_index": 0}],
+        },
+    }
+    A2APipelineJournal(pipeline_dir).append(pending)
+    A2APipelineSnapshotStore(pipeline_dir).save(reduce_pipeline_events([pending]))
+    append_many_calls = []
+    original_append_many = A2APipelineJournal.append_many
+
+    def recording_append_many(self, events, durable: bool = False):
+        append_many_calls.append(([event["eventType"] for event in events], durable))
+        return original_append_many(self, events, durable=durable)
+
+    monkeypatch.setattr(A2APipelineJournal, "append_many", recording_append_many)
+
+    canceled = cancel_waiting_input_task_from_sidecar(
+        cwd=str(cwd),
+        session_id=session_id,
+        context_id=context_id,
+        task_id="task-1",
+        reason="user canceled",
+    )
+
+    assert canceled is True
+    assert append_many_calls[-1] == (["pipeline_canceled", "pipeline_handoff_ready"], True)
+    events = A2APipelineJournal(pipeline_dir).read_all()
+    assert [event["eventType"] for event in events[-2:]] == ["pipeline_canceled", "pipeline_handoff_ready"]
+
+
+def test_cancel_waiting_input_sidecar_returns_false_when_durable_group_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    from iac_code.a2a.pipeline_executor import cancel_waiting_input_task_from_sidecar
+    from iac_code.a2a.pipeline_paths import a2a_pipeline_dir_for_session
+
+    cwd = tmp_path / "workspace"
+    session_id = "session-ctx-1"
+    context_id = "ctx-1"
+    pipeline_dir = a2a_pipeline_dir_for_session(cwd=str(cwd), session_id=session_id)
+    pending = {
+        "schemaVersion": "1.0",
+        "extensionUri": "urn:iac-code:a2a:pipeline-events:v1",
+        "eventId": "evt-selection",
+        "sequence": 1,
+        "createdAt": "2026-06-08T10:00:00Z",
+        "eventType": "input_required",
+        "scope": "step",
+        "pipelineRunId": context_id,
+        "taskId": "task-1",
+        "contextId": context_id,
+        "pipelineName": "selling",
+        "status": "input_required",
+        "step": {"runId": "step-confirm_and_select-1", "id": "confirm_and_select", "attempt": 1},
+        "input": {
+            "inputId": "input-confirm_and_select-1",
+            "kind": "candidate_selection",
+            "prompt": "请选择方案",
+            "options": [{"name": "方案A", "candidate_index": 0}],
+        },
+    }
+    A2APipelineJournal(pipeline_dir).append(pending)
+    A2APipelineSnapshotStore(pipeline_dir).save(reduce_pipeline_events([pending]))
+
+    def fail_append_many(self, events, durable: bool = False):
+        assert durable is True
+        assert [event["eventType"] for event in events] == ["pipeline_canceled", "pipeline_handoff_ready"]
+        raise OSError("journal locked")
+
+    monkeypatch.setattr(A2APipelineJournal, "append_many", fail_append_many)
+
+    canceled = cancel_waiting_input_task_from_sidecar(
+        cwd=str(cwd),
+        session_id=session_id,
+        context_id=context_id,
+        task_id="task-1",
+        reason="user canceled",
+    )
+
+    assert canceled is False
+    assert [event["eventType"] for event in A2APipelineJournal(pipeline_dir).read_all()] == ["input_required"]
+    snapshot = A2APipelineSnapshotStore(pipeline_dir).load()
+    assert snapshot is not None
+    assert snapshot["status"] == "waiting_input"
+
+
 @pytest.mark.asyncio
 async def test_executor_recovers_pending_ask_from_journal_when_snapshot_is_missing(
     monkeypatch: pytest.MonkeyPatch,
@@ -4283,3 +4767,363 @@ async def test_same_task_non_interruptible_active_context_preserves_active_recor
     final_status = _status_events(queue)[-1]["status"]
     assert final_status["state"] == "TASK_STATE_FAILED"
     assert final_status["message"]["parts"][0]["text"] == "Task is already working."
+
+
+@pytest.mark.asyncio
+async def test_active_pipeline_interrupt_receives_structured_image_input(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_executor import IacCodeA2APipelineExecutor
+
+    store = A2ATaskStore(metrics=NoOpA2AMetrics())
+    task = await store.get_or_create_task(task_id="task-1", context_id="ctx-1")
+    task.active_task = asyncio.current_task()
+    ctx = await store.get_or_create_context(
+        context_id="ctx-1",
+        cwd=str(tmp_path),
+        runtime_factory=lambda session_id: _fake_runtime(),
+    )
+    ctx.active_task_id = "task-1"
+    received = []
+
+    class InterruptPipeline(FakePipeline):
+        async def handle_user_interrupt(self, message):
+            received.append(message)
+            return InterruptVerdict(action="continue", reason="keep going")
+
+        def pause_agent_loops(self) -> None:
+            pass
+
+        def resume_agent_loops(self) -> None:
+            pass
+
+    pipeline = InterruptPipeline([], session_dir=tmp_path / "pipeline")
+    publisher = SimpleNamespace(
+        publish_interrupt_received=AsyncMock(),
+        publish_interrupt=AsyncMock(),
+        journal=A2APipelineJournal(tmp_path / "pipeline"),
+        snapshot_store=A2APipelineSnapshotStore(tmp_path / "pipeline"),
+    )
+    ctx.runtime = SimpleNamespace(
+        agent_runtime=_fake_runtime(),
+        pipeline=pipeline,
+        publisher=publisher,
+        current_stream=None,
+        restart_after_interrupt=False,
+        pause_after_interrupt=False,
+        restart_requested=asyncio.Event(),
+    )
+    store.mirror_context(ctx)
+    pipeline_input = image_interrupt_input()
+
+    executor = IacCodeA2APipelineExecutor(
+        task_store=store,
+        model="qwen3.6-plus",
+        metrics=NoOpA2AMetrics(),
+        artifact_store=None,
+        push_notifier=None,
+        permission_resolver=None,
+        auto_approve_permissions=False,
+        thinking_exposure_types=None,
+    )
+    await executor.execute(
+        context=FakeRequestContext(metadata={"iac_code": {"cwd": str(tmp_path)}}),
+        event_queue=FakeEventQueue(),
+        task=task,
+        task_id="task-1",
+        context_id="ctx-1",
+        cwd=str(tmp_path),
+        pipeline_input=pipeline_input,
+    )
+
+    assert received == [pipeline_input]
+    publisher.publish_interrupt_received.assert_awaited_once_with(prompt="[Image input]")
+
+
+@pytest.mark.asyncio
+async def test_active_pending_question_answer_preserves_image_input(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_executor import IacCodeA2APipelineExecutor, _PendingAskUserQuestion
+
+    future = asyncio.get_running_loop().create_future()
+    injected = []
+
+    class Pipeline:
+        def inject_pending_question_supplement(self, message, *, envelope):
+            injected.append((message, envelope))
+
+    runtime = SimpleNamespace(
+        pending_question=_PendingAskUserQuestion(
+            event=AskUserQuestionEvent(
+                tool_use_id="toolu_1",
+                question="Upload diagram",
+                options=[],
+                response_future=future,
+            ),
+            envelope={"scope": "pipeline", "inputId": "ask-toolu_1"},
+        ),
+        pipeline=Pipeline(),
+        publisher=SimpleNamespace(
+            publish_manual=AsyncMock(return_value=object()),
+        ),
+    )
+    pipeline_input = image_interrupt_input()
+    executor = IacCodeA2APipelineExecutor(
+        task_store=A2ATaskStore(metrics=NoOpA2AMetrics()),
+        model="qwen3.6-plus",
+        metrics=NoOpA2AMetrics(),
+        artifact_store=None,
+        push_notifier=None,
+        permission_resolver=None,
+        auto_approve_permissions=False,
+        thinking_exposure_types=None,
+    )
+
+    result = await executor._route_pending_question_answer(runtime, pipeline_input)
+
+    assert result == "answered"
+    answer = future.result()
+    assert answer == {"selected_id": "", "selected_label": "", "free_text": "[Image input]"}
+    assert injected == [(pipeline_input.content, {"scope": "pipeline", "inputId": "ask-toolu_1"})]
+
+
+@pytest.mark.asyncio
+async def test_active_pending_question_image_injection_failure_is_not_marked_answered(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_executor import IacCodeA2APipelineExecutor, _PendingAskUserQuestion
+
+    future = asyncio.get_running_loop().create_future()
+
+    class Pipeline:
+        def inject_pending_question_supplement(self, message, *, envelope):
+            return False
+
+    runtime = SimpleNamespace(
+        pending_question=_PendingAskUserQuestion(
+            event=AskUserQuestionEvent(
+                tool_use_id="toolu_1",
+                question="Upload diagram",
+                options=[],
+                response_future=future,
+            ),
+            envelope={"scope": "pipeline", "inputId": "ask-toolu_1"},
+        ),
+        pipeline=Pipeline(),
+        publisher=SimpleNamespace(
+            publish_manual=AsyncMock(return_value=object()),
+        ),
+    )
+    pipeline_input = image_interrupt_input()
+    executor = IacCodeA2APipelineExecutor(
+        task_store=A2ATaskStore(metrics=NoOpA2AMetrics()),
+        model="qwen3.6-plus",
+        metrics=NoOpA2AMetrics(),
+        artifact_store=None,
+        push_notifier=None,
+        permission_resolver=None,
+        auto_approve_permissions=False,
+        thinking_exposure_types=None,
+    )
+
+    with pytest.raises(RuntimeError, match="image supplement could not be delivered"):
+        await executor._route_pending_question_answer(runtime, pipeline_input)
+
+    assert future.done() is False
+    assert runtime.pending_question is not None
+
+
+@pytest.mark.asyncio
+async def test_active_pending_question_image_injection_failure_restores_snapshot_pending_input(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
+    from iac_code.a2a.pipeline_executor import IacCodeA2APipelineExecutor, _PendingAskUserQuestion
+    from iac_code.a2a.pipeline_journal import A2APipelineJournal
+    from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
+    from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher
+
+    future = asyncio.get_running_loop().create_future()
+
+    class Pipeline:
+        def inject_pending_question_supplement(self, message, *, envelope):
+            return False
+
+    publisher = PipelineA2AEventPublisher(
+        event_queue=FakeEventQueue(),
+        translator=PipelineEventTranslator(
+            PipelineA2AContext(
+                pipeline_run_id="ctx-1",
+                task_id="task-1",
+                context_id="ctx-1",
+                pipeline_name="selling",
+            )
+        ),
+        journal=A2APipelineJournal(tmp_path / "pipeline"),
+        snapshot_store=A2APipelineSnapshotStore(tmp_path / "pipeline"),
+    )
+    await publisher.publish_manual(
+        "input_required",
+        "pipeline",
+        status="input_required",
+        data={
+            "kind": "ask_user_question",
+            "inputId": "ask-toolu_1",
+            "toolUseId": "toolu_1",
+            "question": "Upload diagram",
+            "prompt": "Upload diagram",
+            "options": [],
+            "required": True,
+        },
+    )
+    assert publisher.snapshot_store.load()["pendingInput"]["inputId"] == "ask-toolu_1"
+
+    runtime = SimpleNamespace(
+        pending_question=_PendingAskUserQuestion(
+            event=AskUserQuestionEvent(
+                tool_use_id="toolu_1",
+                question="Upload diagram",
+                options=[],
+                response_future=future,
+            ),
+            envelope={"scope": "pipeline", "inputId": "ask-toolu_1"},
+        ),
+        pipeline=Pipeline(),
+        publisher=publisher,
+    )
+    executor = IacCodeA2APipelineExecutor(
+        task_store=A2ATaskStore(metrics=NoOpA2AMetrics()),
+        model="qwen3.6-plus",
+        metrics=NoOpA2AMetrics(),
+        artifact_store=None,
+        push_notifier=None,
+        permission_resolver=None,
+        auto_approve_permissions=False,
+        thinking_exposure_types=None,
+    )
+
+    with pytest.raises(RuntimeError, match="image supplement could not be delivered"):
+        await executor._route_pending_question_answer(runtime, image_interrupt_input())
+
+    snapshot = publisher.snapshot_store.load()
+    assert snapshot["status"] == "waiting_input"
+    assert snapshot["pendingInput"]["inputId"] == "ask-toolu_1"
+    assert future.done() is False
+    assert runtime.pending_question is not None
+
+
+@pytest.mark.asyncio
+async def test_execute_reports_active_pending_question_image_injection_failure(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
+    from iac_code.a2a.pipeline_executor import (
+        A2APipelineRuntime,
+        IacCodeA2APipelineExecutor,
+        _PendingAskUserQuestion,
+    )
+    from iac_code.a2a.pipeline_journal import A2APipelineJournal
+    from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
+    from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher
+
+    future = asyncio.get_running_loop().create_future()
+
+    class Pipeline:
+        def inject_pending_question_supplement(self, message, *, envelope):
+            return False
+
+    queue = FakeEventQueue()
+    publisher = PipelineA2AEventPublisher(
+        event_queue=queue,
+        translator=PipelineEventTranslator(
+            PipelineA2AContext(
+                pipeline_run_id="ctx-1",
+                task_id="task-1",
+                context_id="ctx-1",
+                pipeline_name="selling",
+            )
+        ),
+        journal=A2APipelineJournal(tmp_path / "pipeline"),
+        snapshot_store=A2APipelineSnapshotStore(tmp_path / "pipeline"),
+    )
+    publisher.publish_manual = AsyncMock(return_value=object())  # type: ignore[method-assign]
+    runtime = A2APipelineRuntime(agent_runtime=_fake_runtime(), pipeline=Pipeline(), publisher=publisher)
+    runtime.pending_question = _PendingAskUserQuestion(
+        event=AskUserQuestionEvent(
+            tool_use_id="toolu_1",
+            question="Upload diagram",
+            options=[],
+            response_future=future,
+        ),
+        envelope={"scope": "pipeline", "inputId": "ask-toolu_1"},
+    )
+    store = A2ATaskStore(metrics=NoOpA2AMetrics())
+    task = await store.get_or_create_task(task_id="task-1", context_id="ctx-1")
+    task.state = "input-required"
+    ctx = await store.get_or_create_context(
+        context_id="ctx-1",
+        cwd=str(tmp_path),
+        runtime_factory=lambda _session_id: _fake_runtime(),
+    )
+    ctx.runtime = runtime
+    ctx.active_task_id = "task-1"
+    executor = IacCodeA2APipelineExecutor(
+        task_store=store,
+        model="qwen3.6-plus",
+        metrics=NoOpA2AMetrics(),
+        artifact_store=None,
+        push_notifier=None,
+        permission_resolver=None,
+        auto_approve_permissions=False,
+        thinking_exposure_types=None,
+    )
+
+    await executor.execute(
+        context=FakeRequestContext(task_id="task-1", context_id="ctx-1"),
+        event_queue=queue,
+        task=task,
+        task_id="task-1",
+        context_id="ctx-1",
+        cwd=str(tmp_path),
+        pipeline_input=image_interrupt_input(),
+    )
+
+    states = [dump(event)["status"]["state"] for event in queue.events if isinstance(event, TaskStatusUpdateEvent)]
+    assert "TASK_STATE_FAILED" in states
+    assert future.done() is False
+    assert runtime.pending_question is not None
+
+
+@pytest.mark.asyncio
+async def test_pending_ask_user_question_resume_preserves_image_input(tmp_path: Path) -> None:
+    from iac_code.a2a.pipeline_executor import _resume_pending_ask_user_question_stream
+
+    pipeline_input = image_interrupt_input()
+    received = {}
+
+    class AskPipeline(FakePipeline):
+        sidecar_status = "waiting_input"
+
+        async def resume_ask_user_question(self, answer, **kwargs):
+            received["answer"] = answer
+            received["supplemental_input"] = kwargs.get("supplemental_input")
+            yield PipelineEvent(
+                type=PipelineEventType.PIPELINE_COMPLETED,
+                step_id="ask",
+                timestamp=0.0,
+                data={"total_steps": 1},
+            )
+
+    pending_input = {
+        "kind": "ask_user_question",
+        "toolUseId": "toolu_1",
+        "inputId": "ask-toolu_1",
+    }
+    pipeline = AskPipeline([], session_dir=tmp_path / "pipeline")
+    publisher = SimpleNamespace(
+        snapshot_store=SimpleNamespace(load=lambda: {"status": "waiting_input"}),
+        publish_manual=AsyncMock(return_value=object()),
+    )
+
+    stream = _resume_pending_ask_user_question_stream(
+        pipeline=pipeline,
+        publisher=publisher,
+        pending_input=pending_input,
+        prompt="[Image input]",
+        pipeline_input=pipeline_input,
+    )
+    events = [event async for event in stream]
+
+    assert events
+    assert received["supplemental_input"] == pipeline_input
diff --git a/tests/a2a/test_pipeline_journal.py b/tests/a2a/test_pipeline_journal.py
index 16bf1986..19a997dd 100644
--- a/tests/a2a/test_pipeline_journal.py
+++ b/tests/a2a/test_pipeline_journal.py
@@ -1,5 +1,7 @@
 from __future__ import annotations
 
+import pytest
+
 from iac_code.a2a.pipeline_journal import A2APipelineJournal
 
 
@@ -37,6 +39,42 @@ def test_read_after_filters_by_sequence(tmp_path) -> None:
     assert [event["eventId"] for event in journal.read_after(1)] == ["evt-2", "evt-3"]
 
 
+def test_append_many_replays_group_as_events(tmp_path) -> None:
+    journal = A2APipelineJournal(tmp_path / "pipeline")
+
+    journal.append_many([_event(1, "evt-cancel"), _event(2, "evt-handoff")], durable=True)
+
+    assert [event["eventId"] for event in journal.read_all_strict()] == ["evt-cancel", "evt-handoff"]
+
+
+def test_append_many_sorts_group_events_with_regular_events(tmp_path) -> None:
+    journal = A2APipelineJournal(tmp_path / "pipeline")
+
+    journal.append(_event(3, "evt-after"))
+    journal.append_many([_event(1, "evt-cancel"), _event(2, "evt-handoff")], durable=True)
+
+    assert [event["eventId"] for event in journal.read_all()] == ["evt-cancel", "evt-handoff", "evt-after"]
+
+
+@pytest.mark.parametrize("write_method", ["append", "append_many"])
+def test_durable_append_fsyncs_parent_directory_when_journal_is_created(
+    tmp_path,
+    monkeypatch: pytest.MonkeyPatch,
+    write_method: str,
+) -> None:
+    journal = A2APipelineJournal(tmp_path / "pipeline")
+    calls = []
+
+    monkeypatch.setattr("iac_code.a2a.pipeline_journal.fsync_parent_dir", calls.append, raising=False)
+
+    if write_method == "append":
+        journal.append(_event(1, "evt-1"), durable=True)
+    else:
+        journal.append_many([_event(1, "evt-1"), _event(2, "evt-2")], durable=True)
+
+    assert calls == [journal.path]
+
+
 def test_invalid_json_lines_are_skipped(tmp_path) -> None:
     journal = A2APipelineJournal(tmp_path / "pipeline")
     journal.append(_event(1, "evt-1"))
diff --git a/tests/a2a/test_pipeline_recovery.py b/tests/a2a/test_pipeline_recovery.py
index bd5f7a98..2250646a 100644
--- a/tests/a2a/test_pipeline_recovery.py
+++ b/tests/a2a/test_pipeline_recovery.py
@@ -60,6 +60,49 @@ async def test_recovery_returns_snapshot_and_replay_events(tmp_path) -> None:
     assert [event["eventId"] for event in state["events"]] == ["evt-2"]
 
 
+@pytest.mark.asyncio
+async def test_recovery_keeps_pipeline_warning_visible_after_snapshot_sequence(tmp_path) -> None:
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    await store.get_or_create_context(
+        context_id="ctx-1",
+        cwd=str(tmp_path),
+        runtime_factory=lambda session_id: object(),
+    )
+    context = await store.get_context_record("ctx-1")
+    pipeline_dir = SessionStorage().session_dir(str(tmp_path), context.session_id) / "pipeline"
+    started = _event(1, "evt-1")
+    warning = _event(2, "evt-warning")
+    warning["eventType"] = "pipeline_warning"
+    warning["data"] = {
+        "reason": "cleanup_tracking_unavailable",
+        "operation": "record_observed",
+        "ledger_path": "/Users/alice/.iac-code/projects/demo/cleanup.yaml",
+        "load_error": "while parsing /Users/alice/.iac-code/projects/demo/cleanup.yaml",
+    }
+    journal = A2APipelineJournal(pipeline_dir)
+    journal.append(started)
+    journal.append(warning)
+    A2APipelineSnapshotStore(pipeline_dir).save(reduce_pipeline_events([started, warning]))
+
+    service = A2APipelineRecoveryService(task_store=store)
+    state = await service.get_state(context_id="ctx-1")
+
+    assert state["events"] == []
+    assert state["snapshot"]["lastSequence"] == 2
+    assert state["snapshot"]["control"]["warningHistory"][0]["eventId"] == "evt-warning"
+    assert state["snapshot"]["control"]["warningHistory"][0]["data"]["reason"] == "cleanup_tracking_unavailable"
+    assert "ledger_path" not in state["snapshot"]["control"]["warningHistory"][0]["data"]
+    assert "load_error" not in state["snapshot"]["control"]["warningHistory"][0]["data"]
+
+    replay_state = await service.get_state(context_id="ctx-1", after_sequence=1)
+
+    assert replay_state["events"][0]["eventType"] == "pipeline_warning"
+    assert replay_state["events"][0]["data"]["reason"] == "cleanup_tracking_unavailable"
+    assert "ledger_path" not in replay_state["events"][0]["data"]
+    assert "load_error" not in replay_state["events"][0]["data"]
+
+
 @pytest.mark.asyncio
 async def test_recovery_sanitizes_legacy_artifact_file_uris_from_snapshot_and_replay(tmp_path) -> None:
     persistence = A2APersistenceStore(tmp_path / "a2a")
@@ -245,6 +288,108 @@ async def test_recovery_rejects_task_id_when_pipeline_state_belongs_to_different
         await service.get_state(task_id="task-2")
 
 
+@pytest.mark.asyncio
+async def test_recovery_resolves_cleanup_snapshot_from_normal_delivery_task_id(tmp_path) -> None:
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_task(A2ATaskSnapshot(task_id="task-pipeline", context_id="ctx-1", state="completed"))
+    persistence.save_task(A2ATaskSnapshot(task_id="task-normal", context_id="ctx-1", state="input-required"))
+    persistence.save_context(A2AContextSnapshot(context_id="ctx-1", session_id="session-1", cwd=str(tmp_path)))
+    pipeline_dir = SessionStorage().session_dir(str(tmp_path), "session-1") / "pipeline"
+    raw_error = (
+        "DeleteStack failed AccessKeySecret=super-secret token=sk-live-1234567890 "
+        "at /Users/alice/.iac-code/projects/session/pipeline/cleanup.yaml"
+    )
+    pipeline_started = _event_for_task(1, "evt-pipeline-started", task_id="task-pipeline")
+    cleanup_started = _event_for_task(2, "evt-cleanup-started", task_id="task-pipeline")
+    cleanup_started.update(
+        {
+            "eventType": "cleanup_started",
+            "scope": "cleanup",
+            "deliveryTaskId": "task-normal",
+            "data": {
+                "status": "started",
+                "resourceCount": 1,
+                "prompt": "hidden cleanup prompt for stack-123",
+                "ledgerPath": "/Users/alice/.iac-code/projects/session/pipeline/cleanup.yaml",
+                "provider": "ros",
+                "resourceType": "stack",
+                "resourceId": "stack-123",
+                "regionId": "cn-hangzhou",
+                "cleanupStatus": "started",
+                "progressStatus": "DELETE_STARTED",
+                "lastError": raw_error,
+            },
+        }
+    )
+    journal = A2APipelineJournal(pipeline_dir)
+    journal.append(pipeline_started)
+    journal.append(cleanup_started)
+    A2APipelineSnapshotStore(pipeline_dir).save(reduce_pipeline_events([pipeline_started, cleanup_started]))
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    service = A2APipelineRecoveryService(task_store=store)
+
+    state = await service.get_state(task_id="task-normal", after_sequence=0)
+
+    assert state["snapshot"]["taskId"] == "task-pipeline"
+    assert state["snapshot"]["cleanup"]["status"] == "started"
+    assert state["snapshot"]["cleanup"]["resources"][0]["resourceId"] == "stack-123"
+    assert "prompt" not in state["snapshot"]["cleanup"]
+    assert "ledgerPath" not in state["snapshot"]["cleanup"]
+    assert "prompt" not in state["snapshot"]["cleanup"]["history"][0]["data"]
+    assert "ledgerPath" not in state["snapshot"]["cleanup"]["history"][0]["data"]
+    assert raw_error not in state["snapshot"]["cleanup"]["history"][0]["data"]["lastError"]
+    assert [event["eventId"] for event in state["events"]] == ["evt-cleanup-started"]
+    assert "prompt" not in state["events"][0]["data"]
+    assert "ledgerPath" not in state["events"][0]["data"]
+    assert raw_error not in state["events"][0]["data"]["lastError"]
+    rendered = json.dumps(state, ensure_ascii=False)
+    assert "super-secret" not in rendered
+    assert "sk-live-1234567890" not in rendered
+    assert "/Users/alice" not in rendered
+
+
+@pytest.mark.asyncio
+async def test_recovery_by_delivery_task_catches_up_stale_pipeline_snapshot(tmp_path) -> None:
+    persistence = A2APersistenceStore(tmp_path / "a2a")
+    persistence.save_task(A2ATaskSnapshot(task_id="task-pipeline", context_id="ctx-1", state="completed"))
+    persistence.save_task(A2ATaskSnapshot(task_id="task-normal", context_id="ctx-1", state="input-required"))
+    persistence.save_context(A2AContextSnapshot(context_id="ctx-1", session_id="session-1", cwd=str(tmp_path)))
+    pipeline_dir = SessionStorage().session_dir(str(tmp_path), "session-1") / "pipeline"
+    pipeline_started = _event_for_task(1, "evt-pipeline-started", task_id="task-pipeline")
+    cleanup_started = _event_for_task(2, "evt-cleanup-started", task_id="task-pipeline")
+    cleanup_started.update(
+        {
+            "eventType": "cleanup_started",
+            "scope": "cleanup",
+            "deliveryTaskId": "task-normal",
+            "data": {
+                "status": "started",
+                "resourceCount": 1,
+                "provider": "ros",
+                "resourceType": "stack",
+                "resourceId": "stack-123",
+                "regionId": "cn-hangzhou",
+                "cleanupStatus": "started",
+                "progressStatus": "DELETE_STARTED",
+            },
+        }
+    )
+    journal = A2APipelineJournal(pipeline_dir)
+    journal.append(pipeline_started)
+    journal.append(cleanup_started)
+    A2APipelineSnapshotStore(pipeline_dir).save(reduce_pipeline_events([pipeline_started]))
+    store = A2ATaskStore(metrics=NoOpA2AMetrics(), persistence=persistence)
+    service = A2APipelineRecoveryService(task_store=store)
+
+    state = await service.get_state(task_id="task-normal")
+
+    assert state["snapshot"]["lastSequence"] == 2
+    assert state["snapshot"]["cleanup"]["status"] == "started"
+    assert state["snapshot"]["cleanup"]["resources"][0]["resourceId"] == "stack-123"
+    assert "prompt" not in state["snapshot"]["cleanup"]
+    assert "ledgerPath" not in state["snapshot"]["cleanup"]
+
+
 @pytest.mark.asyncio
 async def test_recovery_rejects_context_id_that_does_not_match_task_id(tmp_path) -> None:
     persistence = A2APersistenceStore(tmp_path / "a2a")
diff --git a/tests/a2a/test_pipeline_snapshot.py b/tests/a2a/test_pipeline_snapshot.py
index 508bfc32..30ff10f2 100644
--- a/tests/a2a/test_pipeline_snapshot.py
+++ b/tests/a2a/test_pipeline_snapshot.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import json
 import logging
 from pathlib import Path
 
@@ -49,10 +50,10 @@ def test_snapshot_load_logs_parse_failures(tmp_path, caplog) -> None:
 def test_snapshot_save_cleans_temp_file_when_replace_fails(monkeypatch, tmp_path, caplog) -> None:
     store = A2APipelineSnapshotStore(tmp_path)
 
-    def fail_replace(self: Path, target: Path) -> Path:
-        raise PermissionError(f"locked: {target}")
+    def fail_write(path: Path, value: dict, *, durable: bool = True) -> None:
+        raise PermissionError(f"locked: {path}")
 
-    monkeypatch.setattr(Path, "replace", fail_replace)
+    monkeypatch.setattr(pipeline_snapshot, "atomic_write_json", fail_write)
     caplog.set_level(logging.WARNING, logger="iac_code.a2a.pipeline_snapshot")
 
     assert store.save({"status": "working"}) is False
@@ -90,6 +91,26 @@ def test_reduce_steps_and_pending_input() -> None:
     assert snapshot["pendingInput"]["inputId"] == "input-confirm_and_select-1"
 
 
+def test_pipeline_warning_does_not_change_terminal_snapshot_status() -> None:
+    started = _base("evt-start", 1, "pipeline_started")
+    warning = _base("evt-warning", 2, "pipeline_warning", status="working")
+    warning["data"] = {"reason": "cleanup_tracking_unavailable"}
+
+    snapshot = reduce_pipeline_events([started, warning])
+
+    assert snapshot["status"] == "working"
+    assert snapshot["lastSequence"] == 2
+    assert snapshot.get("completedAt") is None
+    assert snapshot["control"]["warningHistory"] == [
+        {
+            "eventId": "evt-warning",
+            "sequence": 2,
+            "createdAt": "2026-06-08T10:00:00Z",
+            "data": {"reason": "cleanup_tracking_unavailable"},
+        }
+    ]
+
+
 def test_reduce_input_received_completes_waiting_step() -> None:
     step = _base("evt-1", 1, "step_started", scope="step")
     step["step"] = {
@@ -114,6 +135,173 @@ def test_reduce_input_received_completes_waiting_step() -> None:
     assert snapshot["steps"][0]["completedAt"] == "2026-06-08T10:00:00Z"
 
 
+def test_reduce_cleanup_handoff_updates_snapshot_cleanup() -> None:
+    handoff = _base("evt-cleanup-handoff", 1, "pipeline_handoff_ready", status="completed")
+    handoff["data"] = {
+        "action": "switch_to_normal",
+        "targetMode": "normal",
+        "outcome": "completed",
+        "summary": "[Pipeline Handoff Context]",
+        "cleanup": {
+            "status": "pending",
+            "resourceCount": 1,
+            "statusMessage": "检测到 1 个回滚残留资源，开始清理流程。",
+            "resources": [{"resourceId": "stack-123", "regionId": "cn-hangzhou"}],
+        },
+    }
+
+    snapshot = reduce_pipeline_events([handoff])
+
+    assert snapshot["cleanup"]["status"] == "pending"
+    assert snapshot["cleanup"]["resourceCount"] == 1
+    assert snapshot["cleanup"]["resources"] == [{"resourceId": "stack-123", "regionId": "cn-hangzhou"}]
+    assert snapshot["cleanup"]["history"][-1]["eventType"] == "pipeline_handoff_ready"
+    assert snapshot["normalHandoff"]["data"]["cleanup"]["resourceCount"] == 1
+
+
+def test_reduce_cleanup_progress_events_update_snapshot_cleanup() -> None:
+    started = _base("evt-cleanup-started", 1, "cleanup_started", scope="cleanup")
+    started["data"] = {
+        "status": "started",
+        "resourceCount": 1,
+        "resources": [{"resourceId": "stack-123", "regionId": "cn-hangzhou"}],
+    }
+    progress = _base("evt-cleanup-progress", 2, "cleanup_progress", scope="cleanup")
+    progress["data"] = {
+        "status": "in_progress",
+        "resourceId": "stack-123",
+        "regionId": "cn-hangzhou",
+        "stackStatus": "DELETE_IN_PROGRESS",
+    }
+    completed = _base("evt-cleanup-completed", 3, "cleanup_completed", scope="cleanup", status="completed")
+    completed["data"] = {
+        "status": "completed",
+        "resourceId": "stack-123",
+        "regionId": "cn-hangzhou",
+        "stackStatus": "DELETE_COMPLETE",
+    }
+
+    snapshot = reduce_pipeline_events([started, progress, completed])
+
+    assert snapshot["cleanup"]["status"] == "completed"
+    assert snapshot["cleanup"]["resourceCount"] == 1
+    assert snapshot["cleanup"]["resources"][0]["resourceId"] == "stack-123"
+    assert snapshot["cleanup"]["resources"][0]["stackStatus"] == "DELETE_COMPLETE"
+    assert [item["eventType"] for item in snapshot["cleanup"]["history"]] == [
+        "cleanup_started",
+        "cleanup_progress",
+        "cleanup_completed",
+    ]
+
+
+def test_reduce_cleanup_status_aggregates_multiple_resources() -> None:
+    started = _base("evt-cleanup-started", 1, "cleanup_started", scope="cleanup")
+    started["data"] = {
+        "status": "pending",
+        "resourceCount": 2,
+        "resources": [
+            {
+                "provider": "ros",
+                "resourceType": "stack",
+                "resourceId": "stack-a",
+                "regionId": "cn-hangzhou",
+                "cleanupStatus": "pending",
+            },
+            {
+                "provider": "ros",
+                "resourceType": "stack",
+                "resourceId": "stack-b",
+                "regionId": "cn-hangzhou",
+                "cleanupStatus": "pending",
+            },
+        ],
+    }
+    completed_one = _base("evt-cleanup-one-complete", 2, "cleanup_completed", scope="cleanup")
+    completed_one["data"] = {
+        "status": "completed",
+        "provider": "ros",
+        "resourceType": "stack",
+        "resourceId": "stack-a",
+        "regionId": "cn-hangzhou",
+        "cleanupStatus": "completed",
+        "stackStatus": "DELETE_COMPLETE",
+    }
+    failed_one = _base("evt-cleanup-one-failed", 3, "cleanup_failed", scope="cleanup")
+    failed_one["data"] = {
+        "status": "failed",
+        "provider": "ros",
+        "resourceType": "stack",
+        "resourceId": "stack-b",
+        "regionId": "cn-hangzhou",
+        "cleanupStatus": "failed",
+        "stackStatus": "DELETE_FAILED",
+    }
+
+    partial = reduce_pipeline_events([started, completed_one])
+    failed = reduce_pipeline_events([started, completed_one, failed_one])
+
+    assert partial["cleanup"]["status"] == "pending"
+    assert failed["cleanup"]["status"] == "failed"
+
+
+def test_reduce_cleanup_progress_distinguishes_provider_and_resource_type() -> None:
+    started = _base("evt-cleanup-started", 1, "cleanup_started", scope="cleanup")
+    started["data"] = {
+        "status": "started",
+        "resourceCount": 3,
+        "resources": [
+            {
+                "provider": "ros",
+                "resourceType": "stack",
+                "resourceId": "shared-id",
+                "regionId": "cn-hangzhou",
+                "stackStatus": "DELETE_IN_PROGRESS",
+            },
+            {
+                "provider": "ros",
+                "resourceType": "stack_set",
+                "resourceId": "shared-id",
+                "regionId": "cn-hangzhou",
+                "stackStatus": "DELETE_IN_PROGRESS",
+            },
+            {
+                "provider": "terraform",
+                "resourceType": "stack",
+                "resourceId": "shared-id",
+                "regionId": "cn-hangzhou",
+                "stackStatus": "DELETE_IN_PROGRESS",
+            },
+        ],
+    }
+    type_progress = _base("evt-cleanup-type-progress", 2, "cleanup_progress", scope="cleanup")
+    type_progress["data"] = {
+        "status": "in_progress",
+        "provider": "ros",
+        "resourceType": "stack_set",
+        "resourceId": "shared-id",
+        "regionId": "cn-hangzhou",
+        "stackStatus": "DELETE_COMPLETE",
+    }
+    provider_progress = _base("evt-cleanup-provider-progress", 3, "cleanup_progress", scope="cleanup")
+    provider_progress["data"] = {
+        "status": "in_progress",
+        "provider": "terraform",
+        "resourceType": "stack",
+        "resourceId": "shared-id",
+        "regionId": "cn-hangzhou",
+        "stackStatus": "DELETE_FAILED",
+    }
+
+    snapshot = reduce_pipeline_events([started, type_progress, provider_progress])
+
+    resources = {
+        (resource["provider"], resource["resourceType"]): resource for resource in snapshot["cleanup"]["resources"]
+    }
+    assert resources[("ros", "stack")]["stackStatus"] == "DELETE_IN_PROGRESS"
+    assert resources[("ros", "stack_set")]["stackStatus"] == "DELETE_COMPLETE"
+    assert resources[("terraform", "stack")]["stackStatus"] == "DELETE_FAILED"
+
+
 def test_reduce_input_received_records_candidate_selection_details_on_step() -> None:
     step = _base("evt-1", 1, "step_started", scope="step")
     step["step"] = {
@@ -729,6 +917,7 @@ def test_reduce_stack_current_changed_updates_snapshot_stack_state() -> None:
         "regionId": "cn-hangzhou",
         "stackId": "stack-123",
         "stackName": "demo",
+        "stackStatus": "DELETE_COMPLETE",
         "isSuccess": True,
         "current": False,
         "cleared": True,
@@ -744,6 +933,40 @@ def test_reduce_stack_current_changed_updates_snapshot_stack_state() -> None:
     assert [item["eventId"] for item in deleted_snapshot["stacks"]["history"]] == ["evt-create", "evt-delete"]
 
 
+def test_reduce_stack_current_changed_keeps_current_for_delete_requested() -> None:
+    created = _base("evt-create", 1, "stack_current_changed", scope="stack")
+    created["data"] = {
+        "toolName": "aliyun_api",
+        "toolUseId": "toolu-create",
+        "provider": "ros",
+        "action": "CreateStack",
+        "regionId": "cn-hangzhou",
+        "stackId": "stack-123",
+        "stackName": "demo",
+        "isSuccess": True,
+        "current": True,
+    }
+    delete_requested = _base("evt-delete-requested", 2, "stack_current_changed", scope="stack")
+    delete_requested["data"] = {
+        "toolName": "ros_stack",
+        "toolUseId": "toolu-delete",
+        "provider": "ros",
+        "action": "DeleteStack",
+        "regionId": "cn-hangzhou",
+        "stackId": "stack-123",
+        "stackName": "demo",
+        "stackStatus": "DELETE_REQUESTED",
+        "isSuccess": True,
+        "current": True,
+    }
+
+    snapshot = reduce_pipeline_events([created, delete_requested])
+
+    assert snapshot["stacks"]["current"]["stackId"] == "stack-123"
+    assert snapshot["stacks"]["byId"]["stack-123"]["current"] is True
+    assert snapshot["stacks"]["byId"]["stack-123"]["stackStatus"] == "DELETE_REQUESTED"
+
+
 def test_reduce_artifact_created_prefers_top_level_artifact_metadata() -> None:
     artifact = _base("evt-1", 1, "artifact_created", scope="step")
     artifact["step"] = {"runId": "step-a-1", "id": "a", "index": 1, "total": 1, "attempt": 1}
@@ -940,6 +1163,81 @@ def test_store_sanitizes_non_finite_and_non_json_values(tmp_path) -> None:
     assert loaded["display"]["candidateDetails"][0]["raw"].startswith("<object object at ")
 
 
+def test_store_sanitizes_cleanup_private_fields_without_dropping_input_prompt(tmp_path) -> None:
+    store = A2APipelineSnapshotStore(tmp_path / "pipeline")
+    raw_error = (
+        "DeleteStack failed AccessKeySecret=super-secret token=sk-live-1234567890 "
+        "at /Users/alice/.iac-code/projects/session/pipeline/cleanup.yaml"
+    )
+    snapshot = reduce_pipeline_events([_base("evt-1", 1, "pipeline_started")])
+    snapshot["pendingInput"] = {"prompt": "choose deployment target"}
+    snapshot["control"]["inputHistory"] = [{"prompt": "choose deployment target"}]
+    snapshot["control"]["handoffHistory"] = [
+        {
+            "data": {
+                "cleanup": {
+                    "prompt": "hidden cleanup prompt",
+                    "ledgerPath": "/tmp/cleanup.yaml",
+                    "lastError": raw_error,
+                }
+            }
+        }
+    ]
+    snapshot["normalHandoff"] = {
+        "data": {
+            "cleanup": {
+                "prompt": "hidden cleanup prompt",
+                "ledgerPath": "/tmp/cleanup.yaml",
+                "lastError": raw_error,
+            }
+        }
+    }
+    snapshot["cleanup"] = {
+        "status": "pending",
+        "resourceCount": 1,
+        "resources": [{"resourceId": "stack-123", "lastError": raw_error}],
+        "history": [
+            {"data": {"prompt": "hidden cleanup prompt", "ledgerPath": "/tmp/cleanup.yaml", "lastError": raw_error}}
+        ],
+        "prompt": "hidden cleanup prompt",
+        "ledgerPath": "/tmp/cleanup.yaml",
+        "last_error": raw_error,
+    }
+
+    store.save(snapshot)
+
+    loaded = store.load()
+    assert loaded is not None
+    assert loaded["pendingInput"]["prompt"] == "choose deployment target"
+    assert loaded["control"]["inputHistory"][0]["prompt"] == "choose deployment target"
+    assert "prompt" not in loaded["control"]["handoffHistory"][0]["data"]["cleanup"]
+    assert raw_error not in loaded["control"]["handoffHistory"][0]["data"]["cleanup"]["lastError"]
+    assert "ledgerPath" not in loaded["normalHandoff"]["data"]["cleanup"]
+    assert raw_error not in loaded["normalHandoff"]["data"]["cleanup"]["lastError"]
+    assert "prompt" not in loaded["cleanup"]
+    assert raw_error not in loaded["cleanup"]["last_error"]
+    assert raw_error not in loaded["cleanup"]["resources"][0]["lastError"]
+    assert "ledgerPath" not in loaded["cleanup"]["history"][0]["data"]
+    assert raw_error not in loaded["cleanup"]["history"][0]["data"]["lastError"]
+    rendered = json.dumps(loaded, ensure_ascii=False)
+    assert "super-secret" not in rendered
+    assert "sk-live-1234567890" not in rendered
+    assert "/Users/alice" not in rendered
+    assert "[REDACTED]" in rendered
+    assert "[PATH]" in rendered
+
+    store.path.write_text(json.dumps(snapshot), encoding="utf-8")
+    loaded = store.load()
+    assert loaded is not None
+    assert loaded["pendingInput"]["prompt"] == "choose deployment target"
+    assert "prompt" not in loaded["normalHandoff"]["data"]["cleanup"]
+    assert "ledgerPath" not in loaded["cleanup"]
+    rendered = json.dumps(loaded, ensure_ascii=False)
+    assert "super-secret" not in rendered
+    assert "sk-live-1234567890" not in rendered
+    assert "/Users/alice" not in rendered
+
+
 def test_store_returns_none_for_invalid_utf8_snapshot(tmp_path) -> None:
     store = A2APipelineSnapshotStore(tmp_path / "pipeline")
     store.pipeline_dir.mkdir(parents=True)
diff --git a/tests/a2a/test_pipeline_stream.py b/tests/a2a/test_pipeline_stream.py
index ca1d1f65..3a14f93c 100644
--- a/tests/a2a/test_pipeline_stream.py
+++ b/tests/a2a/test_pipeline_stream.py
@@ -15,7 +15,7 @@
 from iac_code.a2a.pipeline_events import PipelineA2AContext, PipelineEventTranslator
 from iac_code.a2a.pipeline_journal import A2APipelineJournal
 from iac_code.a2a.pipeline_snapshot import A2APipelineSnapshotStore
-from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher
+from iac_code.a2a.pipeline_stream import PipelineA2AEventPublisher, is_recovery_semantic_event
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.types.stream_events import (
     AskUserQuestionEvent,
@@ -81,6 +81,17 @@ def _envelope(event_type: str, status: str = "working") -> dict[str, Any]:
     }
 
 
+def test_pipeline_warning_is_recovery_semantic() -> None:
+    assert is_recovery_semantic_event(_envelope("pipeline_warning")) is True
+
+
+def test_unknown_working_step_event_is_recovery_semantic() -> None:
+    envelope = _envelope("custom_step_progress")
+    envelope["scope"] = "step"
+
+    assert is_recovery_semantic_event(envelope) is True
+
+
 @pytest.mark.asyncio
 async def test_publish_text_writes_a2a_metadata_journal_and_snapshot(tmp_path: Path) -> None:
     publisher, queue = _publisher(tmp_path)
@@ -300,7 +311,7 @@ async def test_publish_permission_denies_future_when_permission_metadata_is_not_
     publisher, queue = _publisher(tmp_path)
     future: asyncio.Future[bool] = asyncio.get_running_loop().create_future()
 
-    def fail_append(_event: dict[str, Any]) -> None:
+    def fail_append(_event: dict[str, Any], durable: bool = False) -> None:
         raise OSError("append failed")
 
     def fail_save(_snapshot: dict[str, Any]) -> bool:
@@ -324,6 +335,91 @@ def fail_save(_snapshot: dict[str, Any]) -> bool:
     assert queue.events == []
 
 
+@pytest.mark.asyncio
+async def test_recovery_semantic_event_is_not_enqueued_when_metadata_persistence_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    publisher, queue = _publisher(tmp_path)
+
+    def fail_append(_event: dict[str, Any], durable: bool = False) -> None:
+        raise OSError("journal locked")
+
+    monkeypatch.setattr(publisher.journal, "append", fail_append)
+    monkeypatch.setattr(publisher.snapshot_store, "save", lambda _snapshot: False)
+
+    result = await publisher.publish_manual("pipeline_started", "pipeline")
+
+    assert result is None
+    assert queue.events == []
+
+
+@pytest.mark.asyncio
+async def test_text_delta_can_be_enqueued_when_only_durable_metadata_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    publisher, queue = _publisher(tmp_path)
+
+    def fail_append(event: dict[str, Any], durable: bool = False) -> None:
+        if durable:
+            raise OSError("journal locked")
+        A2APipelineJournal.append(publisher.journal, event)
+
+    monkeypatch.setattr(publisher.journal, "append", fail_append)
+    monkeypatch.setattr(publisher.snapshot_store, "save", lambda _snapshot: False)
+
+    returned = await publisher.publish(TextDeltaEvent(text="hello"))
+
+    assert returned == "hello"
+    assert len(queue.events) == 1
+
+
+@pytest.mark.asyncio
+async def test_manual_recovery_event_routes_durable_metadata_without_explicit_request(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    publisher, _queue = _publisher(tmp_path)
+    durable_flags: list[bool] = []
+
+    def record_append(event: dict[str, Any], durable: bool = False) -> None:
+        durable_flags.append(durable)
+        A2APipelineJournal.append(publisher.journal, event)
+
+    monkeypatch.setattr(publisher.journal, "append", record_append)
+
+    await publisher.publish_manual("pipeline_started", "pipeline")
+
+    assert durable_flags == [True]
+
+
+@pytest.mark.asyncio
+async def test_translated_recovery_event_routes_durable_metadata_without_explicit_request(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    publisher, _queue = _publisher(tmp_path)
+    durable_flags: list[bool] = []
+
+    def record_append(event: dict[str, Any], durable: bool = False) -> None:
+        durable_flags.append(durable)
+        A2APipelineJournal.append(publisher.journal, event)
+
+    monkeypatch.setattr(publisher.journal, "append", record_append)
+
+    await publisher.publish(
+        PipelineEvent(
+            type=PipelineEventType.STEP_STARTED,
+            step_id="confirm_and_select",
+            timestamp=1717821600.0,
+            data={"index": 1, "total": 2},
+        )
+    )
+
+    assert durable_flags == [True]
+
+
 @pytest.mark.asyncio
 async def test_publish_permission_redacts_and_truncates_tool_input_in_status_metadata_and_journal(
     tmp_path: Path,
@@ -702,7 +798,7 @@ async def test_publish_does_not_emit_artifact_update_when_artifact_metadata_is_n
     store = A2AArtifactStore(tmp_path / "artifacts")
     publisher, queue = _publisher(tmp_path, artifact_store=store, exposure_types=[A2AExposureType.TOOL_TRACE])
 
-    def fail_append(_event: dict[str, Any]) -> None:
+    def fail_append(_event: dict[str, Any], durable: bool = False) -> None:
         raise OSError("append failed")
 
     def fail_save(_snapshot: dict[str, Any]) -> None:
@@ -896,7 +992,7 @@ async def test_publish_candidate_failure_keeps_a2a_task_working(tmp_path: Path)
 async def test_publish_continues_when_pipeline_persistence_fails(tmp_path: Path) -> None:
     publisher, queue = _publisher(tmp_path)
 
-    def fail_append(_event: dict[str, Any]) -> None:
+    def fail_append(_event: dict[str, Any], durable: bool = False) -> None:
         raise OSError("disk full")
 
     publisher.journal.append = fail_append  # type: ignore[method-assign]
@@ -984,7 +1080,7 @@ async def test_publish_rebuilds_missing_snapshot_with_current_event_when_journal
     await publisher.publish(TextDeltaEvent(text="old"))
     publisher.snapshot_store.path.unlink()
 
-    def fail_append(_event: dict[str, Any]) -> None:
+    def fail_append(_event: dict[str, Any], durable: bool = False) -> None:
         raise OSError("disk full")
 
     publisher.journal.append = fail_append  # type: ignore[method-assign]
@@ -1115,6 +1211,25 @@ async def test_publish_ask_user_question_maps_to_input_required_snapshot(tmp_pat
     assert snapshot["pendingInput"]["question"] == "请选择部署目标"
 
 
+@pytest.mark.asyncio
+async def test_pipeline_input_received_is_not_enqueued_when_metadata_persistence_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    publisher, queue = _publisher(tmp_path)
+
+    def fail_append(_event: dict[str, Any], durable: bool = False) -> None:
+        raise OSError("journal locked")
+
+    monkeypatch.setattr(publisher.journal, "append", fail_append)
+    monkeypatch.setattr(publisher.snapshot_store, "save", lambda _snapshot: False)
+
+    result = await publisher.publish_manual("input_received", "pipeline")
+
+    assert result is None
+    assert queue.events == []
+
+
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
     ("failed", "expected_state"),
diff --git a/tests/a2a/test_selling_console_frontend.py b/tests/a2a/test_selling_console_frontend.py
new file mode 100644
index 00000000..b175b305
--- /dev/null
+++ b/tests/a2a/test_selling_console_frontend.py
@@ -0,0 +1,4893 @@
+from __future__ import annotations
+
+import json
+import os
+import shutil
+import subprocess
+import tempfile
+from pathlib import Path
+
+import pytest
+
+APP_JS = Path(__file__).resolve().parents[2] / "scripts" / "a2a" / "selling_console_web" / "app.js"
+STYLES_CSS = APP_JS.parent / "styles.css"
+NODE_RELATIVE_PATH = Path(".cache/codex-runtimes/codex-primary-runtime/dependencies/node/bin/node")
+
+
+def bundled_node_candidates() -> list[Path]:
+    override = os.environ.get("IAC_CODE_TEST_NODE")
+    if override:
+        return [Path(override).expanduser()]
+    candidates = [Path.home() / NODE_RELATIVE_PATH]
+    home_env = os.environ.get("HOME")
+    if home_env:
+        candidates.append(Path(home_env).expanduser() / NODE_RELATIVE_PATH)
+    candidates.extend(parent / NODE_RELATIVE_PATH for parent in APP_JS.parents)
+    return candidates
+
+
+def node_command() -> list[str]:
+    node = shutil.which("node")
+    if node:
+        return [node]
+    for fallback in bundled_node_candidates():
+        if fallback.exists():
+            return [str(fallback)]
+    pytest.skip("node is not installed")
+
+
+def run_node_script(source: str) -> dict:
+    with tempfile.TemporaryDirectory(prefix="iac-code-selling-console-test-") as temp_dir:
+        script_path = Path(temp_dir) / "script.js"
+        script_path.write_text(source, encoding="utf-8")
+        result = subprocess.run(
+            [*node_command(), str(script_path)],
+            capture_output=True,
+            text=True,
+            encoding="utf-8",
+            check=False,
+        )
+    assert result.returncode == 0, result.stderr
+    return json.loads(result.stdout)
+
+
+def test_run_node_script_uses_file_instead_of_inline_eval(monkeypatch: pytest.MonkeyPatch) -> None:
+    source = 'console.log(JSON.stringify({"ok": true}));'
+    command_seen: list[str] = []
+
+    def fake_run(command, *, capture_output, text, check, encoding):
+        command_seen.extend(str(part) for part in command)
+        assert capture_output is True
+        assert text is True
+        assert check is False
+        assert encoding == "utf-8"
+        assert "-e" not in command_seen
+        script_path = Path(command_seen[-1])
+        assert script_path.read_text(encoding="utf-8") == source
+        return subprocess.CompletedProcess(command, 0, stdout='{"ok": true}\n', stderr="")
+
+    monkeypatch.setattr(shutil, "which", lambda name: "/usr/bin/node" if name == "node" else None)
+    monkeypatch.setattr(subprocess, "run", fake_run)
+
+    assert run_node_script(source) == {"ok": True}
+    assert command_seen[:1] == ["/usr/bin/node"]
+
+
+def test_node_command_falls_back_to_home_bundled_node_when_path_is_empty(
+    monkeypatch: pytest.MonkeyPatch, tmp_path: Path
+) -> None:
+    fake_node = tmp_path / NODE_RELATIVE_PATH
+    fake_node.parent.mkdir(parents=True)
+    fake_node.write_text("#!/bin/sh\n", encoding="utf-8")
+    fake_node.chmod(0o755)
+    monkeypatch.setenv("PATH", "")
+    monkeypatch.delenv("IAC_CODE_TEST_NODE", raising=False)
+    monkeypatch.setenv("HOME", str(tmp_path))
+    assert shutil.which("node") is None
+
+    command = node_command()
+
+    assert command == [str(fake_node)]
+    assert Path(command[0]).exists()
+
+
+def test_node_command_uses_env_override_when_path_is_empty(monkeypatch: pytest.MonkeyPatch, tmp_path: Path) -> None:
+    fake_node = tmp_path / "node"
+    fake_node.write_text("#!/bin/sh\n", encoding="utf-8")
+    fake_node.chmod(0o755)
+    monkeypatch.setenv("PATH", "")
+    monkeypatch.setenv("IAC_CODE_TEST_NODE", str(fake_node))
+
+    command = node_command()
+
+    assert command == [str(fake_node)]
+
+
+def reducer_harness(expression: str) -> dict:
+    app_source = APP_JS.read_text(encoding="utf-8")
+    script = f"""
+const assert = require("assert");
+global.window = {{}};
+global.document = {{
+  readyState: "loading",
+  addEventListener() {{}},
+  querySelector() {{ return null; }},
+  querySelectorAll() {{ return []; }},
+  getElementById() {{ return null; }}
+}};
+{app_source}
+const reducers = window.SellingConsoleReducers;
+const output = (() => {{
+  {expression}
+}})();
+console.log(JSON.stringify(output));
+"""
+    return run_node_script(script)
+
+
+def controller_harness(expression: str) -> dict:
+    app_source = APP_JS.read_text(encoding="utf-8")
+    script = f"""
+class FakeElement {{
+  constructor(tagName, id = "") {{
+    this.tagName = tagName.toUpperCase();
+    this.id = id;
+    this.children = [];
+    this.attributes = {{}};
+    this.listeners = {{}};
+    this.className = "";
+    this.textContent = "";
+    this.value = "";
+    this.hidden = false;
+    this.scrollTop = 0;
+    this.scrollHeight = 100;
+    this.clientHeight = 30;
+  }}
+  appendChild(child) {{
+    this.children.push(child);
+    return child;
+  }}
+  replaceChildren(...children) {{
+    this.children = children;
+    this.textContent = "";
+  }}
+  setAttribute(name, value) {{
+    this.attributes[name] = String(value);
+  }}
+  getAttribute(name) {{
+    return Object.prototype.hasOwnProperty.call(this.attributes, name) ? this.attributes[name] : null;
+  }}
+  addEventListener(name, listener) {{
+    this.listeners[name] = this.listeners[name] || [];
+    this.listeners[name].push(listener);
+  }}
+  click() {{
+    (this.listeners.click || []).forEach((listener) => listener({{type: "click"}}));
+  }}
+}}
+function walk(element, callback) {{
+  if (!element) {{
+    return;
+  }}
+  callback(element);
+  (element.children || []).forEach((child) => walk(child, callback));
+}}
+function textOf(element) {{
+  if (!element) {{
+    return "";
+  }}
+  return [element.textContent || "", ...(element.children || []).map(textOf)].join("");
+}}
+const elements = {{
+  "step-list": new FakeElement("div", "step-list"),
+  "composer-progress": new FakeElement("div", "composer-progress"),
+  "debug-drawer": new FakeElement("details", "debug-drawer"),
+  "progress-debug-panel": new FakeElement("div", "progress-debug-panel"),
+  "debug-output": new FakeElement("pre", "debug-output"),
+  "debug-session-info": new FakeElement("div", "debug-session-info"),
+  "normal-handoff-notice": new FakeElement("div", "normal-handoff-notice"),
+  "plans-grid": new FakeElement("div", "plans-grid"),
+  "status-pill": new FakeElement("span", "status-pill"),
+  "status-alert": new FakeElement("div", "status-alert"),
+  "server-url": new FakeElement("input", "server-url"),
+  cwd: new FakeElement("input", "cwd"),
+  "composer-input": new FakeElement("textarea", "composer-input"),
+  "send-button": new FakeElement("button", "send-button"),
+  "health-button": new FakeElement("button", "health-button"),
+  "fetch-state-button": new FakeElement("button", "fetch-state-button"),
+  "cancel-button": new FakeElement("button", "cancel-button"),
+}};
+elements["normal-handoff-notice"].hidden = true;
+const debugPre = elements["debug-output"];
+const roots = Object.values(elements);
+global.window = {{SELLING_CONSOLE_DEFAULTS: {{serverUrl: "http://127.0.0.1:41299", cwd: "/workspace"}}}};
+global.document = {{
+  readyState: "loading",
+  addEventListener() {{}},
+  createElement(tagName) {{ return new FakeElement(tagName); }},
+  getElementById(id) {{ return elements[id] || null; }},
+  querySelector(selector) {{
+    if (selector === "#debug-drawer pre") {{
+      return debugPre;
+    }}
+    if (selector.startsWith("#")) {{
+      return elements[selector.slice(1)] || null;
+    }}
+    return null;
+  }},
+  querySelectorAll(selector) {{
+    const matches = [];
+    roots.forEach((root) => walk(root, (element) => {{
+      if (selector === "[data-step-id]" && element.getAttribute("data-step-id") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-event-kind]" && element.getAttribute("data-step-event-kind") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-state-icon]" && element.getAttribute("data-step-state-icon") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-toggle]" && element.getAttribute("data-step-toggle") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-result-field]" && element.getAttribute("data-step-result-field") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-result-option]" && element.getAttribute("data-step-result-option") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-candidate-result]" && element.getAttribute("data-step-candidate-result") !== null) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-step-candidate-result-summary]" &&
+        element.getAttribute("data-step-candidate-result-summary") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-step-candidate-result-process]" &&
+        element.getAttribute("data-step-candidate-result-process") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-step-candidate-progress]" &&
+        element.getAttribute("data-step-candidate-progress") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-step-candidate-progress-head]" &&
+        element.getAttribute("data-step-candidate-progress-head") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-pending-input-kind]" && element.getAttribute("data-pending-input-kind") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-pending-input-option]" && element.getAttribute("data-pending-input-option") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-progress-step]" && element.getAttribute("data-progress-step") !== null) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-progress-variant-option]" &&
+        element.getAttribute("data-progress-variant-option") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-progress-param]" && element.getAttribute("data-progress-param") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-progress-param-group]" && element.getAttribute("data-progress-param-group") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-progress-step-option]" && element.getAttribute("data-progress-step-option") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-candidate-choice]" && element.getAttribute("data-candidate-choice") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-candidate-index]" && element.getAttribute("data-candidate-index") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-candidate-status]" && element.getAttribute("data-candidate-status") !== null) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-candidate-subpipeline]" &&
+        element.getAttribute("data-candidate-subpipeline") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-candidate-subpipeline-body]" &&
+        element.getAttribute("data-candidate-subpipeline-body") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-candidate-subpipeline-event]" &&
+        element.getAttribute("data-candidate-subpipeline-event") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-candidate-subpipeline-toggle]" &&
+        element.getAttribute("data-candidate-subpipeline-toggle") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-candidate-substep]" &&
+        element.getAttribute("data-candidate-substep") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-process]" && element.getAttribute("data-step-process") !== null) {{
+        matches.push(element);
+      }}
+      if (selector === "[data-step-event-list]" && element.getAttribute("data-step-event-list") !== null) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-step-process-event]" &&
+        element.getAttribute("data-step-process-event") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-debug-session-field]" &&
+        element.getAttribute("data-debug-session-field") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-normal-handoff-message]" &&
+        element.getAttribute("data-normal-handoff-message") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-chat-message]" &&
+        element.getAttribute("data-chat-message") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-chat-avatar]" &&
+        element.getAttribute("data-chat-avatar") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-normal-turn]" &&
+        element.getAttribute("data-normal-turn") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-normal-process]" &&
+        element.getAttribute("data-normal-process") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-normal-process-event]" &&
+        element.getAttribute("data-normal-process-event") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-normal-answer]" &&
+        element.getAttribute("data-normal-answer") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-markdown-node]" &&
+        element.getAttribute("data-markdown-node") !== null
+      ) {{
+        matches.push(element);
+      }}
+      if (
+        selector === "[data-template-popover]" &&
+        element.getAttribute("data-template-popover") !== null
+      ) {{
+        matches.push(element);
+      }}
+    }}));
+    return matches;
+  }},
+}};
+{app_source}
+(async () => {{
+  const output = await (async () => {{
+    const controller = window.SellingConsoleController;
+    const debug = window.SellingConsoleDebug;
+    const reducers = window.SellingConsoleReducers;
+    const elementById = (id) => elements[id];
+    const all = (selector) => document.querySelectorAll(selector);
+    const text = textOf;
+    const debugText = () => debugPre.textContent;
+    {expression}
+  }})();
+  console.log(JSON.stringify(output));
+}})().catch((error) => {{
+  console.error(error && error.stack ? error.stack : String(error));
+  process.exit(1);
+}});
+"""
+    return run_node_script(script)
+
+
+def test_reducer_maps_pipeline_steps_to_console_sections() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({serverUrl: "http://127.0.0.1:41299", cwd: "/workspace"});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    taskId: "task-1",
+    contextId: "ctx-1",
+    sequence: 3,
+    step: {id: "architecture_planning", name: "架构规划", status: "completed"}
+  }}}
+});
+return {
+  taskId: next.pipelineTaskId,
+  contextId: next.contextId,
+  sequence: next.lastSequence,
+  architectureStatus: next.steps.architecture_planning.status
+};
+"""
+    )
+
+    assert output == {
+        "taskId": "task-1",
+        "contextId": "ctx-1",
+        "sequence": 3,
+        "architectureStatus": "completed",
+    }
+
+
+def test_reducer_uses_event_type_to_mark_completed_step_when_envelope_status_is_working() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {
+      conclusion: {
+        scenario: "Nginx 静态站点",
+        region: "华东 1（杭州）",
+        budget: "低成本"
+      }
+    }
+  }}}
+});
+return {
+  status: next.steps.intent_parsing.status,
+  eventCount: next.steps.intent_parsing.events.length
+};
+"""
+    )
+
+    assert output == {
+        "status": "completed",
+        "eventCount": 1,
+    }
+
+
+def test_reducer_keeps_parent_step_working_when_candidate_sub_step_completes() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.steps.evaluate_candidates.status = "working";
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimating"},
+    data: {summary: "候选方案费用已估算"}
+  }}}
+});
+return {
+  status: next.steps.evaluate_candidates.status,
+  eventCount: next.steps.evaluate_candidates.events.length
+};
+"""
+    )
+
+    assert output == {
+        "status": "working",
+        "eventCount": 1,
+    }
+
+
+def test_reducer_collects_candidate_details_from_tool_display() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState();
+const next = reducers.reducePipelinePayload(state, {
+  snapshot: {
+    status: "waiting_input",
+    display: {
+      candidateDetails: [{
+        candidateName: "ECS 经典网络方案",
+        candidateIndex: 0,
+        summary: "VPC + ECS + EIP",
+        totalMonthlyCost: "¥33.89/月",
+        costItems: [{name: "ECS", spec: "1vCPU/1GiB", monthly_cost: "¥33.89/月"}]
+      }]
+    },
+    pendingInput: {
+      kind: "ask_user_question",
+      prompt: "请选择方案",
+      options: [{id: "0", label: "ECS 经典网络方案"}]
+    }
+  }
+});
+return {
+  candidateCount: next.candidates.length,
+  candidateName: next.candidates[0].name,
+  candidateCost: next.candidates[0].totalMonthlyCost,
+  pendingPrompt: next.pendingInput.prompt
+};
+"""
+    )
+
+    assert output == {
+        "candidateCount": 1,
+        "candidateName": "ECS 经典网络方案",
+        "candidateCost": "¥33.89/月",
+        "pendingPrompt": "请选择方案",
+    }
+
+
+def test_reducer_preserves_zero_candidate_total_monthly_cost() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  snapshot: {
+    display: {
+      candidateDetails: [{
+        candidateName: "免费方案",
+        candidateIndex: 0,
+        totalMonthlyCost: 0
+      }]
+    }
+  }
+});
+return {
+  totalMonthlyCost: next.candidates[0].totalMonthlyCost
+};
+"""
+    )
+
+    assert output == {"totalMonthlyCost": 0}
+
+
+def test_reducer_collects_candidate_details_from_detail_wrapper() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  snapshot: {
+    status: "waiting_input",
+    display: {
+      candidateDetails: [{
+        detailId: "detail-1",
+        candidate: {index: 0},
+        step: {id: "confirm_and_select"},
+        detail: {
+          candidateName: "低成本 ECS 方案",
+          summary: "single ecs",
+          totalMonthlyCost: "CNY 60",
+          costItems: [{name: "ecs", monthly_cost: "CNY 60"}]
+        }
+      }]
+    }
+  }
+});
+return {
+  candidateCount: next.candidates.length,
+  firstName: next.candidates[0].name,
+  firstIndex: next.candidates[0].candidateIndex,
+  firstSummary: next.candidates[0].summary,
+  firstCost: next.candidates[0].totalMonthlyCost,
+  firstCostItemName: next.candidates[0].costItems[0].name
+};
+"""
+    )
+
+    assert output == {
+        "candidateCount": 1,
+        "firstName": "低成本 ECS 方案",
+        "firstIndex": 0,
+        "firstSummary": "single ecs",
+        "firstCost": "CNY 60",
+        "firstCostItemName": "ecs",
+    }
+
+
+def test_reducer_collects_candidate_options_from_complete_step_conclusion() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "complete_step", status: "completed"},
+    data: {
+      conclusion: {
+        options: [{
+          title: "轻量应用服务器一体化方案",
+          index: 1,
+          summary: "开箱即用，管理简单。",
+          totalMonthlyCost: "¥0/月"
+        }]
+      }
+    }
+  }}}
+});
+return {
+  count: next.candidates.length,
+  name: next.candidates[0] && next.candidates[0].name,
+  index: next.candidates[0] && next.candidates[0].candidateIndex,
+  cost: next.candidates[0] && next.candidates[0].totalMonthlyCost
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "name": "轻量应用服务器一体化方案",
+        "index": 1,
+        "cost": "¥0/月",
+    }
+
+
+def test_reducer_populates_candidate_summary_and_price_from_nested_candidate_payload() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "architecture_planning", status: "completed"},
+    data: {
+      conclusion: {
+        candidates: [{
+          index: 0,
+          template: "创建基础 VPC 专有网络",
+          candidate: {
+            output_path: "templates/1-basic-vpc.yml",
+            pros: "满足基础网络隔离需求、零成本、可按需扩展子网和安全组",
+            cons: "仅含 VPC，需后续手动添加 VSwitch",
+            monthly_estimate: 0
+          },
+          cost: {
+            monthly_estimate: "¥0/月",
+            currency: "CNY"
+          }
+        }]
+      }
+    }
+  }}}
+});
+return {
+  count: next.candidates.length,
+  name: next.candidates[0].name,
+  summary: next.candidates[0].summary,
+  totalMonthlyCost: next.candidates[0].totalMonthlyCost,
+  outputPath: next.candidates[0].outputPath
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "name": "创建基础 VPC 专有网络",
+        "summary": "满足基础网络隔离需求、零成本、可按需扩展子网和安全组",
+        "totalMonthlyCost": "¥0/月",
+        "outputPath": "templates/1-basic-vpc.yml",
+    }
+
+
+def test_reducer_collects_step_two_draft_candidates_from_architecture_completion() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "architecture_planning", status: "completed"},
+    data: {
+      conclusion: {
+        draft_candidates: [{
+          candidate_index: 0,
+          candidate_name: "基础 VPC 网络",
+          first_version_description: "创建一个基础 VPC，作为后续云资源的网络容器。",
+          rough_monthly_estimate: "¥0/月"
+        }]
+      }
+    }
+  }}}
+});
+return {
+  count: next.candidates.length,
+  name: next.candidates[0] && next.candidates[0].name,
+  summary: next.candidates[0] && next.candidates[0].summary,
+  cost: next.candidates[0] && next.candidates[0].totalMonthlyCost
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "name": "基础 VPC 网络",
+        "summary": "创建一个基础 VPC，作为后续云资源的网络容器。",
+        "cost": "¥0/月",
+    }
+
+
+def test_reducer_updates_candidate_summary_and_price_from_candidate_completed_event() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [{candidateIndex: 0, name: "基础 VPC 网络"}];
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {
+      candidate_name: "基础 VPC 网络",
+      summary: "VPC 本身免费，适合作为后续子网和云资源的基础容器。",
+      total_monthly_cost: "¥0/月"
+    }
+  }}}
+});
+return {
+  count: next.candidates.length,
+  name: next.candidates[0].name,
+  summary: next.candidates[0].summary,
+  cost: next.candidates[0].totalMonthlyCost,
+  subEventKind: next.candidates[0].subEvents[0].eventType
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "name": "基础 VPC 网络",
+        "summary": "VPC 本身免费，适合作为后续子网和云资源的基础容器。",
+        "cost": "¥0/月",
+        "subEventKind": "candidate_completed",
+    }
+
+
+def test_reducer_updates_candidate_from_nested_candidate_completed_conclusions() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [{
+  candidateIndex: 0,
+  name: "经济型演示方案",
+  summary: "成本最低，适合个人演示场景",
+  totalMonthlyCost: "¥50 - ¥80"
+}];
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0, name: "经济型演示方案"},
+    data: {
+      candidateIndex: 0,
+      candidateName: "经济型演示方案",
+      conclusions: {
+        template: {
+          file_path: "templates/1-economy-nginx.yml",
+          description: "经济型 Nginx 演示环境 - VPC 内单可用区部署一台 ECS。"
+        },
+        cost: {
+          monthly_estimate: "¥74/月",
+          resources: [
+            {type: "ECS 实例", cost: "¥34/月"},
+            {type: "系统盘", cost: "¥40/月"}
+          ]
+        }
+      }
+    }
+  }}}
+});
+return {
+  count: next.candidates.length,
+  name: next.candidates[0].name,
+  summary: next.candidates[0].summary,
+  cost: next.candidates[0].totalMonthlyCost,
+  outputPath: next.candidates[0].outputPath,
+  costItemCount: next.candidates[0].costItems.length
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "name": "经济型演示方案",
+        "summary": "经济型 Nginx 演示环境 - VPC 内单可用区部署一台 ECS。",
+        "cost": "¥74/月",
+        "outputPath": "templates/1-economy-nginx.yml",
+        "costItemCount": 2,
+    }
+
+
+def test_reducer_collects_snake_case_candidate_index_from_conclusion_options() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "complete_step", status: "completed"},
+    data: {
+      conclusion: {
+        options: [{
+          title: "低成本 ECS 方案",
+          candidate_index: 3,
+          total_monthly_cost: "¥33.89/月"
+        }]
+      }
+    }
+  }}}
+});
+reducers.selectCandidate(next, next.candidates[0].candidateIndex);
+return {
+  count: next.candidates.length,
+  index: next.candidates[0].candidateIndex,
+  cost: next.candidates[0].totalMonthlyCost,
+  prompt: reducers.promptForSelectedCandidate(next)
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "index": 3,
+        "cost": "¥33.89/月",
+        "prompt": "选择方案3",
+    }
+
+
+def test_reducer_does_not_mutate_original_state() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({serverUrl: "http://server", cwd: "/workspace"});
+const originalStep = state.steps.architecture_planning;
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    taskId: "task-1",
+    contextId: "ctx-1",
+    sequence: 1,
+    step: {id: "architecture_planning", status: "completed"}
+  }}}
+});
+return {
+  sameState: next === state,
+  sameSteps: next.steps === state.steps,
+  sameStep: next.steps.architecture_planning === originalStep,
+  originalTaskId: state.pipelineTaskId,
+  originalStepStatus: state.steps.architecture_planning.status,
+  originalEventCount: state.steps.architecture_planning.events.length,
+  nextTaskId: next.pipelineTaskId,
+  nextStepStatus: next.steps.architecture_planning.status,
+  nextEventCount: next.steps.architecture_planning.events.length
+};
+"""
+    )
+
+    assert output == {
+        "sameState": False,
+        "sameSteps": False,
+        "sameStep": False,
+        "originalTaskId": "",
+        "originalStepStatus": "pending",
+        "originalEventCount": 0,
+        "nextTaskId": "task-1",
+        "nextStepStatus": "completed",
+        "nextEventCount": 1,
+    }
+
+
+def test_reducer_collects_realtime_candidate_detail_event() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    taskId: "task-1",
+    contextId: "ctx-1",
+    sequence: 7,
+    step: {id: "confirm_and_select", status: "working"},
+    candidate: {index: 0},
+    data: {
+      detailId: "detail-1",
+      detail: {
+        candidateName: "低成本 ECS 方案",
+        summary: "single ecs",
+        totalMonthlyCost: "CNY 60",
+        costItems: [{name: "ecs", monthly_cost: "CNY 60"}]
+      }
+    }
+  }}}
+});
+return {
+  count: next.candidates.length,
+  name: next.candidates[0].name,
+  index: next.candidates[0].candidateIndex,
+  cost: next.candidates[0].totalMonthlyCost,
+  eventCount: next.steps.confirm_and_select.events.length
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "name": "低成本 ECS 方案",
+        "index": 0,
+        "cost": "CNY 60",
+        "eventCount": 1,
+    }
+
+
+def test_reducer_does_not_retain_mutable_candidate_event_payload_references() -> None:
+    output = reducer_harness(
+        """
+const costItems = [{name: "ecs"}];
+const payload = {metadata: {iac_code: {pipeline: {
+  eventType: "candidate_detail_shown",
+  status: "working",
+  taskId: "task-1",
+  contextId: "ctx-1",
+  sequence: 7,
+  step: {id: "confirm_and_select", status: "working"},
+  candidate: {index: 0},
+  data: {
+    detailId: "detail-1",
+    detail: {
+      candidateName: "低成本 ECS 方案",
+      totalMonthlyCost: "CNY 60",
+      costItems
+    }
+  }
+}}}};
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), payload);
+costItems[0].name = "mutated";
+payload.metadata.iac_code.pipeline.data.detail.candidateName = "被污染";
+return {
+  eventName: next.steps.confirm_and_select.events[0].data.detail.candidateName,
+  eventCostItemName: next.steps.confirm_and_select.events[0].data.detail.costItems[0].name,
+  candidateName: next.candidates[0].name,
+  candidateCostItemName: next.candidates[0].costItems[0].name
+};
+"""
+    )
+
+    assert output == {
+        "eventName": "低成本 ECS 方案",
+        "eventCostItemName": "ecs",
+        "candidateName": "低成本 ECS 方案",
+        "candidateCostItemName": "ecs",
+    }
+
+
+def test_reducer_clones_existing_step_events_when_cloning_state() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.steps.confirm_and_select.events.push({
+  eventType: "candidate_detail_shown",
+  data: {detail: {candidateName: "旧事件", costItems: [{name: "ecs"}]}}
+});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "architecture_planning", status: "completed"}
+  }}}
+});
+state.steps.confirm_and_select.events[0].data.detail.candidateName = "mutated";
+state.steps.confirm_and_select.events[0].data.detail.costItems[0].name = "mutated";
+return {
+  sameEvent: next.steps.confirm_and_select.events[0] === state.steps.confirm_and_select.events[0],
+  eventName: next.steps.confirm_and_select.events[0].data.detail.candidateName,
+  costItemName: next.steps.confirm_and_select.events[0].data.detail.costItems[0].name
+};
+"""
+    )
+
+    assert output == {
+        "sameEvent": False,
+        "eventName": "旧事件",
+        "costItemName": "ecs",
+    }
+
+
+def test_upsert_candidate_deep_clones_nested_payload() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const candidate = {
+  name: "方案",
+  candidateIndex: 0,
+  metadata: {source: {tool: "planner"}},
+  costItems: [{name: "ecs", detail: {region: "cn-hangzhou"}}]
+};
+const next = reducers.upsertCandidate(state, candidate);
+candidate.name = "mutated";
+candidate.metadata.source.tool = "mutated";
+candidate.costItems[0].detail.region = "mutated";
+return {
+  name: next.candidates[0].name,
+  tool: next.candidates[0].metadata.source.tool,
+  region: next.candidates[0].costItems[0].detail.region
+};
+"""
+    )
+
+    assert output == {
+        "name": "方案",
+        "tool": "planner",
+        "region": "cn-hangzhou",
+    }
+
+
+def test_reducer_events_only_payload_does_not_duplicate_first_event() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  events: [
+    {eventType: "step_completed", sequence: 1, step: {id: "architecture_planning", status: "completed"}},
+    {eventType: "step_completed", sequence: 2, step: {id: "evaluate_candidates", status: "completed"}}
+  ]
+});
+return {
+  architectureEvents: next.steps.architecture_planning.events.length,
+  evaluateEvents: next.steps.evaluate_candidates.events.length,
+  lastSequence: next.lastSequence
+};
+"""
+    )
+
+    assert output == {
+        "architectureEvents": 1,
+        "evaluateEvents": 1,
+        "lastSequence": 2,
+    }
+
+
+def test_create_initial_state_does_not_alias_defaults_object() -> None:
+    output = reducer_harness(
+        """
+const defaults = {serverUrl: "http://server", cwd: "/workspace", nested: {mode: "x"}};
+const state = reducers.createInitialState(defaults);
+defaults.serverUrl = "mutated";
+defaults.nested.mode = "mutated";
+return {
+  serverUrl: state.serverUrl,
+  defaultsServerUrl: state.defaults.serverUrl,
+  defaultsMode: state.defaults.nested.mode
+};
+"""
+    )
+
+    assert output == {
+        "serverUrl": "http://server",
+        "defaultsServerUrl": "http://server",
+        "defaultsMode": "x",
+    }
+
+
+def test_reducer_clones_existing_defaults_when_cloning_state() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({serverUrl: "http://server", cwd: "/workspace", nested: {mode: "x"}});
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "architecture_planning", status: "completed"}
+  }}}
+});
+state.defaults.nested.mode = "mutated";
+return {
+  sameDefaults: next.defaults === state.defaults,
+  nextMode: next.defaults.nested.mode
+};
+"""
+    )
+
+    assert output == {
+        "sameDefaults": False,
+        "nextMode": "x",
+    }
+
+
+def test_build_stream_payload_uses_active_task_before_handoff() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({serverUrl: "http://server", cwd: "/workspace"});
+state.contextId = "ctx-1";
+state.pipelineTaskId = "pipeline-task";
+state.activeTaskId = "active-task";
+const beforeHandoff = reducers.buildStreamPayload(state, "部署 nginx");
+state.normalHandoffReady = true;
+const afterHandoff = reducers.buildStreamPayload(state, "继续部署");
+return {
+  beforeHandoff,
+  afterHandoff
+};
+"""
+    )
+
+    assert output == {
+        "beforeHandoff": {
+            "serverUrl": "http://server",
+            "cwd": "/workspace",
+            "contextId": "ctx-1",
+            "taskId": "active-task",
+            "prompt": "部署 nginx",
+        },
+        "afterHandoff": {
+            "serverUrl": "http://server",
+            "cwd": "/workspace",
+            "contextId": "ctx-1",
+            "taskId": "",
+            "prompt": "继续部署",
+        },
+    }
+
+
+def test_candidate_selection_prompt_uses_zero_based_index() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [
+  {name: "ECS 经典网络方案", candidateIndex: 0},
+  {name: "轻量应用服务器一体化方案", candidateIndex: 1}
+];
+const selected = reducers.selectCandidate(state, 1);
+return {
+  sameState: selected === state,
+  selected: state.selectedCandidateIndex,
+  prompt: reducers.promptForSelectedCandidate(state),
+  emptyPrompt: reducers.promptForSelectedCandidate(reducers.createInitialState({}))
+};
+"""
+    )
+
+    assert output == {
+        "sameState": True,
+        "selected": 1,
+        "prompt": "选择方案1",
+        "emptyPrompt": "",
+    }
+
+
+def test_controller_initially_hides_left_steps_and_composer_progress() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const leftSteps = all("[data-step-id]");
+const progressSteps = all("[data-progress-step]");
+return {
+  leftStepCount: leftSteps.length,
+  progressCount: progressSteps.length,
+  progressHidden: elementById("composer-progress").hidden,
+  variant: elementById("composer-progress").getAttribute("data-progress-variant"),
+  progressText: text(elementById("composer-progress"))
+};
+"""
+    )
+
+    assert output == {
+        "leftStepCount": 0,
+        "progressCount": 0,
+        "progressHidden": True,
+        "variant": "b",
+        "progressText": "",
+    }
+
+
+def test_controller_reveals_composer_progress_after_pipeline_started() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const initialHidden = elementById("composer-progress").hidden;
+const next = reducers.reducePipelinePayload(debug.state(), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "pipeline_started",
+    status: "working",
+    taskId: "task-1"
+  }}}
+});
+Object.assign(debug.state(), next);
+debug.render();
+const progressSteps = all("[data-progress-step]");
+return {
+  initialHidden,
+  progressHidden: elementById("composer-progress").hidden,
+  mode: elementById("composer-progress").getAttribute("data-progress-mode"),
+  progressCount: progressSteps.length,
+  progressStatuses: progressSteps.map((step) => step.getAttribute("data-status")),
+  progressText: text(elementById("composer-progress"))
+};
+"""
+    )
+
+    assert output == {
+        "initialHidden": True,
+        "progressHidden": False,
+        "mode": "pipeline",
+        "progressCount": 5,
+        "progressStatuses": ["pending", "pending", "pending", "pending", "pending"],
+        "progressText": "需求理解架构规划方案评估方案选择确认部署",
+    }
+
+
+def test_selling_console_chat_column_is_two_thirds_original_width() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+
+    assert "grid-template-columns: minmax(280px, 400px) minmax(0, 1fr) 56px;" in css
+    assert "grid-template-columns: minmax(240px, 347px) minmax(0, 1fr);" in css
+
+
+def test_selling_console_removes_left_ai_navigation_rail() -> None:
+    index_html = (APP_JS.parent / "index.html").read_text(encoding="utf-8")
+    css = STYLES_CSS.read_text(encoding="utf-8")
+
+    assert 'class="ai-rail"' not in index_html
+    assert "rail-bot" not in index_html
+    assert "rail-button" not in index_html
+    assert ".ai-rail" not in css
+
+
+def test_selling_console_left_chat_scrolls_without_moving_composer() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    workflow_rule = css.split(".workflow-panel {", 1)[1].split("}", 1)[0]
+    step_list_rule = css.split(".step-list {", 1)[1].split("}", 1)[0]
+    completed_rule = css.split(".step-card.completed {", 1)[1].split("}", 1)[0]
+    composer_rule = css.split(".composer {", 1)[1].split("}", 1)[0]
+
+    assert "height: calc(100vh - 96px);" in workflow_rule
+    assert "overflow: hidden;" in workflow_rule
+    assert "align-content: start;" in step_list_rule
+    assert "align-items: start;" in step_list_rule
+    assert "overflow-y: auto;" in step_list_rule
+    assert "min-height: 0;" in step_list_rule
+    assert "flex: 1 1 auto;" in step_list_rule
+    assert "gap: 5px;" in step_list_rule
+    assert "padding: 8px 14px;" in step_list_rule
+    assert "grid-template-columns: 24px 1fr;" in completed_rule
+    assert "padding: 6px 8px;" in completed_rule
+    assert "flex: 0 0 auto;" in composer_rule
+    assert "border-top:" not in composer_rule
+
+
+def test_selling_console_chat_messages_have_im_layout_and_avatars() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+
+    assert ".chat-message.user" in css
+    assert ".chat-message.system" in css
+    assert ".chat-avatar.system" in css
+    assert ".chat-avatar.user" in css
+
+
+def test_selling_console_chat_and_progress_use_compact_spacing() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    chat_message_rule = css.split(".chat-message {", 1)[1].split("}", 1)[0]
+    step_title_rule = css.split(".step-card h2 {", 1)[1].split("}", 1)[0]
+    composer_rule = css.split(".composer {", 1)[1].split("}", 1)[0]
+    composer_progress_rule = css.split(".composer-progress:not([hidden]) {", 1)[1].split("}", 1)[0]
+    signal_circuit_rule = css.split(".signal-circuit {", 1)[1].split("}", 1)[0]
+    signal_svg_rule = css.split(".signal-svg {", 1)[1].split("}", 1)[0]
+    signal_labels_rule = css.split(".signal-labels {", 1)[1].split("}", 1)[0]
+
+    assert "gap: 7px;" in chat_message_rule
+    assert "font-size: 13px;" in step_title_rule
+    assert "padding: 6px 14px 10px;" in composer_rule
+    assert "margin-bottom: 8px;" in composer_progress_rule
+    assert "padding-bottom: 8px;" in composer_progress_rule
+    assert "height: 50px;" in signal_circuit_rule
+    assert "height: 36px;" in signal_svg_rule
+    assert "top: 32px;" in signal_labels_rule
+
+
+def test_selling_console_step_rows_hide_sequence_numbers_and_use_compact_marker() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    step_index_rule = css.split(".step-index {", 1)[1].split("}", 1)[0]
+
+    assert "step-number" not in APP_JS.read_text(encoding="utf-8")
+    assert "width: 22px;" in step_index_rule
+    assert "height: 22px;" in step_index_rule
+
+
+def test_selling_console_left_intro_and_top_alert_are_visually_hidden() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    panel_heading_rule = css.split(".panel-heading {", 1)[1].split("}", 1)[0]
+    status_alert_rule = css.split(".status-alert {", 1)[1].split("}", 1)[0]
+
+    assert "display: none;" in panel_heading_rule
+    assert "display: none;" in status_alert_rule
+
+
+def test_selling_console_composer_uses_compact_input_box() -> None:
+    index_html = (APP_JS.parent / "index.html").read_text(encoding="utf-8")
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    composer_rule = css.split(".composer {", 1)[1].split("}", 1)[0]
+    composer_box_rule = css.split(".composer-box {", 1)[1].split("}", 1)[0]
+    input_rule = css.split("#composer-input {", 1)[1].split("}", 1)[0]
+    send_button_rule = css.split(".send-icon-button {", 1)[1].split("}", 1)[0]
+    mobile_compact_rule = css.split("@media (max-width: 560px)", 1)[1].split(".plan-meta", 1)[0]
+
+    assert 'class="composer-box"' in index_html
+    assert 'rows="2"' in index_html
+    assert 'placeholder="继续补充您的需求，比如降低成本、提升可用性或约束地域"' in index_html
+    assert 'aria-label="附件"' in index_html
+    assert 'aria-label="发送"' in index_html
+    assert "padding: 6px 14px 10px;" in composer_rule
+    assert "padding: 10px 10px 9px;" in composer_box_rule
+    assert "min-height: 40px;" in input_rule
+    assert "border: 0;" in input_rule
+    assert "resize: none;" in input_rule
+    assert "width: 36px;" in send_button_rule
+    assert "height: 36px;" in send_button_rule
+    assert ".composer .send-icon-button" in mobile_compact_rule
+    assert "width: 36px;" in mobile_compact_rule
+    assert ".composer .icon-only-button" in mobile_compact_rule
+    assert "width: 32px;" in mobile_compact_rule
+
+
+def test_selling_console_connection_controls_live_in_debug_panel() -> None:
+    index_html = (APP_JS.parent / "index.html").read_text(encoding="utf-8")
+    plan_header = index_html.split('<div class="plan-header">', 1)[1].split('<div id="plans-grid"', 1)[0]
+    debug_panel_intro = index_html.split('<div class="debug-panel">', 1)[1].split(
+        '<div id="progress-debug-panel"',
+        1,
+    )[0]
+
+    assert 'class="connection-controls"' not in plan_header
+    assert 'class="connection-controls"' in debug_panel_intro
+
+
+def test_selling_console_pipeline_diagnostics_output_is_collapsed_by_default() -> None:
+    index_html = (APP_JS.parent / "index.html").read_text(encoding="utf-8")
+    diagnostics = index_html.split('<details class="debug-output-block">', 1)[1].split("</details>", 1)[0]
+
+    assert "<summary>Pipeline Diagnostics</summary>" in diagnostics
+    assert '<details class="debug-output-block" open' not in index_html
+    assert "<h2>Pipeline Diagnostics</h2>" not in index_html
+
+
+def test_selling_console_has_handoff_notice_and_debug_session_info_slots() -> None:
+    index_html = (APP_JS.parent / "index.html").read_text(encoding="utf-8")
+
+    assert 'id="normal-handoff-notice"' not in index_html
+    assert 'id="debug-session-info"' in index_html
+    assert 'class="debug-session-info"' in index_html
+
+
+def test_selling_console_candidate_subpipeline_body_is_height_limited() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+
+    assert ".candidate-subpipeline-body" in css
+    body_rule = css.split(".candidate-subpipeline-body", 1)[1].split("}", 1)[0]
+    assert "max-height:" in body_rule
+    assert "overflow-y: auto;" in body_rule
+
+
+def test_selling_console_running_step_event_list_is_height_limited() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    event_list_rule = css.split(".step-event-list {", 1)[1].split("}", 1)[0]
+
+    assert "max-height:" in event_list_rule
+    assert "overflow-y: auto;" in event_list_rule
+
+
+def test_selling_console_template_popover_can_be_entered_and_scrolled() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    popover_rule = css.split(".template-popover {", 1)[1].split("}", 1)[0]
+    popover_hover_rule = css.split(".template-popover:hover {", 1)[1].split("}", 1)[0]
+
+    assert ".template-popover-host:hover .template-popover" in css
+    assert ".template-popover:hover" in css
+    assert "max-height:" in popover_rule
+    assert "overflow-y: auto;" in popover_rule
+    assert "pointer-events: auto;" in popover_rule
+    assert "transition-delay: 0ms, 0ms, 140ms;" in popover_rule
+    assert "transition-delay: 500ms, 500ms, 500ms;" in popover_hover_rule
+
+
+def test_selling_console_plan_grid_keeps_cards_top_aligned_when_process_expands() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    plans_grid_rule = css.split(".plans-grid", 1)[1].split("}", 1)[0]
+
+    assert "align-items: start;" in plans_grid_rule
+
+
+def test_selling_console_composer_progress_uses_separator_instead_of_floating_panel() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+
+    assert ".composer-progress[hidden]" in css
+    assert ".composer-progress:not([hidden])" in css
+    visible_rule = css.split(".composer-progress:not([hidden])", 1)[1].split("}", 1)[0]
+    assert "border-bottom: 1px solid var(--line);" in visible_rule
+    assert "border-top:" not in visible_rule
+    assert "box-shadow:" not in visible_rule
+    assert "background:" not in visible_rule
+
+
+def test_selling_console_progress_variants_match_unframed_visual_requirements() -> None:
+    css = STYLES_CSS.read_text(encoding="utf-8")
+    chevron_root_rule = css.split(".composer-progress.chevrons {", 1)[1].split("}", 1)[0]
+    chevron_step_rule = css.split(".chevrons .step {", 1)[1].split("}", 1)[0]
+    signal_rule = css.split(".signal-circuit {", 1)[1].split("}", 1)[0]
+
+    assert "height: 32px;" in chevron_root_rule
+    assert "font-size: 10px;" in chevron_step_rule
+    assert "padding: 0 10px 0 14px;" in chevron_step_rule
+    assert "border:" not in signal_rule
+    assert "background:" not in signal_rule
+
+
+def test_selling_console_progress_debug_panel_declares_three_adjustable_variants() -> None:
+    index_html = (APP_JS.parent / "index.html").read_text(encoding="utf-8")
+    assert '<details id="debug-drawer" class="debug-drawer">' in index_html
+    assert '<details id="debug-drawer" class="debug-drawer" open' not in index_html
+    assert 'id="progress-debug-panel"' in index_html
+    assert 'id="debug-output"' in index_html
+
+    output = controller_harness(
+        """
+controller.init();
+const variantButtons = all("[data-progress-variant-option]").map((button) => ({
+  variant: button.getAttribute("data-progress-variant-option"),
+  pressed: button.getAttribute("aria-pressed"),
+  text: text(button)
+}));
+const paramGroups = all("[data-progress-param-group]").map((group) => ({
+  variant: group.getAttribute("data-progress-param-group"),
+  hidden: group.hidden
+}));
+const params = all("[data-progress-param]").map((input) => ({
+  name: input.getAttribute("data-progress-param"),
+  variant: input.getAttribute("data-progress-param-variant"),
+  value: input.value
+}));
+return {
+  progressVariant: elementById("composer-progress").getAttribute("data-progress-variant"),
+  variantButtons,
+  paramGroups,
+  params
+};
+"""
+    )
+
+    assert output["progressVariant"] == "b"
+    assert output["variantButtons"] == [
+        {"variant": "a", "pressed": "false", "text": "A 箭头轨道"},
+        {"variant": "b", "pressed": "true", "text": "B 脉冲线路"},
+        {"variant": "d", "pressed": "false", "text": "D 输入框融合"},
+    ]
+    assert output["paramGroups"] == [
+        {"variant": "a", "hidden": True},
+        {"variant": "b", "hidden": False},
+        {"variant": "d", "hidden": True},
+    ]
+    assert {"variant": "a", "name": "sweepMs", "value": "1800"} in output["params"]
+    assert {"variant": "b", "name": "xPercent", "value": "28"} in output["params"]
+    assert {"variant": "b", "name": "yPercent", "value": "49"} in output["params"]
+    assert {"variant": "b", "name": "t1", "value": "140"} in output["params"]
+    assert {"variant": "b", "name": "t2", "value": "540"} in output["params"]
+    assert {"variant": "b", "name": "maxAmplitude", "value": "9"} in output["params"]
+    assert {"variant": "b", "name": "pauseTime", "value": "510"} in output["params"]
+    assert {"variant": "d", "name": "t1", "value": "1800"} in output["params"]
+    assert {"variant": "d", "name": "t2", "value": "300"} in output["params"]
+    assert all(item["name"] not in {"shineWidth", "lineWidth", "sweepWidth"} for item in output["params"])
+
+
+def test_selling_console_progress_debug_panel_switches_variant_and_updates_param() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const optionD = all("[data-progress-variant-option]").find((button) =>
+  button.getAttribute("data-progress-variant-option") === "d"
+);
+optionD.click();
+const afterSwitch = {
+  progressVariant: elementById("composer-progress").getAttribute("data-progress-variant"),
+  groups: all("[data-progress-param-group]").map((group) => ({
+    variant: group.getAttribute("data-progress-param-group"),
+    hidden: group.hidden
+  }))
+};
+const dT1 = all("[data-progress-param]").find((input) =>
+  input.getAttribute("data-progress-param-variant") === "d" &&
+  input.getAttribute("data-progress-param") === "t1"
+);
+dT1.value = "2200";
+(dT1.listeners.input || []).forEach((listener) => listener({type: "input"}));
+return {
+  afterSwitch,
+  progressVariant: elementById("composer-progress").getAttribute("data-progress-variant"),
+  stateValue: debug.state().progressUi.d.t1,
+  renderedValue: all("[data-progress-param]").find((input) =>
+    input.getAttribute("data-progress-param-variant") === "d" &&
+    input.getAttribute("data-progress-param") === "t1"
+  ).value
+};
+"""
+    )
+
+    assert output == {
+        "afterSwitch": {
+            "progressVariant": "d",
+            "groups": [
+                {"variant": "a", "hidden": True},
+                {"variant": "b", "hidden": True},
+                {"variant": "d", "hidden": False},
+            ],
+        },
+        "progressVariant": "d",
+        "stateValue": 2200,
+        "renderedValue": "2200",
+    }
+
+
+def test_selling_console_debug_step_is_isolated_from_pipeline_progress() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const drawer = elementById("debug-drawer");
+const progress = elementById("composer-progress");
+const initial = {
+  hidden: progress.hidden,
+  stepCount: all("[data-progress-step]").length
+};
+drawer.open = true;
+(drawer.listeners.toggle || []).forEach((listener) => listener({type: "toggle"}));
+all("[data-progress-step-option]")[3].click();
+const debugOpen = {
+  hidden: progress.hidden,
+  mode: progress.getAttribute("data-progress-mode"),
+  activeIndex: progress.children[0].getAttribute("data-active-index"),
+  debugStep: debug.state().progressUi.activeStepIndex
+};
+drawer.open = false;
+(drawer.listeners.toggle || []).forEach((listener) => listener({type: "toggle"}));
+const closed = {
+  hidden: progress.hidden,
+  stepCount: all("[data-progress-step]").length,
+  debugStep: debug.state().progressUi.activeStepIndex
+};
+const next = reducers.reducePipelinePayload(debug.state(), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "intent_parsing"}
+  }}}
+});
+Object.assign(debug.state(), next);
+debug.render();
+const pipeline = {
+  hidden: progress.hidden,
+  mode: progress.getAttribute("data-progress-mode"),
+  activeIndex: progress.children[0].getAttribute("data-active-index"),
+  debugStep: debug.state().progressUi.activeStepIndex
+};
+return {initial, debugOpen, closed, pipeline};
+"""
+    )
+
+    assert output == {
+        "initial": {"hidden": True, "stepCount": 0},
+        "debugOpen": {"hidden": False, "mode": "debug", "activeIndex": "3", "debugStep": 3},
+        "closed": {"hidden": True, "stepCount": 0, "debugStep": 3},
+        "pipeline": {"hidden": False, "mode": "pipeline", "activeIndex": "0", "debugStep": 3},
+    }
+
+
+def test_selling_console_progress_variants_use_prototype_dom_classes() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const drawer = elementById("debug-drawer");
+drawer.open = true;
+(drawer.listeners.toggle || []).forEach((listener) => listener({type: "toggle"}));
+const progress = elementById("composer-progress");
+const bClass = progress.children[0].getAttribute("class");
+all("[data-progress-variant-option]")
+  .find((button) => button.getAttribute("data-progress-variant-option") === "a")
+  .click();
+const aRootClass = progress.getAttribute("class");
+const aStepClasses = progress.children.map((child) => child.getAttribute("class"));
+all("[data-progress-variant-option]")
+  .find((button) => button.getAttribute("data-progress-variant-option") === "d")
+  .click();
+const dClass = progress.children[0].getAttribute("class");
+return {
+  bClass,
+  aRootClass,
+  aStepClasses,
+  dClass
+};
+"""
+    )
+
+    assert output["bClass"] == "signal-circuit"
+    assert "chevrons" in output["aRootClass"]
+    assert output["aStepClasses"][0].startswith("step ")
+    assert output["dClass"] == "fusion-label"
+
+
+def test_selling_console_progress_uses_pipeline_active_step_when_debug_step_is_unset() -> None:
+    output = controller_harness(
+        """
+controller.init();
+debug.loadDemoCandidates();
+const progress = elementById("composer-progress");
+return {
+  activeIndex: progress.children[0].getAttribute("data-active-index"),
+  uiActiveStepIndex: debug.state().progressUi.activeStepIndex
+};
+"""
+    )
+
+    assert output == {
+        "activeIndex": "3",
+        "uiActiveStepIndex": None,
+    }
+
+
+def test_controller_reveals_running_step_events_then_collapses_completed_conclusion() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {summary: "开始理解需求"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {text: "正在分析地域与预算"}
+  }}}
+});
+const runningText = text(all("[data-step-id]")[0]);
+const runningProgress = all("[data-progress-step]").map((step) => ({
+  id: step.getAttribute("data-progress-step"),
+  status: step.getAttribute("data-status")
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {
+      conclusion: {
+        scenario: "Nginx 静态站点",
+        region: "华东 1（杭州）",
+        budget: "低成本"
+      }
+    }
+  }}}
+});
+const completedText = text(all("[data-step-id]")[0]);
+const resultFields = all("[data-step-result-field]").map((field) => ({
+  field: field.getAttribute("data-step-result-field"),
+  text: text(field)
+}));
+const completedEvents = all("[data-step-event-kind]").map((event) => event.getAttribute("data-step-event-kind"));
+const stateIcons = all("[data-step-state-icon]").map((icon) => ({
+  state: icon.getAttribute("data-step-state-icon"),
+  text: text(icon)
+}));
+const toggles = all("[data-step-toggle]");
+toggles[0].click();
+const expandedText = text(all("[data-step-id]")[0]);
+const expandedFields = all("[data-step-result-field]").map((field) => text(field));
+toggles[0].click();
+const recollapsedText = text(all("[data-step-id]")[0]);
+const completedProgress = all("[data-progress-step]").map((step) => ({
+  id: step.getAttribute("data-progress-step"),
+  status: step.getAttribute("data-status")
+}));
+return {
+  stepCount: all("[data-step-id]").length,
+  runningText,
+  runningProgress,
+  completedText,
+  resultFields,
+  completedEvents,
+  stateIcons,
+  toggleCount: toggles.length,
+  expandedText,
+  expandedFields,
+  recollapsedText,
+  completedProgress
+};
+"""
+    )
+
+    assert output["stepCount"] == 1
+    assert "需求理解" in output["runningText"]
+    assert "思考中" in output["runningText"]
+    assert "开始理解需求" in output["runningText"]
+    assert "正在分析地域与预算" in output["runningText"]
+    assert {"id": "intent_parsing", "status": "working"} in output["runningProgress"]
+    assert output["completedText"] == "✓需求理解"
+    assert "思考完成" not in output["completedText"]
+    assert "场景：Nginx 静态站点" not in output["completedText"]
+    assert "地域：华东 1（杭州）" not in output["completedText"]
+    assert "预算：低成本" not in output["completedText"]
+    assert "；" not in output["completedText"]
+    assert output["resultFields"] == []
+    assert output["completedEvents"] == []
+    assert output["stateIcons"] == [{"state": "completed", "text": "✓"}]
+    assert output["toggleCount"] == 1
+    assert "场景：Nginx 静态站点" in output["expandedText"]
+    assert "地域：华东 1（杭州）" in output["expandedText"]
+    assert "预算：低成本" in output["expandedText"]
+    assert output["expandedFields"] == ["场景：Nginx 静态站点", "地域：华东 1（杭州）", "预算：低成本"]
+    assert "场景：Nginx 静态站点" not in output["recollapsedText"]
+    assert "正在分析地域与预算" not in output["completedText"]
+    assert {"id": "intent_parsing", "status": "completed"} in output["completedProgress"]
+
+
+def test_controller_renders_chat_messages_with_user_and_system_avatars() -> None:
+    output = controller_harness(
+        """
+controller.init();
+debug.state().userMessages = [{id: "u-1", text: "创建一个 VPC"}];
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {summary: "开始理解需求"}
+  }}}
+});
+return {
+  messages: all("[data-chat-message]").map((item) => ({
+    role: item.getAttribute("data-chat-message"),
+    text: text(item)
+  })),
+  avatars: all("[data-chat-avatar]").map((item) => ({
+    role: item.getAttribute("data-chat-avatar"),
+    text: text(item)
+  }))
+};
+"""
+    )
+
+    assert output["messages"][0] == {"role": "user", "text": "U创建一个 VPC"}
+    assert output["messages"][1]["role"] == "system"
+    assert output["messages"][1]["text"].startswith("AI")
+    assert "需求理解思考中" in output["messages"][1]["text"]
+    assert output["avatars"][:2] == [{"role": "user", "text": "U"}, {"role": "system", "text": "AI"}]
+
+
+def test_controller_places_user_messages_after_related_pipeline_context() -> None:
+    output = controller_harness(
+        """
+controller.init();
+global.fetch = async () => ({
+  ok: true,
+  status: 200,
+  body: null,
+  text: async () => ""
+});
+
+elementById("composer-input").value = "选择一个已有vpc，创建一个vswitch";
+await controller.sendComposerMessage();
+
+const state = debug.state();
+state.pipelineStarted = true;
+state.steps.intent_parsing.status = "completed";
+state.steps.architecture_planning.status = "completed";
+state.steps.evaluate_candidates.status = "completed";
+state.steps.confirm_and_select.status = "waiting_input";
+state.status = "waiting_input";
+state.pendingInput = {
+  kind: "candidate_selection",
+  prompt: "请选择要部署的方案：",
+  options: [{id: "0", label: "方案0"}]
+};
+debug.render();
+
+elementById("composer-input").value = "选择方案0";
+await controller.sendComposerMessage();
+
+state.steps.confirm_and_select.status = "completed";
+state.steps.deploying.status = "completed";
+state.pendingInput = null;
+state.normalHandoffReady = true;
+state.status = "completed";
+debug.render();
+
+elementById("composer-input").value = "刚才创建了什么？";
+await controller.sendComposerMessage();
+
+const messages = all("[data-chat-message]").map((item) => ({
+  role: item.getAttribute("data-chat-message"),
+  text: text(item)
+}));
+const indexOf = (needle) => messages.findIndex((item) => item.text.includes(needle));
+return {
+  messages,
+  firstUser: indexOf("选择一个已有vpc"),
+  selectStep: indexOf("方案选择"),
+  secondUser: indexOf("选择方案0"),
+  handoff: indexOf("部署流程已完成"),
+  thirdUser: indexOf("刚才创建了什么")
+};
+"""
+    )
+
+    assert output["firstUser"] >= 0
+    assert output["selectStep"] >= 0
+    assert output["secondUser"] > output["selectStep"]
+    assert output["handoff"] >= 0
+    assert output["thirdUser"] > output["handoff"]
+
+
+def test_controller_clears_composer_as_soon_as_message_is_submitted() -> None:
+    output = controller_harness(
+        """
+controller.init();
+let valueSeenByFetch = null;
+global.fetch = async () => {
+  valueSeenByFetch = elementById("composer-input").value;
+  return {
+    ok: true,
+    status: 200,
+    body: null,
+    text: async () => ""
+  };
+};
+elementById("composer-input").value = "创建一个 VPC";
+await controller.sendComposerMessage();
+return {
+  valueSeenByFetch,
+  finalValue: elementById("composer-input").value,
+  messages: all("[data-chat-message]").map((item) => text(item))
+};
+"""
+    )
+
+    assert output["valueSeenByFetch"] == ""
+    assert output["finalValue"] == ""
+    assert any("创建一个 VPC" in item for item in output["messages"])
+
+
+def test_controller_scrolls_left_chat_to_bottom_after_step_updates() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const stepList = elementById("step-list");
+stepList.scrollTop = 0;
+stepList.scrollHeight = 240;
+stepList.clientHeight = 60;
+const next = reducers.reducePipelinePayload(debug.state(), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {text: "正在持续分析用户需求，内容已经超过可视区域"}
+  }}}
+});
+Object.assign(debug.state(), next);
+debug.render();
+return {
+  scrollTop: stepList.scrollTop,
+  scrollHeight: stepList.scrollHeight
+};
+"""
+    )
+
+    assert output == {"scrollTop": 240, "scrollHeight": 240}
+
+
+def test_controller_scrolls_active_step_event_list_to_bottom_after_updates() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(text) {
+  const next = reducers.reducePipelinePayload(debug.state(), {
+    metadata: {iac_code: {pipeline: {
+      eventType: "text_delta",
+      status: "working",
+      step: {id: "intent_parsing"},
+      data: {text}
+    }}}
+  });
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload("第一段分析");
+applyPayload("第二段分析");
+const eventList = all("[data-step-event-list]")[0];
+return {
+  exists: Boolean(eventList),
+  scrollTop: eventList && eventList.scrollTop,
+  scrollHeight: eventList && eventList.scrollHeight
+};
+"""
+    )
+
+    assert output == {"exists": True, "scrollTop": 100, "scrollHeight": 100}
+
+
+def test_controller_renders_normal_chat_answer_with_collapsible_process_after_handoff() -> None:
+    output = controller_harness(
+        """
+controller.init();
+global.fetch = async () => ({
+  ok: true,
+  status: 200,
+  body: null,
+  text: async () => [
+    {
+      taskId: "normal-task",
+      contextId: "ctx-1",
+      status: {state: "TASK_STATE_WORKING"},
+      metadata: {iac_code: {thinking: {type: "raw_thinking", text: "读取刚才部署结果"}}}
+    },
+    {
+      taskId: "normal-task",
+      contextId: "ctx-1",
+      status: {state: "TASK_STATE_WORKING"},
+      metadata: {
+        iac_code: {
+          tool: {
+            status: "completed",
+            toolUseId: "toolu-read",
+            name: "read_file",
+            result: {content: "读取部署摘要"}
+          }
+        }
+      }
+    },
+    {
+      taskId: "normal-task",
+      contextId: "ctx-1",
+      status: {state: "TASK_STATE_WORKING", message: {parts: [{text: "刚才创建了一个 VSwitch。"}]}}
+    },
+    {
+      taskId: "normal-task",
+      contextId: "ctx-1",
+      status: {state: "TASK_STATE_INPUT_REQUIRED"}
+    }
+  ].map((item) => `data: ${JSON.stringify(item)}`).join("\\n\\n")
+});
+Object.assign(debug.state(), {
+  contextId: "ctx-1",
+  normalHandoffReady: true,
+  status: "completed"
+});
+debug.render();
+elementById("composer-input").value = "刚才创建了什么？";
+await controller.sendComposerMessage();
+
+const messages = all("[data-chat-message]").map((item) => ({
+  role: item.getAttribute("data-chat-message"),
+  text: text(item)
+}));
+const turns = all("[data-normal-turn]").map((item) => ({
+  id: item.getAttribute("data-normal-turn"),
+  text: text(item)
+}));
+const process = all("[data-normal-process]")[0];
+const events = all("[data-normal-process-event]").map((item) => ({
+  kind: item.getAttribute("data-normal-process-event"),
+  text: text(item)
+}));
+return {
+  messages,
+  turns,
+  processOpen: process && process.open === true,
+  processText: process && text(process),
+  events,
+  answer: text(all("[data-normal-answer]")[0]),
+  normalStatus: debug.state().normalTurns[0] && debug.state().normalTurns[0].status
+};
+"""
+    )
+
+    assert any(item["role"] == "user" and "刚才创建了什么？" in item["text"] for item in output["messages"])
+    assert len(output["turns"]) == 1
+    assert output["normalStatus"] == "completed"
+    assert output["processOpen"] is False
+    assert output["events"] == [
+        {"kind": "thinking", "text": "思考读取刚才部署结果"},
+        {"kind": "tool", "text": "工具read_file 完成 读取部署摘要"},
+    ]
+    assert output["processText"].startswith("思考过程")
+    assert output["answer"] == "刚才创建了一个 VSwitch。"
+
+
+def test_controller_renders_normal_chat_answer_from_task_history_after_handoff() -> None:
+    output = controller_harness(
+        """
+controller.init();
+global.fetch = async () => ({
+  ok: true,
+  status: 200,
+  body: null,
+  text: async () => [
+    {
+      jsonrpc: "2.0",
+      result: {
+        id: "normal-task",
+        contextId: "ctx-1",
+        status: {state: "TASK_STATE_INPUT_REQUIRED"},
+        history: [
+          {
+            role: "user",
+            parts: [{root: {kind: "text", text: "你刚才创建了啥"}}]
+          },
+          {
+            role: "agent",
+            parts: [
+              {root: {kind: "text", text: "刚才在已有 VPC 中新建了一个 VSwitch。"}},
+              {root: {kind: "text", text: "VSwitch ID 是 vsw-123。"}}
+            ]
+          }
+        ]
+      }
+    }
+  ].map((item) => `data: ${JSON.stringify(item)}`).join("\\n\\n")
+});
+Object.assign(debug.state(), {
+  contextId: "ctx-1",
+  normalHandoffReady: true,
+  status: "completed"
+});
+debug.render();
+elementById("composer-input").value = "你刚才创建了啥";
+await controller.sendComposerMessage();
+
+return {
+  turns: all("[data-normal-turn]").length,
+  answer: text(all("[data-normal-answer]")[0]),
+  normalStatus: debug.state().normalTurns[0] && debug.state().normalTurns[0].status
+};
+"""
+    )
+
+    assert output == {
+        "turns": 1,
+        "answer": "刚才在已有 VPC 中新建了一个 VSwitch。VSwitch ID 是 vsw-123。",
+        "normalStatus": "completed",
+    }
+
+
+def test_controller_expanded_step_shows_all_conclusion_fields() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {
+      conclusion: {
+        core_requirements: "VPC",
+        cloud_platform: "aliyun",
+        user_message_summary: "创建一个 VPC",
+        non_functional: "低成本",
+        additional_notes: "使用默认 CIDR",
+        business_type: "网络基础设施",
+        region_preference: "cn-hangzhou",
+        risk: "后续需补充交换机"
+      }
+    }
+  }}}
+});
+all("[data-step-toggle]")[0].click();
+return {
+  fields: all("[data-step-result-field]").map((field) => ({
+    key: field.getAttribute("data-step-result-field"),
+    text: text(field)
+  }))
+};
+"""
+    )
+
+    assert [field["key"] for field in output["fields"]] == [
+        "core_requirements",
+        "cloud_platform",
+        "user_message_summary",
+        "non_functional",
+        "additional_notes",
+        "business_type",
+        "region_preference",
+        "risk",
+    ]
+    assert "后续需补充交换机" in output["fields"][-1]["text"]
+
+
+def test_controller_merges_contiguous_text_delta_events_into_typing_card() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {summary: "开始理解需求"}
+  }}}
+});
+["正在分析", "地域、预算", "和部署约束"].forEach((fragment) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "intent_parsing"},
+    data: {text: fragment}
+  }}}
+}));
+const cards = all("[data-step-event-kind]").map((item) => ({
+  kind: item.getAttribute("data-step-event-kind"),
+  text: text(item)
+}));
+return {cards};
+"""
+    )
+
+    assert [card["kind"] for card in output["cards"]] == ["step_started", "text_delta"]
+    assert "思考片段" in output["cards"][1]["text"]
+    assert "正在分析地域、预算和部署约束" in output["cards"][1]["text"]
+
+
+def test_controller_shows_distinct_icons_for_running_completed_and_waiting_steps() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "intent_parsing"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "architecture_planning"},
+    data: {summary: "规划网络拓扑"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {kind: "ask_user_question", prompt: "请选择方案"}
+  }}}
+});
+return {
+  icons: all("[data-step-state-icon]").map((icon) => ({
+    state: icon.getAttribute("data-step-state-icon"),
+    text: text(icon)
+  }))
+};
+"""
+    )
+
+    assert output["icons"] == [
+        {"state": "completed", "text": "✓"},
+        {"state": "working", "text": "…"},
+        {"state": "waiting_input", "text": "?"},
+    ]
+
+
+def test_controller_renders_tool_events_as_structured_step_event_cards() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "deploying"},
+    data: {summary: "准备部署"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "tool_result",
+    status: "working",
+    step: {id: "deploying"},
+    data: {
+      toolName: "CreateStack",
+      toolUseId: "tool-1",
+      result: {
+        stackId: "stack-123",
+        stackStatus: "CREATE_COMPLETE"
+      }
+    }
+  }}}
+});
+const eventCards = all("[data-step-event-kind]").map((item) => ({
+  kind: item.getAttribute("data-step-event-kind"),
+  text: text(item)
+}));
+return {
+  count: eventCards.length,
+  eventCards
+};
+"""
+    )
+
+    assert output["count"] == 2
+    assert output["eventCards"][1]["kind"] == "tool_result"
+    assert "工具结果" in output["eventCards"][1]["text"]
+    assert "CreateStack" in output["eventCards"][1]["text"]
+    assert "Tool Use" not in output["eventCards"][1]["text"]
+    assert "tool-1" not in output["eventCards"][1]["text"]
+    assert "stack-123" in output["eventCards"][1]["text"]
+    assert "CREATE_COMPLETE" in output["eventCards"][1]["text"]
+
+
+def test_controller_renders_candidate_subpipeline_below_matching_plan_card() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {index: 0, name: "标准 VPC 网络"},
+  {index: 1, name: "VPC 含可用区交换机"}
+].forEach((candidate) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: candidate.index},
+    data: {detail: {candidateName: candidate.name, candidateIndex: candidate.index}}
+  }}}
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimation", label: "成本估算", status: "working"},
+    data: {summary: "开始估算成本"}
+  }}}
+});
+["查询规格", "与价格"].forEach((fragment) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimation", label: "成本估算", status: "working"},
+    data: {text: fragment}
+  }}}
+}));
+const pipelines = all("[data-candidate-subpipeline]").map((item) => ({
+  candidate: item.getAttribute("data-candidate-subpipeline"),
+  open: item.open === true,
+  text: text(item)
+}));
+const events = all("[data-candidate-subpipeline-event]").map((item) => ({
+  kind: item.getAttribute("data-candidate-subpipeline-event"),
+  text: text(item)
+}));
+return {pipelines, events};
+"""
+    )
+
+    assert len(output["pipelines"]) == 1
+    assert output["pipelines"][0]["candidate"] == "0"
+    assert output["pipelines"][0]["open"] is True
+    assert "思考过程" in output["pipelines"][0]["text"]
+    assert "成本估算" in output["pipelines"][0]["text"]
+    assert "开始估算成本" in output["pipelines"][0]["text"]
+    assert [event["kind"] for event in output["events"]] == ["candidate_step_started", "text_delta"]
+    assert "查询规格与价格" in output["events"][1]["text"]
+
+
+def test_controller_auto_collapses_completed_candidate_subpipeline_on_plan_card() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {detail: {candidateName: "标准 VPC", candidateIndex: 0, summary: "基础网络", totalMonthlyCost: "¥0/月"}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimation", label: "成本估算", status: "working"},
+    data: {summary: "开始估算成本"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimation", label: "成本估算", status: "completed"},
+    data: {summary: "成本估算完成"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "completed",
+    step: {id: "evaluate_candidates"},
+    data: {conclusion: {summary: "方案评估完成"}}
+  }}}
+});
+const pipeline = all("[data-candidate-subpipeline]")[0];
+const eventKinds = all("[data-candidate-subpipeline-event]")
+  .map((item) => item.getAttribute("data-candidate-subpipeline-event"));
+return {
+  open: pipeline.open === true,
+  text: text(pipeline),
+  eventKinds
+};
+"""
+    )
+
+    assert output["open"] is False
+    assert "思考过程" in output["text"]
+    assert "思考完成" not in output["text"]
+    assert output["eventKinds"] == ["candidate_step_started", "candidate_step_completed"]
+
+
+def test_controller_updates_plan_card_and_collapses_subpipeline_when_candidate_completes() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "completed",
+    step: {id: "architecture_planning"},
+    data: {
+      conclusion: {
+        draft_candidates: [{
+          candidate_index: 0,
+          candidate_name: "基础 VPC 网络",
+          first_version_description: "创建一个基础 VPC，作为后续云资源的网络容器。",
+          rough_monthly_estimate: "待估算"
+        }]
+      }
+    }
+  }}}
+});
+const before = text(all("[data-candidate-index]")[0]);
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimation", label: "成本估算", status: "working"},
+    data: {summary: "开始估算成本"}
+  }}}
+});
+let pipeline = all("[data-candidate-subpipeline]")[0];
+const openWhileWorking = pipeline.open === true;
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {
+      candidate_name: "基础 VPC 网络",
+      summary: "VPC 本身免费，适合作为后续子网和云资源的基础容器。",
+      total_monthly_cost: "¥0/月"
+    }
+  }}}
+});
+pipeline = all("[data-candidate-subpipeline]")[0];
+return {
+  before,
+  after: text(all("[data-candidate-index]")[0]),
+  openWhileWorking,
+  openAfterCandidateDone: pipeline.open === true,
+  substepTexts: all("[data-candidate-substep]").map((item) => text(item)),
+  subEventKinds: all("[data-candidate-subpipeline-event]")
+    .map((item) => item.getAttribute("data-candidate-subpipeline-event"))
+};
+"""
+    )
+
+    assert "创建一个基础 VPC" in output["before"]
+    assert "待估算" in output["before"]
+    assert output["openWhileWorking"] is True
+    assert "VPC 本身免费" in output["after"]
+    assert "¥0/月" in output["after"]
+    assert output["openAfterCandidateDone"] is False
+    assert not any("方案思考" in item for item in output["substepTexts"])
+    assert output["subEventKinds"] == ["candidate_step_started"]
+
+
+def test_controller_plan_card_marks_candidate_working_then_completed() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "completed",
+    step: {id: "architecture_planning"},
+    data: {
+      conclusion: {
+        candidates: [{
+          name: "经济型演示方案",
+          candidate_index: 0,
+          topology: "VPC 内单可用区部署一台突发性能 ECS。",
+          monthly_estimate: "¥50 - ¥80"
+        }]
+      }
+    }
+  }}}
+});
+const initialCardText = text(all("[data-candidate-index]")[0]);
+const initialPriceCount = (initialCardText.match(/¥50 - ¥80/g) || []).length;
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0, name: "经济型演示方案"},
+    candidateStep: {id: "template_generating"}
+  }}}
+});
+const workingStatus = all("[data-candidate-status]")[0];
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0, name: "经济型演示方案"},
+    data: {
+      candidateIndex: 0,
+      candidateName: "经济型演示方案",
+      conclusions: {
+        template: {description: "经济型 Nginx 演示环境 - VPC 内单可用区部署一台 ECS。"},
+        cost: {monthly_estimate: "¥74/月"}
+      }
+    }
+  }}}
+});
+const completedStatus = all("[data-candidate-status]")[0];
+return {
+  initialCardText,
+  initialPriceCount,
+  workingStatus: {
+    value: workingStatus.getAttribute("data-candidate-status"),
+    text: text(workingStatus)
+  },
+  completedStatus: {
+    value: completedStatus.getAttribute("data-candidate-status"),
+    text: text(completedStatus)
+  },
+  completedCardText: text(all("[data-candidate-index]")[0])
+};
+"""
+    )
+
+    assert "预估价格" in output["initialCardText"]
+    assert output["initialPriceCount"] == 1
+    assert output["workingStatus"] == {"value": "working", "text": "生成中"}
+    assert output["completedStatus"] == {"value": "completed", "text": "已完成"}
+    assert "经济型 Nginx 演示环境" in output["completedCardText"]
+    assert "¥74/月" in output["completedCardText"]
+
+
+def test_controller_groups_candidate_subpipeline_into_expandable_substeps() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {detail: {candidateName: "基础 VPC 网络", candidateIndex: 0, summary: "基础网络", totalMonthlyCost: "¥0/月"}}
+  }}}
+});
+[
+  {
+    eventType: "candidate_step_started",
+    id: "template_generating",
+    label: "模板生成",
+    status: "working",
+    summary: "开始生成模板"
+  },
+  {
+    eventType: "tool_result",
+    id: "template_generating",
+    label: "模板生成",
+    status: "working",
+    summary: "写入模板",
+    toolName: "write_file"
+  },
+  {
+    eventType: "candidate_step_completed",
+    id: "template_generating",
+    label: "模板生成",
+    status: "completed",
+    summary: "模板生成完成"
+  },
+  {
+    eventType: "candidate_step_started",
+    id: "cost_estimating",
+    label: "成本估算",
+    status: "working",
+    summary: "开始估算成本"
+  }
+].forEach((item) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: item.eventType,
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: item.id, label: item.label, status: item.status},
+    data: {summary: item.summary, toolName: item.toolName}
+  }}}
+}));
+const pipeline = all("[data-candidate-subpipeline]")[0];
+const substeps = all("[data-candidate-substep]").map((item) => ({
+  id: item.getAttribute("data-candidate-substep"),
+  open: item.open === true,
+  text: text(item)
+}));
+const events = all("[data-candidate-subpipeline-event]")
+  .map((item) => item.getAttribute("data-candidate-subpipeline-event"));
+return {
+  pipelineOpen: pipeline.open === true,
+  pipelineClickListeners: (pipeline.listeners.click || []).length,
+  substeps,
+  events
+};
+"""
+    )
+
+    assert output["pipelineOpen"] is True
+    assert output["pipelineClickListeners"] >= 1
+    assert [item["id"] for item in output["substeps"]] == ["template_generating", "cost_estimating"]
+    assert "模板生成" in output["substeps"][0]["text"]
+    assert "成本估算" in output["substeps"][1]["text"]
+    assert output["substeps"][1]["open"] is True
+    assert output["events"] == [
+        "candidate_step_started",
+        "tool_result",
+        "candidate_step_completed",
+        "candidate_step_started",
+    ]
+
+
+def test_controller_marks_candidate_substeps_complete_after_evaluation_step_completes() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {detail: {candidateName: "基础 VPC 网络", candidateIndex: 0, summary: "基础网络", totalMonthlyCost: "¥0/月"}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "template_generating", status: "working"},
+    data: {summary: "开始生成模板"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "template_generating", status: "working"},
+    data: {text: "模板内容已生成"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    data: {conclusion: {summary: "方案评估完成"}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {kind: "candidate_selection", prompt: "请选择购买方案", options: [{id: "0", label: "基础 VPC 网络"}]}
+  }}}
+});
+const substeps = all("[data-candidate-substep]").map((item) => ({
+  id: item.getAttribute("data-candidate-substep"),
+  open: item.open === true,
+  text: text(item)
+}));
+return {substeps};
+"""
+    )
+
+    assert output["substeps"] == [
+        {
+            "id": "template_generating",
+            "open": False,
+            "text": "模板生成完成子步骤开始开始生成模板思考片段模板内容已生成",
+        }
+    ]
+
+
+def test_controller_preserves_open_candidate_subpipeline_when_events_update() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {detail: {candidateName: "基础 VPC 网络", candidateIndex: 0, summary: "基础网络"}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "template_generating", status: "working"},
+    data: {summary: "开始生成模板"}
+  }}}
+});
+let pipeline = all("[data-candidate-subpipeline]")[0];
+pipeline.open = true;
+(pipeline.listeners.toggle || []).forEach((listener) => listener({type: "toggle"}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "template_generating", status: "working"},
+    data: {text: "继续生成"}
+  }}}
+});
+pipeline = all("[data-candidate-subpipeline]")[0];
+return {
+  openAfterUpdate: pipeline.open === true,
+  stored: debug.state().expandedCandidateSubpipelines["0"] === true
+};
+"""
+    )
+
+    assert output == {"openAfterUpdate": True, "stored": True}
+
+
+def test_controller_auto_opens_and_scrolls_candidate_subpipeline_while_evaluating() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    data: {summary: "开始评估方案"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {detail: {candidateName: "基础 VPC 网络", candidateIndex: 0, summary: "基础网络"}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "template_generating", status: "working"},
+    data: {summary: "开始生成模板"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "template_generating", status: "working"},
+    data: {text: "继续生成"}
+  }}}
+});
+const pipeline = all("[data-candidate-subpipeline]")[0];
+const body = all("[data-candidate-subpipeline-body]")[0];
+return {
+  open: pipeline.open === true,
+  scrollTop: body && body.scrollTop,
+  scrollHeight: body && body.scrollHeight
+};
+"""
+    )
+
+    assert output == {"open": True, "scrollTop": 100, "scrollHeight": 100}
+
+
+def test_controller_candidate_subpipeline_keeps_all_chinese_substeps_and_auto_opens_body() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {detail: {candidateName: "基础 VPC 网络", candidateIndex: 0, summary: "基础网络", totalMonthlyCost: "¥0/月"}}
+  }}}
+});
+[
+  "template_generating",
+  "cost_estimating",
+  "quality_review"
+].forEach((stepId, stepIndex) => {
+  for (let index = 0; index < 9; index += 1) {
+    const isLast = index === 8;
+    applyPayload({
+      metadata: {iac_code: {pipeline: {
+        eventType: isLast ? "candidate_step_completed" : index === 0 ? "candidate_step_started" : "text_delta",
+        status: "working",
+        step: {id: "evaluate_candidates"},
+        candidate: {index: 0},
+        candidateStep: {id: stepId, status: isLast ? "completed" : "working"},
+        data: {text: `片段 ${stepIndex}-${index}`, summary: `子步骤 ${stepIndex}-${index}`}
+      }}}
+    });
+  }
+});
+const pipeline = all("[data-candidate-subpipeline]")[0];
+const toggle = all("[data-candidate-subpipeline-toggle]")[0];
+const substeps = all("[data-candidate-substep]").map((item) => text(item));
+return {
+  pipelineOpen: pipeline.open === true,
+  pipelineText: text(pipeline),
+  toggleText: text(toggle),
+  substeps
+};
+"""
+    )
+
+    assert output["pipelineOpen"] is True
+    assert output["toggleText"] == "思考过程"
+    assert "思考完成" not in output["pipelineText"]
+    assert any("模板生成" in item for item in output["substeps"])
+    assert any("成本估算" in item for item in output["substeps"])
+    assert any("质量复核" in item for item in output["substeps"])
+    assert not any("template_generating" in item or "cost_estimating" in item for item in output["substeps"])
+
+
+def test_controller_collapses_step_three_completion_in_left_chat_without_duplicate_option_details() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    data: {summary: "开始评估候选方案"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    data: {
+      conclusion: {
+        options: [
+          {
+            title: "标准 VPC 网络",
+            candidateIndex: 0,
+            summary: "成本较低，扩展性一般",
+            totalMonthlyCost: "¥33.89/月"
+          },
+          {
+            title: "VPC 含可用区交换机",
+            candidateIndex: 1,
+            summary: "自动创建交换机，部署更顺滑",
+            totalMonthlyCost: "¥60/月"
+          }
+        ]
+      }
+    }
+  }}}
+});
+const stepText = text(all("[data-step-id]")[0]);
+const resultOptions = all("[data-step-result-option]").map((item) => ({
+  option: item.getAttribute("data-step-result-option"),
+  text: text(item)
+}));
+return {stepText, resultOptions};
+"""
+    )
+
+    assert "；" not in output["stepText"]
+    assert "已生成 2 个方案" not in output["stepText"]
+    assert "成本较低，扩展性一般" not in output["stepText"]
+    assert "自动创建交换机，部署更顺滑" not in output["stepText"]
+    assert output["resultOptions"] == []
+
+
+def test_controller_renders_step_three_nested_candidate_conclusion_without_flat_object_text() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    data: {
+      conclusion: {
+        0: {
+          template: "基础 VPC 网络模板，创建 CIDR 192.168.0.0/16 的专有网络",
+          cost: {
+            template_fixed: false,
+            monthly_estimate: "¥0/月",
+            currency: "CNY",
+            api_raw_summary: "GetTemplateEstimateCost 返回 Resources: {}，VPC 为免费资源"
+          },
+          candidate: {
+            name: "基础 VPC 网络",
+            output_path: "templates/1-basic-vpc.yml",
+            pros: "满足基础网络隔离需求、零成本、可按需扩展子网和安全组",
+            monthly_estimate: 0,
+            cons: "仅含 VPC，需后续手动添加 VSwitch"
+          }
+        }
+      }
+    }
+  }}}
+});
+all("[data-step-toggle]")[0].click();
+const stepText = text(all("[data-step-id]")[0]);
+const resultOptions = all("[data-step-result-option]").map((item) => text(item));
+const candidateResults = all("[data-step-candidate-result]").map((item) => text(item));
+const resultFields = all("[data-step-result-field]").map((field) => text(field));
+return {stepText, resultOptions, candidateResults, resultFields};
+"""
+    )
+
+    assert "cost：" not in output["stepText"]
+    assert "candidate：" not in output["stepText"]
+    assert "template fixed" not in output["stepText"]
+    assert "；" not in output["stepText"]
+    assert output["resultFields"] == []
+    assert output["resultOptions"] == []
+    assert len(output["candidateResults"]) == 1
+    assert "基础 VPC 网络" in output["candidateResults"][0]
+    assert "基础 VPC 网络模板" in output["candidateResults"][0]
+    assert "¥0/月" in output["candidateResults"][0]
+
+
+def test_controller_compacts_long_template_text_in_step_three_candidate_result() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+const fullTemplate = [
+  "ROSTemplateFormatVersion: '2015-09-01'",
+  "Description:",
+  "  zh-cn: 经济型突发实例方案，使用 Nginx 托管静态网站",
+  "Resources:",
+  "  WebServer:",
+  "    Type: ALIYUN::ECS::Instance",
+  "    Properties:",
+  "      InstanceType: ecs.t6-c1m1.large",
+  "      SystemDiskCategory: cloud_essd",
+  "      InternetMaxBandwidthOut: 1"
+].join("\\n");
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    data: {
+      detail: {
+        candidateName: "经济型突发实例方案",
+        candidateIndex: 0,
+        template: fullTemplate,
+        totalMonthlyCost: "¥24.51/月"
+      }
+    }
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "completed",
+    step: {id: "evaluate_candidates"},
+    data: {conclusion: {summary: "方案评估完成"}}
+  }}}
+});
+all("[data-step-toggle]")[0].click();
+const result = all("[data-step-candidate-result]")[0];
+const planCard = all("[data-candidate-index]")[0];
+const summary = all("[data-step-candidate-result-summary]")[0] || null;
+const popovers = all("[data-template-popover]").map((popover) => text(popover));
+return {
+  resultText: text(result),
+  resultTitle: result ? result.getAttribute("title") : null,
+  planTitle: planCard ? planCard.getAttribute("title") : null,
+  summaryText: summary ? text(summary) : "",
+  summaryTitle: summary ? summary.getAttribute("title") : null,
+  popovers
+};
+"""
+    )
+
+    assert "经济型突发实例方案" in output["resultText"]
+    assert "¥24.51/月" in output["resultText"]
+    assert "ROSTemplateFormatVersion" not in output["summaryText"]
+    assert "Resources:" not in output["summaryText"]
+    assert "模板内容已生成" in output["summaryText"]
+    assert output["resultTitle"] is None
+    assert output["planTitle"] is None
+    assert output["summaryTitle"] is None
+    assert len(output["popovers"]) == 2
+    assert all("ROSTemplateFormatVersion" in item for item in output["popovers"])
+    assert all("Resources:" in item for item in output["popovers"])
+
+
+def test_controller_step_three_expansion_groups_summary_and_process_by_candidate() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {index: 0, name: "基础 VPC 网络", summary: "VPC 本身免费，适合先建立网络容器", price: "¥0/月"},
+  {index: 1, name: "VPC 含交换机", summary: "自动创建交换机，后续部署更顺滑", price: "¥0/月"}
+].forEach((candidate) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: candidate.index},
+    data: {
+      detail: {
+        candidateName: candidate.name,
+        candidateIndex: candidate.index,
+        summary: candidate.summary,
+        totalMonthlyCost: candidate.price
+      }
+    }
+  }}}
+}));
+[
+  {candidateIndex: 0, stepId: "template_generating", text: "生成 VPC 模板"},
+  {candidateIndex: 0, stepId: "cost_estimating", text: "确认 VPC 免费"},
+  {candidateIndex: 1, stepId: "template_generating", text: "生成 VPC 与交换机模板"},
+  {candidateIndex: 1, stepId: "cost_estimating", text: "确认网络资源免费"}
+].forEach((item) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "text_delta",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: item.candidateIndex},
+    candidateStep: {id: item.stepId, status: "working"},
+    data: {text: item.text}
+  }}}
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    data: {conclusion: {
+      0: {candidate: {name: "基础 VPC 网络"}, summary: "VPC 本身免费，适合先建立网络容器"},
+      1: {candidate: {name: "VPC 含交换机"}, summary: "自动创建交换机，后续部署更顺滑"}
+    }}
+  }}}
+});
+all("[data-step-toggle]")[0].click();
+const results = all("[data-step-candidate-result]").map((item) => ({
+  candidate: item.getAttribute("data-step-candidate-result"),
+  text: text(item)
+}));
+const processes = all("[data-step-candidate-result-process]").map((item) => ({
+  candidate: item.getAttribute("data-step-candidate-result-process"),
+  open: item.open === true,
+  text: text(item)
+}));
+return {results, processes};
+"""
+    )
+
+    assert [item["candidate"] for item in output["results"]] == ["0", "1"]
+    assert "基础 VPC 网络" in output["results"][0]["text"]
+    assert "VPC 本身免费" in output["results"][0]["text"]
+    assert "VPC 含交换机" in output["results"][1]["text"]
+    assert "自动创建交换机" in output["results"][1]["text"]
+    assert [item["candidate"] for item in output["processes"]] == ["0", "1"]
+    assert output["processes"][0]["open"] is False
+    assert "模板生成" in output["processes"][0]["text"]
+    assert "成本估算" in output["processes"][0]["text"]
+    assert "生成 VPC 模板" in output["processes"][0]["text"]
+    assert "生成 VPC 与交换机模板" in output["processes"][1]["text"]
+
+
+def test_controller_completed_step_expansion_includes_collapsible_process() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {eventType: "step_started", status: "working", data: {summary: "开始理解需求"}},
+  {eventType: "text_delta", status: "working", data: {text: "识别 VPC"}},
+  {eventType: "tool_result", status: "working", data: {toolName: "read_context", result: {status: "success"}}},
+  {eventType: "step_completed", status: "working", data: {conclusion: {
+    core_requirements: "VPC",
+    cloud_platform: "aliyun",
+    user_message_summary: "创建一个 VPC"
+  }}}
+].forEach((event) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    ...event,
+    step: {id: "intent_parsing"}
+  }}}
+}));
+all("[data-step-toggle]")[0].click();
+const step = all("[data-step-id]")[0];
+const process = all("[data-step-process]")[0];
+const processEvents = all("[data-step-process-event]").map((item) => ({
+  kind: item.getAttribute("data-step-process-event"),
+  text: text(item)
+}));
+return {
+  stepText: text(step),
+  processOpen: process.open === true,
+  processText: text(process),
+  processEvents
+};
+"""
+    )
+
+    assert "VPC" in output["stepText"]
+    assert "思考过程" in output["processText"]
+    assert output["processOpen"] is False
+    assert [event["kind"] for event in output["processEvents"]] == [
+        "step_started",
+        "text_delta",
+        "tool_result",
+        "step_completed",
+    ]
+    assert "识别 VPC" in output["processEvents"][1]["text"]
+
+
+def test_controller_summarizes_step_three_left_chat_by_candidate_latest_progress() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {
+    index: 0,
+    name: "基础 VPC 网络",
+    summary: "使用 192.168.0.0/16 网段，作为后续网络资源的基础容器。"
+  },
+  {
+    index: 1,
+    name: "VPC 含可用区交换机",
+    summary: "创建 VPC 和可用区交换机，后续可直接部署 ECS。"
+  }
+].forEach((candidate) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: candidate.index},
+    data: {detail: {
+      candidateName: candidate.name,
+      candidateIndex: candidate.index,
+      summary: candidate.summary,
+      totalMonthlyCost: "¥0/月"
+    }}
+  }}}
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimating", label: "成本估算"},
+    data: {summary: "开始估算成本"}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "tool_result",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 0},
+    candidateStep: {id: "cost_estimating", label: "成本估算"},
+    data: {toolName: "GetTemplateEstimateCost", result: {status: "success"}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_step_started",
+    status: "working",
+    step: {id: "evaluate_candidates"},
+    candidate: {index: 1},
+    candidateStep: {id: "template_validating", label: "模板校验"},
+    data: {summary: "校验模板参数"}
+  }}}
+});
+const stepText = text(all("[data-step-id]")[0]);
+const heads = all("[data-step-candidate-progress-head]").map((item) => text(item));
+const summaries = all("[data-step-candidate-progress]").map((item) => ({
+  index: item.getAttribute("data-step-candidate-progress"),
+  text: text(item)
+}));
+return {stepText, heads, summaries};
+"""
+    )
+
+    assert output["heads"] == ["方案 0基础 VPC 网络", "方案 1VPC 含可用区交换机"]
+    assert len(output["summaries"]) == 2
+    assert output["summaries"] == [
+        {"index": "0", "text": "方案 0基础 VPC 网络工具结果GetTemplateEstimateCost"},
+        {"index": "1", "text": "方案 1VPC 含可用区交换机模板校验校验模板参数"},
+    ]
+    assert "使用 192.168.0.0/16 网段" not in output["stepText"]
+    assert "创建 VPC 和可用区交换机" not in output["stepText"]
+
+
+def test_controller_renders_generic_pending_input_options_in_left_chat() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    input: {
+      kind: "ask_user_question",
+      inputId: "ask-1",
+      question: "请选择部署目标",
+      options: [
+        {id: "nginx", label: "Nginx 网站", description: "托管静态站点"},
+        {id: "api", label: "API 服务", description: "后端接口"}
+      ]
+    }
+  }}}
+});
+const cards = all("[data-pending-input-kind]");
+const options = all("[data-pending-input-option]").map((option) => ({
+  id: option.getAttribute("data-pending-input-option"),
+  text: text(option)
+}));
+all("[data-pending-input-option]")[1].click();
+const optionsAfter = all("[data-pending-input-option]").map((option) => ({
+  id: option.getAttribute("data-pending-input-option"),
+  pressed: option.getAttribute("aria-pressed"),
+  className: option.getAttribute("class")
+}));
+return {
+  cardCount: cards.length,
+  options,
+  optionsAfter,
+  pendingKind: debug.state().pendingInput.kind,
+  pendingPrompt: debug.state().pendingInput.prompt,
+  pendingOptionCount: debug.state().pendingInput.options.length,
+  selectedPendingInputOptionId: debug.state().selectedPendingInputOptionId,
+  composerValue: elementById("composer-input").value
+};
+"""
+    )
+
+    assert output == {
+        "cardCount": 1,
+        "options": [
+            {"id": "nginx", "text": "Nginx 网站托管静态站点"},
+            {"id": "api", "text": "API 服务后端接口"},
+        ],
+        "optionsAfter": [
+            {"id": "nginx", "pressed": "false", "className": "pending-input-option"},
+            {"id": "api", "pressed": "true", "className": "pending-input-option selected"},
+        ],
+        "pendingKind": "ask_user_question",
+        "pendingPrompt": "请选择部署目标",
+        "pendingOptionCount": 2,
+        "selectedPendingInputOptionId": "api",
+        "composerValue": "api",
+    }
+
+
+def test_controller_renders_pending_input_markdown_for_questions_and_candidate_selection() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "intent_parsing"},
+    input: {
+      kind: "ask_user_question",
+      question: "请选择 **部署目标**：\\n\\n- Nginx 网站\\n- API 服务\\n\\n查看 [帮助](https://example.com/docs)",
+      options: [
+        {id: "nginx", label: "Nginx 网站", description: "用于 **静态站点**"}
+      ]
+    }
+  }}}
+});
+const askCard = all("[data-pending-input-kind]")[0];
+const askMarkdown = all("[data-markdown-node]").map((node) => ({
+  kind: node.getAttribute("data-markdown-node"),
+  tag: node.tagName,
+  text: text(node),
+  href: node.getAttribute("href")
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    input: {
+      kind: "candidate_select",
+      question: "请选择要部署的方案：**方案 0** 或 **方案 1**",
+      options: [
+        {id: "0", label: "经济型方案", description: "适合 **低成本** 演示"}
+      ]
+    }
+  }}}
+});
+const candidateCard = all("[data-pending-input-kind]")[0];
+const candidateMarkdown = all("[data-markdown-node]").map((node) => ({
+  kind: node.getAttribute("data-markdown-node"),
+  tag: node.tagName,
+  text: text(node),
+  href: node.getAttribute("href")
+}));
+return {
+  askText: text(askCard),
+  askMarkdown,
+  candidateText: text(candidateCard),
+  candidateMarkdown
+};
+"""
+    )
+
+    assert "**部署目标**" not in output["askText"]
+    assert "查看 帮助" in output["askText"]
+    assert {"kind": "strong", "tag": "STRONG", "text": "部署目标", "href": None} in output["askMarkdown"]
+    assert {"kind": "li", "tag": "LI", "text": "Nginx 网站", "href": None} in output["askMarkdown"]
+    assert {"kind": "a", "tag": "A", "text": "帮助", "href": "https://example.com/docs"} in output["askMarkdown"]
+    assert "**方案 0**" not in output["candidateText"]
+    assert "方案 0" in output["candidateText"]
+    assert {"kind": "strong", "tag": "STRONG", "text": "方案 0", "href": None} in output["candidateMarkdown"]
+    assert {"kind": "strong", "tag": "STRONG", "text": "低成本", "href": None} in output["candidateMarkdown"]
+
+
+def test_controller_renders_inline_numbered_pending_input_as_ordered_list() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const next = reducers.reducePipelinePayload(debug.state(), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "intent_parsing"},
+    input: {
+      kind: "ask_user_question",
+      question: "请补充以下信息： 1. 演示内容：**静态页面**、反向代理还是其他？ 2. 是否需要公网访问？ 3. 预算偏好？"
+    }
+  }}}
+});
+Object.assign(debug.state(), next);
+debug.render();
+const card = all("[data-pending-input-kind]")[0];
+const markdown = all("[data-markdown-node]").map((node) => ({
+  kind: node.getAttribute("data-markdown-node"),
+  tag: node.tagName,
+  text: text(node)
+}));
+return {cardText: text(card), markdown};
+"""
+    )
+
+    assert "1. 演示内容" not in output["cardText"]
+    assert {
+        "kind": "ol",
+        "tag": "OL",
+        "text": "演示内容：静态页面、反向代理还是其他？是否需要公网访问？预算偏好？",
+    } in output["markdown"]
+    assert {"kind": "li", "tag": "LI", "text": "演示内容：静态页面、反向代理还是其他？"} in output["markdown"]
+    assert {"kind": "li", "tag": "LI", "text": "是否需要公网访问？"} in output["markdown"]
+    assert {"kind": "li", "tag": "LI", "text": "预算偏好？"} in output["markdown"]
+    assert {"kind": "strong", "tag": "STRONG", "text": "静态页面"} in output["markdown"]
+
+
+def test_controller_ask_user_question_candidate_option_syncs_with_right_plan_card() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {index: 0, name: "经济型演示方案", summary: "成本最低", price: "¥74/月"},
+  {index: 1, name: "均衡型演示方案", summary: "性能稳定", price: "¥291/月"}
+].forEach((candidate) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "confirm_and_select"},
+    candidate: {index: candidate.index},
+    data: {
+      detail: {
+        candidateName: candidate.name,
+        candidateIndex: candidate.index,
+        summary: candidate.summary,
+        totalMonthlyCost: candidate.price
+      }
+    }
+  }}}
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    input: {
+      kind: "ask_user_question",
+      question: "请选择要部署的方案",
+      options: [
+        {id: "use-economy", label: "选择经济型", candidate_index: 0},
+        {id: "use-balanced", label: "选择均衡型", candidate_index: 1}
+      ]
+    }
+  }}}
+});
+all("[data-pending-input-option]")
+  .find((option) => option.getAttribute("data-pending-input-option") === "use-balanced")
+  .click();
+const leftOptions = all("[data-pending-input-option]").map((option) => ({
+  id: option.getAttribute("data-pending-input-option"),
+  candidateChoice: option.getAttribute("data-candidate-choice"),
+  pressed: option.getAttribute("aria-pressed"),
+  className: option.getAttribute("class")
+}));
+const rightCards = all("[data-candidate-index]").map((card) => ({
+  index: card.getAttribute("data-candidate-index"),
+  pressed: card.getAttribute("aria-pressed"),
+  className: card.getAttribute("class")
+}));
+return {
+  leftOptions,
+  rightCards,
+  selectedCandidateIndex: debug.state().selectedCandidateIndex,
+  selectedPendingInputOptionId: debug.state().selectedPendingInputOptionId,
+  composerValue: elementById("composer-input").value
+};
+"""
+    )
+
+    assert output == {
+        "leftOptions": [
+            {
+                "id": "use-economy",
+                "candidateChoice": "0",
+                "pressed": "false",
+                "className": "pending-input-option",
+            },
+            {
+                "id": "use-balanced",
+                "candidateChoice": "1",
+                "pressed": "true",
+                "className": "pending-input-option selected",
+            },
+        ],
+        "rightCards": [
+            {"index": "0", "pressed": "false", "className": "plan-card"},
+            {"index": "1", "pressed": "true", "className": "plan-card selected recommended"},
+        ],
+        "selectedCandidateIndex": 1,
+        "selectedPendingInputOptionId": "use-balanced",
+        "composerValue": "use-balanced",
+    }
+
+
+def test_controller_renders_candidate_selection_pending_input_as_options() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "confirm_and_select"},
+    candidate: {index: 1},
+    data: {
+      detail: {
+        candidateName: "轻量应用服务器",
+        candidateIndex: 1,
+        summary: "开箱即用",
+        totalMonthlyCost: "¥0/月",
+        costItems: []
+      }
+    }
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {
+      kind: "candidate_selection",
+      prompt: "请选择购买方案",
+      options: [{id: "1", label: "轻量应用服务器", summary: "开箱即用", totalMonthlyCost: "¥0/月"}]
+    }
+  }}}
+});
+const cards = all("[data-pending-input-kind]");
+const options = all("[data-pending-input-option]");
+const planCard = all("[data-candidate-index]")[0];
+const stepText = text(all("[data-step-id]").find((step) => step.getAttribute("data-step-id") === "confirm_and_select"));
+options[0].click();
+const selectedPlanText = text(all("[data-candidate-index]")[0]);
+return {
+  cardCount: cards.length,
+  optionCount: options.length,
+  stepText,
+  planText: selectedPlanText,
+  selectedCandidateIndex: debug.state().selectedCandidateIndex,
+  composerValue: elementById("composer-input").value
+};
+"""
+    )
+
+    assert output["cardCount"] == 1
+    assert output["optionCount"] == 1
+    assert "请选择购买方案" in output["stepText"]
+    assert "轻量应用服务器" in output["stepText"]
+    assert "开箱即用" in output["stepText"]
+    assert "¥0/月" in output["stepText"]
+    assert "思考过程" in output["stepText"]
+    assert output["planText"] == "已选方案 1轻量应用服务器开箱即用预估价格¥0/月"
+    assert output["selectedCandidateIndex"] == 1
+    assert output["composerValue"] == "选择方案1"
+
+
+def test_controller_step_four_selection_ui_syncs_with_right_plan_cards() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {index: 0, name: "基础 VPC", summary: "成本最低", price: "¥0/月"},
+  {index: 1, name: "VPC 含交换机", summary: "部署更完整", price: "¥0/月"}
+].forEach((candidate) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "confirm_and_select"},
+    candidate: {index: candidate.index},
+    data: {
+      detail: {
+        candidateName: candidate.name,
+        candidateIndex: candidate.index,
+        summary: candidate.summary,
+        totalMonthlyCost: candidate.price
+      }
+    }
+  }}}
+}));
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {
+      kind: "candidate_selection",
+      prompt: "请选择购买方案",
+      options: [
+        {id: "0", label: "基础 VPC", summary: "成本最低", totalMonthlyCost: "¥0/月"},
+        {id: "1", label: "VPC 含交换机", summary: "部署更完整", totalMonthlyCost: "¥0/月"}
+      ]
+    }
+  }}}
+});
+const choicesBefore = all("[data-candidate-choice]").map((choice) => ({
+  index: choice.getAttribute("data-candidate-choice"),
+  pressed: choice.getAttribute("aria-pressed"),
+  text: text(choice)
+}));
+all("[data-candidate-choice]")
+  .find((choice) => choice.getAttribute("data-candidate-choice") === "1")
+  .click();
+const choicesAfter = all("[data-candidate-choice]").map((choice) => ({
+  index: choice.getAttribute("data-candidate-choice"),
+  pressed: choice.getAttribute("aria-pressed"),
+  className: choice.getAttribute("class")
+}));
+const rightCards = all("[data-candidate-index]").map((card) => ({
+  index: card.getAttribute("data-candidate-index"),
+  pressed: card.getAttribute("aria-pressed"),
+  className: card.getAttribute("class")
+}));
+return {
+  choicesBefore,
+  choicesAfter,
+  rightCards,
+  selectedCandidateIndex: debug.state().selectedCandidateIndex,
+  composerValue: elementById("composer-input").value
+};
+"""
+    )
+
+    assert [choice["index"] for choice in output["choicesBefore"]] == ["0", "1"]
+    assert "基础 VPC" in output["choicesBefore"][0]["text"]
+    assert "VPC 含交换机" in output["choicesBefore"][1]["text"]
+    assert output["choicesAfter"] == [
+        {"index": "0", "pressed": "false", "className": "pending-input-option"},
+        {"index": "1", "pressed": "true", "className": "pending-input-option selected"},
+    ]
+    assert output["rightCards"] == [
+        {"index": "0", "pressed": "false", "className": "plan-card"},
+        {"index": "1", "pressed": "true", "className": "plan-card selected recommended"},
+    ]
+    assert output["selectedCandidateIndex"] == 1
+    assert output["composerValue"] == "选择方案1"
+
+
+def test_controller_step_four_waiting_input_keeps_thinking_process_available() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+[
+  {eventType: "step_started", data: {summary: "准备选择方案"}},
+  {eventType: "text_delta", data: {text: "比较方案偏好"}},
+  {eventType: "input_required", data: {
+    kind: "candidate_selection",
+    prompt: "请选择购买方案",
+    options: [{id: "0", label: "基础 VPC", summary: "成本最低"}]
+  }}
+].forEach((event) => applyPayload({
+  metadata: {iac_code: {pipeline: {
+    ...event,
+    status: event.eventType === "input_required" ? "input_required" : "working",
+    step: {id: "confirm_and_select"}
+  }}}
+}));
+const step = all("[data-step-id]").find((item) => item.getAttribute("data-step-id") === "confirm_and_select");
+const process = all("[data-step-process]")
+  .find((item) => item.getAttribute("data-step-process") === "confirm_and_select");
+return {
+  stepText: text(step),
+  processText: text(process),
+  processEvents: all("[data-step-process-event]").map((item) => item.getAttribute("data-step-process-event"))
+};
+"""
+    )
+
+    assert "请选择购买方案" in output["stepText"]
+    assert "基础 VPC" in output["stepText"]
+    assert "思考过程" in output["processText"]
+    assert output["processEvents"] == ["step_started", "text_delta", "input_required"]
+
+
+def test_controller_accepts_candidate_select_pending_input_alias() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "confirm_and_select"},
+    candidate: {index: 1},
+    data: {detail: {candidateName: "轻量应用服务器", candidateIndex: 1}}
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {
+      kind: "candidate_select",
+      prompt: "请选择购买方案",
+      options: [{id: "1", label: "轻量应用服务器"}]
+    }
+  }}}
+});
+const cards = all("[data-pending-input-kind]");
+const options = all("[data-pending-input-option]");
+options[0].click();
+return {
+  cardCount: cards.length,
+  optionCount: options.length,
+  selectedCandidateIndex: debug.state().selectedCandidateIndex,
+  composerValue: elementById("composer-input").value
+};
+"""
+    )
+
+    assert output == {
+        "cardCount": 1,
+        "optionCount": 1,
+        "selectedCandidateIndex": 1,
+        "composerValue": "选择方案1",
+    }
+
+
+def test_controller_candidate_select_uses_candidate_index_when_option_id_is_not_numeric() -> None:
+    output = controller_harness(
+        """
+controller.init();
+function applyPayload(payload) {
+  const next = reducers.reducePipelinePayload(debug.state(), payload);
+  Object.assign(debug.state(), next);
+  debug.render();
+}
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "candidate_detail_shown",
+    status: "working",
+    step: {id: "confirm_and_select"},
+    candidate: {index: 1},
+    data: {
+      detail: {
+        candidateName: "均衡型演示方案",
+        candidateIndex: 1,
+        summary: "性能稳定",
+        totalMonthlyCost: "¥291/月"
+      }
+    }
+  }}}
+});
+applyPayload({
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {
+      kind: "candidate_select",
+      prompt: "请选择购买方案",
+      options: [{id: "balanced-plan", label: "均衡型演示方案", candidate_index: 1}]
+    }
+  }}}
+});
+all("[data-pending-input-option]")[0].click();
+const option = all("[data-pending-input-option]")[0];
+const plan = all("[data-candidate-index]")[0];
+return {
+  optionId: option.getAttribute("data-pending-input-option"),
+  candidateChoice: option.getAttribute("data-candidate-choice"),
+  optionPressed: option.getAttribute("aria-pressed"),
+  optionClass: option.getAttribute("class"),
+  planPressed: plan.getAttribute("aria-pressed"),
+  planClass: plan.getAttribute("class"),
+  selectedCandidateIndex: debug.state().selectedCandidateIndex,
+  selectedPendingInputOptionId: debug.state().selectedPendingInputOptionId,
+  composerValue: elementById("composer-input").value
+};
+"""
+    )
+
+    assert output == {
+        "optionId": "balanced-plan",
+        "candidateChoice": "1",
+        "optionPressed": "true",
+        "optionClass": "pending-input-option selected",
+        "planPressed": "true",
+        "planClass": "plan-card selected recommended",
+        "selectedCandidateIndex": 1,
+        "selectedPendingInputOptionId": "balanced-plan",
+        "composerValue": "选择方案1",
+    }
+
+
+def test_controller_candidate_choices_show_in_left_chat_and_sync_with_right_cards() -> None:
+    output = controller_harness(
+        """
+controller.init();
+debug.loadDemoCandidates();
+const leftChoiceCountBefore = all("[data-pending-input-option]").length;
+all("[data-pending-input-option]")[1].click();
+const leftChoiceCountAfter = all("[data-pending-input-option]").length;
+const planCards = all("[data-candidate-index]").map((card) => ({
+  index: card.getAttribute("data-candidate-index"),
+  pressed: card.getAttribute("aria-pressed")
+}));
+return {
+  leftChoiceCountBefore,
+  leftChoiceCountAfter,
+  selectedCandidateIndex: debug.state().selectedCandidateIndex,
+  selectedPlan: planCards.find((card) => card.index === "1"),
+  prompt: reducers.promptForSelectedCandidate(debug.state())
+};
+"""
+    )
+
+    assert output == {
+        "leftChoiceCountBefore": 2,
+        "leftChoiceCountAfter": 2,
+        "selectedCandidateIndex": 1,
+        "selectedPlan": {
+            "index": "1",
+            "pressed": "true",
+        },
+        "prompt": "选择方案1",
+    }
+
+
+def test_controller_shows_normal_chat_notice_in_dialog_after_pipeline_handoff() -> None:
+    output = controller_harness(
+        """
+controller.init();
+const next = reducers.reducePipelinePayload(debug.state(), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "pipeline_handoff_ready",
+    status: "completed",
+    contextId: "ctx-1",
+    taskId: "task-pipeline",
+    data: {action: "switch_to_normal", targetMode: "normal"}
+  }}}
+});
+Object.assign(debug.state(), next);
+debug.render();
+const messages = all("[data-normal-handoff-message]").map((item) => text(item));
+return {
+  messages,
+  composerNoticeHidden: elementById("normal-handoff-notice").hidden,
+  activeTaskId: debug.state().activeTaskId,
+  normalHandoffReady: debug.state().normalHandoffReady
+};
+"""
+    )
+
+    assert output == {
+        "messages": ["部署流程已完成，已进入普通会话。可以继续追问资源、运维或变更需求。"],
+        "composerNoticeHidden": True,
+        "activeTaskId": "",
+        "normalHandoffReady": True,
+    }
+
+
+def test_controller_renders_debug_session_info_for_issue_reports() -> None:
+    output = controller_harness(
+        """
+controller.init();
+Object.assign(debug.state(), {
+  contextId: "ctx-1",
+  pipelineTaskId: "task-pipeline",
+  activeTaskId: "task-active",
+  lastSequence: 42,
+  status: "working",
+  normalHandoffReady: false
+});
+debug.render();
+const fields = all("[data-debug-session-field]").map((field) => ({
+  key: field.getAttribute("data-debug-session-field"),
+  text: text(field)
+}));
+return {fields};
+"""
+    )
+
+    assert output["fields"] == [
+        {"key": "serverUrl", "text": "Server URLhttp://127.0.0.1:41299"},
+        {"key": "cwd", "text": "CWD/workspace"},
+        {"key": "contextId", "text": "Context IDctx-1"},
+        {"key": "pipelineTaskId", "text": "Pipeline Tasktask-pipeline"},
+        {"key": "activeTaskId", "text": "Active Tasktask-active"},
+        {"key": "lastSequence", "text": "Last Sequence42"},
+        {"key": "status", "text": "Statusworking"},
+        {"key": "handoff", "text": "Normal Handoff否"},
+        {"key": "logs", "text": "Logs默认 ~/.iac-code/logs，或 IAC_CODE_CONFIG_DIR/logs"},
+    ]
+
+
+def test_controller_plan_card_selection_updates_left_candidate_choice() -> None:
+    output = controller_harness(
+        """
+controller.init();
+debug.loadDemoCandidates();
+all("[data-candidate-index]")[1].click();
+return {
+  leftChoices: all("[data-candidate-choice]").map((choice) => ({
+    index: choice.getAttribute("data-candidate-choice"),
+    pressed: choice.getAttribute("aria-pressed")
+  })),
+  rightCards: all("[data-candidate-index]").map((card) => ({
+    index: card.getAttribute("data-candidate-index"),
+    pressed: card.getAttribute("aria-pressed")
+  })),
+  prompt: reducers.promptForSelectedCandidate(debug.state())
+};
+"""
+    )
+
+    assert output == {
+        "leftChoices": [
+            {"index": "0", "pressed": "false"},
+            {"index": "1", "pressed": "true"},
+        ],
+        "rightCards": [
+            {"index": "0", "pressed": "false"},
+            {"index": "1", "pressed": "true"},
+        ],
+        "prompt": "选择方案1",
+    }
+
+
+def test_controller_reports_sse_error_event_as_failed_send() -> None:
+    output = controller_harness(
+        """
+controller.init();
+elementById("composer-input").value = "继续部署";
+global.fetch = async () => ({
+  ok: true,
+  status: 200,
+  body: null,
+  text: async () => 'data: {"ok": false, "error": "upstream timed out"}\\n\\n'
+});
+await controller.sendComposerMessage();
+return {
+  alertText: elementById("status-alert").textContent,
+  alertKind: elementById("status-alert").getAttribute("data-kind"),
+  debug: debugText()
+};
+"""
+    )
+
+    assert output["alertText"] == "消息发送失败：upstream timed out"
+    assert output["alertKind"] == "error"
+    assert "upstream timed out" in output["debug"]
+
+
+def test_controller_yields_between_sse_blocks_so_streaming_can_paint_incrementally() -> None:
+    output = controller_harness(
+        """
+controller.init();
+debug.state().progressUi.variant = "a";
+elementById("composer-input").value = "创建 VPC";
+let paintCount = 0;
+global.requestAnimationFrame = (callback) => {
+  paintCount += 1;
+  return setTimeout(() => callback(Date.now()), 0);
+};
+global.cancelAnimationFrame = (id) => clearTimeout(id);
+const encoder = new TextEncoder();
+let readCount = 0;
+global.fetch = async () => ({
+  ok: true,
+  status: 200,
+  body: {
+    getReader() {
+      return {
+        async read() {
+          readCount += 1;
+          if (readCount === 1) {
+            return {
+              done: false,
+              value: encoder.encode([
+                'data: {"metadata":{"iac_code":{"pipeline":' +
+                  '{"eventType":"step_started","status":"working","step":{"id":"intent_parsing"},' +
+                  '"data":{"summary":"开始理解需求"}}}}}',
+                'data: {"metadata":{"iac_code":{"pipeline":' +
+                  '{"eventType":"text_delta","status":"working","step":{"id":"intent_parsing"},' +
+                  '"data":{"text":"正在分析预算"}}}}}'
+              ].join("\\n\\n") + "\\n\\n")
+            };
+          }
+          return {done: true};
+        },
+        async cancel() {}
+      };
+    }
+  }
+});
+await controller.sendComposerMessage();
+return {
+  paintCount,
+  cardKinds: all("[data-step-event-kind]").map((item) => item.getAttribute("data-step-event-kind"))
+};
+"""
+    )
+
+    assert output["paintCount"] >= 2
+    assert output["cardKinds"] == ["step_started", "text_delta"]
+
+
+def test_reducer_deep_clones_existing_permission_and_diagnostics() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.permission = {decision: {allowed: true}};
+state.diagnostics = {
+  requests: [{meta: {id: "req-1"}}],
+  sse: [{meta: {id: "sse-1"}}],
+  snapshots: [{meta: {id: "snap-1"}}]
+};
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "step_completed",
+    step: {id: "architecture_planning", status: "completed"}
+  }}}
+});
+state.permission.decision.allowed = false;
+state.diagnostics.requests[0].meta.id = "mutated";
+state.diagnostics.sse[0].meta.id = "mutated";
+state.diagnostics.snapshots[0].meta.id = "mutated";
+return {
+  permissionAllowed: next.permission.decision.allowed,
+  requestId: next.diagnostics.requests[0].meta.id,
+  sseId: next.diagnostics.sse[0].meta.id,
+  snapshotId: next.diagnostics.snapshots[0].meta.id
+};
+"""
+    )
+
+    assert output == {
+        "permissionAllowed": True,
+        "requestId": "req-1",
+        "sseId": "sse-1",
+        "snapshotId": "snap-1",
+    }
+
+
+def test_candidate_from_display_item_deep_clones_cost_item_nested_fields() -> None:
+    output = reducer_harness(
+        """
+const source = {
+  candidateName: "方案",
+  candidateIndex: 0,
+  costItems: [{name: "ecs", detail: {region: "cn-hangzhou"}}]
+};
+const candidate = reducers.candidateFromDisplayItem(source);
+source.costItems[0].detail.region = "mutated";
+return {
+  name: candidate.name,
+  region: candidate.costItems[0].detail.region
+};
+"""
+    )
+
+    assert output == {
+        "name": "方案",
+        "region": "cn-hangzhou",
+    }
+
+
+def test_reducer_sets_and_clears_realtime_pending_input() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+const waiting = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    taskId: "task-1",
+    contextId: "ctx-1",
+    input: {
+      inputId: "ask-1",
+      kind: "ask_user_question",
+      question: "请选择部署目标",
+      options: [{id: "nginx", label: "Nginx 网站"}]
+    }
+  }}}
+});
+const received = reducers.reducePipelinePayload(waiting, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_received",
+    status: "working",
+    taskId: "task-1",
+    contextId: "ctx-1"
+  }}}
+});
+return {
+  prompt: waiting.pendingInput.prompt,
+  optionLabel: waiting.pendingInput.options[0].label,
+  candidateCount: waiting.candidates.length,
+  originalPending: state.pendingInput,
+  waitingStatus: waiting.status,
+  cleared: received.pendingInput === null
+};
+"""
+    )
+
+    assert output == {
+        "prompt": "请选择部署目标",
+        "optionLabel": "Nginx 网站",
+        "candidateCount": 0,
+        "originalPending": None,
+        "waitingStatus": "waiting_input",
+        "cleared": True,
+    }
+
+
+def test_reducer_does_not_turn_pending_input_data_options_into_candidates() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    data: {
+      question: "请选择部署目标",
+      options: [{id: "nginx", label: "Nginx 网站"}]
+    }
+  }}}
+});
+return {
+  candidateCount: next.candidates.length,
+  prompt: next.pendingInput.prompt,
+  optionLabel: next.pendingInput.options[0].label
+};
+"""
+    )
+
+    assert output == {
+        "candidateCount": 0,
+        "prompt": "请选择部署目标",
+        "optionLabel": "Nginx 网站",
+    }
+
+
+def test_reducer_collects_candidate_selection_options_from_pending_input() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    step: {id: "confirm_and_select"},
+    data: {
+      kind: "candidate_selection",
+      prompt: "请选择购买方案",
+      options: [{
+        id: "1",
+        label: "标准 VPC",
+        description: "在 cn-hangzhou 创建一个标准 VPC，使用默认网段 172.16.0.0/12。",
+        price: "¥0/月"
+      }]
+    }
+  }}}
+});
+return {
+  candidateCount: next.candidates.length,
+  name: next.candidates[0] && next.candidates[0].name,
+  index: next.candidates[0] && next.candidates[0].candidateIndex,
+  summary: next.candidates[0] && next.candidates[0].summary,
+  cost: next.candidates[0] && next.candidates[0].totalMonthlyCost,
+  pendingPrompt: next.pendingInput.prompt
+};
+"""
+    )
+
+    assert output == {
+        "candidateCount": 1,
+        "name": "标准 VPC",
+        "index": 1,
+        "summary": "在 cn-hangzhou 创建一个标准 VPC，使用默认网段 172.16.0.0/12。",
+        "cost": "¥0/月",
+        "pendingPrompt": "请选择购买方案",
+    }
+
+
+def test_reducer_deep_clones_realtime_pending_input_payload() -> None:
+    output = reducer_harness(
+        """
+const input = {
+  question: "请选择部署目标",
+  extra: {source: "planner"},
+  options: [{id: "nginx", label: "Nginx 网站", meta: {score: 1}}]
+};
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  metadata: {iac_code: {pipeline: {
+    eventType: "input_required",
+    status: "input_required",
+    taskId: "task-1",
+    contextId: "ctx-1",
+    input
+  }}}
+});
+input.extra.source = "mutated";
+input.options[0].meta.score = 99;
+return {
+  prompt: next.pendingInput.prompt,
+  source: next.pendingInput.extra.source,
+  score: next.pendingInput.options[0].meta.score
+};
+"""
+    )
+
+    assert output == {
+        "prompt": "请选择部署目标",
+        "source": "planner",
+        "score": 1,
+    }
+
+
+def test_reducer_handles_snake_case_input_required_envelope() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  metadata: {iac_code: {pipeline: {
+    event_type: "input_required",
+    status: "input_required",
+    task_id: "task-1",
+    context_id: "ctx-1",
+    pending_input: {
+      question: "请选择部署目标",
+      options: [{id: "nginx", label: "Nginx 网站"}]
+    }
+  }}}
+});
+return {
+  taskId: next.pipelineTaskId,
+  contextId: next.contextId,
+  status: next.status,
+  prompt: next.pendingInput && next.pendingInput.prompt
+};
+"""
+    )
+
+    assert output == {
+        "taskId": "task-1",
+        "contextId": "ctx-1",
+        "status": "waiting_input",
+        "prompt": "请选择部署目标",
+    }
+
+
+def test_reducer_extracts_realtime_envelope_from_a2a_status_update_wrapper() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  result: {
+    statusUpdate: {
+      metadata: {iac_code: {pipeline: {
+        eventType: "input_required",
+        status: "input_required",
+        taskId: "task-1",
+        contextId: "ctx-1",
+        input: {
+          question: "请选择部署目标",
+          options: [{id: "nginx", label: "Nginx 网站"}]
+        }
+      }}}
+    }
+  }
+});
+return {
+  taskId: next.pipelineTaskId,
+  contextId: next.contextId,
+  status: next.status,
+  prompt: next.pendingInput && next.pendingInput.prompt
+};
+"""
+    )
+
+    assert output == {
+        "taskId": "task-1",
+        "contextId": "ctx-1",
+        "status": "waiting_input",
+        "prompt": "请选择部署目标",
+    }
+
+
+def test_reducer_restores_pipeline_state_snapshot_and_applies_events() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  snapshot: {
+    taskId: "task-1",
+    contextId: "ctx-1",
+    lastSequence: 7,
+    status: "working",
+    steps: [{id: "architecture_planning", status: "completed"}]
+  },
+  events: [{
+    eventType: "step_completed",
+    status: "working",
+    taskId: "task-1",
+    contextId: "ctx-1",
+    sequence: 8,
+    step: {id: "evaluate_candidates", status: "completed"}
+  }]
+});
+return {
+  taskId: next.pipelineTaskId,
+  contextId: next.contextId,
+  lastSequence: next.lastSequence,
+  architectureStatus: next.steps.architecture_planning.status,
+  evaluateStatus: next.steps.evaluate_candidates.status,
+  evaluateEvents: next.steps.evaluate_candidates.events.length
+};
+"""
+    )
+
+    assert output == {
+        "taskId": "task-1",
+        "contextId": "ctx-1",
+        "lastSequence": 8,
+        "architectureStatus": "completed",
+        "evaluateStatus": "completed",
+        "evaluateEvents": 1,
+    }
+
+
+def test_reducer_does_not_roll_back_last_sequence_from_replay_event() -> None:
+    output = reducer_harness(
+        """
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), {
+  snapshot: {
+    task_id: "task-1",
+    context_id: "ctx-1",
+    last_sequence: "10",
+    status: "working"
+  },
+  events: [{
+    event_type: "step_completed",
+    sequence: 8,
+    step: {id: "evaluate_candidates", status: "completed"}
+  }]
+});
+return {
+  lastSequence: next.lastSequence,
+  evaluateEvents: next.steps.evaluate_candidates.events.length
+};
+"""
+    )
+
+    assert output == {
+        "lastSequence": 10,
+        "evaluateEvents": 1,
+    }
+
+
+def test_reducer_snapshot_pending_input_null_clears_stale_pending_input() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.pendingInput = {prompt: "旧问题", options: [{id: "old", label: "旧选项"}]};
+const next = reducers.reducePipelinePayload(state, {
+  snapshot: {status: "working", pendingInput: null}
+});
+return {
+  originalPrompt: state.pendingInput.prompt,
+  nextPending: next.pendingInput
+};
+"""
+    )
+
+    assert output == {
+        "originalPrompt": "旧问题",
+        "nextPending": None,
+    }
+
+
+def test_reducer_snapshot_normal_handoff_switches_to_normal_mode() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.activeTaskId = "pipeline-task";
+const next = reducers.reducePipelinePayload(state, {
+  snapshot: {
+    status: "completed",
+    normalHandoff: {action: "switch_to_normal", targetMode: "normal"}
+  }
+});
+return {
+  normalHandoffReady: next.normalHandoffReady,
+  activeTaskId: next.activeTaskId,
+  status: next.status,
+  originalActiveTaskId: state.activeTaskId
+};
+"""
+    )
+
+    assert output == {
+        "normalHandoffReady": True,
+        "activeTaskId": "",
+        "status": "completed",
+        "originalActiveTaskId": "pipeline-task",
+    }
+
+
+def test_reducer_snapshot_snake_case_normal_handoff_switches_to_normal_mode() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.activeTaskId = "pipeline-task";
+const next = reducers.reducePipelinePayload(state, {
+  snapshot: {
+    status: "completed",
+    normal_handoff: {action: "switch_to_normal", target_mode: "normal"}
+  }
+});
+return {
+  normalHandoffReady: next.normalHandoffReady,
+  activeTaskId: next.activeTaskId,
+  status: next.status,
+  originalActiveTaskId: state.activeTaskId
+};
+"""
+    )
+
+    assert output == {
+        "normalHandoffReady": True,
+        "activeTaskId": "",
+        "status": "completed",
+        "originalActiveTaskId": "pipeline-task",
+    }
+
+
+def test_reducer_attaches_pipeline_scoped_events_to_current_step() -> None:
+    output = reducer_harness(
+        """
+let state = reducers.createInitialState({});
+[
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "step_started",
+      status: "working",
+      step: {id: "deploying"},
+      data: {summary: "开始部署"}
+    }}}
+  },
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "text_delta",
+      status: "working",
+      scope: "pipeline",
+      data: {text: "开始部署流程"}
+    }}}
+  },
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "permission_requested",
+      status: "working",
+      scope: "pipeline",
+      data: {toolName: "ros_stack", reason: "创建资源栈"}
+    }}}
+  },
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "tool_result",
+      status: "working",
+      scope: "pipeline",
+      data: {toolName: "ros_stack", result: {stackId: "stack-1", stackStatus: "CREATE_COMPLETE"}}
+    }}}
+  },
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "step_completed",
+      status: "completed",
+      step: {id: "deploying"},
+      data: {conclusion: {summary: "部署完成"}}
+    }}}
+  }
+].forEach((payload) => {
+  state = reducers.reducePipelinePayload(state, payload);
+});
+return {
+  currentStepId: state.currentStepId,
+  deployingEvents: state.steps.deploying.events.map((event) => event.eventType)
+};
+"""
+    )
+
+    assert output == {
+        "currentStepId": "deploying",
+        "deployingEvents": ["step_started", "text_delta", "permission_requested", "tool_result", "step_completed"],
+    }
+
+
+def test_reducer_does_not_attach_pipeline_scoped_events_to_completed_step() -> None:
+    output = reducer_harness(
+        """
+let state = reducers.createInitialState({});
+[
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "step_started",
+      status: "working",
+      step: {id: "deploying"},
+      data: {summary: "开始部署"}
+    }}}
+  },
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "step_completed",
+      status: "completed",
+      step: {id: "deploying"},
+      data: {conclusion: {summary: "部署完成"}}
+    }}}
+  },
+  {
+    metadata: {iac_code: {pipeline: {
+      eventType: "text_delta",
+      status: "completed",
+      scope: "pipeline",
+      data: {text: "流程结束后的普通消息"}
+    }}}
+  }
+].forEach((payload) => {
+  state = reducers.reducePipelinePayload(state, payload);
+});
+return {
+  currentStepId: state.currentStepId,
+  deployingEvents: state.steps.deploying.events.map((event) => event.eventType || event.event_type)
+};
+"""
+    )
+
+    assert output == {
+        "currentStepId": "deploying",
+        "deployingEvents": ["step_started", "step_completed"],
+    }
+
+
+def test_reducer_applies_raw_snapshot_like_payload_with_snake_case_aliases() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.activeTaskId = "pipeline-task";
+state.pendingInput = {prompt: "旧问题", options: [{id: "old", label: "旧选项"}]};
+const next = reducers.reducePipelinePayload(state, {
+  status: "input_required",
+  task_id: "task-1",
+  context_id: "ctx-1",
+  last_sequence: "12",
+  pending_input: {
+    question: "请选择部署目标",
+    options: [{id: "nginx", label: "Nginx 网站"}]
+  },
+  normal_handoff: {action: "switch_to_normal", target_mode: "normal"}
+});
+return {
+  status: next.status,
+  taskId: next.pipelineTaskId,
+  contextId: next.contextId,
+  lastSequence: next.lastSequence,
+  prompt: next.pendingInput && next.pendingInput.prompt,
+  activeTaskId: next.activeTaskId,
+  normalHandoffReady: next.normalHandoffReady,
+  originalPrompt: state.pendingInput.prompt
+};
+"""
+    )
+
+    assert output == {
+        "status": "waiting_input",
+        "taskId": "task-1",
+        "contextId": "ctx-1",
+        "lastSequence": 12,
+        "prompt": "请选择部署目标",
+        "activeTaskId": "",
+        "normalHandoffReady": True,
+        "originalPrompt": "旧问题",
+    }
+
+
+def test_reducer_does_not_retain_mutable_candidate_payload_references() -> None:
+    output = reducer_harness(
+        """
+const costItems = [{name: "ecs"}];
+const payload = {snapshot: {display: {candidateDetails: [{
+  candidateName: "方案",
+  candidateIndex: 0,
+  costItems
+}]}}};
+const next = reducers.reducePipelinePayload(reducers.createInitialState({}), payload);
+payload.snapshot.display.candidateDetails[0].candidateName = "被污染";
+costItems[0].name = "mutated";
+return {
+  name: next.candidates[0].name,
+  costItemName: next.candidates[0].costItems[0].name
+};
+"""
+    )
+
+    assert output == {
+        "name": "方案",
+        "costItemName": "ecs",
+    }
+
+
+def test_upsert_candidate_does_not_mutate_original_state() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [{name: "旧方案", candidateIndex: 0, costItems: []}];
+const next = reducers.upsertCandidate(state, {
+  name: "新方案",
+  candidateIndex: 0,
+  totalMonthlyCost: "CNY 80",
+  costItems: [{name: "ecs"}]
+});
+return {
+  sameState: next === state,
+  sameCandidates: next.candidates === state.candidates,
+  originalName: state.candidates[0].name,
+  originalCost: state.candidates[0].totalMonthlyCost || "",
+  nextName: next.candidates[0].name,
+  nextCost: next.candidates[0].totalMonthlyCost,
+  nextCostItem: next.candidates[0].costItems[0].name
+};
+"""
+    )
+
+    assert output == {
+        "sameState": False,
+        "sameCandidates": False,
+        "originalName": "旧方案",
+        "originalCost": "",
+        "nextName": "新方案",
+        "nextCost": "CNY 80",
+        "nextCostItem": "ecs",
+    }
+
+
+def test_upsert_candidate_deduplicates_numeric_string_candidate_index() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [{name: "旧方案", candidateIndex: 1, costItems: []}];
+const next = reducers.upsertCandidate(state, {
+  name: "新方案",
+  candidateIndex: "1",
+  totalMonthlyCost: "¥0/月"
+});
+return {
+  count: next.candidates.length,
+  index: next.candidates[0].candidateIndex,
+  name: next.candidates[0].name,
+  originalName: state.candidates[0].name
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "index": 1,
+        "name": "新方案",
+        "originalName": "旧方案",
+    }
+
+
+def test_upsert_candidate_merges_indexed_detail_into_same_name_placeholder() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [{
+  name: "标准 VPC 网络",
+  candidateIndex: null,
+  summary: "",
+  totalMonthlyCost: "",
+  costItems: []
+}];
+const next = reducers.upsertCandidate(state, {
+  name: "标准 VPC 网络",
+  candidateIndex: 0,
+  summary: "仅创建 VPC，作为后续子网和云资源的网络容器。",
+  totalMonthlyCost: "¥33.89/月",
+  costItems: [{name: "VPC", monthly_cost: "免费"}]
+});
+const candidate = next.candidates.find((item) => item.candidateIndex === 0) || next.candidates[0];
+return {
+  count: next.candidates.length,
+  index: candidate.candidateIndex,
+  name: candidate.name,
+  summary: candidate.summary,
+  cost: candidate.totalMonthlyCost,
+  costItem: candidate.costItems[0] && candidate.costItems[0].name
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "index": 0,
+        "name": "标准 VPC 网络",
+        "summary": "仅创建 VPC，作为后续子网和云资源的网络容器。",
+        "cost": "¥33.89/月",
+        "costItem": "VPC",
+    }
+
+
+def test_upsert_candidate_does_not_overwrite_existing_detail_with_empty_fields() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState({});
+state.candidates = [{
+  name: "VPC 含可用区交换机",
+  candidateIndex: 1,
+  summary: "创建 VPC 及一个可用区交换机，开箱即用。",
+  totalMonthlyCost: "¥0/月",
+  costItems: [{name: "VPC", monthly_cost: "免费"}]
+}];
+const next = reducers.upsertCandidate(state, {
+  name: "VPC 含可用区交换机",
+  candidateIndex: 1,
+  summary: "",
+  totalMonthlyCost: "",
+  costItems: []
+});
+return {
+  count: next.candidates.length,
+  summary: next.candidates[0].summary,
+  cost: next.candidates[0].totalMonthlyCost,
+  costItemCount: next.candidates[0].costItems.length
+};
+"""
+    )
+
+    assert output == {
+        "count": 1,
+        "summary": "创建 VPC 及一个可用区交换机，开箱即用。",
+        "cost": "¥0/月",
+        "costItemCount": 1,
+    }
+
+
+def test_extract_pipeline_envelope_handles_snapshot_metadata_wrapper() -> None:
+    output = reducer_harness(
+        """
+const envelope = reducers.extractPipelineEnvelope({
+  snapshot: {
+    metadata: {iac_code: {pipeline: {
+      eventType: "step_completed",
+      taskId: "task-1",
+      contextId: "ctx-1",
+      step: {id: "architecture_planning"}
+    }}}
+  }
+});
+return {
+  taskId: envelope.taskId,
+  contextId: envelope.contextId,
+  stepId: envelope.step.id
+};
+"""
+    )
+
+    assert output == {
+        "taskId": "task-1",
+        "contextId": "ctx-1",
+        "stepId": "architecture_planning",
+    }
+
+
+def test_reducer_clears_active_task_on_normal_handoff() -> None:
+    output = reducer_harness(
+        """
+const state = reducers.createInitialState();
+state.pipelineTaskId = "pipeline-task";
+state.activeTaskId = "pipeline-task";
+const next = reducers.reducePipelinePayload(state, {
+  metadata: {iac_code: {pipeline: {
+    eventType: "pipeline_handoff_ready",
+    taskId: "pipeline-task",
+    contextId: "ctx-1",
+    status: "completed",
+    data: {action: "switch_to_normal", targetMode: "normal"}
+  }}}
+});
+return {
+  normalHandoffReady: next.normalHandoffReady,
+  activeTaskId: next.activeTaskId,
+  contextId: next.contextId
+};
+"""
+    )
+
+    assert output == {
+        "normalHandoffReady": True,
+        "activeTaskId": "",
+        "contextId": "ctx-1",
+    }
diff --git a/tests/a2a/test_selling_console_script.py b/tests/a2a/test_selling_console_script.py
new file mode 100644
index 00000000..9c160a4a
--- /dev/null
+++ b/tests/a2a/test_selling_console_script.py
@@ -0,0 +1,1054 @@
+from __future__ import annotations
+
+import html as html_lib
+import importlib.util
+import json
+import os
+import shutil
+import socket
+import subprocess
+import sys
+import threading
+from contextlib import contextmanager
+from http.client import RemoteDisconnected
+from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
+from pathlib import Path
+from typing import Any
+from urllib.error import HTTPError
+from urllib.parse import urlencode, urlparse
+from urllib.request import Request, urlopen
+
+import pytest
+
+SCRIPT_PATH = Path(__file__).resolve().parents[2] / "scripts" / "a2a" / "selling_console.py"
+SCRIPTS_README_PATH = Path(__file__).resolve().parents[2] / "scripts" / "README.md"
+NODE_RELATIVE_PATH = Path(".cache/codex-runtimes/codex-primary-runtime/dependencies/node/bin/node")
+RECOVERABLE_JSONRPC_ERROR = {
+    "jsonrpc": "2.0",
+    "id": "1",
+    "error": {
+        "code": -32602,
+        "message": "Pipeline already running.",
+        "data": {
+            "recoverableTaskId": "task-owner",
+            "contextId": "ctx-1",
+            "sidecarStatus": "running",
+        },
+    },
+}
+
+
+def bundled_node_candidates() -> list[Path]:
+    override = os.environ.get("IAC_CODE_TEST_NODE")
+    if override:
+        return [Path(override).expanduser()]
+    candidates = [Path.home() / NODE_RELATIVE_PATH]
+    home_env = os.environ.get("HOME")
+    if home_env:
+        candidates.append(Path(home_env).expanduser() / NODE_RELATIVE_PATH)
+    candidates.extend(parent / NODE_RELATIVE_PATH for parent in SCRIPT_PATH.parents)
+    return candidates
+
+
+def node_command() -> list[str]:
+    node = shutil.which("node")
+    if node:
+        return [node]
+    for fallback in bundled_node_candidates():
+        if fallback.exists():
+            return [str(fallback)]
+    pytest.skip("node is not installed")
+
+
+def test_scripts_readme_mentions_selling_console() -> None:
+    readme = SCRIPTS_README_PATH.read_text(encoding="utf-8")
+
+    assert "a2a/selling_console.py" in readme
+    assert "Selling pipeline console" in readme
+
+
+def load_module():
+    spec = importlib.util.spec_from_file_location("selling_console", SCRIPT_PATH)
+    assert spec is not None
+    module = importlib.util.module_from_spec(spec)
+    assert spec.loader is not None
+    sys.modules[spec.name] = module
+    spec.loader.exec_module(module)
+    return module
+
+
+class JsonTargetHandler(BaseHTTPRequestHandler):
+    response_status = 200
+    response_body: dict[str, Any] = {"ok": True}
+    response_headers: dict[str, str] = {"Content-Type": "application/json"}
+    requests: list[dict[str, Any]] = []
+
+    def log_message(self, format: str, *args: object) -> None:
+        return None
+
+    def do_GET(self) -> None:
+        self._record_request()
+        self._send_response()
+
+    def do_POST(self) -> None:
+        self._record_request()
+        self._send_response()
+
+    def _record_request(self) -> None:
+        raw_body = self.rfile.read(int(self.headers.get("Content-Length", "0") or "0"))
+        self.__class__.requests.append(
+            {
+                "method": self.command,
+                "path": self.path,
+                "headers": dict(self.headers.items()),
+                "body": raw_body.decode("utf-8") if raw_body else "",
+            }
+        )
+
+    def _send_response(self) -> None:
+        body = json.dumps(self.__class__.response_body).encode("utf-8")
+        self.send_response(self.__class__.response_status)
+        for name, value in self.__class__.response_headers.items():
+            self.send_header(name, value)
+        self.send_header("Content-Length", str(len(body)))
+        self.end_headers()
+        self.wfile.write(body)
+
+
+class SseTargetHandler(BaseHTTPRequestHandler):
+    requests: list[dict[str, Any]] = []
+
+    def log_message(self, format: str, *args: object) -> None:
+        return None
+
+    def do_POST(self) -> None:
+        raw_body = self.rfile.read(int(self.headers.get("Content-Length", "0") or "0"))
+        self.__class__.requests.append(
+            {
+                "headers": dict(self.headers.items()),
+                "body": raw_body.decode("utf-8"),
+            }
+        )
+        body = (
+            b'data: {"jsonrpc":"2.0","result":{"id":"task-1","contextId":"ctx-1",'
+            b'"status":{"state":"TASK_STATE_WORKING"}}}\n\n'
+        )
+        self.send_response(200)
+        self.send_header("Content-Type", "text/event-stream")
+        self.send_header("Content-Length", str(len(body)))
+        self.end_headers()
+        self.wfile.write(body)
+
+
+@contextmanager
+def serve_handler(handler_cls: type[BaseHTTPRequestHandler]):
+    server = ThreadingHTTPServer(("127.0.0.1", 0), handler_cls)
+    thread = threading.Thread(target=server.serve_forever, daemon=True)
+    thread.start()
+    try:
+        host, port = server.server_address
+        yield f"http://{host}:{port}"
+    finally:
+        server.shutdown()
+        server.server_close()
+        thread.join(timeout=2)
+
+
+def start_console(console, *, default_cwd: str = "/workspace/demo"):
+    config = console.SellingConsoleConfig(
+        host="127.0.0.1",
+        port=0,
+        default_server_url="http://127.0.0.1:41299",
+        default_cwd=default_cwd,
+    )
+    server = console.create_server(config)
+    thread = threading.Thread(target=server.serve_forever, daemon=True)
+    thread.start()
+    host, port = server.server_address
+
+    class RunningServer:
+        url = f"http://{host}:{port}"
+
+        def close(self) -> None:
+            server.shutdown()
+            server.server_close()
+            thread.join(timeout=2)
+
+    return RunningServer()
+
+
+def test_create_server_disables_address_reuse_on_windows(monkeypatch) -> None:
+    console = load_module()
+    monkeypatch.setattr(console.sys, "platform", "win32")
+    config = console.SellingConsoleConfig(
+        host="127.0.0.1",
+        port=0,
+        default_server_url="http://127.0.0.1:41299",
+        default_cwd="/workspace/demo",
+    )
+
+    server = console.create_server(config)
+    try:
+        assert server.allow_reuse_address is False
+    finally:
+        server.server_close()
+
+
+def get_text(url: str) -> tuple[int, str, str]:
+    with urlopen(url, timeout=5) as response:
+        return response.status, response.headers.get("Content-Type", ""), response.read().decode("utf-8")
+
+
+def get_json(url: str) -> tuple[int, dict[str, Any]]:
+    with urlopen(url, timeout=5) as response:
+        return response.status, json.loads(response.read().decode("utf-8"))
+
+
+def get_json_error(url: str) -> tuple[int, dict[str, Any]]:
+    try:
+        with urlopen(url, timeout=5) as response:
+            return response.status, json.loads(response.read().decode("utf-8"))
+    except HTTPError as exc:
+        try:
+            raw_body = exc.read()
+        finally:
+            exc.close()
+        return exc.code, json.loads(raw_body.decode("utf-8"))
+
+
+def post_json(url: str, body: dict[str, Any]) -> tuple[int, dict[str, Any]]:
+    request = Request(
+        url,
+        data=json.dumps(body).encode("utf-8"),
+        headers={"Content-Type": "application/json"},
+        method="POST",
+    )
+    with urlopen(request, timeout=5) as response:
+        return response.status, json.loads(response.read().decode("utf-8"))
+
+
+def post_json_error(url: str, body: dict[str, Any]) -> tuple[int, dict[str, Any]]:
+    request = Request(
+        url,
+        data=json.dumps(body).encode("utf-8"),
+        headers={"Content-Type": "application/json"},
+        method="POST",
+    )
+    try:
+        with urlopen(request, timeout=5) as response:
+            return response.status, json.loads(response.read().decode("utf-8"))
+    except HTTPError as exc:
+        try:
+            raw_body = exc.read()
+        finally:
+            exc.close()
+        return exc.code, json.loads(raw_body.decode("utf-8"))
+
+
+def post_raw(url: str, body: dict[str, Any]) -> tuple[int, str, str]:
+    request = Request(
+        url,
+        data=json.dumps(body).encode("utf-8"),
+        headers={"Content-Type": "application/json"},
+        method="POST",
+    )
+    with urlopen(request, timeout=5) as response:
+        return response.status, response.read().decode("utf-8"), response.headers.get("Content-Type", "")
+
+
+def post_raw_response(url: str, body: dict[str, Any]) -> tuple[int, str, str]:
+    request = Request(
+        url,
+        data=json.dumps(body).encode("utf-8"),
+        headers={"Content-Type": "application/json"},
+        method="POST",
+    )
+    try:
+        with urlopen(request, timeout=5) as response:
+            return response.status, response.read().decode("utf-8"), response.headers.get("Content-Type", "")
+    except HTTPError as exc:
+        try:
+            raw_body = exc.read()
+        finally:
+            exc.close()
+        return exc.code, raw_body.decode("utf-8"), exc.headers.get("Content-Type", "")
+    except RemoteDisconnected as exc:
+        return 0, str(exc), ""
+
+
+def raw_http_request(url: str, request_text: str) -> tuple[int, str]:
+    parsed = urlparse(url)
+    assert parsed.hostname is not None
+    assert parsed.port is not None
+    with socket.create_connection((parsed.hostname, parsed.port), timeout=5) as sock:
+        sock.settimeout(5)
+        sock.sendall(request_text.encode("ascii"))
+        chunks = []
+        while True:
+            try:
+                chunk = sock.recv(65536)
+            except TimeoutError:
+                break
+            if not chunk:
+                break
+            chunks.append(chunk)
+
+    response = b"".join(chunks).decode("utf-8", errors="replace")
+    status_line = response.splitlines()[0] if response else ""
+    status_parts = status_line.split()
+    status = int(status_parts[1]) if len(status_parts) >= 2 and status_parts[0].startswith("HTTP/") else 0
+    _, _, body = response.partition("\r\n\r\n")
+    return status, body
+
+
+def test_pipeline_state_route_requires_context_or_task() -> None:
+    console = load_module()
+    running = start_console(console)
+    try:
+        query = urlencode({"serverUrl": "http://127.0.0.1:41299"})
+        with pytest.raises(HTTPError) as exc_info:
+            get_json(f"{running.url}/api/pipeline/state?{query}")
+    finally:
+        running.close()
+
+    assert exc_info.value.code == 400
+    try:
+        response_body = json.loads(exc_info.value.read().decode("utf-8"))
+    finally:
+        exc_info.value.close()
+    assert response_body == {"ok": False, "error": "contextId or taskId is required"}
+
+
+def test_pipeline_state_route_proxies_query_parameters() -> None:
+    console = load_module()
+    JsonTargetHandler.requests = []
+    JsonTargetHandler.response_body = {"snapshot": {"status": "working"}}
+
+    with serve_handler(JsonTargetHandler) as target:
+        running = start_console(console)
+        try:
+            query = urlencode({"serverUrl": target, "contextId": "ctx-1", "taskId": "task-1", "afterSequence": "7"})
+            status, body = get_json(f"{running.url}/api/pipeline/state?{query}")
+        finally:
+            running.close()
+
+    assert status == 200
+    assert body == {"snapshot": {"status": "working"}}
+    assert JsonTargetHandler.requests[0]["path"] == (
+        "/iac-code/pipeline/state?contextId=ctx-1&taskId=task-1&afterSequence=7"
+    )
+
+
+def test_task_get_route_sends_get_task_jsonrpc() -> None:
+    console = load_module()
+    JsonTargetHandler.requests = []
+    JsonTargetHandler.response_body = {"jsonrpc": "2.0", "result": {"id": "task-1"}}
+
+    with serve_handler(JsonTargetHandler) as target:
+        running = start_console(console)
+        try:
+            query = urlencode({"serverUrl": target, "taskId": "task-1", "historyLength": "2"})
+            status, body = get_json(f"{running.url}/api/task/get?{query}")
+        finally:
+            running.close()
+
+    assert status == 200
+    assert body == {"jsonrpc": "2.0", "result": {"id": "task-1"}}
+    payload = json.loads(JsonTargetHandler.requests[0]["body"])
+    assert payload["method"] == "GetTask"
+    assert payload["params"] == {"id": "task-1", "historyLength": 2}
+
+
+def test_task_cancel_route_sends_cancel_task_jsonrpc() -> None:
+    console = load_module()
+    JsonTargetHandler.requests = []
+    JsonTargetHandler.response_body = {"jsonrpc": "2.0", "result": {"id": "task-1"}}
+
+    with serve_handler(JsonTargetHandler) as target:
+        running = start_console(console)
+        try:
+            status, body = post_json(f"{running.url}/api/task/cancel", {"serverUrl": target, "taskId": "task-1"})
+        finally:
+            running.close()
+
+    assert status == 200
+    assert body == {"jsonrpc": "2.0", "result": {"id": "task-1"}}
+    payload = json.loads(JsonTargetHandler.requests[0]["body"])
+    assert payload["method"] == "CancelTask"
+    assert payload["params"] == {"id": "task-1"}
+
+
+def test_message_stream_route_forwards_sse_and_cwd_metadata() -> None:
+    console = load_module()
+    SseTargetHandler.requests = []
+
+    with serve_handler(SseTargetHandler) as target:
+        running = start_console(console)
+        try:
+            status, text, content_type = post_raw(
+                f"{running.url}/api/message/stream",
+                {"serverUrl": target, "cwd": "/workspace/demo", "prompt": "部署一个静态网站"},
+            )
+        finally:
+            running.close()
+
+    assert status == 200
+    assert "event-stream" in content_type
+    assert "TASK_STATE_WORKING" in text
+    payload = json.loads(SseTargetHandler.requests[0]["body"])
+    assert payload["method"] == "SendStreamingMessage"
+    assert payload["params"]["message"]["metadata"] == {"iac_code": {"cwd": "/workspace/demo"}}
+
+
+def test_message_stream_route_surfaces_recoverable_task_id_from_jsonrpc_error() -> None:
+    console = load_module()
+    JsonTargetHandler.response_status = 200
+    JsonTargetHandler.response_body = RECOVERABLE_JSONRPC_ERROR
+    JsonTargetHandler.response_headers = {"Content-Type": "application/json"}
+    JsonTargetHandler.requests = []
+
+    with serve_handler(JsonTargetHandler) as target:
+        running = start_console(console)
+        try:
+            status, text, content_type = post_raw(
+                f"{running.url}/api/message/stream",
+                {"serverUrl": target, "cwd": "/workspace/demo", "prompt": "部署一个静态网站"},
+            )
+        finally:
+            running.close()
+
+    assert status == 200
+    assert "event-stream" in content_type
+    assert "data: " in text
+    assert "Pipeline already running." in text
+    assert "task-owner" in text
+
+
+def test_selling_console_web_extracts_delivery_task_aliases() -> None:
+    console = load_module()
+    app_js = (console.WEB_ROOT / "app.js").read_text(encoding="utf-8")
+
+    assert '"deliveryTaskId"' in app_js
+    assert '"deliveryContextId"' in app_js
+
+
+def test_message_stream_route_keeps_read_errors_in_sse_body(monkeypatch: pytest.MonkeyPatch) -> None:
+    console = load_module()
+
+    class TimedOutSseStream:
+        status = 200
+
+        def __init__(self) -> None:
+            self._sent_first_event = False
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, exc_type, exc_value, traceback) -> None:
+            return None
+
+        def __iter__(self):
+            return self
+
+        def __next__(self) -> bytes:
+            if self._sent_first_event:
+                raise TimeoutError("upstream timed out")
+            self._sent_first_event = True
+            return b'data: {"ok": true, "event": "first"}\n\n'
+
+    def open_sse_stream(server_url: str, payload: dict[str, Any]) -> TimedOutSseStream:
+        assert server_url == "http://127.0.0.1:41299"
+        assert payload["method"] == "SendStreamingMessage"
+        return TimedOutSseStream()
+
+    monkeypatch.setattr(console.a2a_debugger, "_open_sse_stream", open_sse_stream)
+
+    running = start_console(console)
+    try:
+        status, text, content_type = post_raw(
+            f"{running.url}/api/message/stream",
+            {
+                "serverUrl": "http://127.0.0.1:41299",
+                "cwd": "/workspace/demo",
+                "prompt": "部署一个静态网站",
+            },
+        )
+    finally:
+        running.close()
+
+    assert status == 200
+    assert "event-stream" in content_type
+    assert 'data: {"ok": true, "event": "first"}' in text
+    assert '"ok": false' in text
+    assert "upstream timed out" in text
+    assert "HTTP/" not in text
+    assert "Content-Type:" not in text
+
+
+def test_message_stream_route_reports_upstream_reset_before_headers(monkeypatch: pytest.MonkeyPatch) -> None:
+    console = load_module()
+
+    def open_sse_stream(server_url: str, payload: dict[str, Any]):
+        assert server_url == "http://127.0.0.1:41299"
+        assert payload["method"] == "SendStreamingMessage"
+        raise ConnectionResetError("upstream reset before headers")
+
+    monkeypatch.setattr(console.a2a_debugger, "_open_sse_stream", open_sse_stream)
+
+    running = start_console(console)
+    try:
+        status, text, content_type = post_raw_response(
+            f"{running.url}/api/message/stream",
+            {
+                "serverUrl": "http://127.0.0.1:41299",
+                "cwd": "/workspace/demo",
+                "prompt": "部署一个静态网站",
+            },
+        )
+    finally:
+        running.close()
+
+    assert status == 502
+    assert "event-stream" in content_type
+    assert '"ok": false' in text
+    assert "upstream reset before headers" in text
+
+
+def test_message_stream_route_keeps_upstream_reset_during_stream_in_sse_body(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    console = load_module()
+
+    class ResettingSseStream:
+        status = 200
+
+        def __init__(self) -> None:
+            self._sent_first_event = False
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, exc_type, exc_value, traceback) -> None:
+            return None
+
+        def __iter__(self):
+            return self
+
+        def __next__(self) -> bytes:
+            if self._sent_first_event:
+                raise ConnectionResetError("upstream reset during stream")
+            self._sent_first_event = True
+            return b'data: {"ok": true, "event": "first"}\n\n'
+
+    def open_sse_stream(server_url: str, payload: dict[str, Any]) -> ResettingSseStream:
+        assert server_url == "http://127.0.0.1:41299"
+        assert payload["method"] == "SendStreamingMessage"
+        return ResettingSseStream()
+
+    monkeypatch.setattr(console.a2a_debugger, "_open_sse_stream", open_sse_stream)
+
+    running = start_console(console)
+    try:
+        status, text, content_type = post_raw(
+            f"{running.url}/api/message/stream",
+            {
+                "serverUrl": "http://127.0.0.1:41299",
+                "cwd": "/workspace/demo",
+                "prompt": "部署一个静态网站",
+            },
+        )
+    finally:
+        running.close()
+
+    assert status == 200
+    assert "event-stream" in content_type
+    assert 'data: {"ok": true, "event": "first"}' in text
+    assert '"ok": false' in text
+    assert "upstream reset during stream" in text
+    assert "HTTP/" not in text
+    assert "Content-Type:" not in text
+
+
+def test_message_stream_route_does_not_rewrite_headers_after_client_write_error(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    console = load_module()
+    send_sse_error_calls: list[tuple[int, str]] = []
+    write_attempts: list[bytes] = []
+
+    class OneLineSseStream:
+        status = 200
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, exc_type, exc_value, traceback) -> None:
+            return None
+
+        def __iter__(self):
+            yield b'data: {"ok": true, "event": "first"}\n\n'
+
+    class BodyWriteFailingWriter:
+        def __init__(self, wrapped) -> None:
+            self._wrapped = wrapped
+
+        def write(self, data: bytes) -> int:
+            write_attempts.append(data)
+            raise OSError("disk full-ish write failure")
+
+        def __getattr__(self, name: str):
+            return getattr(self._wrapped, name)
+
+    def open_sse_stream(server_url: str, payload: dict[str, Any]) -> OneLineSseStream:
+        assert server_url == "http://127.0.0.1:41299"
+        assert payload["method"] == "SendStreamingMessage"
+        return OneLineSseStream()
+
+    original_end_headers = console.BaseHTTPRequestHandler.end_headers
+
+    def end_headers(handler) -> None:
+        original_end_headers(handler)
+        if handler.path == "/api/message/stream":
+            handler.wfile = BodyWriteFailingWriter(handler.wfile)
+
+    def send_sse_error(handler, status: int, message: str) -> None:
+        send_sse_error_calls.append((status, message))
+
+    monkeypatch.setattr(console.a2a_debugger, "_open_sse_stream", open_sse_stream)
+    monkeypatch.setattr(console.BaseHTTPRequestHandler, "end_headers", end_headers)
+    monkeypatch.setattr(console.a2a_debugger, "_send_sse_error", send_sse_error)
+
+    running = start_console(console)
+    try:
+        status, _text, content_type = post_raw(
+            f"{running.url}/api/message/stream",
+            {
+                "serverUrl": "http://127.0.0.1:41299",
+                "cwd": "/workspace/demo",
+                "prompt": "部署一个静态网站",
+            },
+        )
+    finally:
+        running.close()
+
+    assert status == 200
+    assert "event-stream" in content_type
+    assert write_attempts == [b'data: {"ok": true, "event": "first"}\n\n']
+    assert send_sse_error_calls == []
+
+
+def test_message_stream_route_does_not_rewrite_headers_when_sse_error_event_write_fails(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    console = load_module()
+    send_json_calls: list[tuple[int, Any]] = []
+    send_sse_error_calls: list[tuple[int, str]] = []
+    write_attempts: list[bytes] = []
+
+    class TimedOutSseStream:
+        status = 200
+
+        def __init__(self) -> None:
+            self._sent_first_event = False
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, exc_type, exc_value, traceback) -> None:
+            return None
+
+        def __iter__(self):
+            return self
+
+        def __next__(self) -> bytes:
+            if self._sent_first_event:
+                raise TimeoutError("upstream timed out")
+            self._sent_first_event = True
+            return b'data: {"ok": true, "event": "first"}\n\n'
+
+    class ErrorEventWriteFailingWriter:
+        def __init__(self, wrapped) -> None:
+            self._wrapped = wrapped
+
+        def write(self, data: bytes) -> int:
+            write_attempts.append(data)
+            if len(write_attempts) == 2:
+                raise OSError("cannot write error event")
+            return self._wrapped.write(data)
+
+        def __getattr__(self, name: str):
+            return getattr(self._wrapped, name)
+
+    def open_sse_stream(server_url: str, payload: dict[str, Any]) -> TimedOutSseStream:
+        assert server_url == "http://127.0.0.1:41299"
+        assert payload["method"] == "SendStreamingMessage"
+        return TimedOutSseStream()
+
+    original_end_headers = console.BaseHTTPRequestHandler.end_headers
+
+    def end_headers(handler) -> None:
+        original_end_headers(handler)
+        if handler.path == "/api/message/stream":
+            handler.wfile = ErrorEventWriteFailingWriter(handler.wfile)
+
+    def send_json(handler, status: int, value: Any) -> None:
+        send_json_calls.append((status, value))
+
+    def send_sse_error(handler, status: int, message: str) -> None:
+        send_sse_error_calls.append((status, message))
+
+    monkeypatch.setattr(console.a2a_debugger, "_open_sse_stream", open_sse_stream)
+    monkeypatch.setattr(console.BaseHTTPRequestHandler, "end_headers", end_headers)
+    monkeypatch.setattr(console.a2a_debugger, "_send_json", send_json)
+    monkeypatch.setattr(console.a2a_debugger, "_send_sse_error", send_sse_error)
+
+    running = start_console(console)
+    try:
+        status, text, content_type = post_raw(
+            f"{running.url}/api/message/stream",
+            {
+                "serverUrl": "http://127.0.0.1:41299",
+                "cwd": "/workspace/demo",
+                "prompt": "部署一个静态网站",
+            },
+        )
+    finally:
+        running.close()
+
+    assert status == 200
+    assert "event-stream" in content_type
+    assert text == 'data: {"ok": true, "event": "first"}\n\n'
+    assert [attempt.startswith(b"data: ") for attempt in write_attempts] == [True, True]
+    assert send_json_calls == []
+    assert send_sse_error_calls == []
+
+
+def test_implemented_post_route_rejects_malformed_json() -> None:
+    console = load_module()
+    running = start_console(console)
+    try:
+        target = urlparse(running.url)
+        status, body = raw_http_request(
+            running.url,
+            "\r\n".join(
+                [
+                    "POST /api/task/cancel HTTP/1.1",
+                    f"Host: {target.hostname}:{target.port}",
+                    "Content-Type: application/json",
+                    "Content-Length: 1",
+                    "Connection: close",
+                    "",
+                    "{",
+                ]
+            ),
+        )
+    finally:
+        running.close()
+
+    assert status == 400
+    response_body = json.loads(body)
+    assert response_body["ok"] is False
+    assert response_body["error"] == "Request body must be valid JSON"
+
+
+def test_unimplemented_post_route_ignores_malformed_content_length() -> None:
+    console = load_module()
+    running = start_console(console)
+    try:
+        target = urlparse(running.url)
+        status, body = raw_http_request(
+            running.url,
+            "\r\n".join(
+                [
+                    "POST /api/not-found HTTP/1.1",
+                    f"Host: {target.hostname}:{target.port}",
+                    "Content-Type: application/json",
+                    "Content-Length: nope",
+                    "Connection: close",
+                    "",
+                    "",
+                ]
+            ),
+        )
+    finally:
+        running.close()
+
+    assert status == 404
+    assert json.loads(body)["error"] == "Not found"
+
+
+def test_parse_args_defaults_to_loopback_and_current_directory(monkeypatch, tmp_path: Path) -> None:
+    console = load_module()
+    monkeypatch.chdir(tmp_path)
+
+    args = console.parse_args([])
+
+    assert args.host == "127.0.0.1"
+    assert args.port == 41980
+    assert args.default_server_url == "http://127.0.0.1:41299"
+    assert args.default_cwd == str(tmp_path)
+
+
+def test_script_help_exits_successfully() -> None:
+    result = subprocess.run(
+        [sys.executable, str(SCRIPT_PATH), "--help"],
+        check=False,
+        capture_output=True,
+        text=True,
+    )
+
+    assert result.returncode == 0
+    assert "Run a local A2A selling pipeline console." in result.stdout
+
+
+def test_index_route_serves_selling_console_html(tmp_path: Path) -> None:
+    console = load_module()
+    running = start_console(console, default_cwd=str(tmp_path))
+    try:
+        status, content_type, html = get_text(running.url)
+    finally:
+        running.close()
+
+    assert status == 200
+    assert "text/html" in content_type
+    assert "阿里云" in html
+    assert "您的购买方案" in html
+    assert "window.SELLING_CONSOLE_DEFAULTS" in html
+    assert "http://127.0.0.1:41299" in html
+    assert str(tmp_path) in html
+
+
+def test_index_html_escapes_defaults_json_for_script_context() -> None:
+    console = load_module()
+    html = console.render_index_html(
+        console.SellingConsoleConfig(
+            host="127.0.0.1",
+            port=41980,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="</script><script>alert(1)</script>",
+        )
+    )
+
+    defaults_start = html.index("window.SELLING_CONSOLE_DEFAULTS = ")
+    script_end = html.index("</script>", defaults_start)
+    defaults_assignment = html[defaults_start:script_end]
+
+    assert "</script><script>" not in defaults_assignment
+    assert "<\\/script><script>alert(1)<\\/script>" in defaults_assignment
+
+
+def test_index_html_escapes_visible_default_input_values() -> None:
+    console = load_module()
+    default_server_url = "http://example.test/<api>?x='single'&y=\"q\""
+    default_cwd = "/tmp/<demo> & 'single' \"quoted\""
+
+    html = console.render_index_html(
+        console.SellingConsoleConfig(
+            host="127.0.0.1",
+            port=41980,
+            default_server_url=default_server_url,
+            default_cwd=default_cwd,
+        )
+    )
+
+    server_marker = 'id="server-url"'
+    server_tag_start = html.rindex("<input", 0, html.index(server_marker))
+    server_tag = html[server_tag_start : html.index(">", server_tag_start)]
+    cwd_marker = 'id="cwd"'
+    cwd_tag_start = html.rindex("<input", 0, html.index(cwd_marker))
+    cwd_tag = html[cwd_tag_start : html.index(">", cwd_tag_start)]
+
+    assert 'value="http://example.test/&lt;api&gt;?x=&#x27;single&#x27;&amp;y=&quot;q&quot;"' in server_tag
+    assert "<api>" not in server_tag
+    assert "x='single'" not in server_tag
+    assert 'y="q"' not in server_tag
+    assert 'value="/tmp/&lt;demo&gt; &amp; &#x27;single&#x27; &quot;quoted&quot;"' in cwd_tag
+    assert "<demo>" not in cwd_tag
+    assert "& 'single'" not in cwd_tag
+    assert '"quoted"' not in cwd_tag
+
+    defaults_start = html.index("window.SELLING_CONSOLE_DEFAULTS = ") + len("window.SELLING_CONSOLE_DEFAULTS = ")
+    defaults_end = html.index(";", defaults_start)
+    assert json.loads(html[defaults_start:defaults_end]) == {
+        "serverUrl": default_server_url,
+        "cwd": default_cwd,
+    }
+
+
+def test_index_html_does_not_reprocess_template_placeholders_inside_defaults() -> None:
+    console = load_module()
+    default_server_url = "__DEFAULT_CWD_ATTR__"
+    default_cwd = "__DEFAULT_SERVER_URL_ATTR__"
+
+    html = console.render_index_html(
+        console.SellingConsoleConfig(
+            host="127.0.0.1",
+            port=41980,
+            default_server_url=default_server_url,
+            default_cwd=default_cwd,
+        )
+    )
+
+    defaults_start = html.index("window.SELLING_CONSOLE_DEFAULTS = ") + len("window.SELLING_CONSOLE_DEFAULTS = ")
+    defaults_end = html.index(";", defaults_start)
+    assert json.loads(html[defaults_start:defaults_end]) == {
+        "serverUrl": default_server_url,
+        "cwd": default_cwd,
+    }
+    server_marker = 'id="server-url"'
+    server_tag_start = html.rindex("<input", 0, html.index(server_marker))
+    server_tag = html[server_tag_start : html.index(">", server_tag_start)]
+    cwd_marker = 'id="cwd"'
+    cwd_tag_start = html.rindex("<input", 0, html.index(cwd_marker))
+    cwd_tag = html[cwd_tag_start : html.index(">", cwd_tag_start)]
+
+    assert 'value="&#95;&#95;DEFAULT&#95;CWD&#95;ATTR&#95;&#95;"' in server_tag
+    assert 'value="&#95;&#95;DEFAULT&#95;SERVER&#95;URL&#95;ATTR&#95;&#95;"' in cwd_tag
+    assert 'value="__DEFAULT_CWD_ATTR__"' in html_lib.unescape(server_tag)
+    assert 'value="__DEFAULT_SERVER_URL_ATTR__"' in html_lib.unescape(cwd_tag)
+    assert "__DEFAULTS_JSON__" not in html
+    assert "__DEFAULT_SERVER_URL_ATTR__" not in html
+    assert "__DEFAULT_CWD_ATTR__" not in html
+
+
+def test_index_html_contains_screenshot_layout_regions() -> None:
+    console = load_module()
+
+    html = console.render_index_html(
+        console.SellingConsoleConfig(
+            host="127.0.0.1",
+            port=41980,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="/workspace/demo",
+        )
+    )
+
+    for expected in [
+        'class="topbar"',
+        'id="workflow-panel"',
+        'id="status-pill"',
+        'id="status-alert"',
+        'id="step-list"',
+        'aria-label="Pipeline 实时步骤"',
+        'id="composer-progress"',
+        'aria-label="Pipeline 总进度"',
+        'id="plans-grid"',
+        'id="composer-input"',
+        'id="send-button"',
+        'id="deep-think-button"',
+        'id="debug-drawer"',
+        'id="server-url"',
+        'id="cwd"',
+        'id="health-button"',
+        'id="fetch-state-button"',
+        'id="cancel-button"',
+        'aria-label="帮助"',
+        'aria-label="刷新"',
+        'aria-label="反馈"',
+        'aria-label="设置"',
+        "您的购买方案",
+        "内容由 AI 生成，方案与价格仅供参考",
+    ]:
+        assert expected in html
+    assert '<article class="step-card current">' not in html
+
+
+def test_index_html_uses_cache_busted_static_assets() -> None:
+    console = load_module()
+
+    html = console.render_index_html(
+        console.SellingConsoleConfig(
+            host="127.0.0.1",
+            port=41980,
+            default_server_url="http://127.0.0.1:41299",
+            default_cwd="/workspace/demo",
+        )
+    )
+
+    assert 'href="/styles.css?v=' in html
+    assert 'src="/app.js?v=' in html
+    assert "selling-console-20260618" not in html
+    assert "__STATIC_ASSET_VERSION__" not in html
+
+
+def test_styles_define_console_layout_tokens() -> None:
+    css = (SCRIPT_PATH.parent / "selling_console_web" / "styles.css").read_text(encoding="utf-8")
+
+    for expected in [
+        "--aliyun-orange",
+        ".console-shell",
+        ".workflow-panel",
+        ".plan-card",
+        ".price",
+        ".utility-rail",
+        "@media (max-width: 980px)",
+        "overflow-x: hidden",
+        "minmax(0, 1fr)",
+        ":focus-visible",
+        ":focus-within",
+        "overflow-wrap: anywhere",
+    ]:
+        assert expected in css
+
+
+def test_frontend_javascript_is_syntax_valid() -> None:
+    app_js = SCRIPT_PATH.parent / "selling_console_web" / "app.js"
+
+    result = subprocess.run([*node_command(), "--check", str(app_js)], capture_output=True, text=True, check=False)
+
+    assert result.returncode == 0, result.stderr
+
+
+def test_static_asset_route_serves_css_and_js() -> None:
+    console = load_module()
+    running = start_console(console)
+    try:
+        css_status, css_type, css = get_text(f"{running.url}/styles.css")
+        js_status, js_type, js = get_text(f"{running.url}/app.js")
+        css_query_status, css_query_type, css_query = get_text(f"{running.url}/styles.css?v=test")
+        js_query_status, js_query_type, js_query = get_text(f"{running.url}/app.js?v=test")
+    finally:
+        running.close()
+
+    assert css_status == 200
+    assert "text/css" in css_type
+    assert ".topbar" in css
+    assert js_status == 200
+    assert "javascript" in js_type
+    assert "SellingConsoleReducers" in js
+    assert css_query_status == 200
+    assert "text/css" in css_query_type
+    assert css_query == css
+    assert js_query_status == 200
+    assert "javascript" in js_query_type
+    assert js_query == js
+
+
+def test_static_asset_route_rejects_path_traversal() -> None:
+    console = load_module()
+    running = start_console(console)
+    try:
+        status, response_body = get_json_error(f"{running.url}/../debugger.py")
+    finally:
+        running.close()
+
+    assert status == 404
+    assert response_body["error"] == "Not found"
+
+
+def test_health_route_proxies_a2a_health_and_agent_card() -> None:
+    console = load_module()
+    JsonTargetHandler.requests = []
+    JsonTargetHandler.response_body = {"status": "ok"}
+
+    with serve_handler(JsonTargetHandler) as target:
+        running = start_console(console)
+        try:
+            query = urlencode({"serverUrl": target})
+            status, body = get_json(f"{running.url}/api/health?{query}")
+        finally:
+            running.close()
+
+    assert status == 200
+    assert body["ok"] is True
+    assert [request["path"] for request in JsonTargetHandler.requests] == ["/health", "/.well-known/agent-card.json"]
diff --git a/tests/a2a/test_transport_dispatcher.py b/tests/a2a/test_transport_dispatcher.py
index 5e9ae89b..7b4dd76a 100644
--- a/tests/a2a/test_transport_dispatcher.py
+++ b/tests/a2a/test_transport_dispatcher.py
@@ -1,4 +1,5 @@
 import asyncio
+import base64
 from types import SimpleNamespace
 
 import pytest
@@ -80,6 +81,54 @@ async def test_dispatcher_stream_yields_events(monkeypatch, tmp_path) -> None:
     await components.aclose()
 
 
+@pytest.mark.asyncio
+async def test_dispatcher_rejects_pipeline_image_before_executor_runs(monkeypatch, tmp_path) -> None:
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    monkeypatch.setattr(
+        "iac_code.a2a.parts.maybe_resize_and_downsample",
+        lambda raw: SimpleNamespace(data=raw, media_type="image/png"),
+    )
+    monkeypatch.setattr("iac_code.a2a.executor.is_model_multimodal", lambda *args, **kwargs: False)
+
+    async def fail_if_called(*args, **kwargs):
+        raise AssertionError("executor should not run for invalid image input")
+
+    monkeypatch.setattr("iac_code.a2a.executor.IacCodeA2AExecutor.execute", fail_if_called)
+    components = create_runtime_components(model="text-only-model", host="127.0.0.1", port=41242)
+    dispatcher = A2AJsonRpcDispatcher(components)
+
+    response = await dispatcher.dispatch(
+        {
+            "jsonrpc": "2.0",
+            "id": "image-invalid",
+            "method": "SendStreamingMessage",
+            "params": {
+                "message": {
+                    "messageId": "msg-image-invalid",
+                    "contextId": "ctx-image-invalid",
+                    "role": "ROLE_USER",
+                    "parts": [
+                        {
+                            "data": {
+                                "filename": "initial.png",
+                                "bytes": base64.b64encode(b"fake image").decode("ascii"),
+                            },
+                            "mediaType": "image/png",
+                        }
+                    ],
+                    "metadata": {"iac_code": {"cwd": str(tmp_path)}},
+                },
+                "configuration": {"acceptedOutputModes": ["text/plain"]},
+            },
+        }
+    )
+
+    assert response["id"] == "image-invalid"
+    assert response["error"]["code"] == -32602
+    assert response["error"]["message"] == "Current model text-only-model does not support image input."
+    await components.aclose()
+
+
 @pytest.mark.asyncio
 async def test_dispatcher_routes_second_pipeline_stream_as_interrupt(monkeypatch, tmp_path) -> None:
     monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
diff --git a/tests/a2a_e2e/test_run_recovery_scenarios.py b/tests/a2a_e2e/test_run_recovery_scenarios.py
index f3d13b23..d5ec6678 100644
--- a/tests/a2a_e2e/test_run_recovery_scenarios.py
+++ b/tests/a2a_e2e/test_run_recovery_scenarios.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import base64
 import importlib.util
 import json
 import sys
@@ -67,6 +68,111 @@ def test_normal_running_recovery_prompt_ignores_continue() -> None:
     assert "更早的方案选择消息" in runner.DEFAULT_NORMAL_RUNNING_RECOVERY_PROMPT
 
 
+def test_text_image_fixture_store_writes_png_and_manifest(tmp_path: Path) -> None:
+    runner = _load_runner()
+    store = runner.TextImageFixtureStore(tmp_path / "image-fixtures")
+
+    part = store.part("runtime-only", runner.DEFAULT_INITIAL_PROMPT)
+
+    assert part["filename"] == "runtime-only.png"
+    assert part["mediaType"] == "image/png"
+    assert base64.b64decode(part["bytes"]).startswith(b"\x89PNG\r\n\x1a\n")
+    assert (tmp_path / "image-fixtures" / "runtime-only.png").is_file()
+    manifest = json.loads((tmp_path / "image-fixtures" / "manifest.json").read_text(encoding="utf-8"))
+    assert manifest["runtime-only"]["text"] == runner.DEFAULT_INITIAL_PROMPT
+    assert manifest["runtime-only"]["mediaType"] == "image/png"
+    assert manifest["runtime-only"]["source"] == "generated"
+
+
+def test_static_text_image_fixtures_cover_fixed_image_prompts() -> None:
+    runner = _load_runner()
+    manifest = json.loads((runner.STATIC_TEXT_IMAGE_FIXTURE_ROOT / "manifest.json").read_text(encoding="utf-8"))
+
+    assert set(manifest) == set(runner.STATIC_TEXT_IMAGE_FIXTURES)
+    for key, text in runner.STATIC_TEXT_IMAGE_FIXTURES.items():
+        entry = manifest[key]
+        fixture_path = runner.STATIC_TEXT_IMAGE_FIXTURE_ROOT / entry["filename"]
+        assert entry["text"] == text
+        assert entry["mediaType"] == "image/png"
+        assert fixture_path.read_bytes().startswith(b"\x89PNG\r\n\x1a\n")
+
+
+def test_text_image_fixture_store_prefers_static_fixture(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    store = runner.TextImageFixtureStore(tmp_path / "image-fixtures")
+    static_manifest = json.loads((runner.STATIC_TEXT_IMAGE_FIXTURE_ROOT / "manifest.json").read_text(encoding="utf-8"))
+
+    def fail_render(_text: str) -> bytes:
+        raise AssertionError("static fixtures should avoid runtime image rendering")
+
+    monkeypatch.setattr(runner, "_render_text_png", fail_render)
+
+    part = store.part("initial", runner.STATIC_TEXT_IMAGE_FIXTURES["initial"])
+
+    static_path = runner.STATIC_TEXT_IMAGE_FIXTURE_ROOT / static_manifest["initial"]["filename"]
+    assert part["filename"] == static_path.name
+    assert part["mediaType"] == "image/png"
+    assert base64.b64decode(part["bytes"]) == static_path.read_bytes()
+    manifest = json.loads((tmp_path / "image-fixtures" / "manifest.json").read_text(encoding="utf-8"))
+    assert manifest["initial"]["source"] == "static"
+    assert manifest["initial"]["path"] == str(static_path)
+
+
+def test_scenario_harness_stream_passes_image_parts(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    captured: dict[str, object] = {}
+
+    args = SimpleNamespace(
+        server_cwd=str(tmp_path),
+        cwd="",
+        port=0,
+        host="127.0.0.1",
+        no_auto_approve_permissions=False,
+        provider="",
+        model="",
+        api_base="",
+        deterministic=False,
+        fault_at="",
+        stream_timeout=1,
+        run_dir=str(tmp_path / "run"),
+        run_root=str(tmp_path / "runs"),
+        python=sys.executable,
+        leave_server_running=False,
+    )
+    harness = runner.ScenarioHarness(args, scenario="image-initial")
+    image = {"filename": "initial.png", "mediaType": "image/png", "bytes": "iVBORw0KGgo="}
+
+    def fake_stream_message(**kwargs):
+        captured.update(kwargs)
+        return runner.StreamSummary(
+            name=kwargs["name"],
+            prompt=kwargs["prompt"],
+            request_task_id=kwargs["task_id"],
+            task_id="task-1",
+            context_id="ctx-1",
+        )
+
+    monkeypatch.setattr(runner, "stream_message", fake_stream_message)
+
+    harness.stream(prompt=runner.IMAGE_TEXT_PROMPT, name="01-image", context_id="", task_id="", images=[image])
+
+    assert captured["images"] == [image]
+
+
+def test_image_recovery_scenarios_are_registered() -> None:
+    runner = _load_runner()
+
+    for scenario in [
+        "image-initial",
+        "image-ask-waiting",
+        "image-selection-waiting",
+        "image-normal-handoff",
+        "image-interrupt",
+    ]:
+        assert scenario in runner._SCENARIOS
+        assert scenario in runner._REAL_CLOUD_SCENARIOS
+
+
 def test_answer_intervening_ask_inputs_reaches_selection(tmp_path: Path) -> None:
     runner = _load_runner()
     initial = runner.StreamSummary(
@@ -245,6 +351,1019 @@ def test_fault_after_snapshot_allows_explicit_real_cloud_opt_in() -> None:
     runner._validate_scenario_execution(args, "fault-after-snapshot")
 
 
+def test_rollback_step5_cleanup_scenarios_are_registered_and_require_real_cloud() -> None:
+    runner = _load_runner()
+
+    assert runner._SCENARIOS["rollback-step5-cleanup"] is runner.run_rollback_step5_cleanup
+    assert runner._SCENARIOS["rollback-step5-cleanup-recovery"] is runner.run_rollback_step5_cleanup_recovery
+
+    for scenario in ("rollback-step5-cleanup", "rollback-step5-cleanup-recovery"):
+        args = SimpleNamespace(allow_real_cloud=False, deterministic=False)
+        try:
+            runner._validate_scenario_execution(args, scenario)
+        except SystemExit as exc:
+            assert "--allow-real-cloud" in str(exc)
+        else:
+            raise AssertionError(f"{scenario} should require --allow-real-cloud")
+
+
+def test_stack_cleanup_snapshot_helpers_distinguish_deleted_and_retained_stacks() -> None:
+    runner = _load_runner()
+    snapshot = {
+        "snapshot": {
+            "cleanup": {
+                "resources": [
+                    {
+                        "provider": "ros",
+                        "resourceType": "stack",
+                        "resourceId": "stack-1",
+                        "regionId": "cn-hangzhou",
+                        "cleanupStatus": "completed",
+                        "stackStatus": "DELETE_COMPLETE",
+                    }
+                ]
+            },
+            "stacks": {
+                "current": {"stackId": "stack-2", "regionId": "cn-hangzhou", "current": True},
+                "byId": {
+                    "stack-1": {"stackId": "stack-1", "current": False, "cleared": True},
+                    "stack-2": {"stackId": "stack-2", "current": True},
+                    "stack-3": {"stackId": "stack-3", "isSuccess": False, "stackStatus": "CREATE_FAILED"},
+                },
+            },
+        }
+    }
+
+    cleanup_resource = runner._cleanup_resource_for_stack(snapshot, "stack-1")
+    assert cleanup_resource["cleanupStatus"] == "completed"
+    assert runner._cleanup_resource_completed(cleanup_resource) is True
+    assert runner._cleanup_resource_completed({"cleanupStatus": "completed"}) is False
+    assert runner._snapshot_current_stack_id(snapshot, exclude={"stack-1"}) == "stack-2"
+    assert runner._snapshot_current_stack_id(snapshot, exclude={"stack-2"}) is None
+    assert runner._ros_stack_deleted({"status": "DELETE_COMPLETE"}) is True
+    assert runner._ros_stack_deleted({"not_found": True}) is True
+    assert runner._ros_stack_retained({"status": "CREATE_COMPLETE"}) is True
+    assert runner._ros_stack_retained({"status": "DELETE_COMPLETE"}) is False
+    assert runner._ros_stack_retained({"status": "DELETE_ROLLBACK_COMPLETE"}) is False
+
+
+def _stack_current_changed_event(
+    *,
+    action: str,
+    stack_id: str,
+    status: str,
+    is_success: bool,
+    cleared: bool = False,
+) -> dict:
+    return {
+        "result": {
+            "statusUpdate": {
+                "metadata": {
+                    "iac_code": {
+                        "pipeline": {
+                            "eventType": "stack_current_changed",
+                            "data": {
+                                "provider": "ros",
+                                "action": action,
+                                "stackId": stack_id,
+                                "stackStatus": status,
+                                "isSuccess": is_success,
+                                "cleared": cleared,
+                            },
+                        }
+                    }
+                }
+            }
+        }
+    }
+
+
+def test_wait_for_created_stack_uses_successful_stack_event() -> None:
+    runner = _load_runner()
+    summary = runner.StreamSummary(name="02-create-first-stack", prompt="deploy")
+    events = [
+        _stack_current_changed_event(
+            action="CreateStack",
+            stack_id="failed-stack",
+            status="CREATE_FAILED",
+            is_success=False,
+        ),
+        _stack_current_changed_event(
+            action="DeleteStack",
+            stack_id="failed-stack",
+            status="DELETE_COMPLETE",
+            is_success=True,
+            cleared=True,
+        ),
+        _stack_current_changed_event(
+            action="CreateStack",
+            stack_id="created-stack",
+            status="CREATE_COMPLETE",
+            is_success=True,
+        ),
+    ]
+
+    class FakeStream:
+        name = "02-create-first-stack"
+
+        def wait_for(self, predicate, *, description: str, timeout: float):
+            for event in events:
+                if predicate(event, summary):
+                    return runner.EventMatch(description=description, event=event, summary=summary)
+            raise TimeoutError(description)
+
+    assert runner._wait_for_created_stack(FakeStream(), exclude=set(), timeout=1) == "created-stack"
+
+
+def test_created_stack_id_from_stream_uses_only_that_stream_successes() -> None:
+    runner = _load_runner()
+
+    stream = SimpleNamespace(
+        events=[
+            _stack_current_changed_event(
+                action="CreateStack",
+                stack_id="failed-stack",
+                status="CREATE_FAILED",
+                is_success=False,
+            ),
+            _stack_current_changed_event(
+                action="CreateStack",
+                stack_id="rollback-stack",
+                status="CREATE_COMPLETE",
+                is_success=True,
+            ),
+            _stack_current_changed_event(
+                action="CreateStack",
+                stack_id="second-stack",
+                status="CREATE_COMPLETE",
+                is_success=True,
+            ),
+        ]
+    )
+
+    assert runner._created_stack_id_from_stream(stream, exclude={"rollback-stack"}) == "second-stack"
+
+
+def test_post_rollback_timeout_allows_step_regeneration_time() -> None:
+    runner = _load_runner()
+
+    args = SimpleNamespace(event_timeout=300, stream_timeout=2400)
+
+    assert runner._post_rollback_timeout(args) == 900
+
+
+def test_wait_any_ignores_finished_stream_when_another_stream_matches() -> None:
+    runner = _load_runner()
+    match = runner.EventMatch(
+        description="target",
+        event={"ok": True},
+        summary=runner.StreamSummary(name="active", prompt=""),
+    )
+
+    class FinishedStream:
+        name = "finished"
+
+        def wait_for(self, *_args, **_kwargs):
+            raise RuntimeError("finished ended before target")
+
+    class ActiveStream:
+        name = "active"
+
+        def wait_for(self, *_args, **_kwargs):
+            return match
+
+    assert (
+        runner._wait_any([FinishedStream(), ActiveStream()], lambda *_args: True, description="target", timeout=1)
+        is match
+    )
+
+
+def test_cleanup_ledger_items_use_a2a_context_session_id(monkeypatch, tmp_path: Path) -> None:
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", str(tmp_path / "config"))
+    runner = _load_runner()
+
+    cwd = str((tmp_path / "workspace").resolve())
+    Path(cwd).mkdir()
+    run_dir = tmp_path / "run"
+    contexts_dir = run_dir / "a2a-persistence" / "contexts"
+    contexts_dir.mkdir(parents=True)
+    (contexts_dir / "ctx-1.json").write_text(
+        json.dumps({"context_id": "ctx-1", "session_id": "session-1", "cwd": cwd}),
+        encoding="utf-8",
+    )
+
+    from iac_code.services.session_storage import SessionStorage
+
+    ledger_dir = SessionStorage().session_dir(cwd, "session-1") / "pipeline"
+    ledger_dir.mkdir(parents=True)
+    (ledger_dir / "cleanup.yaml").write_text(
+        "\n".join(
+            [
+                "schema_version: 1",
+                "observed_resources:",
+                "- provider: ros",
+                "  resource_type: stack",
+                "  resource_id: stack-1",
+                "  observed_action: CreateStack",
+                "cleanup_resources: []",
+                "history: []",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    harness = SimpleNamespace(context_id="ctx-1", cwd=cwd, run_dir=run_dir)
+
+    items = runner._cleanup_ledger_items(harness, "observed_resources")
+
+    assert [item["resource_id"] for item in items] == ["stack-1"]
+
+
+def test_cleanup_activity_snapshot_helper_ignores_empty_default_cleanup() -> None:
+    runner = _load_runner()
+
+    assert (
+        runner._snapshot_has_cleanup_activity(
+            {"snapshot": {"cleanup": {"status": "none", "resourceCount": 0, "resources": [], "history": []}}}
+        )
+        is False
+    )
+    assert runner._snapshot_has_cleanup_activity({"snapshot": {"cleanup": {"resourceCount": "1"}}}) is True
+    assert runner._snapshot_has_cleanup_activity({"snapshot": {"cleanup": {"status": "pending"}}}) is True
+    assert (
+        runner._snapshot_has_cleanup_activity({"snapshot": {"cleanup": {"resources": [{"resourceId": "stack-1"}]}}})
+        is True
+    )
+    assert runner._snapshot_has_cleanup_activity({"snapshot": {"cleanup": {"history": [{"eventType": "x"}]}}}) is True
+
+
+def test_cleanup_activity_event_helper_detects_cleanup_events_and_handoff_data(tmp_path: Path) -> None:
+    runner = _load_runner()
+    normal_path = tmp_path / "normal.events.jsonl"
+    cleanup_path = tmp_path / "cleanup.events.jsonl"
+    handoff_path = tmp_path / "handoff.events.jsonl"
+    normal_path.write_text(
+        json.dumps(
+            _stack_current_changed_event(
+                action="CreateStack",
+                stack_id="stack-1",
+                status="CREATE_COMPLETE",
+                is_success=True,
+            )
+        ),
+        encoding="utf-8",
+    )
+    cleanup_path.write_text(
+        json.dumps(
+            {
+                "result": {
+                    "statusUpdate": {
+                        "metadata": {
+                            "iac_code": {
+                                "pipeline": {
+                                    "eventType": "cleanup_started",
+                                    "scope": "cleanup",
+                                    "data": {"resourceId": "stack-1"},
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+        ),
+        encoding="utf-8",
+    )
+    handoff_path.write_text(
+        json.dumps(
+            {
+                "result": {
+                    "statusUpdate": {
+                        "metadata": {
+                            "iac_code": {
+                                "pipeline": {
+                                    "eventType": "pipeline_handoff_ready",
+                                    "data": {"cleanup": {"resourceCount": 1}},
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+        ),
+        encoding="utf-8",
+    )
+
+    assert runner._events_file_has_cleanup_activity(normal_path) is False
+    assert runner._events_file_has_cleanup_activity(cleanup_path) is True
+    assert runner._events_file_has_cleanup_activity(handoff_path) is True
+    assert runner._run_dir_has_cleanup_events(tmp_path) is True
+
+
+def test_session_file_has_cleanup_prompt_uses_metadata_type(tmp_path: Path) -> None:
+    runner = _load_runner()
+    session_path = tmp_path / "session.jsonl"
+    session_path.write_text(
+        "\n".join(
+            [
+                json.dumps({"role": "user", "content": "visible"}),
+                json.dumps(
+                    {
+                        "role": "user",
+                        "content": "hidden cleanup prompt",
+                        "metadata": {"type": "pipeline_cleanup_prompt"},
+                    }
+                ),
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    assert runner._session_file_has_cleanup_prompt(session_path) is True
+
+
+def test_cleanup_ledger_required_resources_helper_ignores_observed_only() -> None:
+    runner = _load_runner()
+    harness = SimpleNamespace()
+
+    assert runner._cleanup_ledger_has_required_resources(harness) is False
+
+    original = runner._cleanup_ledger_items
+    try:
+        runner._cleanup_ledger_items = lambda _h, key: (
+            [{"resource_id": "stack-1", "cleanup_required": False}]
+            if key == "cleanup_resources"
+            else [{"resource_id": "stack-observed"}]
+        )
+        assert runner._cleanup_ledger_has_required_resources(harness) is False
+        runner._cleanup_ledger_items = lambda _h, key: (
+            [{"resource_id": "stack-2", "cleanup_required": True}] if key == "cleanup_resources" else []
+        )
+        assert runner._cleanup_ledger_has_required_resources(harness) is True
+    finally:
+        runner._cleanup_ledger_items = original
+
+
+def test_cleanup_deployment_prompts_use_distinct_run_scoped_stack_names(tmp_path: Path) -> None:
+    runner = _load_runner()
+    harness = SimpleNamespace(run_dir=tmp_path / "20260617T010203Z-12345-abcdef12")
+
+    first = runner._cleanup_deployment_prompt("你随便选一个方案。", harness, "first")
+    second = runner._cleanup_deployment_prompt("你随便选一个方案。", harness, "second")
+
+    assert "唯一成功条件是新建一个 ROS stack" in first
+    assert "任何已有 stack" in first
+    assert "不能作为部署成功依据" in first
+    assert "StackName" in first
+    assert "必须覆盖为 `iac-e2e-abcdef12-first`" in first
+    assert "不要调用 complete_step" in first
+    assert "等待用户下一条指令" in first
+    assert "iac-e2e-abcdef12-first" in first
+    assert "iac-e2e-abcdef12-second" in second
+    assert "complete_step 前必须" in second
+    assert first != second
+
+
+def test_rollback_step5_cleanup_flow_cleans_first_stack_and_keeps_second(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    fake_harnesses = []
+
+    class FakeStream:
+        def __init__(self, summary: object, events: list[dict] | None = None) -> None:
+            self.summary = summary
+            self.name = summary.name
+            self.events = events or []
+
+        def wait_for(self, *_args, **_kwargs):
+            return None
+
+        def join(self, timeout: float):
+            return self.summary
+
+    class FakeHarness:
+        def __init__(self) -> None:
+            self.args = SimpleNamespace(stream_timeout=1, event_timeout=1)
+            self.run_dir = tmp_path
+            self.server_env = {}
+            self.cwd = str(tmp_path)
+            self.context_id = "ctx-1"
+            self.pipeline_task_id = "task-1"
+            self.checks: dict[str, bool] = {}
+            self.notes: list[str] = []
+            self.summaries = {}
+            self.snapshots = {}
+            self.stream_calls: list[dict] = []
+            self.started_streams: list[str] = []
+
+        def stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            self.stream_calls.append({"prompt": prompt, "name": name, "task_id": task_id})
+            is_initial = name == "01-initial"
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_INPUT_REQUIRED"] if is_initial else ["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["input_required"] if is_initial else ["pipeline_completed"],
+                last_input_required_step_id="confirm_and_select" if is_initial else "",
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            return summary
+
+        def start_stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            self.started_streams.append(name)
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["pipeline_completed"],
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            events = []
+            if name == "04-select-second-stack":
+                events.append(
+                    _stack_current_changed_event(
+                        action="CreateStack",
+                        stack_id="stack-2",
+                        status="CREATE_COMPLETE",
+                        is_success=True,
+                    )
+                )
+            return FakeStream(summary, events=events)
+
+        def fetch_state(self, name: str):
+            snapshot = {
+                "snapshot": {
+                    "status": "completed",
+                    "cleanup": {
+                        "status": "completed",
+                        "resources": [
+                            {
+                                "provider": "ros",
+                                "resourceType": "stack",
+                                "resourceId": "stack-1",
+                                "regionId": "cn-hangzhou",
+                                "cleanupStatus": "completed",
+                                "stackStatus": "DELETE_COMPLETE",
+                            }
+                        ],
+                    },
+                    "stacks": {
+                        "current": {"stackId": "stack-2", "regionId": "cn-hangzhou", "current": True},
+                        "byId": {"stack-2": {"stackId": "stack-2", "current": True}},
+                    },
+                }
+            }
+            self.snapshots[name] = snapshot
+            return snapshot
+
+        def kill9_and_restart(self) -> None:
+            self.notes.append("restarted")
+
+    def fake_run_with_harness(_args, _scenario, callback):
+        harness = FakeHarness()
+        fake_harnesses.append(harness)
+        callback(harness)
+        return 0 if all(harness.checks.values()) else 1
+
+    cleanup_ledger_items = [
+        {
+            "provider": "ros",
+            "resource_type": "stack",
+            "resource_id": "stack-1",
+            "region_id": "cn-hangzhou",
+            "cleanup_required": True,
+        }
+    ]
+
+    monkeypatch.setattr(runner, "_run_with_harness", fake_run_with_harness)
+    monkeypatch.setattr(runner, "_answer_intervening_ask_inputs", lambda _h, summary, **_kwargs: summary)
+    monkeypatch.setattr(runner, "_wait_for_created_stack", lambda *_args, **_kwargs: "stack-1")
+    monkeypatch.setattr(runner, "_wait_any", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_finish_pipeline_after_possible_input", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(
+        runner,
+        "_cleanup_ledger_items",
+        lambda _h, key: cleanup_ledger_items if key == "cleanup_resources" else [],
+    )
+    monkeypatch.setattr(
+        runner,
+        "_capture_ros_stack_states",
+        lambda _h, stack_ids, name: {
+            "stack-1": {"status": "DELETE_COMPLETE"},
+            "stack-2": {"status": "CREATE_COMPLETE"},
+        },
+    )
+
+    args = SimpleNamespace(
+        event_timeout=1,
+        initial_prompt=runner.DEFAULT_INITIAL_PROMPT,
+        selection_prompt=runner.DEFAULT_SELECTION_PROMPT,
+        normal_followup_prompt=runner.DEFAULT_NORMAL_FOLLOWUP_PROMPT,
+    )
+
+    assert runner.run_rollback_step5_cleanup(args, "rollback-step5-cleanup") == 0
+    harness = fake_harnesses[0]
+    assert harness.stream_calls[-1]["task_id"] == ""
+    assert harness.checks["first rollback stack cleanup completed in snapshot"] is True
+    assert harness.checks["rollback cleanup stacks completed in snapshot"] is True
+    assert harness.checks["ROS first rollback stack deleted"] is True
+    assert harness.checks["ROS rollback cleanup stacks deleted"] is True
+    assert harness.checks["ROS second stack retained"] is True
+
+
+def test_rollback_step5_cleanup_recovery_uses_tool_safe_recovery_prompt(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    fake_harnesses = []
+
+    class FakeStream:
+        def __init__(self, summary: object, events: list[dict] | None = None) -> None:
+            self.summary = summary
+            self.name = summary.name
+            self.events = events or []
+
+        def wait_for(self, *_args, **_kwargs):
+            return None
+
+        def join(self, timeout: float):
+            return self.summary
+
+    class FakeHarness:
+        def __init__(self) -> None:
+            self.args = SimpleNamespace(stream_timeout=1, event_timeout=1)
+            self.run_dir = tmp_path
+            self.server_env = {}
+            self.cwd = str(tmp_path)
+            self.context_id = "ctx-1"
+            self.pipeline_task_id = "task-1"
+            self.checks: dict[str, bool] = {}
+            self.notes: list[str] = []
+            self.summaries = {}
+            self.snapshots = {}
+            self.stream_calls: list[dict] = []
+
+        def stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            self.stream_calls.append({"prompt": prompt, "name": name, "task_id": task_id})
+            is_initial = name == "01-initial"
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_INPUT_REQUIRED"] if is_initial else ["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["input_required"] if is_initial else ["pipeline_completed"],
+                last_input_required_step_id="confirm_and_select" if is_initial else "",
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            return summary
+
+        def start_stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["pipeline_completed"],
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            events = []
+            if name == "04-select-second-stack":
+                events.append(
+                    _stack_current_changed_event(
+                        action="CreateStack",
+                        stack_id="stack-2",
+                        status="CREATE_COMPLETE",
+                        is_success=True,
+                    )
+                )
+            return FakeStream(summary, events=events)
+
+        def fetch_state(self, name: str):
+            snapshot = {
+                "snapshot": {
+                    "status": "completed",
+                    "cleanup": {
+                        "status": "completed",
+                        "resources": [
+                            {
+                                "provider": "ros",
+                                "resourceType": "stack",
+                                "resourceId": "stack-1",
+                                "regionId": "cn-hangzhou",
+                                "cleanupStatus": "completed",
+                                "stackStatus": "DELETE_COMPLETE",
+                            }
+                        ],
+                    },
+                    "stacks": {
+                        "current": {"stackId": "stack-2", "regionId": "cn-hangzhou", "current": True},
+                        "byId": {"stack-2": {"stackId": "stack-2", "current": True}},
+                    },
+                }
+            }
+            self.snapshots[name] = snapshot
+            return snapshot
+
+        def kill9_and_restart(self) -> None:
+            self.notes.append("restarted")
+
+    def fake_run_with_harness(_args, _scenario, callback):
+        harness = FakeHarness()
+        fake_harnesses.append(harness)
+        callback(harness)
+        return 0 if all(harness.checks.values()) else 1
+
+    cleanup_ledger_items = [
+        {
+            "provider": "ros",
+            "resource_type": "stack",
+            "resource_id": "stack-1",
+            "region_id": "cn-hangzhou",
+            "cleanup_required": True,
+        }
+    ]
+
+    monkeypatch.setattr(runner, "_run_with_harness", fake_run_with_harness)
+    monkeypatch.setattr(runner, "_answer_intervening_ask_inputs", lambda _h, summary, **_kwargs: summary)
+    monkeypatch.setattr(runner, "_wait_for_created_stack", lambda *_args, **_kwargs: "stack-1")
+    monkeypatch.setattr(runner, "_wait_any", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_finish_pipeline_after_possible_input", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_wait_for_cleanup_started", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_join_after_kill", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(
+        runner,
+        "_events_file_has_cleanup_event",
+        lambda *_args, **_kwargs: True,
+    )
+    monkeypatch.setattr(
+        runner,
+        "_cleanup_ledger_items",
+        lambda _h, key: cleanup_ledger_items if key == "cleanup_resources" else [],
+    )
+    monkeypatch.setattr(
+        runner,
+        "_capture_ros_stack_states",
+        lambda _h, stack_ids, name: {
+            "stack-1": {"status": "DELETE_COMPLETE"},
+            "stack-2": {"status": "CREATE_COMPLETE"},
+        },
+    )
+
+    args = SimpleNamespace(
+        event_timeout=1,
+        initial_prompt=runner.DEFAULT_INITIAL_PROMPT,
+        selection_prompt=runner.DEFAULT_SELECTION_PROMPT,
+        normal_followup_prompt=runner.DEFAULT_NORMAL_FOLLOWUP_PROMPT,
+    )
+
+    assert runner.run_rollback_step5_cleanup_recovery(args, "rollback-step5-cleanup-recovery") == 0
+    recovery_prompt = next(
+        call["prompt"] for call in fake_harnesses[0].stream_calls if call["name"] == "06-cleanup-after-restart"
+    )
+    assert recovery_prompt != runner.CONTINUE_PROMPT
+    assert "不要调用任何工具" in recovery_prompt
+    assert "不要查询" in recovery_prompt
+    assert "不要删除" in recovery_prompt
+
+
+def test_rollback_step5_cleanup_flow_fails_when_any_cleanup_stack_is_left(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+
+    class FakeStream:
+        def __init__(self, summary: object, events: list[dict] | None = None) -> None:
+            self.summary = summary
+            self.name = summary.name
+            self.events = events or []
+
+        def wait_for(self, *_args, **_kwargs):
+            return None
+
+        def join(self, timeout: float):
+            return self.summary
+
+    class FakeHarness:
+        def __init__(self) -> None:
+            self.args = SimpleNamespace(stream_timeout=1, event_timeout=1)
+            self.run_dir = tmp_path
+            self.server_env = {}
+            self.cwd = str(tmp_path)
+            self.context_id = "ctx-1"
+            self.pipeline_task_id = "task-1"
+            self.checks: dict[str, bool] = {}
+            self.notes: list[str] = []
+            self.summaries = {}
+            self.snapshots = {}
+
+        def stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            is_initial = name == "01-initial"
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_INPUT_REQUIRED"] if is_initial else ["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["input_required"] if is_initial else ["pipeline_completed"],
+                last_input_required_step_id="confirm_and_select" if is_initial else "",
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            return summary
+
+        def start_stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["pipeline_completed"],
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            events = []
+            if name == "04-select-second-stack":
+                events.append(
+                    _stack_current_changed_event(
+                        action="CreateStack",
+                        stack_id="stack-2",
+                        status="CREATE_COMPLETE",
+                        is_success=True,
+                    )
+                )
+            return FakeStream(summary, events=events)
+
+        def fetch_state(self, name: str):
+            snapshot = {
+                "snapshot": {
+                    "status": "completed",
+                    "cleanup": {
+                        "status": "pending",
+                        "resources": [
+                            {
+                                "provider": "ros",
+                                "resourceType": "stack",
+                                "resourceId": "stack-1",
+                                "regionId": "cn-hangzhou",
+                                "cleanupStatus": "completed",
+                                "stackStatus": "DELETE_COMPLETE",
+                            },
+                            {
+                                "provider": "ros",
+                                "resourceType": "stack",
+                                "resourceId": "stack-left",
+                                "regionId": "cn-hangzhou",
+                                "cleanupStatus": "pending",
+                                "stackStatus": "CREATE_COMPLETE",
+                            },
+                        ],
+                    },
+                    "stacks": {
+                        "current": {"stackId": "stack-2", "regionId": "cn-hangzhou", "current": True},
+                        "byId": {"stack-2": {"stackId": "stack-2", "current": True}},
+                    },
+                }
+            }
+            self.snapshots[name] = snapshot
+            return snapshot
+
+        def kill9_and_restart(self) -> None:
+            raise AssertionError("non-recovery scenario should not restart")
+
+    def fake_run_with_harness(_args, _scenario, callback):
+        harness = FakeHarness()
+        callback(harness)
+        return 0 if all(harness.checks.values()) else 1
+
+    cleanup_ledger_items = [
+        {
+            "provider": "ros",
+            "resource_type": "stack",
+            "resource_id": "stack-1",
+            "region_id": "cn-hangzhou",
+            "cleanup_required": True,
+        },
+        {
+            "provider": "ros",
+            "resource_type": "stack",
+            "resource_id": "stack-left",
+            "region_id": "cn-hangzhou",
+            "cleanup_required": True,
+        },
+    ]
+
+    monkeypatch.setattr(runner, "_run_with_harness", fake_run_with_harness)
+    monkeypatch.setattr(runner, "_answer_intervening_ask_inputs", lambda _h, summary, **_kwargs: summary)
+    monkeypatch.setattr(runner, "_wait_for_created_stack", lambda *_args, **_kwargs: "stack-1")
+    monkeypatch.setattr(runner, "_wait_any", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_finish_pipeline_after_possible_input", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(
+        runner,
+        "_cleanup_ledger_items",
+        lambda _h, key: cleanup_ledger_items if key == "cleanup_resources" else [],
+    )
+    monkeypatch.setattr(
+        runner,
+        "_capture_ros_stack_states",
+        lambda _h, stack_ids, name: {
+            "stack-1": {"status": "DELETE_COMPLETE"},
+            "stack-left": {"status": "CREATE_COMPLETE"},
+            "stack-2": {"status": "CREATE_COMPLETE"},
+        },
+    )
+
+    args = SimpleNamespace(
+        event_timeout=1,
+        initial_prompt=runner.DEFAULT_INITIAL_PROMPT,
+        selection_prompt=runner.DEFAULT_SELECTION_PROMPT,
+        normal_followup_prompt=runner.DEFAULT_NORMAL_FOLLOWUP_PROMPT,
+    )
+
+    assert runner.run_rollback_step5_cleanup(args, "rollback-step5-cleanup") == 1
+
+
+def test_rollback_step5_cleanup_recovery_kills_and_retriggers_cleanup(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    fake_harnesses = []
+
+    class FakeStream:
+        def __init__(self, summary: object, events: list[dict] | None = None) -> None:
+            self.summary = summary
+            self.name = summary.name
+            self.events = events or []
+
+        def wait_for(self, *_args, **_kwargs):
+            return None
+
+        def join(self, timeout: float):
+            return self.summary
+
+    class FakeHarness:
+        def __init__(self) -> None:
+            self.args = SimpleNamespace(stream_timeout=1, event_timeout=1)
+            self.run_dir = tmp_path
+            self.server_env = {}
+            self.cwd = str(tmp_path)
+            self.context_id = "ctx-1"
+            self.pipeline_task_id = "task-1"
+            self.checks: dict[str, bool] = {}
+            self.notes: list[str] = []
+            self.summaries = {}
+            self.snapshots = {}
+            self.stream_calls: list[dict] = []
+            self.started_streams: list[dict] = []
+            self.kill_count = 0
+
+        def stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            self.stream_calls.append({"prompt": prompt, "name": name, "task_id": task_id})
+            is_initial = name == "01-initial"
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_INPUT_REQUIRED"] if is_initial else ["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["input_required"] if is_initial else ["pipeline_completed"],
+                last_input_required_step_id="confirm_and_select" if is_initial else "",
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            return summary
+
+        def start_stream(self, *, prompt: str, name: str, task_id: str | None = None, **_kwargs):
+            self.started_streams.append({"prompt": prompt, "name": name, "task_id": task_id})
+            summary = runner.StreamSummary(
+                name=name,
+                prompt=prompt,
+                request_task_id=self.pipeline_task_id if task_id is None else task_id,
+                context_id=self.context_id,
+                task_id="normal-task" if task_id == "" else self.pipeline_task_id,
+                status_states=["TASK_STATE_COMPLETED"],
+                pipeline_event_types=["pipeline_completed"],
+                normal_handoff_ready=True,
+                text="done",
+            )
+            self.summaries[name] = summary
+            events = []
+            if name == "04-select-second-stack":
+                events.append(
+                    _stack_current_changed_event(
+                        action="CreateStack",
+                        stack_id="stack-2",
+                        status="CREATE_COMPLETE",
+                        is_success=True,
+                    )
+                )
+            return FakeStream(summary, events=events)
+
+        def fetch_state(self, name: str):
+            snapshot = {
+                "snapshot": {
+                    "status": "completed",
+                    "cleanup": {
+                        "status": "completed",
+                        "resources": [
+                            {
+                                "provider": "ros",
+                                "resourceType": "stack",
+                                "resourceId": "stack-1",
+                                "regionId": "cn-hangzhou",
+                                "cleanupStatus": "completed",
+                                "stackStatus": "DELETE_COMPLETE",
+                            }
+                        ],
+                    },
+                    "stacks": {
+                        "current": {"stackId": "stack-2", "regionId": "cn-hangzhou", "current": True},
+                        "byId": {"stack-2": {"stackId": "stack-2", "current": True}},
+                    },
+                }
+            }
+            self.snapshots[name] = snapshot
+            return snapshot
+
+        def kill9_and_restart(self) -> None:
+            self.kill_count += 1
+
+    def fake_run_with_harness(_args, _scenario, callback):
+        harness = FakeHarness()
+        fake_harnesses.append(harness)
+        callback(harness)
+        return 0 if all(harness.checks.values()) else 1
+
+    cleanup_ledger_items = [
+        {
+            "provider": "ros",
+            "resource_type": "stack",
+            "resource_id": "stack-1",
+            "region_id": "cn-hangzhou",
+            "cleanup_required": True,
+        }
+    ]
+
+    monkeypatch.setattr(runner, "_run_with_harness", fake_run_with_harness)
+    monkeypatch.setattr(runner, "_answer_intervening_ask_inputs", lambda _h, summary, **_kwargs: summary)
+    monkeypatch.setattr(runner, "_wait_for_created_stack", lambda *_args, **_kwargs: "stack-1")
+    monkeypatch.setattr(runner, "_wait_any", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_finish_pipeline_after_possible_input", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_wait_for_cleanup_started", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(runner, "_events_file_has_cleanup_event", lambda *_args, **_kwargs: True)
+    monkeypatch.setattr(
+        runner,
+        "_cleanup_ledger_items",
+        lambda _h, key: cleanup_ledger_items if key == "cleanup_resources" else [],
+    )
+    monkeypatch.setattr(
+        runner,
+        "_capture_ros_stack_states",
+        lambda _h, stack_ids, name: {
+            "stack-1": {"status": "DELETE_COMPLETE"},
+            "stack-2": {"status": "CREATE_COMPLETE"},
+        },
+    )
+
+    args = SimpleNamespace(
+        event_timeout=1,
+        initial_prompt=runner.DEFAULT_INITIAL_PROMPT,
+        selection_prompt=runner.DEFAULT_SELECTION_PROMPT,
+        normal_followup_prompt=runner.DEFAULT_NORMAL_FOLLOWUP_PROMPT,
+    )
+
+    assert runner.run_rollback_step5_cleanup_recovery(args, "rollback-step5-cleanup-recovery") == 0
+    harness = fake_harnesses[0]
+    assert harness.kill_count == 1
+    assert harness.started_streams[-1] == {
+        "prompt": runner.DEFAULT_NORMAL_FOLLOWUP_PROMPT,
+        "name": "05-cleanup-running",
+        "task_id": "",
+    }
+    assert harness.stream_calls[-1] == {
+        "prompt": runner.CLEANUP_RECOVERY_PROMPT,
+        "name": "06-cleanup-after-restart",
+        "task_id": "",
+    }
+    assert harness.checks["cleanup retriggered after restart"] is True
+
+
 def test_rollback_accepts_security_group_deployment_from_handoff(monkeypatch) -> None:
     runner = _load_runner()
     handoff_summary = (
diff --git a/tests/agent/test_agent_loop_continue.py b/tests/agent/test_agent_loop_continue.py
index cf3a9eb5..cfb5e8dd 100644
--- a/tests/agent/test_agent_loop_continue.py
+++ b/tests/agent/test_agent_loop_continue.py
@@ -29,8 +29,8 @@ def __init__(self):
     def append(self, cwd, session_id, message, *, git_branch=None):
         self.appended.append((cwd, session_id, message, git_branch))
 
-    def save(self, cwd, session_id, messages, *, git_branch=None):
-        self.saved.append((cwd, session_id, messages, git_branch))
+    def save(self, cwd, session_id, messages, *, git_branch=None, preserve_cleanup_prompts=False):
+        self.saved.append((cwd, session_id, messages, git_branch, preserve_cleanup_prompts))
 
 
 @pytest.mark.asyncio
@@ -54,3 +54,24 @@ async def test_continue_streaming_uses_existing_context_without_appending_user_m
     assert provider.calls[0]["messages"][0].content == "already persisted prompt"
     appended_roles = [message.role for _cwd, _sid, message, _branch in storage.appended]
     assert appended_roles == ["assistant"]
+
+
+def test_stamp_last_turn_elapsed_preserves_cleanup_prompts():
+    storage = RecordingStorage()
+    loop = AgentLoop(
+        provider_manager=FakeProviderManager(),
+        system_prompt="system",
+        tool_registry=ToolRegistry(),
+        session_storage=storage,
+        session_id="session-cleanup",
+        resume_messages=[Message(role="user", content="later"), Message(role="assistant", content="done")],
+        cwd="/repo",
+    )
+
+    loop.stamp_last_turn_elapsed(1.5)
+
+    assert len(storage.saved) == 1
+    _cwd, _session_id, messages, _branch, preserve_cleanup_prompts = storage.saved[0]
+    assert [message.content for message in messages] == ["later", "done"]
+    assert messages[-1].elapsed_seconds == 1.5
+    assert preserve_cleanup_prompts is True
diff --git a/tests/agent/test_agent_loop_new.py b/tests/agent/test_agent_loop_new.py
index 1b683ec3..a476471f 100644
--- a/tests/agent/test_agent_loop_new.py
+++ b/tests/agent/test_agent_loop_new.py
@@ -2112,6 +2112,7 @@ async def test_auto_compact_persists_compacted_session(self, mock_provider, mock
             "auto-compact-session",
             compacted_messages,
             git_branch="main",
+            preserve_cleanup_prompts=True,
         )
 
     async def test_auto_compact_records_response_usage(self, mock_provider, mock_registry, tmp_path):
@@ -2216,6 +2217,7 @@ async def test_compact_persists_compacted_session(self, mock_provider, mock_regi
             "manual-compact-session",
             compacted_messages,
             git_branch="dev",
+            preserve_cleanup_prompts=True,
         )
 
     async def test_compact_records_response_usage(self, mock_provider, mock_registry, tmp_path):
diff --git a/tests/agent/test_permission_scenarios.py b/tests/agent/test_permission_scenarios.py
index c430eb73..1388a798 100644
--- a/tests/agent/test_permission_scenarios.py
+++ b/tests/agent/test_permission_scenarios.py
@@ -70,6 +70,21 @@ def _bash_turn(tool_use_id: str, command: str, *, text: str = "") -> list:
     return events
 
 
+def _read_file_turn(tool_use_id: str, path: str, *, text: str = "") -> list:
+    """Build a fake LLM turn that calls read_file with the given path."""
+    events = [MessageStartEvent(message_id=f"msg-{tool_use_id}")]
+    if text:
+        events.append(TextDeltaEvent(text=text))
+    events.extend(
+        [
+            ToolUseStartEvent(tool_use_id=tool_use_id, name="read_file"),
+            ToolUseEndEvent(tool_use_id=tool_use_id, name="read_file", input={"path": path}),
+            MessageEndEvent(stop_reason="tool_use", usage=Usage()),
+        ]
+    )
+    return events
+
+
 def _text_turn(text: str) -> list:
     """Build a fake LLM turn that just responds with text (no tool calls)."""
     return [
@@ -126,6 +141,69 @@ async def test_readonly_command_auto_allowed(self):
         results = _tool_results(events)
         assert any(not r.is_error for r in results)
 
+    @pytest.mark.asyncio
+    async def test_loop_trusted_read_roots_apply_to_read_file_permissions(self, tmp_path):
+        """Agent loop skill read roots should be available to permission checks and tool execution."""
+        project = tmp_path / "project"
+        skill_root = tmp_path / "skill"
+        project.mkdir()
+        skill_root.mkdir()
+        reference = skill_root / "template-parameters.md"
+        reference.write_text("Skill reference content", encoding="utf-8")
+
+        provider = FakeProvider([_read_file_turn("t1", str(reference)), _text_turn("done")])
+        registry = ToolRegistry()
+        registry.register_default_tools()
+        loop = AgentLoop(
+            provider_manager=provider,
+            system_prompt="test",
+            tool_registry=registry,
+            cwd=str(project),
+            max_turns=2,
+            permission_context=ToolPermissionContext(cwd=str(project)),
+            tool_context_trusted_read_directories=[str(skill_root)],
+        )
+
+        events = await _collect_events(loop, "read skill reference")
+
+        assert not _has_permission_request(events)
+        results = _tool_results(events)
+        assert any("Skill reference content" in result.result for result in results)
+
+    @pytest.mark.asyncio
+    async def test_session_trusted_read_roots_do_not_change_relative_read_lookup(self, tmp_path):
+        """Non-pipeline trusted read roots should not make read_file resolve relative paths from them."""
+        project = tmp_path / "project"
+        session_root = tmp_path / "session-artifacts"
+        project.mkdir()
+        reference = session_root / "references" / "template-parameters.md"
+        reference.parent.mkdir(parents=True)
+        reference.write_text("Session reference content", encoding="utf-8")
+
+        provider = FakeProvider([_read_file_turn("t1", "references/template-parameters.md"), _text_turn("done")])
+        registry = ToolRegistry()
+        registry.register_default_tools()
+        loop = AgentLoop(
+            provider_manager=provider,
+            system_prompt="test",
+            tool_registry=registry,
+            cwd=str(project),
+            max_turns=2,
+            permission_context=ToolPermissionContext(
+                cwd=str(project),
+                trusted_read_directories=[str(session_root)],
+            ),
+        )
+
+        events = await _collect_events(loop, "read session reference")
+
+        assert not _has_permission_request(events)
+        results = _tool_results(events)
+        assert any(result.is_error for result in results)
+        expected_error = f"File not found: {project / 'references' / 'template-parameters.md'}"
+        assert any(expected_error in result.result for result in results)
+        assert not any("Session reference content" in result.result for result in results)
+
     @pytest.mark.asyncio
     async def test_curl_requires_permission(self):
         """curl should prompt for permission."""
diff --git a/tests/commands/test_prompt.py b/tests/commands/test_prompt.py
index 6df5e0da..661cca3a 100644
--- a/tests/commands/test_prompt.py
+++ b/tests/commands/test_prompt.py
@@ -6,6 +6,8 @@
 from iac_code.agent.message import Message as AgentMessage
 from iac_code.commands import create_default_registry
 from iac_code.commands import prompt as prompt_module
+from iac_code.pipeline.config import RunMode
+from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
 from iac_code.providers.base import ContentBlock, Message, ToolDefinition
 
 
@@ -112,6 +114,121 @@ def test_prompt_snapshot_prefers_last_provider_request_with_recalled_memory():
     assert "hidden conversation" in html
 
 
+def test_prompt_snapshot_includes_hidden_cleanup_prompt_from_session():
+    cleanup = create_cleanup_prompt_message(
+        "检测到 pipeline rollback 后仍需要清理的云资源。\n待清理资源：stack-123",
+        cleanup_status="pending",
+    )
+    repl = SimpleNamespace(
+        _agent_loop=_FakeAgentLoopWithLastRequest(),
+        _session_storage=SimpleNamespace(load=lambda cwd, session_id: [cleanup]),
+        _original_cwd="/repo",
+        _session_id="session-123",
+        get_status_snapshot=lambda: {"session_id": "session-123", "cwd": "/repo"},
+    )
+
+    snapshot = prompt_module.build_prompt_snapshot(repl)
+    html = prompt_module.render_prompt_html(snapshot)
+
+    assert "待清理资源：stack-123" in html
+    assert "cleanup prompt" in html
+    assert 'data-tab-target="cleanup"' in html
+    assert 'data-tab-panel="cleanup"' in html
+    assert "Cleanup Prompts" in html
+
+
+def test_prompt_snapshot_inserts_removed_cleanup_prompt_between_session_anchors():
+    class _AnchoredLastRequestLoop(_FakeAgentLoop):
+        def get_last_provider_request_snapshot(self):
+            return {
+                "system_prompt": "# Sent System\nactual sent system",
+                "provider_messages": [
+                    Message.user("before cleanup"),
+                    Message(role="assistant", content="after cleanup"),
+                ],
+                "tools": [],
+            }
+
+    cleanup = create_cleanup_prompt_message(
+        "检测到 pipeline rollback 后仍需要清理的云资源。\n待清理资源：stack-anchored",
+        cleanup_status="completed",
+    )
+    repl = SimpleNamespace(
+        _agent_loop=_AnchoredLastRequestLoop(),
+        _session_storage=SimpleNamespace(
+            load=lambda cwd, session_id: [
+                AgentMessage(role="user", content="before cleanup"),
+                cleanup,
+                AgentMessage(role="assistant", content="after cleanup"),
+            ]
+        ),
+        _original_cwd="/repo",
+        _session_id="session-123",
+        get_status_snapshot=lambda: {"session_id": "session-123", "cwd": "/repo"},
+    )
+
+    snapshot = prompt_module.build_prompt_snapshot(repl)
+    messages = snapshot["provider_messages"]
+
+    assert [message["content"] for message in messages] == [
+        "before cleanup",
+        "检测到 pipeline rollback 后仍需要清理的云资源。\n待清理资源：stack-anchored",
+        "after cleanup",
+    ]
+    assert messages[1]["badge"] == "cleanup prompt · removed"
+    assert snapshot["cleanup_prompts"][0]["content"].endswith("stack-anchored")
+
+
+def test_prompt_snapshot_keeps_unanchored_removed_cleanup_prompt_out_of_provider_messages():
+    class _UnanchoredLastRequestLoop(_FakeAgentLoop):
+        def get_last_provider_request_snapshot(self):
+            return {
+                "system_prompt": "# Sent System\nactual sent system",
+                "provider_messages": [Message(role="assistant", content="after cleanup")],
+                "tools": [],
+            }
+
+    cleanup = create_cleanup_prompt_message(
+        "检测到 pipeline rollback 后仍需要清理的云资源。\n待清理资源：stack-unanchored",
+        cleanup_status="completed",
+    )
+    repl = SimpleNamespace(
+        _agent_loop=_UnanchoredLastRequestLoop(),
+        _session_storage=SimpleNamespace(
+            load=lambda cwd, session_id: [
+                cleanup,
+                AgentMessage(role="assistant", content="after cleanup"),
+            ]
+        ),
+        _original_cwd="/repo",
+        _session_id="session-123",
+        get_status_snapshot=lambda: {"session_id": "session-123", "cwd": "/repo"},
+    )
+
+    snapshot = prompt_module.build_prompt_snapshot(repl)
+    html = prompt_module.render_prompt_html(snapshot)
+
+    assert [message["content"] for message in snapshot["provider_messages"]] == ["after cleanup"]
+    assert snapshot["cleanup_prompts"][0]["content"].endswith("stack-unanchored")
+    assert "待清理资源：stack-unanchored" in html
+    assert 'data-tab-target="cleanup"' in html
+
+
+def test_prompt_html_hides_cleanup_tab_when_no_cleanup_prompt():
+    html = prompt_module.render_prompt_html(
+        {
+            "metadata": {"session_id": "abc"},
+            "system_prompt": "# System\nPrompt",
+            "system_sections": [{"title": "System", "content": "# System\nPrompt", "zone": "static"}],
+            "provider_messages": [{"role": "user", "content": "hello"}],
+            "tools": [],
+        }
+    )
+
+    assert 'data-tab-target="cleanup"' not in html
+    assert 'data-tab-panel="cleanup"' not in html
+
+
 @pytest.mark.asyncio
 async def test_prompt_command_exports_html_and_opens(tmp_path, monkeypatch):
     opened: list[object] = []
@@ -214,6 +331,52 @@ async def test_prompt_command_exports_pipeline_prompt_context(tmp_path):
     assert "original prompt" in html
 
 
+@pytest.mark.asyncio
+async def test_prompt_command_uses_normal_snapshot_with_cleanup_prompt_after_pipeline_handoff(tmp_path):
+    ensure = AsyncMock(return_value=False)
+    cleanup = create_cleanup_prompt_message(
+        "检测到 pipeline rollback 后仍需要清理的云资源。\n待清理资源：stack-cleanup",
+        cleanup_status="completed",
+    )
+    prompt_context = SimpleNamespace(
+        scope="parent",
+        step_id="deploying",
+        system_prompt="stale pipeline prompt",
+        messages=[AgentMessage(role="user", content="stale pipeline message")],
+        agent_loop_session_id="transcript_deploying",
+        initial_prompt="",
+        candidate_index=None,
+        candidate_name="",
+        sub_pipeline_id="",
+    )
+    session_dir = tmp_path / "root-session"
+    repl = SimpleNamespace(
+        ensure_pipeline_restored_for_prompt=ensure,
+        _get_runtime_mode=lambda: RunMode.NORMAL,
+        _pipeline=SimpleNamespace(get_prompt_contexts=lambda: [prompt_context]),
+        _agent_loop=_FakeAgentLoopWithLastRequest(),
+        _session_storage=SimpleNamespace(
+            load=lambda cwd, session_id: [cleanup],
+            session_dir=lambda cwd, session_id: session_dir,
+        ),
+        _original_cwd="/repo",
+        _session_id="root-session",
+        get_status_snapshot=lambda: {"session_id": "root-session", "cwd": "/repo"},
+    )
+    opened_urls: list[str] = []
+
+    await prompt_module.prompt_command(
+        context=SimpleNamespace(repl=repl),
+        browser_opener=lambda url: opened_urls.append(url) or True,
+    )
+
+    html = (session_dir / "prompt.html").read_text(encoding="utf-8")
+    assert "待清理资源：stack-cleanup" in html
+    assert "cleanup prompt" in html
+    assert "stale pipeline prompt" not in html
+    assert "stale pipeline message" not in html
+
+
 @pytest.mark.asyncio
 async def test_prompt_command_escapes_pipeline_prompt_html(tmp_path):
     ensure = AsyncMock(return_value=True)
diff --git a/tests/conftest.py b/tests/conftest.py
index 477146ad..32dc39b1 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -47,6 +47,20 @@ def _isolate_iac_home(tmp_path_factory, monkeypatch):
     monkeypatch.delenv("IAC_CODE_CONFIG_DIR", raising=False)
 
 
+@pytest.fixture(autouse=True)
+def _disable_tiktoken_encoding_downloads(monkeypatch):
+    """Keep tests from downloading tokenizer assets through tiktoken."""
+    try:
+        import tiktoken
+    except Exception:
+        return
+
+    def unavailable_encoding(_name):
+        raise RuntimeError("tiktoken encoding downloads are disabled in tests")
+
+    monkeypatch.setattr(tiktoken, "get_encoding", unavailable_encoding)
+
+
 @pytest.fixture(autouse=True)
 def _stamp_release_date(monkeypatch):
     """Simulate a packaged release build so the telemetry local-build gate
diff --git a/tests/memory/test_memory_tools.py b/tests/memory/test_memory_tools.py
index 5edf180a..ac7635f9 100644
--- a/tests/memory/test_memory_tools.py
+++ b/tests/memory/test_memory_tools.py
@@ -63,6 +63,28 @@ async def test_read_missing_memory_returns_error(self):
         assert result.is_error is True
         assert "not found" in result.content
 
+    async def test_read_missing_memory_returns_error_with_index_content(self):
+        manager = FakeMemoryManager()
+        manager.index_content = "- [role](role.md) — Role\n- [prefs](prefs.md) — Preferences\n"
+        tool = ReadMemoryTool(manager)
+
+        result = await tool.execute(tool_input={"name": "missing"}, context=ToolContext())
+
+        assert result.is_error is True
+        assert "Memory 'missing' not found." in result.content
+        assert "Available memories:" in result.content
+        assert "- [role](role.md) — Role" in result.content
+        assert "- [prefs](prefs.md) — Preferences" in result.content
+        assert "Call read_memory again with one of these names" in result.content
+
+    async def test_read_missing_memory_returns_error_with_empty_index_message(self):
+        tool = ReadMemoryTool(FakeMemoryManager())
+
+        result = await tool.execute(tool_input={"name": "missing"}, context=ToolContext())
+
+        assert result.is_error is True
+        assert result.content == "Memory 'missing' not found.\n\nNo memories saved yet."
+
     async def test_read_without_name_returns_index_content(self):
         manager = FakeMemoryManager()
         manager.index_content = "memory index"
diff --git a/tests/pipeline/engine/test_cleanup.py b/tests/pipeline/engine/test_cleanup.py
new file mode 100644
index 00000000..ad727ddf
--- /dev/null
+++ b/tests/pipeline/engine/test_cleanup.py
@@ -0,0 +1,843 @@
+from __future__ import annotations
+
+import json
+import logging
+import threading
+import time
+
+import yaml
+
+import iac_code.pipeline.engine.cleanup as cleanup_module
+from iac_code.pipeline.engine.cleanup import (
+    CleanupLedger,
+    CleanupObserver,
+    CleanupResource,
+    ObservedResource,
+    cleanup_prompt_ledger_path,
+    create_cleanup_prompt_message,
+    is_active_cleanup_prompt_message,
+    mark_cleanup_prompt_message_completed,
+)
+from iac_code.types.stream_events import StackProgressEvent, ToolResultEvent, ToolUseEndEvent
+
+
+def _observed_stack() -> ObservedResource:
+    return ObservedResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        resource_name="demo",
+        region_id="cn-hangzhou",
+        source_step_id="deploying",
+        source_attempt_id="att_0001",
+        observed_action="CreateStack",
+        observed_at=1.0,
+        metadata={"tool_name": "ros_stack"},
+    )
+
+
+def test_ledger_persists_observed_and_required_resources(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    observed = _observed_stack()
+
+    ledger.record_observed(observed)
+    ledger.mark_cleanup_required(
+        [CleanupResource.from_observed(observed, reason="rollback requested")],
+        source_step_id="deploying",
+        reason="rollback requested",
+    )
+
+    restored = CleanupLedger(tmp_path / "cleanup.yaml")
+    assert restored.observed_resources()[0] == observed
+    pending = restored.pending_resources()
+    assert len(pending) == 1
+    assert pending[0].provider == "ros"
+    assert pending[0].resource_type == "stack"
+    assert pending[0].resource_id == "stack-123"
+    assert pending[0].resource_name == "demo"
+    assert pending[0].region_id == "cn-hangzhou"
+    assert pending[0].cleanup_status == "pending"
+    assert pending[0].cleanup_required is True
+
+
+def test_pending_prompt_includes_active_resources_after_restart(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resources = [
+        CleanupResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-started",
+            region_id="cn-hangzhou",
+            cleanup_status="started",
+            progress_status="DELETE_STARTED",
+        ),
+        CleanupResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-progress",
+            region_id="cn-hangzhou",
+            cleanup_status="in_progress",
+            progress_status="DELETE_IN_PROGRESS",
+        ),
+        CleanupResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-complete",
+            region_id="cn-hangzhou",
+            cleanup_status="completed",
+            progress_status="DELETE_COMPLETE",
+        ),
+    ]
+    ledger.mark_cleanup_required(resources, source_step_id="deploying", reason="rollback requested")
+
+    prompt = ledger.build_pending_prompt()
+
+    assert prompt is not None
+    assert [resource.resource_id for resource in prompt.resources] == ["stack-started", "stack-progress"]
+    assert "stack-started" in prompt.prompt
+    assert "stack-progress" in prompt.prompt
+    assert "stack-complete" not in prompt.prompt
+    assert "strict allowlist" in prompt.prompt
+    assert "delete only ids in the cleanup resources list below" in prompt.prompt
+    assert "Do not delete, modify, or roll back any stack or cloud resource outside the cleanup resources list" in (
+        prompt.prompt
+    )
+    assert "Do not call ListStacks or search for other stacks by name" in prompt.prompt
+    assert "verify that StackId exactly matches an id in the cleanup resources list" in prompt.prompt
+    assert "If StackId is not in the cleanup resources list, do not call DeleteStack" in prompt.prompt
+    assert "Do not infer extra cleanup targets from pipeline handoff" in prompt.prompt
+    assert "Do not expand cleanup scope for user follow-ups" in prompt.prompt
+    assert "When resuming cleanup, still process only resources listed in this prompt" in prompt.prompt
+    assert "如果用户只说“继续”" not in prompt.prompt
+    assert "After all listed resources are DELETE_COMPLETE, stop this cleanup turn immediately" in prompt.prompt
+
+
+def test_ledger_records_prompt_queued_history(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    prompt = ledger.build_pending_prompt()
+    assert prompt is not None
+
+    ledger.record_prompt_queued(prompt, ui_surface="repl")
+
+    history = ledger._load()["history"]
+    assert [entry["type"] for entry in history] == ["cleanup_required", "cleanup_prompt_queued"]
+    assert history[-1]["ui_surface"] == "repl"
+    assert history[-1]["resource_count"] == 1
+    assert history[-1]["resources"][0]["resource_id"] == "stack-123"
+    assert "prompt" not in history[-1]
+
+
+def test_cleanup_prompt_message_tracks_ledger_path_and_completion(tmp_path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    message = create_cleanup_prompt_message(
+        "cleanup hidden prompt",
+        cleanup_ledger_path=path,
+        cleanup_status="pending",
+    )
+
+    assert cleanup_prompt_ledger_path(message) == str(path)
+    assert is_active_cleanup_prompt_message(message)
+
+    assert mark_cleanup_prompt_message_completed(message, cleanup_ledger_path=path) is True
+
+    assert message.metadata["cleanupStatus"] == "completed"
+    assert not is_active_cleanup_prompt_message(message)
+
+
+def test_observer_marks_ros_stack_delete_complete(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="ros_stack",
+            input={
+                "action": "DeleteStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123", "StackName": "demo"},
+            },
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="ros_stack",
+            result=json.dumps(
+                {
+                    "stack_id": "stack-123",
+                    "stack_name": "demo",
+                    "status": "DELETE_COMPLETE",
+                    "is_success": True,
+                }
+            ),
+            is_error=False,
+        )
+    )
+
+    [updated] = ledger.cleanup_resources()
+    assert updated.cleanup_status == "completed"
+    assert updated.cleanup_tool_use_id == "toolu-delete"
+    assert updated.progress_status == "DELETE_COMPLETE"
+
+
+def test_observer_keeps_statusless_delete_stack_result_in_progress(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="ros_stack",
+            input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-123"}},
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="ros_stack",
+            result=json.dumps({"stack_id": "stack-123", "is_success": True}),
+            is_error=False,
+        )
+    )
+
+    [updated] = ledger.cleanup_resources()
+    assert updated.cleanup_status == "in_progress"
+    assert updated.progress_status == "DELETE_REQUESTED"
+    assert ledger.build_pending_prompt() is not None
+
+
+def test_observer_marks_ros_stack_delete_failed(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="ros_stack",
+            input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-123"}},
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="ros_stack",
+            result=json.dumps({"stack_id": "stack-123", "status": "DELETE_FAILED", "is_success": False}),
+            is_error=True,
+        )
+    )
+
+    [updated] = ledger.cleanup_resources()
+    assert updated.cleanup_status == "failed"
+    assert updated.progress_status == "DELETE_FAILED"
+    assert updated.last_error
+
+
+def test_update_resource_sanitizes_durable_last_error(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="failed",
+        progress_status="DELETE_FAILED",
+        last_error=(
+            "AccessKeySecret=super-secret token=sk-live-1234567890 "
+            "Authorization: Bearer bearer-secret at /Users/alice/.iac-code/settings.yml"
+        ),
+    )
+
+    data = ledger._load()
+    resource_error = data["cleanup_resources"][0]["last_error"]
+    history_error = data["history"][-1]["last_error"]
+    for value in (resource_error, history_error):
+        assert "super-secret" not in value
+        assert "sk-live" not in value
+        assert "bearer-secret" not in value
+        assert "/Users/alice" not in value
+        assert "[REDACTED]" in value or "[PATH]" in value
+
+
+def test_observer_tracks_aliyun_api_delete_then_get_stack_polling(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "DeleteStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="aliyun_api",
+            result=json.dumps({"RequestId": "req-1"}),
+            is_error=False,
+        )
+    )
+    [started] = ledger.cleanup_resources()
+    assert started.cleanup_status == "in_progress"
+    assert started.progress_status == "DELETE_REQUESTED"
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-get-1",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "GetStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-get-1",
+            tool_name="aliyun_api",
+            result=json.dumps({"StackId": "stack-123", "Status": "DELETE_IN_PROGRESS"}),
+            is_error=False,
+        )
+    )
+    [progress] = ledger.cleanup_resources()
+    assert progress.cleanup_status == "in_progress"
+    assert progress.progress_status == "DELETE_IN_PROGRESS"
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-get-2",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "GetStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-get-2",
+            tool_name="aliyun_api",
+            result=json.dumps({"StackId": "stack-123", "Status": "DELETE_COMPLETE"}),
+            is_error=False,
+        )
+    )
+    [completed] = ledger.cleanup_resources()
+    assert completed.cleanup_status == "completed"
+    assert completed.progress_status == "DELETE_COMPLETE"
+
+
+def test_observer_clears_previous_error_after_retry_success(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="failed",
+        last_error="DELETE_FAILED",
+    )
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-get",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "GetStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-get",
+            tool_name="aliyun_api",
+            result=json.dumps({"StackId": "stack-123", "Status": "DELETE_COMPLETE"}),
+            is_error=False,
+        )
+    )
+
+    [completed] = ledger.cleanup_resources()
+    assert completed.cleanup_status == "completed"
+    assert completed.progress_status == "DELETE_COMPLETE"
+    assert completed.last_error is None
+
+
+def test_terminal_cleanup_resource_ignores_late_nonterminal_or_failed_events(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-late-delete",
+            name="ros_stack",
+            input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-123"}},
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-late-delete",
+            tool_name="ros_stack",
+            result=json.dumps({"stack_id": "stack-123", "is_success": True}),
+            is_error=False,
+        )
+    )
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-late-get",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "GetStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+    )
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-late-get",
+            tool_name="aliyun_api",
+            result=json.dumps({"StackId": "stack-123", "Status": "DELETE_FAILED"}),
+            is_error=True,
+        )
+    )
+
+    [completed] = ledger.cleanup_resources()
+    assert completed.cleanup_status == "completed"
+    assert completed.progress_status == "DELETE_COMPLETE"
+    assert completed.cleanup_tool_use_id is None
+    assert completed.last_error is None
+    assert ledger.build_pending_prompt() is None
+
+
+def test_mark_cleanup_required_skips_terminal_resources_without_history(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-completed",
+                region_id="cn-hangzhou",
+                cleanup_status="completed",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-skipped",
+                region_id="cn-hangzhou",
+                cleanup_status="skipped",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback requested",
+    )
+    history_before = list(ledger._load()["history"])
+
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-completed",
+                region_id="cn-hangzhou",
+                cleanup_status="pending",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-skipped",
+                region_id="cn-hangzhou",
+                cleanup_status="pending",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback requested again",
+    )
+
+    assert ledger._load()["history"] == history_before
+    assert [resource.cleanup_status for resource in ledger.cleanup_resources()] == ["completed", "skipped"]
+
+
+def test_mark_cleanup_required_preserves_active_execution_fields(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="in_progress",
+        cleanup_tool_use_id="toolu-delete",
+        cleanup_action="DeleteStack",
+        progress_status="DELETE_IN_PROGRESS",
+        progress_percentage=30,
+        last_error="slow",
+    )
+
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested again")
+
+    [updated] = ledger.cleanup_resources()
+    assert updated.cleanup_status == "in_progress"
+    assert updated.cleanup_tool_use_id == "toolu-delete"
+    assert updated.cleanup_action == "DeleteStack"
+    assert updated.progress_status == "DELETE_IN_PROGRESS"
+    assert updated.progress_percentage == 30
+    assert updated.last_error == "slow"
+
+
+def test_observer_uses_persisted_tool_mapping_after_restart(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    CleanupObserver(ledger).observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="ros_stack",
+            input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-123"}},
+        )
+    )
+
+    restarted = CleanupObserver(CleanupLedger(tmp_path / "cleanup.yaml"))
+    restarted.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="ros_stack",
+            result=json.dumps({"stack_id": "stack-123", "status": "DELETE_COMPLETE"}),
+            is_error=False,
+        )
+    )
+
+    [updated] = CleanupLedger(tmp_path / "cleanup.yaml").cleanup_resources()
+    assert updated.cleanup_status == "completed"
+
+
+def test_observer_rejects_persisted_mapping_result_stack_id_mismatch(tmp_path, caplog) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(provider="ros", resource_type="stack", resource_id="stack-a", region_id="cn-hangzhou"),
+            CleanupResource(provider="ros", resource_type="stack", resource_id="stack-b", region_id="cn-hangzhou"),
+        ],
+        source_step_id="deploying",
+        reason="rollback requested",
+    )
+    ledger.record_tool_use_mapping(
+        tool_use_id="toolu-delete-a",
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-a",
+        region_id="cn-hangzhou",
+        action="DeleteStack",
+        tool_name="ros_stack",
+        tool_input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-a"}},
+    )
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.cleanup")
+    unsafe_stack_id = "stack-b AccessKeySecret=super-secret /Users/alice/.iac-code/settings.yml"
+
+    CleanupObserver(CleanupLedger(tmp_path / "cleanup.yaml")).observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete-a",
+            tool_name="ros_stack",
+            result=json.dumps({"StackId": unsafe_stack_id, "Status": "DELETE_COMPLETE"}),
+            is_error=False,
+        )
+    )
+
+    resources = {
+        resource.resource_id: resource for resource in CleanupLedger(tmp_path / "cleanup.yaml").cleanup_resources()
+    }
+    assert resources["stack-a"].cleanup_status == "pending"
+    assert resources["stack-b"].cleanup_status == "pending"
+    history = CleanupLedger(tmp_path / "cleanup.yaml").history_entries()
+    assert history[-1]["type"] == "cleanup_tool_result_mismatch"
+    assert history[-1]["tool_use_id"] == "toolu-delete-a"
+    assert history[-1]["mapped_resource_id"] == "stack-a"
+    assert history[-1]["result_resource_id"] != unsafe_stack_id
+    assert "super-secret" not in history[-1]["result_resource_id"]
+    assert "/Users/alice" not in history[-1]["result_resource_id"]
+    assert "[REDACTED]" in history[-1]["result_resource_id"]
+    assert "[PATH]" in history[-1]["result_resource_id"]
+    assert history[-1]["tool_name"] == "ros_stack"
+    assert "Mismatched cleanup tool result" in caplog.text
+    assert "super-secret" not in caplog.text
+    assert "/Users/alice" not in caplog.text
+    assert "settings.yml" not in caplog.text
+    assert "[REDACTED]" in caplog.text
+    assert "[PATH]" in caplog.text
+
+
+def test_observer_rejects_in_memory_tool_result_stack_id_mismatch(tmp_path, caplog) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(provider="ros", resource_type="stack", resource_id="stack-a", region_id="cn-hangzhou"),
+            CleanupResource(provider="ros", resource_type="stack", resource_id="stack-b", region_id="cn-hangzhou"),
+        ],
+        source_step_id="deploying",
+        reason="rollback requested",
+    )
+    observer = CleanupObserver(ledger)
+    observer.observe(
+        ToolUseEndEvent(
+            tool_use_id="toolu-delete-a",
+            name="ros_stack",
+            input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-a"}},
+        )
+    )
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.cleanup")
+
+    observer.observe(
+        ToolResultEvent(
+            tool_use_id="toolu-delete-a",
+            tool_name="ros_stack",
+            result=json.dumps({"StackId": "stack-b", "Status": "DELETE_COMPLETE"}),
+            is_error=False,
+        )
+    )
+
+    resources = {resource.resource_id: resource for resource in ledger.cleanup_resources()}
+    assert resources["stack-a"].cleanup_status == "started"
+    assert resources["stack-b"].cleanup_status == "pending"
+    assert ledger.history_entries()[-1]["type"] == "cleanup_tool_result_mismatch"
+    assert "Mismatched cleanup tool result" in caplog.text
+
+
+def test_observer_records_history_warning_for_unmatched_cleanup_tool_result(tmp_path, caplog) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.cleanup")
+
+    CleanupObserver(ledger).observe(
+        ToolResultEvent(
+            tool_use_id="toolu-missing",
+            tool_name="ros_stack",
+            result=json.dumps({"stack_id": "stack-123", "status": "DELETE_COMPLETE"}),
+            is_error=False,
+        )
+    )
+
+    [pending] = ledger.cleanup_resources()
+    assert pending.cleanup_status == "pending"
+    history = ledger.history_entries()
+    assert history[-1]["type"] == "cleanup_tool_result_unmatched"
+    assert history[-1]["tool_use_id"] == "toolu-missing"
+    assert history[-1]["tool_name"] == "ros_stack"
+    assert "Unmatched cleanup tool result" in caplog.text
+
+
+def test_corrupt_ledger_records_unavailable_without_overwrite(tmp_path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+
+    status = ledger.mark_cleanup_required(
+        [CleanupResource.from_observed(_observed_stack(), reason="rollback")],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+
+    assert path.read_text(encoding="utf-8") == "[broken"
+    assert ledger.load_failed()
+    assert ledger.load_error()
+    assert status.written is False
+    assert status.unavailable is True
+    assert status.reason == "load_failed"
+    assert status.load_error
+
+
+def test_corrupt_ledger_record_observed_reports_unavailable_without_overwrite(tmp_path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+
+    status = ledger.record_observed(_observed_stack())
+
+    assert path.read_text(encoding="utf-8") == "[broken"
+    assert status.written is False
+    assert status.unavailable is True
+    assert status.reason == "load_failed"
+    assert status.load_error
+
+
+def test_cleanup_ledger_save_uses_state_io_atomic_durable_write(tmp_path, monkeypatch) -> None:
+    calls = []
+
+    def fake_atomic_write_text(path, content, *, durable=True, **_kwargs):
+        calls.append((path, content, durable))
+        path.write_text(content, encoding="utf-8")
+
+    monkeypatch.setattr(cleanup_module, "atomic_write_text", fake_atomic_write_text, raising=False)
+    path = tmp_path / "cleanup.yaml"
+    ledger = CleanupLedger(path)
+
+    ledger.mark_cleanup_required(
+        [CleanupResource.from_observed(_observed_stack(), reason="rollback requested")],
+        source_step_id="deploying",
+        reason="rollback requested",
+    )
+
+    assert len(calls) == 1
+    saved_path, content, durable = calls[0]
+    assert saved_path == path
+    assert durable is True
+    saved = yaml.safe_load(content)
+    assert saved["cleanup_resources"][0]["resource_id"] == "stack-123"
+
+
+def test_mark_cleanup_required_serializes_read_modify_write_for_same_path(tmp_path) -> None:
+    first_save_entered = threading.Event()
+    save_lock = threading.Lock()
+    save_count = 0
+
+    class SlowFirstSaveLedger(CleanupLedger):
+        def _save(self, data):
+            nonlocal save_count
+            with save_lock:
+                save_count += 1
+                current_save = save_count
+            if current_save == 1:
+                first_save_entered.set()
+                time.sleep(0.25)
+            super()._save(data)
+
+    path = tmp_path / "cleanup.yaml"
+    errors = []
+
+    def mark_required(resource_id: str) -> None:
+        try:
+            resource = CleanupResource.from_observed(
+                ObservedResource(
+                    provider="ros",
+                    resource_type="stack",
+                    resource_id=resource_id,
+                    region_id="cn-hangzhou",
+                    source_step_id="deploying",
+                    observed_action="CreateStack",
+                ),
+                reason="rollback requested",
+            )
+            SlowFirstSaveLedger(path).mark_cleanup_required(
+                [resource],
+                source_step_id="deploying",
+                reason="rollback requested",
+            )
+        except Exception as exc:  # pragma: no cover - surfaced by assertion below
+            errors.append(exc)
+
+    first = threading.Thread(target=mark_required, args=("stack-one",))
+    second = threading.Thread(target=mark_required, args=("stack-two",))
+
+    first.start()
+    assert first_save_entered.wait(timeout=1)
+    second.start()
+    first.join(timeout=2)
+    second.join(timeout=2)
+
+    assert not first.is_alive()
+    assert not second.is_alive()
+    assert errors == []
+    resources = CleanupLedger(path).cleanup_resources()
+    assert sorted(resource.resource_id for resource in resources) == ["stack-one", "stack-two"]
+
+
+def test_corrupt_ledger_non_empty_writes_do_not_mutate_or_replace_file(tmp_path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+
+    ledger.record_observed(_observed_stack())
+    ledger.mark_cleanup_required(
+        [CleanupResource.from_observed(_observed_stack(), reason="rollback requested")],
+        source_step_id="deploying",
+        reason="rollback requested",
+    )
+
+    assert path.read_text(encoding="utf-8") == "[broken"
+    assert not list(tmp_path.glob("cleanup.yaml.corrupt*"))
+    assert ledger.load_failed() is True
+    assert ledger.observed_resources() == []
+    assert ledger.cleanup_resources() == []
+
+
+def test_corrupt_ledger_update_does_not_write_empty_replacement(tmp_path) -> None:
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+
+    assert ledger.load_failed() is True
+    assert ledger.load_error()
+
+    changed = ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+    )
+
+    assert changed is False
+    assert path.exists()
+    assert path.read_text(encoding="utf-8") == "[broken"
+    assert not list(tmp_path.glob("cleanup.yaml.corrupt*"))
+
+
+def test_observer_updates_progress_from_stack_progress_event(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    resource = CleanupResource.from_observed(_observed_stack(), reason="rollback requested")
+    ledger.mark_cleanup_required([resource], source_step_id="deploying", reason="rollback requested")
+    observer = CleanupObserver(ledger)
+
+    observer.observe(
+        StackProgressEvent(
+            stack_id="stack-123",
+            stack_name="demo",
+            status="DELETE_IN_PROGRESS",
+            progress_percentage=60,
+            resources=[],
+            elapsed_seconds=12,
+        )
+    )
+
+    [updated] = ledger.cleanup_resources()
+    assert updated.cleanup_status == "in_progress"
+    assert updated.progress_status == "DELETE_IN_PROGRESS"
+    assert updated.progress_percentage == 60
diff --git a/tests/pipeline/engine/test_complete_step_tool.py b/tests/pipeline/engine/test_complete_step_tool.py
index 0272e233..d31514cf 100644
--- a/tests/pipeline/engine/test_complete_step_tool.py
+++ b/tests/pipeline/engine/test_complete_step_tool.py
@@ -217,6 +217,176 @@ async def test_rejects_when_rollback_target_count_exceeds_limit(self):
 
 
 class TestCompletionGuards:
+    @staticmethod
+    def _deploying_success_guard() -> dict:
+        return {
+            "when_conclusion_field_equals": {"status": "success"},
+            "required_conclusion_field": "stack_id",
+            "require_tool_result": {
+                "tool": "ros_stack",
+                "action_in": ["CreateStack", "ContinueCreateStack"],
+                "is_success": True,
+                "status_in": ["CREATE_COMPLETE"],
+                "match_conclusion_field": "stack_id",
+            },
+            "message": "部署成功必须等待 ros_stack CreateStack 返回 CREATE_COMPLETE。",
+        }
+
+    @staticmethod
+    def _deploying_tool(result_records: list[dict] | None = None) -> CompleteStepTool:
+        config = StepConfig(
+            step_id="deploying",
+            conclusion_field="deployment",
+            forward=None,
+            conclusion_schema={
+                "type": "object",
+                "required": ["status"],
+                "additionalProperties": False,
+                "properties": {
+                    "stack_id": {"type": "string"},
+                    "status": {"type": "string", "enum": ["success", "failed", "cancelled"]},
+                    "error": {"type": "string"},
+                },
+            },
+        )
+        return CompleteStepTool(
+            config,
+            completion_guards=[TestCompletionGuards._deploying_success_guard()],
+            completion_guard_state={
+                "successful_tools": set(),
+                "tool_results": {},
+                "tool_result_records": list(result_records or []),
+            },
+        )
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_rejects_deploying_success_without_create_stack_result(self):
+        tool = self._deploying_tool()
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+            context=ToolContext(),
+        )
+
+        assert result.is_error
+        assert "CreateStack" in result.content
+        assert "CREATE_COMPLETE" in result.content
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_rejects_deploying_success_when_stack_creation_failed(self):
+        tool = self._deploying_tool(
+            [
+                {
+                    "tool_name": "ros_stack",
+                    "input": {"action": "CreateStack", "params": {"StackName": "demo"}},
+                    "result": {"stack_id": "stack-123", "status": "CREATE_FAILED", "is_success": False},
+                    "is_error": True,
+                }
+            ]
+        )
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+            context=ToolContext(),
+        )
+
+        assert result.is_error
+        assert "CREATE_COMPLETE" in result.content
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_rejects_deploying_success_when_stack_id_mismatches(self):
+        tool = self._deploying_tool(
+            [
+                {
+                    "tool_name": "ros_stack",
+                    "input": {"action": "CreateStack", "params": {"StackName": "demo"}},
+                    "result": {"stack_id": "stack-123", "status": "CREATE_COMPLETE", "is_success": True},
+                    "is_error": False,
+                }
+            ]
+        )
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "success", "stack_id": "stack-other"}},
+            context=ToolContext(),
+        )
+
+        assert result.is_error
+        assert "stack_id" in result.content
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_accepts_matching_deploying_success(self):
+        tool = self._deploying_tool(
+            [
+                {
+                    "tool_name": "ros_stack",
+                    "input": {"action": "CreateStack", "params": {"StackName": "demo"}},
+                    "result": {"stack_id": "stack-123", "status": "CREATE_COMPLETE", "is_success": True},
+                    "is_error": False,
+                }
+            ]
+        )
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+            context=ToolContext(),
+        )
+
+        assert not result.is_error
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_accepts_matching_continue_create_stack_success(self):
+        tool = self._deploying_tool(
+            [
+                {
+                    "tool_name": "ros_stack",
+                    "input": {"action": "ContinueCreateStack", "params": {"StackName": "demo"}},
+                    "result": {"stack_id": "stack-123", "status": "CREATE_COMPLETE", "is_success": True},
+                    "is_error": False,
+                }
+            ]
+        )
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+            context=ToolContext(),
+        )
+
+        assert not result.is_error
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_rejects_non_matching_stack_action(self):
+        tool = self._deploying_tool(
+            [
+                {
+                    "tool_name": "ros_stack",
+                    "input": {"action": "UpdateStack", "params": {"StackName": "demo"}},
+                    "result": {"stack_id": "stack-123", "status": "CREATE_COMPLETE", "is_success": True},
+                    "is_error": False,
+                }
+            ]
+        )
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+            context=ToolContext(),
+        )
+
+        assert result.is_error
+        assert "CreateStack" in result.content
+        assert "ContinueCreateStack" in result.content
+
+    @pytest.mark.asyncio
+    async def test_required_tool_result_does_not_block_failed_deploying_conclusion(self):
+        tool = self._deploying_tool()
+
+        result = await tool.execute(
+            tool_input={"conclusion": {"status": "failed", "error": "CREATE_FAILED"}},
+            context=ToolContext(),
+        )
+
+        assert not result.is_error
+
     @pytest.mark.asyncio
     async def test_required_conclusion_any_of_accepts_clarification_text(self):
         config = StepConfig(step_id="intent_parsing", conclusion_field="intent", forward=None)
diff --git a/tests/pipeline/engine/test_display_replay.py b/tests/pipeline/engine/test_display_replay.py
index 3b88d57b..1a4eab1a 100644
--- a/tests/pipeline/engine/test_display_replay.py
+++ b/tests/pipeline/engine/test_display_replay.py
@@ -32,6 +32,26 @@ def test_recorder_and_reducer_preserve_repeated_attempts_after_rollback(tmp_path
     assert model.interrupted is True
 
 
+def test_display_replay_ignores_pipeline_warning_without_terminal_change(tmp_path) -> None:
+    path = tmp_path / "display.jsonl"
+    recorder = PipelineDisplayRecorder(path)
+
+    recorder.record("pipeline_started", pipeline_name="selling", timestamp=1.0)
+    recorder.record("step_started", step_id="deploying", payload={"index": 1, "total": 1}, timestamp=1.5)
+    recorder.record(
+        "pipeline_warning",
+        step_id="deploying",
+        payload={"reason": "cleanup_tracking_unavailable"},
+        timestamp=2.0,
+    )
+
+    model = PipelineDisplayReducer().reduce(load_display_events(path))
+
+    assert model.interrupted is False
+    assert model.failed is False
+    assert model.attempts[-1].status == "running"
+
+
 def test_reducer_attaches_transcript_ids_from_event_payload_and_attempt_metadata(tmp_path):
     path = tmp_path / "display.jsonl"
     recorder = PipelineDisplayRecorder(path)
diff --git a/tests/pipeline/engine/test_interrupt.py b/tests/pipeline/engine/test_interrupt.py
index ee46e213..565ecefe 100644
--- a/tests/pipeline/engine/test_interrupt.py
+++ b/tests/pipeline/engine/test_interrupt.py
@@ -6,6 +6,9 @@
 
 import pytest
 
+from iac_code.agent.message import ImageBlock, TextBlock
+from iac_code.pipeline.engine.user_input import PipelineUserInput
+
 
 class TestInterruptVerdict:
     def test_verdict_creation(self):
@@ -101,6 +104,49 @@ async def test_judge_parses_valid_response(self):
         assert verdict.action == "hard_interrupt"
         assert verdict.rollback_target == "intent_parsing"
 
+    @pytest.mark.asyncio
+    async def test_judge_sends_image_blocks_to_provider(self):
+        from iac_code.pipeline.engine.interrupt import InterruptController
+
+        captured = {}
+
+        class ProviderManager:
+            async def complete(self, *, messages, system, tools=None, max_tokens=8192, cache_policy="default"):
+                captured["messages"] = messages
+                return type(
+                    "Response",
+                    (),
+                    {
+                        "text": (
+                            '{"action":"supplement","reason":"image updates current step",'
+                            '"rollback_target":null,"candidate_scope":null,'
+                            '"supplement_target":null,"rollback_context":null}'
+                        )
+                    },
+                )()
+
+        controller = InterruptController(
+            ProviderManager(),
+            lambda: {"pipeline_name": "selling", "steps": []},
+        )
+        image = ImageBlock(media_type="image/png", data="aGVsbG8=")
+        verdict = await controller.judge(
+            PipelineUserInput(
+                content=[TextBlock(text="see diagram"), image],
+                display_text="see diagram",
+                has_images=True,
+            )
+        )
+
+        assert verdict.action == "supplement"
+        message = captured["messages"][0]
+        assert isinstance(message.content, list)
+        assert message.content[0].type == "text"
+        assert "用户同时提供了图片输入" in (message.content[0].text or "")
+        assert message.content[1].type == "image"
+        assert message.content[1].media_type == "image/png"
+        assert message.content[1].data == "aGVsbG8="
+
     @pytest.mark.asyncio
     async def test_judge_invalid_json_returns_continue(self):
         from iac_code.pipeline.engine.interrupt import InterruptController
diff --git a/tests/pipeline/engine/test_loader.py b/tests/pipeline/engine/test_loader.py
index 9fd05d28..41597451 100644
--- a/tests/pipeline/engine/test_loader.py
+++ b/tests/pipeline/engine/test_loader.py
@@ -48,6 +48,32 @@ def test_loads_basic_pipeline(self, tmp_path):
         assert loaded.steps[1].context_fields == ["intent"]
         assert loaded.max_rollbacks == 2
 
+    def test_ignores_legacy_step_rollback_section(self, tmp_path):
+        yaml_content = dedent("""\
+            name: test
+            context_dependencies:
+              intent: []
+              architecture: [intent]
+            max_rollbacks: 2
+            steps:
+              - id: step_a
+                conclusion_field: intent
+                forward: step_b
+                prompt: prompts/step_a.md
+              - id: step_b
+                conclusion_field: architecture
+                forward: null
+                prompt: prompts/step_b.md
+                rollback:
+                  - target: step_a
+                    condition: revise_intent
+        """)
+        _write_pipeline(tmp_path, yaml_content, {"step_a.md": "Do A", "step_b.md": "Do B"})
+
+        loaded = load_pipeline_dir(tmp_path)
+
+        assert not hasattr(loaded.steps[1], "rollback_rules")
+
     def test_selling_iac_aliyun_skill_reference_file_uses_bundled_root_fallback(self, tmp_path):
         _write_pipeline(tmp_path, MINIMAL_YAML, {"step_a.md": "Do A", "step_b.md": "Do B with {intent}"})
         skill_dir = tmp_path / "skills" / "iac-aliyun-cost"
@@ -452,6 +478,34 @@ def test_inject_tools_default_empty(self, tmp_path):
         assert loaded.steps[0].inject_tools == []
 
 
+class TestSurfaceOverridesParsing:
+    def test_surface_overrides_parse_prompt_and_inject_tools(self, tmp_path):
+        yaml_content = dedent("""\
+            name: test
+            context_dependencies:
+              result: []
+            max_rollbacks: 1
+            steps:
+              - id: confirm
+                conclusion_field: result
+                forward: null
+                prompt: prompts/confirm.md
+                inject_tools: [show_architecture_diagram, show_candidate_detail]
+                surface_overrides:
+                  a2a:
+                    prompt: prompts/confirm.a2a.md
+                    inject_tools: []
+        """)
+        _write_pipeline(tmp_path, yaml_content, {"confirm.md": "C", "confirm.a2a.md": "A2A"})
+
+        loaded = load_pipeline_dir(tmp_path)
+        step = loaded.steps[0]
+
+        assert step.surface_overrides["a2a"].prompt_file == "prompts/confirm.a2a.md"
+        assert step.surface_overrides["a2a"].inject_tools == []
+        assert step.inject_tools == ["show_architecture_diagram", "show_candidate_detail"]
+
+
 class TestUiMode:
     def test_ui_mode_parsed_from_yaml(self, tmp_path):
         yaml_content = dedent("""\
diff --git a/tests/pipeline/engine/test_loader_hooks.py b/tests/pipeline/engine/test_loader_hooks.py
new file mode 100644
index 00000000..233620c7
--- /dev/null
+++ b/tests/pipeline/engine/test_loader_hooks.py
@@ -0,0 +1,47 @@
+from __future__ import annotations
+
+import textwrap
+
+from iac_code.pipeline.engine.loader import load_pipeline_dir
+
+
+def test_loader_binds_cleanup_hook_functions(tmp_path) -> None:
+    (tmp_path / "pipeline.yaml").write_text(
+        textwrap.dedent(
+            """
+            name: cleanup-hooks
+            context_dependencies:
+              deployment: []
+            steps:
+              - id: deploying
+                conclusion_field: deployment
+                forward: null
+                prompt: deploying.md
+                hooks_file: hooks/deploying.py
+            """
+        ),
+        encoding="utf-8",
+    )
+    (tmp_path / "deploying.md").write_text("deploy", encoding="utf-8")
+    hooks_dir = tmp_path / "hooks"
+    hooks_dir.mkdir()
+    (hooks_dir / "deploying.py").write_text(
+        textwrap.dedent(
+            """
+            def on_resource_observed(*args, **kwargs):
+                return None
+
+            def on_rollback_cleanup_required(*args, **kwargs):
+                return []
+            """
+        ),
+        encoding="utf-8",
+    )
+
+    loaded = load_pipeline_dir(tmp_path)
+    [step] = loaded.steps
+
+    assert step.on_resource_observed is not None
+    assert step.on_resource_observed.__name__ == "on_resource_observed"
+    assert step.on_rollback_cleanup_required is not None
+    assert step.on_rollback_cleanup_required.__name__ == "on_rollback_cleanup_required"
diff --git a/tests/pipeline/engine/test_pipeline_observability.py b/tests/pipeline/engine/test_pipeline_observability.py
index 4ceb2885..e8edb61b 100644
--- a/tests/pipeline/engine/test_pipeline_observability.py
+++ b/tests/pipeline/engine/test_pipeline_observability.py
@@ -12,7 +12,7 @@
 from iac_code.pipeline.engine.pipeline_runner import PipelineRunner
 from iac_code.pipeline.engine.session import RestoreResult
 from iac_code.pipeline.engine.step_spec import LoadedPipeline, StepSpec, SubPipelineSpec
-from iac_code.pipeline.engine.types import RollbackRule, StepResult, StepStatus
+from iac_code.pipeline.engine.types import StepResult, StepStatus
 from iac_code.services.telemetry.config import ContentCaptureMode
 from iac_code.services.telemetry.names import Events, GenAiAttr, GenAiOperationName, GenAiSpanKind, Metrics, Spans
 
@@ -1491,7 +1491,6 @@ def test_restore_from_sidecar_emits_sidecar_failed_for_real_restore_failure(runn
 async def test_runner_emits_parent_rollback_telemetry(runner):
     runner._observability.rollback = MagicMock()
     runner.state_machine.advance()
-    runner.state_machine.current_step.rollback_rules.append(RollbackRule(target_step="a", condition="revise"))
 
     async def fake_execute(step, context, session_id, user_message=None, **kwargs):
         conclusion = {"value": step.step_id}
@@ -1529,7 +1528,6 @@ async def test_runner_distinguishes_step_attempts_after_parent_rollback(runner):
     runner._observability.step_completed = MagicMock()
     runner._observability.funnel_step = MagicMock()
     runner._observability.rollback = MagicMock()
-    runner.state_machine._steps["b"].rollback_rules.append(RollbackRule(target_step="a", condition="revise"))
     seen: dict[str, int] = {"a": 0, "b": 0}
 
     async def fake_execute(step, context, session_id, user_message=None, **kwargs):
diff --git a/tests/pipeline/engine/test_pipeline_runner.py b/tests/pipeline/engine/test_pipeline_runner.py
index 9fa33bd8..f00c47bf 100644
--- a/tests/pipeline/engine/test_pipeline_runner.py
+++ b/tests/pipeline/engine/test_pipeline_runner.py
@@ -9,6 +9,7 @@
 import yaml
 
 from iac_code.agent.message import Message, ToolResultBlock
+from iac_code.pipeline.engine.cleanup import CleanupLedger, CleanupResource, ObservedResource
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.pipeline.engine.pipeline_runner import PipelineRunner
@@ -17,6 +18,7 @@
 from iac_code.pipeline.engine.transcript_storage import PipelineTranscriptStorage
 from iac_code.pipeline.engine.types import StepResult, StepStatus
 from iac_code.services.session_storage import SessionStorage
+from iac_code.types.stream_events import ResourceObservedEvent
 
 
 def _selling_dir() -> Path:
@@ -35,6 +37,19 @@ def session_path(self, cwd, session_id):
         return self._path
 
 
+class FailingAppendMetaSessionStorage(FakeSessionStorage):
+    def __init__(self, fail_types: set[str] | None = None):
+        super().__init__()
+        self.fail_types = fail_types
+        self.append_attempts = []
+
+    def append_meta(self, cwd, session_id, meta):
+        self.append_attempts.append(meta)
+        if self.fail_types is None or meta.get("type") in self.fail_types:
+            raise OSError("session meta unavailable")
+        super().append_meta(cwd, session_id, meta)
+
+
 class DirectorySessionStorage(FakeSessionStorage):
     def __init__(self, root: Path):
         super().__init__()
@@ -120,6 +135,41 @@ def save_rollback_sync(
         raise OSError("sidecar unavailable")
 
 
+class FailingAfterAdvancePipelineSession(RecordingPipelineSession):
+    async def save_running(
+        self, current_step, state_machine_snapshot, context_snapshot, pipeline_identity, reason=None, **kwargs
+    ):
+        self.calls.append(("running_attempted", current_step, state_machine_snapshot["current_index"], reason))
+        if current_step == "b" and reason == "advanced from a":
+            raise OSError("sidecar unavailable")
+
+
+class FailingFinalCompletedPipelineSession(RecordingPipelineSession):
+    async def save_completed(
+        self, current_step, state_machine_snapshot, context_snapshot, pipeline_identity, reason=None, **kwargs
+    ):
+        self.calls.append(("completed_attempted", current_step, state_machine_snapshot["current_index"], reason))
+        raise OSError("sidecar unavailable")
+
+
+class FailingCandidateFailedPipelineSession(RecordingPipelineSession):
+    async def save_running(
+        self, current_step, state_machine_snapshot, context_snapshot, pipeline_identity, reason=None, **kwargs
+    ):
+        self.calls.append(("running_attempted", current_step, state_machine_snapshot["current_index"], reason))
+        if reason == "parallel candidate failed":
+            raise OSError("sidecar unavailable")
+
+
+class FailingUserInputCheckpointPipelineSession(RecordingPipelineSession):
+    async def save_running(
+        self, current_step, state_machine_snapshot, context_snapshot, pipeline_identity, reason=None, **kwargs
+    ):
+        self.calls.append(("running_attempted", current_step, state_machine_snapshot["current_index"], reason))
+        if reason in {"user input received", "pipeline pause confirmation received"}:
+            raise OSError("sidecar unavailable")
+
+
 class CapturingPipelineSession(RecordingPipelineSession):
     def __init__(self):
         super().__init__()
@@ -142,7 +192,7 @@ async def save_failed(
         )
 
 
-def _build_two_step_runner(tmp_path, *, auto_advance_first=True):
+def _build_two_step_runner(tmp_path, *, auto_advance_first=True, storage=None):
     (tmp_path / "prompts").mkdir(exist_ok=True)
     (tmp_path / "prompts" / "a.md").write_text("A", encoding="utf-8")
     (tmp_path / "prompts" / "b.md").write_text("B", encoding="utf-8")
@@ -173,7 +223,7 @@ def _build_two_step_runner(tmp_path, *, auto_advance_first=True):
         pipeline_dir=tmp_path,
         provider_manager=MagicMock(),
         base_tool_registry=MagicMock(),
-        session_storage=FakeSessionStorage(),
+        session_storage=storage or FakeSessionStorage(),
         session_id="test",
         cwd=str(tmp_path),
     )
@@ -208,9 +258,6 @@ def _build_parallel_runner(tmp_path, *, storage=None):
                 forward: null
                 prompt: prompts/cost.md
                 context_fields: [template]
-                rollback:
-                  - target: template_gen
-                    condition: needs_template_rework
         steps:
           - id: arch
             conclusion_field: architecture
@@ -353,14 +400,14 @@ async def fake_execute(step, context, session_id, user_message=None, **kwargs):
 
 
 @pytest.mark.asyncio
-async def test_sidecar_save_failure_does_not_abort_pipeline(tmp_path):
-    runner = _build_two_step_runner(tmp_path, auto_advance_first=False)
-    runner.session = FailingSavePipelineSession()
+async def test_sidecar_save_failure_stops_before_next_step(tmp_path):
+    runner = _build_two_step_runner(tmp_path)
+    runner.session = FailingAfterAdvancePipelineSession()
     executed_steps = []
 
     async def fake_execute(step, context, session_id, user_message=None, **kwargs):
         executed_steps.append(step.step_id)
-        conclusion = {"user_prompt": "choose", "options": ["one"]}
+        conclusion = {"value": step.step_id}
         context.set_conclusion(step.conclusion_field, conclusion)
         yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion=conclusion)
 
@@ -372,18 +419,114 @@ async def fake_execute(step, context, session_id, user_message=None, **kwargs):
 
     assert executed_steps == ["a"]
     assert any(
-        isinstance(event, PipelineEvent) and event.type == PipelineEventType.USER_INPUT_REQUIRED for event in events
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.step_id == "a"
+        and "pipeline state persistence failed" in str(event.data).lower()
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_COMPLETED and event.step_id == "a"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_STARTED and event.step_id == "b"
+        for event in events
+    )
+    assert runner.state_machine.current_step.step_id == "b"
+    assert ("running_attempted", "b", 1, "advanced from a") in runner.session.calls
+    assert runner.sidecar_status is None
+
+
+@pytest.mark.asyncio
+async def test_final_completed_save_failure_yields_persistence_failure_event(tmp_path):
+    runner = _build_two_step_runner(tmp_path)
+    runner.session = FailingFinalCompletedPipelineSession()
+    executed_steps = []
+
+    async def fake_execute(step, context, session_id, user_message=None, **kwargs):
+        executed_steps.append(step.step_id)
+        conclusion = {"value": step.step_id}
+        context.set_conclusion(step.conclusion_field, conclusion)
+        yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion=conclusion)
+
+    runner._step_executor.execute = fake_execute
+
+    events = []
+    async for event in runner._continue_from_current():
+        events.append(event)
+
+    assert executed_steps == ["a", "b"]
+    assert any(
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.step_id == "b"
+        and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+        for event in events
     )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_COMPLETED for event in events
+    )
+    assert ("completed_attempted", "b", 2, "pipeline completed") in runner.session.calls
     assert runner.sidecar_status is None
 
 
+@pytest.mark.asyncio
+async def test_resume_input_save_failure_stops_before_input_received_event(tmp_path):
+    runner = _build_two_step_runner(tmp_path, auto_advance_first=False)
+    runner.session = FailingUserInputCheckpointPipelineSession()
+
+    async def fake_execute(step, context, session_id, user_message=None, **kwargs):
+        yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion={})
+
+    runner._step_executor.execute = fake_execute
+
+    events = []
+    async for event in runner.resume("continue"):
+        events.append(event)
+
+    assert any(
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.USER_INPUT_RECEIVED for event in events
+    )
+    assert ("running_attempted", "a", 0, "user input received") in runner.session.calls
+
+
+@pytest.mark.asyncio
+async def test_pause_confirmation_save_failure_stops_before_input_received_event(tmp_path):
+    runner = _build_two_step_runner(tmp_path)
+    runner.session = FailingUserInputCheckpointPipelineSession()
+    runner._set_pending_input_kind("pipeline_pause_confirmation")
+
+    events = []
+    async for event in runner.continue_from_sidecar("continue"):
+        events.append(event)
+
+    assert any(
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.USER_INPUT_RECEIVED for event in events
+    )
+    assert ("running_attempted", "a", 0, "pipeline pause confirmation received") in runner.session.calls
+
+
 @pytest.mark.asyncio
 async def test_sidecar_save_failure_emits_sidecar_failed_telemetry(tmp_path):
     runner = _build_two_step_runner(tmp_path)
     runner.session = FailingSavePipelineSession()
     runner._observability.sidecar_failed = MagicMock()
 
-    await runner._save_running("a", reason="step started")
+    with pytest.raises(RuntimeError, match="pipeline state persistence failed during save_running"):
+        await runner._save_running("a", reason="step started")
 
     runner._observability.sidecar_failed.assert_called_once_with(
         operation="save_running",
@@ -394,6 +537,203 @@ async def test_sidecar_save_failure_emits_sidecar_failed_telemetry(tmp_path):
     )
 
 
+@pytest.mark.asyncio
+async def test_resource_observed_save_failure_stops_before_continuing(tmp_path, monkeypatch):
+    runner = _build_two_step_runner(tmp_path)
+    runner.session = PipelineSession(tmp_path / "session" / "pipeline")
+    step = runner.state_machine.current_step
+
+    def on_resource_observed(ctx, event, *, ledger, step_id, attempt_id):
+        return ObservedResource(
+            provider=event.provider,
+            resource_type=event.resource_type,
+            resource_id=event.resource_id,
+            resource_name=event.resource_name,
+            region_id=event.region_id,
+            source_step_id=step_id,
+            source_attempt_id=attempt_id,
+            observed_action=event.action,
+            observed_at=1.0,
+        )
+
+    def fail_record_observed(self, observed):
+        raise OSError("cleanup disk full")
+
+    step.on_resource_observed = on_resource_observed
+    monkeypatch.setattr(CleanupLedger, "record_observed", fail_record_observed)
+
+    async def fake_execute(step, context, session_id, user_message=None, **kwargs):
+        yield ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-123",
+            resource_name="demo",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+        )
+        context.set_conclusion(step.conclusion_field, {"value": step.step_id})
+        yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion={"value": step.step_id})
+
+    runner._step_executor.execute = fake_execute
+
+    events = [event async for event in runner._continue_from_current()]
+
+    assert any(
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.step_id == "a"
+        and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_COMPLETED and event.step_id == "a"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_COMPLETED for event in events
+    )
+
+
+@pytest.mark.asyncio
+async def test_rollback_cleanup_required_save_failure_stops_before_rollback_event(tmp_path, monkeypatch):
+    runner = _build_two_step_runner(tmp_path)
+    runner.session = PipelineSession(tmp_path / "session" / "pipeline")
+
+    def on_rollback_cleanup_required(ctx, *, ledger, from_step, from_attempt_id, to_step, reason):
+        return [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                source_step_id=from_step,
+                source_attempt_id=from_attempt_id,
+                cleanup_reason=reason,
+            )
+        ]
+
+    def fail_mark_cleanup_required(self, resources, *, source_step_id, reason):
+        raise OSError("cleanup disk full")
+
+    runner._loaded.steps[1].on_rollback_cleanup_required = on_rollback_cleanup_required
+    monkeypatch.setattr(CleanupLedger, "mark_cleanup_required", fail_mark_cleanup_required)
+
+    async def fake_execute(step, context, session_id, user_message=None, **kwargs):
+        if step.step_id == "a":
+            conclusion = {"value": "a"}
+            context.set_conclusion(step.conclusion_field, conclusion)
+            yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion=conclusion)
+            return
+        conclusion = {"value": "b"}
+        context.set_conclusion(step.conclusion_field, conclusion)
+        yield StepResult(
+            step_id=step.step_id,
+            status=StepStatus.COMPLETED,
+            conclusion=conclusion,
+            rollback_request=("a", "retry"),
+        )
+
+    runner._step_executor.execute = fake_execute
+
+    events = [event async for event in runner._continue_from_current()]
+
+    assert any(
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.step_id == "b"
+        and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_COMPLETED and event.step_id == "b"
+        for event in events
+    )
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.ROLLBACK_TRIGGERED for event in events
+    )
+
+
+@pytest.mark.asyncio
+async def test_initial_sidecar_save_failure_stops_before_pipeline_init_meta(tmp_path):
+    runner = _build_two_step_runner(tmp_path)
+    runner.session = FailingSavePipelineSession()
+
+    events = [event async for event in runner.run("start")]
+
+    assert any(
+        isinstance(event, PipelineEvent)
+        and event.type == PipelineEventType.STEP_FAILED
+        and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+        for event in events
+    )
+    assert runner._session_storage.meta_entries == []
+    assert not any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_STARTED for event in events
+    )
+
+
+@pytest.mark.asyncio
+async def test_session_meta_append_failure_is_best_effort_for_completed_pipeline(tmp_path, caplog):
+    storage = FailingAppendMetaSessionStorage()
+    runner = _build_two_step_runner(tmp_path, storage=storage)
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.pipeline_runner")
+
+    async def fake_execute(step, context, session_id, user_message=None, **kwargs):
+        conclusion = {"value": step.step_id}
+        context.set_conclusion(step.conclusion_field, conclusion)
+        yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion=conclusion)
+
+    runner._step_executor.execute = fake_execute
+
+    events = [event async for event in runner.run("start")]
+
+    assert any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_STARTED for event in events
+    )
+    assert any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_COMPLETED for event in events
+    )
+    assert not any(isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_FAILED for event in events)
+    assert {meta["type"] for meta in storage.append_attempts} >= {"pipeline_init", "pipeline_step_complete"}
+    assert "Failed to append pipeline session metadata" in caplog.text
+
+
+@pytest.mark.asyncio
+async def test_rollback_session_meta_append_failure_is_best_effort(tmp_path, caplog):
+    storage = FailingAppendMetaSessionStorage(fail_types={"pipeline_rollback"})
+    runner = _build_two_step_runner(tmp_path, storage=storage)
+    requested_rollback = False
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.pipeline_runner")
+
+    async def fake_execute(step, context, session_id, user_message=None, **kwargs):
+        nonlocal requested_rollback
+        conclusion = {"value": step.step_id}
+        context.set_conclusion(step.conclusion_field, conclusion)
+        rollback_request = None
+        if step.step_id == "b" and not requested_rollback:
+            requested_rollback = True
+            rollback_request = ("a", "retry")
+        yield StepResult(
+            step_id=step.step_id,
+            status=StepStatus.COMPLETED,
+            conclusion=conclusion,
+            rollback_request=rollback_request,
+        )
+
+    runner._step_executor.execute = fake_execute
+
+    events = [event async for event in runner._continue_from_current()]
+
+    assert any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.ROLLBACK_TRIGGERED for event in events
+    )
+    assert any(
+        isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_COMPLETED for event in events
+    )
+    assert not any(isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_FAILED for event in events)
+    assert any(meta["type"] == "pipeline_rollback" for meta in storage.append_attempts)
+    assert "Failed to append pipeline session metadata during pipeline_rollback" in caplog.text
+
+
 @pytest.mark.asyncio
 async def test_real_sidecar_save_failure_logs_once_at_runner_boundary(tmp_path, caplog, monkeypatch):
     from iac_code.pipeline.engine.session import PipelineSession
@@ -407,7 +747,8 @@ def fail_write(path, data):
     monkeypatch.setattr(runner.session, "_atomic_write_yaml", fail_write)
     caplog.set_level(logging.WARNING)
 
-    await runner._save_running("a", reason="step started")
+    with pytest.raises(RuntimeError, match="pipeline state persistence failed during save_running"):
+        await runner._save_running("a", reason="step started")
 
     sidecar_records = [record for record in caplog.records if "pipeline sidecar" in record.getMessage()]
     assert len(sidecar_records) == 1
@@ -468,7 +809,7 @@ async def fake_execute(step, context, session_id, user_message=None, **kwargs):
     assert seen_user_messages == [None]
 
 
-def test_sync_sidecar_save_failure_does_not_abort_hard_interrupt(tmp_path):
+def test_sync_sidecar_save_failure_raises_after_hard_interrupt_boundary(tmp_path):
     from iac_code.pipeline.engine.interrupt import InterruptVerdict
 
     runner = _build_two_step_runner(tmp_path)
@@ -476,11 +817,11 @@ def test_sync_sidecar_save_failure_does_not_abort_hard_interrupt(tmp_path):
     runner._observability.sidecar_failed = MagicMock()
     runner.state_machine.advance()
 
-    result = runner.apply_hard_interrupt(
-        InterruptVerdict(action="hard_interrupt", reason="changed mind", rollback_target="a")
-    )
+    with pytest.raises(RuntimeError, match="pipeline state persistence failed during save_rollback_sync"):
+        runner.apply_hard_interrupt(
+            InterruptVerdict(action="hard_interrupt", reason="changed mind", rollback_target="a")
+        )
 
-    assert result is True
     assert runner.state_machine.current_step.step_id == "a"
     assert any(call[0] == "rollback_sync_attempted" for call in runner.session.calls)
     assert runner.sidecar_status is None
@@ -1245,6 +1586,78 @@ async def failing_execute_streaming(*args, **kwargs):
         assert record.error_summary == "lost worker token=[REDACTED] [PATH]"
         assert record.error_id == failed_event.data["error_details"]["error_id"]
 
+    @pytest.mark.asyncio
+    async def test_parallel_candidate_failure_save_failure_stops_before_failed_event(self, tmp_path):
+        runner = _build_parallel_runner(tmp_path)
+        runner.session = FailingCandidateFailedPipelineSession()
+        step = runner.state_machine.current_step
+
+        async def failing_execute_streaming(*args, **kwargs):
+            raise RuntimeError("candidate worker failed")
+            if False:
+                yield
+
+        with patch("iac_code.pipeline.engine.pipeline_runner.SubPipelineExecutor") as mock_sub_exec:
+            instance = MagicMock()
+            instance.execute_streaming = failing_execute_streaming
+            instance.current_step_executor_agent_loop = None
+            mock_sub_exec.return_value = instance
+
+            events = [event async for event in runner._execute_parallel_sub_pipeline(step)]
+
+        assert any(
+            isinstance(event, PipelineEvent)
+            and event.type == PipelineEventType.STEP_FAILED
+            and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+            for event in events
+        )
+        assert not any(
+            isinstance(event, PipelineEvent)
+            and event.type == PipelineEventType.SUB_PIPELINE_COMPLETED
+            and event.data.get("failed") is True
+            for event in events
+        )
+        assert not any(
+            isinstance(event, PipelineEvent) and event.type == PipelineEventType.STEP_COMPLETED for event in events
+        )
+        assert ("running_attempted", "eval", 1, "parallel candidate failed") in runner.session.calls
+
+    @pytest.mark.asyncio
+    async def test_parallel_candidate_failure_save_failure_stops_outer_step(self, tmp_path):
+        runner = _build_parallel_runner(tmp_path)
+        runner.session = FailingCandidateFailedPipelineSession()
+
+        async def failing_execute_streaming(*args, **kwargs):
+            raise RuntimeError("candidate worker failed")
+            if False:
+                yield
+
+        with patch("iac_code.pipeline.engine.pipeline_runner.SubPipelineExecutor") as mock_sub_exec:
+            instance = MagicMock()
+            instance.execute_streaming = failing_execute_streaming
+            instance.current_step_executor_agent_loop = None
+            mock_sub_exec.return_value = instance
+
+            events = [event async for event in runner._continue_from_current()]
+
+        assert any(
+            isinstance(event, PipelineEvent)
+            and event.type == PipelineEventType.STEP_FAILED
+            and event.data["error_details"]["type"] == "PipelineStatePersistenceError"
+            for event in events
+        )
+        assert not any(
+            isinstance(event, PipelineEvent)
+            and event.type == PipelineEventType.STEP_COMPLETED
+            and event.step_id == "eval"
+            for event in events
+        )
+        assert not any(
+            isinstance(event, PipelineEvent) and event.type == PipelineEventType.PIPELINE_COMPLETED for event in events
+        )
+        assert not any(call[0] == "completed" for call in runner.session.calls)
+        assert ("running_attempted", "eval", 1, "parallel candidate failed") in runner.session.calls
+
     @pytest.mark.asyncio
     async def test_resolve_iterate_field_raises_for_missing_and_returns_for_present(self, tmp_path):
         """P-I16: _resolve_iterate_field raises ValueError when context field is missing,
diff --git a/tests/pipeline/engine/test_pipeline_runner_cleanup.py b/tests/pipeline/engine/test_pipeline_runner_cleanup.py
new file mode 100644
index 00000000..3463d891
--- /dev/null
+++ b/tests/pipeline/engine/test_pipeline_runner_cleanup.py
@@ -0,0 +1,308 @@
+from __future__ import annotations
+
+import logging
+
+import pytest
+import yaml
+
+from iac_code.pipeline.engine.cleanup import CleanupLedger, CleanupResource, ObservedResource
+from iac_code.pipeline.engine.context import PipelineContext
+from iac_code.pipeline.engine.events import PipelineEventType
+from iac_code.pipeline.engine.pipeline_runner import PipelineRunner, PipelineStatePersistenceError
+from iac_code.pipeline.engine.session import PipelineSession
+from iac_code.pipeline.engine.step_spec import LoadedPipeline, StepSpec
+from iac_code.types.stream_events import ResourceObservedEvent
+
+
+def _runner(tmp_path) -> PipelineRunner:
+    runner = PipelineRunner.__new__(PipelineRunner)
+    runner.session = PipelineSession(tmp_path / "session" / "pipeline")
+    runner.context = PipelineContext({})
+    runner._loaded = LoadedPipeline(
+        name="test",
+        steps=[],
+        context_dependencies={},
+        max_rollbacks=3,
+        skills={},
+    )
+    return runner
+
+
+def test_runner_persists_resource_observed_returned_by_step_hook(tmp_path) -> None:
+    runner = _runner(tmp_path)
+
+    def on_resource_observed(ctx, event, *, ledger, step_id, attempt_id):
+        assert ctx is runner.context
+        assert isinstance(ledger, CleanupLedger)
+        return ObservedResource(
+            provider=event.provider,
+            resource_type=event.resource_type,
+            resource_id=event.resource_id,
+            resource_name=event.resource_name,
+            region_id=event.region_id,
+            source_step_id=step_id,
+            source_attempt_id=attempt_id,
+            observed_action=event.action,
+            observed_at=1.0,
+        )
+
+    step = StepSpec(
+        step_id="deploying",
+        conclusion_field="deployment",
+        forward=None,
+        prompt_file="deploying.md",
+    )
+    step.on_resource_observed = on_resource_observed
+
+    runner._handle_resource_observed(
+        step,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-123",
+            resource_name="demo",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+        ),
+        attempt_id="att_0001",
+    )
+
+    [observed] = runner.cleanup_ledger().observed_resources()
+    assert observed.resource_id == "stack-123"
+    assert observed.source_step_id == "deploying"
+    assert observed.source_attempt_id == "att_0001"
+
+
+def test_runner_raises_cleanup_observed_write_failure(tmp_path, monkeypatch, caplog) -> None:
+    runner = _runner(tmp_path)
+
+    def on_resource_observed(ctx, event, *, ledger, step_id, attempt_id):
+        return ObservedResource(
+            provider=event.provider,
+            resource_type=event.resource_type,
+            resource_id=event.resource_id,
+            resource_name=event.resource_name,
+            region_id=event.region_id,
+            source_step_id=step_id,
+            source_attempt_id=attempt_id,
+            observed_action=event.action,
+            observed_at=1.0,
+        )
+
+    def fail_record_observed(self, observed):
+        raise OSError("cleanup disk full")
+
+    step = StepSpec(
+        step_id="deploying",
+        conclusion_field="deployment",
+        forward=None,
+        prompt_file="deploying.md",
+    )
+    step.on_resource_observed = on_resource_observed
+    monkeypatch.setattr(CleanupLedger, "record_observed", fail_record_observed)
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.pipeline_runner")
+
+    with pytest.raises(PipelineStatePersistenceError) as exc_info:
+        runner._handle_resource_observed(
+            step,
+            ResourceObservedEvent(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                resource_name="demo",
+                region_id="cn-hangzhou",
+                action="CreateStack",
+            ),
+            attempt_id="att_0001",
+        )
+
+    assert exc_info.value.step_id == "deploying"
+    assert "Failed to persist observed cleanup resource" in caplog.text
+    assert "step_id=deploying" in caplog.text
+    assert "cleanup disk full" in caplog.text
+
+
+def test_runner_marks_cleanup_required_from_rollback_hook(tmp_path) -> None:
+    runner = _runner(tmp_path)
+    observed = ObservedResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        resource_name="demo",
+        region_id="cn-hangzhou",
+        source_step_id="deploying",
+        source_attempt_id="att_0001",
+        observed_action="CreateStack",
+    )
+    runner.cleanup_ledger().record_observed(observed)
+
+    def on_rollback_cleanup_required(ctx, *, ledger, from_step, from_attempt_id, to_step, reason):
+        assert ctx is runner.context
+        assert from_step == "deploying"
+        assert from_attempt_id == "att_0001"
+        assert to_step == "confirm_and_select"
+        assert reason == "invalid selection"
+        return [CleanupResource.from_observed(ledger.observed_resources()[0], reason=reason)]
+
+    step = StepSpec(
+        step_id="deploying",
+        conclusion_field="deployment",
+        forward=None,
+        prompt_file="deploying.md",
+    )
+    step.on_rollback_cleanup_required = on_rollback_cleanup_required
+
+    runner._mark_rollback_cleanup_required(
+        step,
+        "confirm_and_select",
+        "invalid selection",
+        from_attempt_id="att_0001",
+    )
+
+    [pending] = runner.cleanup_ledger().pending_resources()
+    assert pending.resource_id == "stack-123"
+    assert pending.cleanup_reason == "invalid selection"
+    data = yaml.safe_load((runner.session.session_dir / "cleanup.yaml").read_text(encoding="utf-8"))
+    assert [entry["type"] for entry in data["history"]] == ["cleanup_required"]
+
+
+def test_runner_raises_cleanup_required_write_failure(tmp_path, monkeypatch, caplog) -> None:
+    runner = _runner(tmp_path)
+
+    def on_rollback_cleanup_required(ctx, *, ledger, from_step, from_attempt_id, to_step, reason):
+        return [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                source_step_id=from_step,
+                source_attempt_id=from_attempt_id,
+                cleanup_reason=reason,
+            )
+        ]
+
+    def fail_mark_cleanup_required(self, resources, *, source_step_id, reason):
+        raise OSError("cleanup disk full")
+
+    step = StepSpec(
+        step_id="deploying",
+        conclusion_field="deployment",
+        forward=None,
+        prompt_file="deploying.md",
+    )
+    step.on_rollback_cleanup_required = on_rollback_cleanup_required
+    monkeypatch.setattr(CleanupLedger, "mark_cleanup_required", fail_mark_cleanup_required)
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.pipeline_runner")
+
+    with pytest.raises(PipelineStatePersistenceError) as exc_info:
+        runner._mark_rollback_cleanup_required(
+            step,
+            "confirm_and_select",
+            "invalid selection",
+            from_attempt_id="att_0001",
+        )
+
+    assert exc_info.value.step_id == "deploying"
+    assert "Failed to persist rollback cleanup resources" in caplog.text
+    assert "step_id=deploying" in caplog.text
+    assert "cleanup disk full" in caplog.text
+
+
+def test_runner_emits_warning_event_when_observed_cleanup_ledger_unavailable(tmp_path, caplog) -> None:
+    runner = _runner(tmp_path)
+    ledger_path = runner.session.session_dir / "cleanup.yaml"
+    ledger_path.parent.mkdir(parents=True, exist_ok=True)
+    ledger_path.write_text("[broken", encoding="utf-8")
+
+    def on_resource_observed(ctx, event, *, ledger, step_id, attempt_id):
+        return ObservedResource(
+            provider=event.provider,
+            resource_type=event.resource_type,
+            resource_id=event.resource_id,
+            resource_name=event.resource_name,
+            region_id=event.region_id,
+            source_step_id=step_id,
+            source_attempt_id=attempt_id,
+            observed_action=event.action,
+        )
+
+    step = StepSpec(
+        step_id="deploying",
+        conclusion_field="deployment",
+        forward=None,
+        prompt_file="deploying.md",
+    )
+    step.on_resource_observed = on_resource_observed
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.pipeline_runner")
+
+    events = runner._handle_resource_observed(
+        step,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-123",
+            resource_name="demo",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+        ),
+        attempt_id="att_0001",
+    )
+
+    assert ledger_path.read_text(encoding="utf-8") == "[broken"
+    assert len(events) == 1
+    event = events[0]
+    assert event.type == PipelineEventType.PIPELINE_WARNING
+    assert event.step_id == "deploying"
+    assert event.data["reason"] == "cleanup_tracking_unavailable"
+    assert event.data["operation"] == "record_observed"
+    assert event.data["resource_id"] == "stack-123"
+    assert "ledger_path" not in event.data
+    assert "load_error" not in event.data
+    assert "cleanup tracking unavailable" in caplog.text.lower()
+
+
+def test_runner_emits_warning_event_when_required_cleanup_ledger_unavailable(tmp_path, caplog) -> None:
+    runner = _runner(tmp_path)
+    ledger_path = runner.session.session_dir / "cleanup.yaml"
+    ledger_path.parent.mkdir(parents=True, exist_ok=True)
+    ledger_path.write_text("[broken", encoding="utf-8")
+
+    def on_rollback_cleanup_required(ctx, *, ledger, from_step, from_attempt_id, to_step, reason):
+        return [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                source_step_id=from_step,
+                source_attempt_id=from_attempt_id,
+                cleanup_reason=reason,
+            )
+        ]
+
+    step = StepSpec(
+        step_id="deploying",
+        conclusion_field="deployment",
+        forward=None,
+        prompt_file="deploying.md",
+    )
+    step.on_rollback_cleanup_required = on_rollback_cleanup_required
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.pipeline_runner")
+
+    events = runner._mark_rollback_cleanup_required(
+        step,
+        "confirm_and_select",
+        "invalid selection",
+        from_attempt_id="att_0001",
+    )
+
+    assert ledger_path.read_text(encoding="utf-8") == "[broken"
+    assert len(events) == 1
+    event = events[0]
+    assert event.type == PipelineEventType.PIPELINE_WARNING
+    assert event.step_id == "deploying"
+    assert event.data["reason"] == "cleanup_tracking_unavailable"
+    assert event.data["operation"] == "mark_cleanup_required"
+    assert event.data["resource_count"] == 1
+    assert "ledger_path" not in event.data
+    assert "load_error" not in event.data
+    assert "cleanup tracking unavailable" in caplog.text.lower()
diff --git a/tests/pipeline/engine/test_pipeline_runner_interrupt.py b/tests/pipeline/engine/test_pipeline_runner_interrupt.py
index e70a9aae..4af79035 100644
--- a/tests/pipeline/engine/test_pipeline_runner_interrupt.py
+++ b/tests/pipeline/engine/test_pipeline_runner_interrupt.py
@@ -5,6 +5,7 @@
 
 import pytest
 
+from iac_code.agent.message import ImageBlock, Message, TextBlock, ToolResultBlock
 from iac_code.pipeline.engine.events import PipelineEventType
 from iac_code.pipeline.engine.interrupt import InterruptVerdict
 from iac_code.pipeline.engine.pipeline_runner import PipelineRunner, RestartInfo
@@ -23,10 +24,41 @@ def session_path(self, cwd, session_id):
         return self._path
 
 
+class FakeTranscriptStorage:
+    def __init__(self, messages_by_id=None):
+        self.messages_by_id = messages_by_id or {}
+
+    def load(self, cwd, session_id):
+        return list(self.messages_by_id.get(session_id, []))
+
+    @staticmethod
+    def repair_interrupted(messages):
+        return list(messages)
+
+
 class RecordingPipelineSession:
     def __init__(self):
         self.calls = []
 
+    async def save_running(
+        self,
+        current_step,
+        state_machine_snapshot,
+        context_snapshot,
+        pipeline_identity,
+        reason=None,
+        **kwargs,
+    ):
+        self.calls.append(
+            (
+                "running",
+                current_step,
+                state_machine_snapshot["current_index"],
+                reason,
+                pipeline_identity.pipeline_name,
+            )
+        )
+
     def save_rollback_sync(
         self,
         from_step,
@@ -432,6 +464,32 @@ async def test_supplement_verdict_passes_input_to_current_step(self, pipeline_ru
         judge.assert_awaited_once_with("use a smaller instance")
         cont.assert_called_once_with(user_input="use a smaller instance", resume_running_step=True)
 
+    @pytest.mark.asyncio
+    async def test_supplement_verdict_preserves_image_blocks_for_current_step(self, pipeline_runner):
+        verdict = InterruptVerdict(action="supplement", reason="extra context")
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+
+        with (
+            patch.object(pipeline_runner._interrupt_controller, "judge", AsyncMock(return_value=verdict)) as judge,
+            patch.object(pipeline_runner, "_continue_from_current", MagicMock(return_value=_empty_stream())) as cont,
+        ):
+            async for _event in pipeline_runner.continue_from_sidecar(user_input=image_input):
+                pass
+
+        judge.assert_awaited_once()
+        judged_input = judge.await_args.args[0]
+        assert judged_input.content == image_input
+        assert judged_input.display_text == "参考这张图"
+        assert judged_input.has_images is True
+        cont.assert_called_once_with(
+            user_input=image_input,
+            user_input_display_text="参考这张图",
+            resume_running_step=True,
+        )
+
     @pytest.mark.asyncio
     async def test_restored_parallel_continuation_judges_with_persisted_candidate_state(self, pipeline_runner):
         _seed_restored_parallel_judge_state(pipeline_runner)
@@ -1403,6 +1461,29 @@ async def test_continue_after_interrupt_passes_context(self, pipeline_runner):
         assert pipeline_runner._rollback_context is None
         await gen.aclose()
 
+    @pytest.mark.asyncio
+    async def test_continue_after_interrupt_preserves_image_source_input(self, pipeline_runner):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        verdict = InterruptVerdict(
+            action="hard_interrupt",
+            reason="changed mind",
+            rollback_target="a",
+            rollback_context="用户要求改为WordPress网站",
+        )
+        pipeline_runner.apply_hard_interrupt(verdict, source_input=image_input)
+
+        expected_display = "用户要求改为WordPress网站\n\n参考这张图"
+        expected_content = [TextBlock(text="用户要求改为WordPress网站"), *image_input]
+        with patch.object(pipeline_runner, "_continue_from_current", MagicMock(return_value=_empty_stream())) as cont:
+            gen = pipeline_runner.continue_after_interrupt()
+            await gen.aclose()
+
+        assert pipeline_runner._rollback_context is None
+        cont.assert_called_once_with(user_input=expected_content, user_input_display_text=expected_display)
+
     def test_schedule_candidate_restart_stores_rollback_context(self, pipeline_runner):
         mock_task = MagicMock()
         mock_task.done.return_value = False
@@ -1426,6 +1507,643 @@ def test_schedule_candidate_restart_stores_rollback_context(self, pipeline_runne
 
         assert pipeline_runner._pending_candidate_restarts[0].rollback_context == "用户要求模板使用WordPress"
 
+    def test_schedule_candidate_restart_preserves_image_source_input(self, pipeline_runner):
+        mock_task = MagicMock()
+        mock_task.done.return_value = False
+        mock_task.cancel = MagicMock()
+        pipeline_runner._active_candidates[0] = {
+            "task": mock_task,
+            "current_sub_step": "template_generating",
+            "conclusions": {},
+            "name": "基础方案",
+            "agent_loop": None,
+        }
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+
+        verdict = InterruptVerdict(
+            action="hard_interrupt",
+            reason="fix template",
+            rollback_target="template_generating",
+            candidate_scope="candidate:0",
+            rollback_context="用户要求模板使用WordPress",
+        )
+        pipeline_runner._schedule_candidate_restart(verdict, source_input=image_input)
+
+        info = pipeline_runner._pending_candidate_restarts[0]
+        assert info.rollback_context == "用户要求模板使用WordPress\n\n参考这张图"
+        assert info.rollback_input == [TextBlock(text="用户要求模板使用WordPress"), *image_input]
+
+    def test_candidate_ask_user_question_keeps_tool_result_before_image_message(self, pipeline_runner):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        tool_result_message = Message(role="user", content=[tool_result])
+        pipeline_runner._restored_ask_user_question = {
+            "candidate_index": 0,
+            "resume_messages": [tool_result_message],
+            "user_message": image_input,
+            "precompleted_tools": {"ask_user_question": {"free_text": "see image"}},
+        }
+
+        assert pipeline_runner._candidate_resume_messages_for_restored_ask_user_question(0) == [tool_result_message]
+        assert pipeline_runner._candidate_user_message_for_restored_ask_user_question(0) == image_input
+
+    def test_candidate_ask_user_question_resume_state_survives_execution_snapshot(self, pipeline_runner):
+        _seed_restored_parallel_judge_state(pipeline_runner)
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        tool_result_message = Message(role="user", content=[tool_result])
+        precompleted_tools = {"ask_user_question": {"free_text": "see image"}}
+
+        pipeline_runner._set_candidate_ask_user_question_resume_state(
+            0,
+            user_message=image_input,
+            resume_messages=[tool_result_message],
+            precompleted_tools=precompleted_tools,
+        )
+
+        restored = PipelineRunner(
+            pipeline_dir=pipeline_runner._pipeline_dir,
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            session_storage=FakeSessionStorage(),
+            session_id="restored",
+            cwd=pipeline_runner._cwd,
+        )
+        restored._execution = dict(pipeline_runner._execution)
+
+        assert restored._candidate_user_message_for_restored_ask_user_question(0) == image_input
+        assert restored._candidate_resume_messages_for_restored_ask_user_question(0) == [tool_result_message]
+        assert restored._candidate_precompleted_tools_for_restored_ask_user_question(0) == precompleted_tools
+
+    @pytest.mark.asyncio
+    async def test_restored_candidate_ask_user_question_image_resume_reaches_sub_pipeline(self, tmp_path):
+        from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "sub_a.md").write_text("sub A", encoding="utf-8")
+        (tmp_path / "pipeline.yaml").write_text(
+            dedent("""\
+            name: test
+            context_dependencies:
+              architecture: []
+              candidates_done: [architecture]
+            max_rollbacks: 3
+            sub_pipelines:
+              per_candidate:
+                iterate_over: architecture.candidates
+                context_fields_from_parent: []
+                max_rollbacks: 3
+                steps:
+                  - id: sub_a
+                    conclusion_field: sub_a_out
+                    forward: null
+                    prompt: prompts/sub_a.md
+                    description: Sub A
+            steps:
+              - id: parallel
+                conclusion_field: candidates_done
+                type: parallel_sub_pipeline
+                sub_pipeline: per_candidate
+                forward: null
+                description: Parallel
+        """),
+            encoding="utf-8",
+        )
+        runner = PipelineRunner(
+            pipeline_dir=tmp_path,
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            session_storage=FakeSessionStorage(),
+            session_id="test",
+            cwd=str(tmp_path),
+        )
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        tool_result_message = Message(role="user", content=[tool_result])
+        precompleted_tools = {"ask_user_question": {"free_text": "see image"}}
+        candidates = [{"name": "方案1"}]
+        runner.context.set_conclusion("architecture", {"candidates": candidates})
+        runner._execution = {
+            "kind": "parallel_sub_pipeline",
+            "step_id": "parallel",
+            "sub_pipeline_name": "per_candidate",
+            "active_attempt_id": "attempt_parent",
+            "transcript_id": "transcript_parent",
+            "candidates": {
+                "0": {
+                    "status": "running",
+                    "candidate": candidates[0],
+                    "current_sub_step": "sub_a",
+                    "state_machine": {"current_index": 0, "completed": [], "rollback_count": 0},
+                    "context": {"fields": {}},
+                    "pending_ask_user_question_resume": {
+                        "user_message": [
+                            {"type": "text", "text": "参考这张图"},
+                            {"type": "image", "media_type": "image/png", "data": "aW1hZ2U="},
+                        ],
+                        "resume_messages": [tool_result_message.to_dict()],
+                        "precompleted_tools": precompleted_tools,
+                    },
+                },
+            },
+        }
+        runner._attempts["items"]["attempt_parent"] = {
+            "attempt_id": "attempt_parent",
+            "scope": "parent",
+            "step_id": "parallel",
+            "status": "running",
+            "transcript_id": "transcript_parent",
+        }
+        captured: dict[str, object] = {}
+
+        from iac_code.pipeline.engine import sub_pipeline_executor as spe_module
+
+        original_execute_streaming = spe_module.SubPipelineExecutor.execute_streaming
+
+        async def spy_execute_streaming(self, *args, **kwargs):
+            captured.update(kwargs)
+            yield PipelineEvent(
+                type=PipelineEventType.SUB_PIPELINE_STARTED,
+                step_id=None,
+                timestamp=0.0,
+                data={
+                    "sub_pipeline_id": "x",
+                    "candidate_index": kwargs.get("candidate_index", 0),
+                    "candidate_name": "方案",
+                    "total_steps": 1,
+                    "sub_pipeline_name": "per_candidate",
+                },
+            )
+            yield PipelineEvent(
+                type=PipelineEventType.SUB_PIPELINE_COMPLETED,
+                step_id=None,
+                timestamp=0.0,
+                data={
+                    "sub_pipeline_id": "x",
+                    "candidate_index": kwargs.get("candidate_index", 0),
+                    "failed": False,
+                    "conclusions": {},
+                },
+            )
+
+        spe_module.SubPipelineExecutor.execute_streaming = spy_execute_streaming
+        try:
+            async for _event in runner._continue_from_current(user_input=None):
+                pass
+        finally:
+            spe_module.SubPipelineExecutor.execute_streaming = original_execute_streaming
+
+        assert captured["user_message"] == image_input
+        assert captured["resume_messages"] == [tool_result_message]
+        assert captured["precompleted_tools"] == precompleted_tools
+
+    @pytest.mark.asyncio
+    async def test_parent_ask_user_question_image_resume_state_survives_sidecar_restore(self, pipeline_runner):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        tool_result_message = Message(role="user", content=[tool_result])
+        precompleted_tools = {"ask_user_question": {"free_text": "see image"}}
+
+        pipeline_runner._set_current_step_user_input(image_input, display_text="参考这张图")
+        pipeline_runner._set_current_step_resume_state(
+            resume_messages=[tool_result_message],
+            precompleted_tools=precompleted_tools,
+        )
+        snapshot = pipeline_runner._state_machine_snapshot_for_sidecar()
+
+        restored = PipelineRunner(
+            pipeline_dir=pipeline_runner._pipeline_dir,
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            session_storage=FakeSessionStorage(),
+            session_id="restored",
+            cwd=pipeline_runner._cwd,
+        )
+        restored.state_machine = type(pipeline_runner.state_machine).from_snapshot(
+            snapshot,
+            restored._loaded.steps,
+            max_rollbacks=restored._loaded.max_rollbacks,
+        )
+        restored._restore_current_step_user_input_from_snapshot(snapshot)
+
+        captured: dict[str, object] = {}
+
+        async def capture_execute(*args, **kwargs):
+            captured.update(kwargs)
+            if False:
+                yield None
+
+        restored._step_executor.execute = capture_execute
+
+        async for _event in restored._continue_from_current(user_input=None):
+            pass
+
+        assert captured["user_message"] == image_input
+        assert captured["resume_messages"] == [tool_result_message]
+        assert captured["precompleted_tools"] == precompleted_tools
+
+    @pytest.mark.asyncio
+    async def test_parent_ask_user_question_restore_prefers_transcript_with_answer(self, pipeline_runner):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        tool_result_message = Message(role="user", content=[tool_result])
+        post_answer_message = Message(role="assistant", content=[TextBlock(text="我已经读取图片")])
+        precompleted_tools = {"ask_user_question": {"free_text": "see image"}}
+
+        pipeline_runner._set_current_step_user_input(image_input, display_text="参考这张图")
+        pipeline_runner._set_current_step_resume_state(
+            resume_messages=[tool_result_message],
+            precompleted_tools=precompleted_tools,
+        )
+        snapshot = pipeline_runner._state_machine_snapshot_for_sidecar()
+
+        restored = PipelineRunner(
+            pipeline_dir=pipeline_runner._pipeline_dir,
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            session_storage=FakeSessionStorage(),
+            session_id="restored",
+            cwd=pipeline_runner._cwd,
+        )
+        restored.state_machine = type(pipeline_runner.state_machine).from_snapshot(
+            snapshot,
+            restored._loaded.steps,
+            max_rollbacks=restored._loaded.max_rollbacks,
+        )
+        restored._restore_current_step_user_input_from_snapshot(snapshot)
+        restored._attempts["items"]["attempt_parent"] = {
+            "attempt_id": "attempt_parent",
+            "scope": "parent",
+            "step_id": "a",
+            "status": "running",
+            "transcript_id": "transcript_parent",
+        }
+        restored._execution = {
+            "kind": "step",
+            "step_id": "a",
+            "active_attempt_id": "attempt_parent",
+            "transcript_id": "transcript_parent",
+        }
+        restored._transcript_storage = FakeTranscriptStorage(
+            {"transcript_parent": [tool_result_message, post_answer_message]}
+        )
+        captured: dict[str, object] = {}
+
+        async def capture_execute(*args, **kwargs):
+            captured.update(kwargs)
+            if False:
+                yield None
+
+        restored._step_executor.execute = capture_execute
+
+        async for _event in restored._continue_from_current(user_input=None):
+            pass
+
+        assert captured["resume_messages"] == [tool_result_message, post_answer_message]
+        assert captured["precompleted_tools"] == precompleted_tools
+
+    @pytest.mark.asyncio
+    async def test_parent_ask_user_question_restore_does_not_replay_transcript_image_user_message(
+        self,
+        pipeline_runner,
+    ):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        tool_result_message = Message(role="user", content=[tool_result])
+        image_message = Message(role="user", content=image_input)
+        precompleted_tools = {"ask_user_question": {"free_text": "see image"}}
+
+        pipeline_runner._set_current_step_user_input(image_input, display_text="参考这张图")
+        pipeline_runner._set_current_step_resume_state(
+            resume_messages=[tool_result_message],
+            precompleted_tools=precompleted_tools,
+        )
+        snapshot = pipeline_runner._state_machine_snapshot_for_sidecar()
+
+        restored = PipelineRunner(
+            pipeline_dir=pipeline_runner._pipeline_dir,
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            session_storage=FakeSessionStorage(),
+            session_id="restored",
+            cwd=pipeline_runner._cwd,
+        )
+        restored.state_machine = type(pipeline_runner.state_machine).from_snapshot(
+            snapshot,
+            restored._loaded.steps,
+            max_rollbacks=restored._loaded.max_rollbacks,
+        )
+        restored._restore_current_step_user_input_from_snapshot(snapshot)
+        restored._attempts["items"]["attempt_parent"] = {
+            "attempt_id": "attempt_parent",
+            "scope": "parent",
+            "step_id": "a",
+            "status": "running",
+            "transcript_id": "transcript_parent",
+        }
+        restored._execution = {
+            "kind": "step",
+            "step_id": "a",
+            "active_attempt_id": "attempt_parent",
+            "transcript_id": "transcript_parent",
+        }
+        restored._transcript_storage = FakeTranscriptStorage(
+            {"transcript_parent": [tool_result_message, image_message]}
+        )
+        captured: dict[str, object] = {}
+
+        async def capture_execute(*args, **kwargs):
+            captured.update(kwargs)
+            if False:
+                yield None
+
+        restored._step_executor.execute = capture_execute
+
+        async for _event in restored._continue_from_current(user_input=None):
+            pass
+
+        assert captured["user_message"] is None
+        assert captured["resume_messages"] == [tool_result_message, image_message]
+        assert captured["precompleted_tools"] == precompleted_tools
+
+    @pytest.mark.asyncio
+    async def test_sub_pipeline_ask_user_question_restore_does_not_duplicate_transcript_answer(self, tmp_path):
+        from iac_code.pipeline.engine.context import PipelineContext
+        from iac_code.pipeline.engine.step_spec import LoadedPipeline, StepSpec, SubPipelineSpec
+        from iac_code.pipeline.engine.sub_pipeline_executor import SubPipelineExecutor
+        from iac_code.pipeline.engine.types import StepResult, StepStatus
+
+        step = StepSpec(
+            step_id="sub_a",
+            conclusion_field="sub_a_out",
+            forward=None,
+            prompt_file="prompts/sub_a.md",
+            description="Sub A",
+        )
+        sub_spec = SubPipelineSpec(
+            name="per_candidate",
+            steps=[step],
+            max_rollbacks=3,
+            iterate_over="architecture.candidates",
+        )
+        loaded = LoadedPipeline(
+            name="test",
+            steps=[],
+            context_dependencies={},
+            max_rollbacks=3,
+            skills={},
+            sub_pipelines={"per_candidate": sub_spec},
+        )
+        executor = SubPipelineExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            pipeline=loaded,
+            pipeline_dir=tmp_path,
+            session_storage=FakeSessionStorage(),
+            cwd=str(tmp_path),
+        )
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result_message = Message(role="user", content=[tool_result])
+        post_answer_message = Message(role="assistant", content=[TextBlock(text="我已经读取图片")])
+        captured: dict[str, object] = {}
+
+        class CapturingStepExecutor:
+            async def execute(self, step, context, session_id, **kwargs):
+                captured.update(kwargs)
+                yield StepResult(
+                    step_id=step.step_id,
+                    status=StepStatus.COMPLETED,
+                    conclusion={"ok": True},
+                )
+
+        executor._make_step_executor = lambda: CapturingStepExecutor()
+
+        def allocate_sub_step_attempt(request):
+            return {
+                "attempt_id": "attempt_sub",
+                "transcript_id": "transcript_sub",
+                "resume_messages": [tool_result_message, post_answer_message],
+            }
+
+        async for _event in executor.execute_streaming(
+            sub_spec=sub_spec,
+            candidate={"name": "方案1"},
+            candidate_index=0,
+            parent_context=PipelineContext({}),
+            session_id="session",
+            user_message=image_input,
+            resume_messages=[tool_result_message],
+            parent_step_id="parallel",
+            resume_state={
+                "sub_pipeline_id": "sub",
+                "state_machine": {
+                    "current_index": 0,
+                    "rollback_count": 0,
+                    "interrupt_rollback_count": 0,
+                    "step_statuses": {},
+                },
+                "context": {"fields": {}},
+                "active_attempt_id": "attempt_sub",
+                "transcript_id": "transcript_sub",
+                "current_sub_step": "sub_a",
+            },
+            sub_step_attempt_allocator=allocate_sub_step_attempt,
+            precompleted_tools={"ask_user_question": {"free_text": "see image"}},
+        ):
+            pass
+
+        assert captured["resume_messages"] == [tool_result_message, post_answer_message]
+
+    @pytest.mark.asyncio
+    async def test_sub_pipeline_ask_user_question_restore_does_not_replay_transcript_image_user_message(
+        self,
+        tmp_path,
+    ):
+        from iac_code.pipeline.engine.context import PipelineContext
+        from iac_code.pipeline.engine.step_spec import LoadedPipeline, StepSpec, SubPipelineSpec
+        from iac_code.pipeline.engine.sub_pipeline_executor import SubPipelineExecutor
+        from iac_code.pipeline.engine.types import StepResult, StepStatus
+
+        step = StepSpec(
+            step_id="sub_a",
+            conclusion_field="sub_a_out",
+            forward=None,
+            prompt_file="prompts/sub_a.md",
+            description="Sub A",
+        )
+        sub_spec = SubPipelineSpec(
+            name="per_candidate",
+            steps=[step],
+            max_rollbacks=3,
+            iterate_over="architecture.candidates",
+        )
+        loaded = LoadedPipeline(
+            name="test",
+            steps=[],
+            context_dependencies={},
+            max_rollbacks=3,
+            skills={},
+            sub_pipelines={"per_candidate": sub_spec},
+        )
+        executor = SubPipelineExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            pipeline=loaded,
+            pipeline_dir=tmp_path,
+            session_storage=FakeSessionStorage(),
+            cwd=str(tmp_path),
+        )
+        tool_result = ToolResultBlock(
+            tool_use_id="toolu_1",
+            content='{"selected_id":"","selected_label":"","free_text":"see image"}',
+        )
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        tool_result_message = Message(role="user", content=[tool_result])
+        image_message = Message(role="user", content=image_input)
+        captured: dict[str, object] = {}
+
+        class CapturingStepExecutor:
+            async def execute(self, step, context, session_id, **kwargs):
+                captured.update(kwargs)
+                yield StepResult(
+                    step_id=step.step_id,
+                    status=StepStatus.COMPLETED,
+                    conclusion={"ok": True},
+                )
+
+        executor._make_step_executor = lambda: CapturingStepExecutor()
+
+        def allocate_sub_step_attempt(request):
+            return {
+                "attempt_id": "attempt_sub",
+                "transcript_id": "transcript_sub",
+                "resume_messages": [tool_result_message, image_message],
+            }
+
+        async for _event in executor.execute_streaming(
+            sub_spec=sub_spec,
+            candidate={"name": "方案1"},
+            candidate_index=0,
+            parent_context=PipelineContext({}),
+            session_id="session",
+            user_message=image_input,
+            resume_messages=[tool_result_message],
+            parent_step_id="parallel",
+            resume_state={
+                "sub_pipeline_id": "sub",
+                "state_machine": {
+                    "current_index": 0,
+                    "rollback_count": 0,
+                    "interrupt_rollback_count": 0,
+                    "step_statuses": {},
+                },
+                "context": {"fields": {}},
+                "active_attempt_id": "attempt_sub",
+                "transcript_id": "transcript_sub",
+                "current_sub_step": "sub_a",
+            },
+            sub_step_attempt_allocator=allocate_sub_step_attempt,
+            precompleted_tools={"ask_user_question": {"free_text": "see image"}},
+        ):
+            pass
+
+        assert captured["user_message"] is None
+        assert captured["resume_messages"] == [tool_result_message, image_message]
+
+    def test_inject_pending_question_supplement_preserves_image_blocks(self, pipeline_runner):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        injected_messages = []
+
+        class AgentLoop:
+            def try_inject_user_message(self, message):
+                injected_messages.append(message)
+                return True
+
+        agent_loop = AgentLoop()
+        pipeline_runner._step_executor._current_agent_loop = agent_loop
+
+        injected = pipeline_runner.inject_pending_question_supplement(
+            image_input,
+            envelope={"scope": "pipeline", "inputId": "ask-toolu_1"},
+        )
+
+        assert injected is True
+        assert injected_messages == [image_input]
+
+    def test_inject_pending_question_supplement_treats_none_return_as_success(self, pipeline_runner):
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        injected_messages = []
+
+        class AgentLoop:
+            def try_inject_user_message(self, message):
+                injected_messages.append(message)
+
+        agent_loop = AgentLoop()
+        pipeline_runner._step_executor._current_agent_loop = agent_loop
+
+        injected = pipeline_runner.inject_pending_question_supplement(
+            image_input,
+            envelope={"scope": "pipeline", "inputId": "ask-toolu_1"},
+        )
+
+        assert injected is True
+        assert injected_messages == [image_input]
+
 
 class TestParallelSubPipelineUserMessagePropagation:
     """Regression: `user_input` from `_continue_from_current` must reach the
@@ -1890,6 +2608,128 @@ async def spy_execute_streaming(self, *args, **kwargs):
         assert captured[1]["user_message"] == "restored restart feedback"
         assert isinstance(captured[1]["resume_state"], dict)
 
+    @pytest.mark.asyncio
+    async def test_restored_candidate_restart_preserves_image_rollback_input(self, tmp_path):
+        from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+        from iac_code.pipeline.engine.pipeline_runner import PipelineRunner
+
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "sub_a.md").write_text("sub A", encoding="utf-8")
+        (tmp_path / "pipeline.yaml").write_text(
+            dedent("""\
+            name: test
+            context_dependencies:
+              architecture: []
+              candidates_done: [architecture]
+            max_rollbacks: 3
+            sub_pipelines:
+              per_candidate:
+                iterate_over: architecture.candidates
+                context_fields_from_parent: []
+                max_rollbacks: 3
+                steps:
+                  - id: sub_a
+                    conclusion_field: sub_a_out
+                    forward: null
+                    prompt: prompts/sub_a.md
+                    description: Sub A
+            steps:
+              - id: parallel
+                conclusion_field: candidates_done
+                type: parallel_sub_pipeline
+                sub_pipeline: per_candidate
+                forward: null
+                description: Parallel
+        """),
+            encoding="utf-8",
+        )
+        runner = PipelineRunner(
+            pipeline_dir=tmp_path,
+            provider_manager=MagicMock(),
+            base_tool_registry=MagicMock(),
+            session_storage=FakeSessionStorage(),
+            session_id="test",
+            cwd=str(tmp_path),
+        )
+        image_input = [
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ]
+        candidates = [{"name": "方案1"}]
+        runner.context.set_conclusion("architecture", {"candidates": candidates})
+        runner._execution = {
+            "kind": "parallel_sub_pipeline",
+            "step_id": "parallel",
+            "sub_pipeline_name": "per_candidate",
+            "active_attempt_id": "attempt_parent",
+            "transcript_id": "transcript_parent",
+            "candidates": {
+                "0": {
+                    "status": "running",
+                    "candidate": candidates[0],
+                    "current_sub_step": "sub_a",
+                    "pending_restart": {
+                        "start_from_step": "sub_a",
+                        "preserved_conclusions": {},
+                        "rollback_context": "用户要求改架构\n\n参考这张图",
+                        "rollback_input": [
+                            {"type": "text", "text": "用户要求改架构"},
+                            {"type": "text", "text": "参考这张图"},
+                            {"type": "image", "media_type": "image/png", "data": "aW1hZ2U="},
+                        ],
+                    },
+                },
+            },
+        }
+        runner._attempts["items"]["attempt_parent"] = {
+            "attempt_id": "attempt_parent",
+            "scope": "parent",
+            "step_id": "parallel",
+            "status": "running",
+            "transcript_id": "transcript_parent",
+        }
+        captured: dict[int, dict[str, object]] = {}
+
+        from iac_code.pipeline.engine import sub_pipeline_executor as spe_module
+
+        original_execute_streaming = spe_module.SubPipelineExecutor.execute_streaming
+
+        async def spy_execute_streaming(self, *args, **kwargs):
+            captured[kwargs["candidate_index"]] = {"user_message": kwargs.get("user_message")}
+            yield PipelineEvent(
+                type=PipelineEventType.SUB_PIPELINE_STARTED,
+                step_id=None,
+                timestamp=0.0,
+                data={
+                    "sub_pipeline_id": "x",
+                    "candidate_index": kwargs.get("candidate_index", 0),
+                    "candidate_name": "方案",
+                    "total_steps": 1,
+                    "sub_pipeline_name": "per_candidate",
+                },
+            )
+            yield PipelineEvent(
+                type=PipelineEventType.SUB_PIPELINE_COMPLETED,
+                step_id=None,
+                timestamp=0.0,
+                data={
+                    "sub_pipeline_id": "x",
+                    "candidate_index": kwargs.get("candidate_index", 0),
+                    "failed": False,
+                    "conclusions": {},
+                },
+            )
+
+        spe_module.SubPipelineExecutor.execute_streaming = spy_execute_streaming
+        try:
+            async for _ev in runner._continue_from_current(user_input=None):
+                if captured:
+                    break
+        finally:
+            spe_module.SubPipelineExecutor.execute_streaming = original_execute_streaming
+
+        assert captured[0]["user_message"] == [TextBlock(text="用户要求改架构"), *image_input]
+
 
 class TestSupplementTargetUnifiedFormat:
     """P-I5: _inject_supplement should accept both 'candidate:N' (new unified)
diff --git a/tests/pipeline/engine/test_pipeline_runner_sidecar_path.py b/tests/pipeline/engine/test_pipeline_runner_sidecar_path.py
index 76af42e2..41a8f952 100644
--- a/tests/pipeline/engine/test_pipeline_runner_sidecar_path.py
+++ b/tests/pipeline/engine/test_pipeline_runner_sidecar_path.py
@@ -8,7 +8,7 @@
 import pytest
 import yaml
 
-from iac_code.agent.message import Message, ToolResultBlock
+from iac_code.agent.message import ImageBlock, Message, TextBlock, ToolResultBlock
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.pipeline.engine.types import StepResult, StepStatus
 
@@ -469,6 +469,40 @@ async def fake_execute(step, context, session_id, user_message=None, **_kwargs):
     assert seen_user_messages == ["选择一个已有vpc，创建一个vswitch"]
 
 
+@pytest.mark.asyncio
+async def test_continue_from_sidecar_reuses_persisted_current_step_image_input(tmp_path):
+    from iac_code.pipeline.engine.user_input import PipelineUserInput
+
+    image_input = PipelineUserInput(
+        content=[
+            TextBlock(text="参考这张图"),
+            ImageBlock(media_type="image/png", data="aW1hZ2U="),
+        ],
+        display_text="参考这张图",
+        has_images=True,
+    )
+    runner = _build_two_step_runner(tmp_path)
+    runner._set_current_step_user_input(image_input)
+    await runner._save_running("s1", reason="step started")
+
+    runner2 = _build_two_step_runner(tmp_path, resume_from_sidecar=True)
+    seen_user_messages = []
+
+    async def fake_execute(step, context, session_id, user_message=None, **_kwargs):
+        seen_user_messages.append(user_message)
+        conclusion = {"value": step.step_id}
+        context.set_conclusion(step.conclusion_field, conclusion)
+        yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion=conclusion)
+
+    runner2._step_executor.execute = fake_execute
+
+    async for _event in runner2.continue_from_sidecar():
+        if seen_user_messages:
+            break
+
+    assert seen_user_messages == [image_input.content]
+
+
 @pytest.mark.asyncio
 async def test_hard_interrupt_rollback_context_survives_sidecar_restore(tmp_path):
     from iac_code.pipeline.engine.interrupt import InterruptVerdict
@@ -566,6 +600,37 @@ async def fake_continue(user_input=None, **kwargs):
     }
 
 
+@pytest.mark.asyncio
+async def test_resume_candidate_selection_extracts_index_from_structured_json(tmp_path):
+    runner = _build_runner(tmp_path)
+    runner.state_machine.current_step.ui_mode = "candidate_selection"
+    runner._waiting_input_options_by_step["s1"] = [
+        {"name": "方案A", "candidate_index": 0},
+        {"name": "方案B", "candidate_index": 1},
+    ]
+
+    async def fake_continue(user_input=None, **kwargs):
+        assert kwargs == {"resume_waiting_step": True}
+        if False:
+            yield
+
+    runner._continue_from_current = fake_continue
+    user_input = json.dumps(
+        {
+            "selected_candidate_index": 1,
+            "parameter_overrides": {"InstanceType": "ecs.g7.large"},
+        },
+        ensure_ascii=False,
+    )
+
+    events = [event async for event in runner.resume(user_input)]
+
+    received = next(event for event in events if isinstance(event, PipelineEvent))
+    assert received.type == PipelineEventType.USER_INPUT_RECEIVED
+    assert received.data["selected_index"] == 1
+    assert received.data["selected_option"] == {"name": "方案B", "candidate_index": 1}
+
+
 @pytest.mark.asyncio
 async def test_resume_candidate_selection_uses_restored_context_options(tmp_path):
     runner = _build_runner(tmp_path)
diff --git a/tests/pipeline/engine/test_recovery.py b/tests/pipeline/engine/test_recovery.py
index 3e9dd837..11aaa168 100644
--- a/tests/pipeline/engine/test_recovery.py
+++ b/tests/pipeline/engine/test_recovery.py
@@ -1,6 +1,11 @@
 from __future__ import annotations
 
+import json
+import logging
+
 from iac_code.agent.message import Message, TextBlock, ToolResultBlock, ToolUseBlock
+from iac_code.pipeline.engine import completion_guard_state
+from iac_code.pipeline.engine.completion_guard_state import record_completion_guard_tool_result
 from iac_code.pipeline.engine.recovery import (
     last_successful_tool_input,
     reconstruct_completion_guard_state,
@@ -164,3 +169,87 @@ def test_reconstruct_completion_guard_state_ignores_successful_non_guard_tools()
 
     assert state["successful_tools"] == set()
     assert state["tool_results"] == {}
+
+
+def test_reconstruct_completion_guard_state_records_ros_stack_results_for_completion_guards():
+    messages = [
+        Message(
+            role="assistant",
+            content=[
+                ToolUseBlock(
+                    id="tu_stack",
+                    name="ros_stack",
+                    input={"action": "CreateStack", "params": {"StackName": "demo"}},
+                )
+            ],
+        ),
+        Message(
+            role="user",
+            content=[
+                ToolResultBlock(
+                    tool_use_id="tu_stack",
+                    content=json.dumps(
+                        {
+                            "stack_id": "stack-123",
+                            "stack_name": "demo",
+                            "status": "CREATE_COMPLETE",
+                            "is_success": True,
+                        }
+                    ),
+                    is_error=False,
+                )
+            ],
+        ),
+    ]
+
+    state = reconstruct_completion_guard_state(messages)
+
+    assert state["successful_tools"] == {"ros_stack"}
+    assert state["tool_results"]["ros_stack"]["stack_id"] == "stack-123"
+    assert state["tool_result_records"] == [
+        {
+            "tool_name": "ros_stack",
+            "input": {"action": "CreateStack", "params": {"StackName": "demo"}},
+            "result": {
+                "stack_id": "stack-123",
+                "stack_name": "demo",
+                "status": "CREATE_COMPLETE",
+                "is_success": True,
+            },
+            "is_error": False,
+        }
+    ]
+
+
+def test_completion_guard_state_logs_json_parse_failures(caplog):
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.completion_guard_state")
+    state = {}
+
+    record_completion_guard_tool_result(
+        state,
+        tool_name="ros_stack",
+        tool_input={"action": "CreateStack"},
+        content="{not-json",
+        is_error=False,
+    )
+
+    assert "Failed to parse completion guard state" in caplog.text
+
+
+def test_completion_guard_state_logs_rebuild_failures(monkeypatch, caplog):
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.engine.completion_guard_state")
+
+    def fail_record(*_args, **_kwargs):
+        raise RuntimeError("boom")
+
+    monkeypatch.setattr(completion_guard_state, "_record_ask_user_question", fail_record)
+
+    record_completion_guard_tool_result(
+        {},
+        tool_name="ask_user_question",
+        tool_input={},
+        content='{"free_text": "ok"}',
+        is_error=False,
+    )
+
+    assert "Failed to rebuild completion guard state" in caplog.text
diff --git a/tests/pipeline/engine/test_resume_recovery.py b/tests/pipeline/engine/test_resume_recovery.py
new file mode 100644
index 00000000..6fef87b0
--- /dev/null
+++ b/tests/pipeline/engine/test_resume_recovery.py
@@ -0,0 +1,35 @@
+from iac_code.agent.message import ImageBlock, Message, TextBlock, ToolResultBlock
+from iac_code.pipeline.engine.resume_recovery import reconcile_resume_messages, user_message_already_in_resume
+
+
+def test_reconcile_resume_messages_filters_duplicate_tool_result_blocks_only():
+    existing = Message(
+        role="user",
+        content=[ToolResultBlock(tool_use_id="toolu_existing", content="done")],
+    )
+    sidecar = Message(
+        role="user",
+        content=[
+            ToolResultBlock(tool_use_id="toolu_existing", content="done"),
+            ToolResultBlock(tool_use_id="toolu_new", content="new"),
+        ],
+    )
+
+    merged = reconcile_resume_messages([existing], [sidecar])
+
+    assert merged is not None
+    assert len(merged) == 2
+    assert merged[0] == existing
+    assert merged[1] == Message(
+        role="user",
+        content=[ToolResultBlock(tool_use_id="toolu_new", content="new")],
+    )
+
+
+def test_user_message_already_in_resume_matches_image_message():
+    image_message = [
+        TextBlock(text="参考这张图"),
+        ImageBlock(media_type="image/png", data="aW1hZ2U="),
+    ]
+
+    assert user_message_already_in_resume(image_message, [Message(role="user", content=image_message)]) is True
diff --git a/tests/pipeline/engine/test_session.py b/tests/pipeline/engine/test_session.py
index d10b1cc0..9b051002 100644
--- a/tests/pipeline/engine/test_session.py
+++ b/tests/pipeline/engine/test_session.py
@@ -1,5 +1,6 @@
 import json
 import logging
+from pathlib import Path
 
 import pytest
 import yaml
@@ -109,6 +110,27 @@ def fail_write(path, data):
     ]
 
 
+def test_sidecar_yaml_uses_atomic_state_write(monkeypatch, tmp_path) -> None:
+    calls = []
+
+    def fake_atomic_write_text(path, content, *, durable=True, replace_attempts=3, encoding="utf-8"):
+        calls.append((Path(path).name, durable))
+        Path(path).write_text(content, encoding=encoding)
+
+    monkeypatch.setattr("iac_code.pipeline.engine.session.atomic_write_text", fake_atomic_write_text)
+
+    session = PipelineSession(tmp_path / "pipeline")
+    session.save_running_sync(
+        "step",
+        {"current_index": 0, "rollback_count": 0, "step_statuses": {"step": "running"}},
+        {},
+        {"pipeline_name": "test", "step_ids": ["step"], "sub_pipeline_step_ids": {}, "pipeline_fingerprint": "fp"},
+    )
+
+    assert ("context.yaml", True) in calls
+    assert ("meta.yaml", True) in calls
+
+
 class TestSaveRollback:
     @pytest.mark.asyncio
     async def test_updates_meta_with_target_step(self, session, session_dir):
@@ -142,6 +164,29 @@ async def test_appends_to_events_jsonl(self, session, session_dir):
         assert event["from"] == "c"
         assert event["to"] == "a"
 
+    def test_sync_does_not_append_rollback_event_when_state_save_fails(self, session, monkeypatch):
+        def fail_write(path, data):
+            raise OSError("disk full")
+
+        monkeypatch.setattr(session, "_atomic_write_yaml", fail_write)
+
+        with pytest.raises(OSError, match="disk full"):
+            session.save_rollback_sync(
+                from_step="confirm",
+                to_step="intent",
+                reason="retry intent",
+                state_machine_snapshot={
+                    "current_index": 0,
+                    "rollback_count": 1,
+                    "interrupt_rollback_count": 0,
+                    "step_statuses": {"intent": "running", "confirm": "stale"},
+                },
+                context_snapshot={},
+                identity=_identity(),
+            )
+
+        assert not session.events_path.exists()
+
     def test_sync_preserves_attempt_metadata(self, session):
         identity = _identity()
         execution = {
diff --git a/tests/pipeline/engine/test_state_machine.py b/tests/pipeline/engine/test_state_machine.py
index 6a19c214..b6cfc1dc 100644
--- a/tests/pipeline/engine/test_state_machine.py
+++ b/tests/pipeline/engine/test_state_machine.py
@@ -2,30 +2,15 @@
 
 from iac_code.pipeline.engine.state_machine import StateMachine
 from iac_code.pipeline.engine.step_spec import StepSpec
-from iac_code.pipeline.engine.types import RollbackRule, StepStatus
+from iac_code.pipeline.engine.types import StepStatus
 
 
 def _make_three_steps():
     """A → B → C pipeline."""
     return [
         StepSpec(step_id="a", conclusion_field="a", forward="b", prompt_file="a.md"),
-        StepSpec(
-            step_id="b",
-            conclusion_field="b",
-            forward="c",
-            prompt_file="b.md",
-            rollback_rules=[RollbackRule(target_step="a", condition="fix")],
-        ),
-        StepSpec(
-            step_id="c",
-            conclusion_field="c",
-            forward=None,
-            prompt_file="c.md",
-            rollback_rules=[
-                RollbackRule(target_step="a", condition="restart"),
-                RollbackRule(target_step="b", condition="revise"),
-            ],
-        ),
+        StepSpec(step_id="b", conclusion_field="b", forward="c", prompt_file="b.md"),
+        StepSpec(step_id="c", conclusion_field="c", forward=None, prompt_file="c.md"),
     ]
 
 
@@ -66,11 +51,11 @@ def test_rollback_to_allowed_target(self):
         assert sm._step_statuses["b"] == StepStatus.STALE
         assert sm._step_statuses["c"] == StepStatus.STALE
 
-    def test_rollback_to_disallowed_target_raises(self):
+    def test_rollback_to_future_target_raises(self):
         sm = StateMachine(_make_three_steps())
         sm.advance()  # a → b
         with pytest.raises(ValueError, match="Cannot rollback"):
-            sm.rollback("c", "invalid")  # b can only roll back to a
+            sm.rollback("c", "invalid")
 
     def test_max_rollbacks_exceeded(self):
         sm = StateMachine(_make_three_steps(), max_rollbacks=1)
@@ -98,14 +83,11 @@ def test_can_rollback_to(self):
         assert sm.can_rollback_to("b")
         assert not sm.can_rollback_to("nonexistent")
 
-    def test_get_rollback_options(self):
+    def test_completed_non_future_rollback_targets(self):
         sm = StateMachine(_make_three_steps())
         sm.advance()
         sm.advance()
-        options = sm.get_rollback_options()
-        assert len(options) == 2
-        targets = {r.target_step for r in options}
-        assert targets == {"a", "b"}
+        assert sm.completed_non_future_rollback_targets() == ["a", "b"]
 
     def test_completed_non_future_rollback_targets_ignore_static_rules(self):
         steps = [
@@ -118,7 +100,7 @@ def test_completed_non_future_rollback_targets_ignore_static_rules(self):
         sm.advance()  # b -> c
 
         assert sm.completed_non_future_rollback_targets() == ["a", "b"]
-        step = sm.rollback("b", "revise completed step", allow_completed_non_future=True)
+        step = sm.rollback("b", "revise completed step")
 
         assert step.step_id == "b"
 
@@ -133,7 +115,7 @@ def test_completed_non_future_rollback_rejects_future_and_uncompleted_targets(se
 
         assert sm.completed_non_future_rollback_targets() == ["a"]
         with pytest.raises(ValueError, match="Cannot rollback"):
-            sm.rollback("c", "future", allow_completed_non_future=True)
+            sm.rollback("c", "future")
 
 
 class TestInterruptRollback:
@@ -183,10 +165,9 @@ def test_interrupt_rollback_to_current_step(self):
         assert step.step_id == "b"
         assert sm._step_statuses["b"] == StepStatus.RUNNING
 
-    def test_interrupt_rollback_ignores_rollback_rules(self):
-        """interrupt_rollback should work even without rollback_rules."""
+    def test_interrupt_rollback_accepts_current_or_prior_step(self):
         sm = StateMachine(_make_three_steps())
-        sm.advance()  # a → b (b can only roll back to a via rules)
+        sm.advance()  # a → b
         sm.advance()  # b → c
         step = sm.interrupt_rollback("b", "no rule needed")
         assert step.step_id == "b"
diff --git a/tests/pipeline/engine/test_step_executor.py b/tests/pipeline/engine/test_step_executor.py
index f6f833a7..b7b62098 100644
--- a/tests/pipeline/engine/test_step_executor.py
+++ b/tests/pipeline/engine/test_step_executor.py
@@ -1,5 +1,7 @@
+import json
 import logging
 from pathlib import Path
+from types import SimpleNamespace
 from unittest.mock import MagicMock, call, patch
 
 import pytest
@@ -7,9 +9,9 @@
 from iac_code.agent.message import Message, ToolResultBlock, ToolUseBlock
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.step_executor import StepExecutor
-from iac_code.pipeline.engine.step_spec import IncludeExcludeConfig, LoadedPipeline, StepSpec
-from iac_code.pipeline.engine.types import RollbackRule, StepResult, StepStatus
-from iac_code.tools.base import ToolContext, ToolRegistry
+from iac_code.pipeline.engine.step_spec import IncludeExcludeConfig, LoadedPipeline, StepSpec, StepSurfaceOverride
+from iac_code.pipeline.engine.types import StepResult, StepStatus
+from iac_code.tools.base import Tool, ToolContext, ToolRegistry, ToolResult
 from iac_code.types.stream_events import (
     AskUserQuestionEvent,
     MessageEndEvent,
@@ -100,6 +102,16 @@ def test_complete_step_tool_registered(self, tmp_path):
         tool_reg = executor._build_step_tools(step, ctx)
         assert tool_reg.get("complete_step") is not None
 
+    def test_agent_loop_context_marks_pipeline_mode(self, tmp_path):
+        executor = _make_executor(tmp_path)
+        step = _make_step()
+        ctx = PipelineContext(SIMPLE_DEPS)
+
+        agent_context = executor.build_agent_loop_context(step, ctx, "test_session")
+
+        assert agent_context.agent_loop is not None
+        assert agent_context.agent_loop._pipeline_mode is True
+
     def test_full_tools_when_step_returns_none(self, tmp_path):
         registry = ToolRegistry()
 
@@ -716,6 +728,38 @@ def test_no_skill_uses_prompt_only(self, tmp_path):
         assert "# Step Prompt Only" in prompt
         assert prompt.endswith("# Step Prompt Only")
 
+    def test_surface_override_uses_surface_prompt_file(self, tmp_path):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "confirm.md").write_text("# REPL Prompt", encoding="utf-8")
+        (tmp_path / "prompts" / "confirm.a2a.md").write_text("# A2A Prompt", encoding="utf-8")
+
+        step = StepSpec(
+            step_id="confirm_and_select",
+            conclusion_field="selected_plan",
+            forward=None,
+            prompt_file="prompts/confirm.md",
+            surface_overrides={"a2a": StepSurfaceOverride(prompt_file="prompts/confirm.a2a.md")},
+        )
+        pipeline = LoadedPipeline(
+            name="test",
+            steps=[step],
+            context_dependencies={"selected_plan": []},
+            max_rollbacks=3,
+            skills={},
+        )
+        executor = StepExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=ToolRegistry(),
+            pipeline=pipeline,
+            pipeline_dir=tmp_path,
+            surface="a2a",
+        )
+
+        prompt = executor._build_full_system_prompt(step, PipelineContext({"selected_plan": []}))
+
+        assert "# A2A Prompt" in prompt
+        assert "# REPL Prompt" not in prompt
+
     def test_empty_prompt_file_with_skill(self, tmp_path):
         """When prompt_file is empty string but skill exists, just use skill content."""
         step = StepSpec(
@@ -1016,6 +1060,39 @@ def test_no_inject_tools_only_has_complete_step(self, tmp_path):
         assert registry.get("ask_user_question") is None
         assert registry.get("complete_step") is not None
 
+    def test_surface_override_can_disable_injected_tools(self, tmp_path):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "confirm.md").write_text("Confirm.", encoding="utf-8")
+
+        step = StepSpec(
+            step_id="confirm_and_select",
+            conclusion_field="selected_plan",
+            forward=None,
+            prompt_file="prompts/confirm.md",
+            inject_tools=["show_architecture_diagram"],
+            surface_overrides={"a2a": StepSurfaceOverride(inject_tools=[])},
+        )
+        pipeline = LoadedPipeline(
+            name="test",
+            steps=[step],
+            context_dependencies={"selected_plan": []},
+            max_rollbacks=3,
+            skills={},
+        )
+        executor = StepExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=ToolRegistry(),
+            pipeline=pipeline,
+            pipeline_dir=tmp_path,
+            surface="a2a",
+        )
+
+        context = PipelineContext({"selected_plan": []})
+        registry = executor._build_step_tools(step, context)
+
+        assert registry.get("show_architecture_diagram") is None
+        assert registry.get("complete_step") is not None
+
     @pytest.mark.asyncio
     async def test_ask_user_question_continues_same_agent_loop_to_complete_step(self, tmp_path):
         (tmp_path / "prompts").mkdir(exist_ok=True)
@@ -1350,6 +1427,417 @@ async def stream(self, messages, system, tools=None):
         assert step_results[-1].conclusion["clarification_choice"] == "deploy_to_aliyun"
         assert "selected_id" not in step_results[-1].conclusion
 
+    @pytest.mark.asyncio
+    async def test_completion_guard_rejects_deploying_success_until_create_stack_completes(self, tmp_path):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "deploying.md").write_text("Deploy.", encoding="utf-8")
+
+        class DummyRosStack(Tool):
+            @property
+            def name(self) -> str:
+                return "ros_stack"
+
+            @property
+            def description(self) -> str:
+                return "ROS stack"
+
+            @property
+            def input_schema(self) -> dict:
+                return {
+                    "type": "object",
+                    "required": ["action"],
+                    "properties": {"action": {"type": "string"}, "params": {"type": "object"}},
+                }
+
+            def is_read_only(self, input: dict | None = None) -> bool:
+                return True
+
+            async def execute(self, *, tool_input: dict, context: ToolContext) -> ToolResult:
+                assert tool_input["action"] == "CreateStack"
+                return ToolResult.success(
+                    json.dumps(
+                        {
+                            "stack_id": "stack-123",
+                            "stack_name": "demo",
+                            "status": "CREATE_COMPLETE",
+                            "is_success": True,
+                        }
+                    )
+                )
+
+        step = StepSpec(
+            step_id="deploying",
+            conclusion_field="deployment",
+            forward=None,
+            prompt_file="prompts/deploying.md",
+            conclusion_schema={
+                "type": "object",
+                "required": ["status"],
+                "additionalProperties": False,
+                "properties": {
+                    "stack_id": {"type": "string"},
+                    "status": {"type": "string", "enum": ["success", "failed", "cancelled"]},
+                    "error": {"type": "string"},
+                },
+            },
+            completion_guards=[
+                {
+                    "when_conclusion_field_equals": {"status": "success"},
+                    "required_conclusion_field": "stack_id",
+                    "require_tool_result": {
+                        "tool": "ros_stack",
+                        "action_in": ["CreateStack", "ContinueCreateStack"],
+                        "is_success": True,
+                        "status_in": ["CREATE_COMPLETE"],
+                        "match_conclusion_field": "stack_id",
+                    },
+                    "message": "部署成功必须等待 ros_stack CreateStack 返回 CREATE_COMPLETE。",
+                }
+            ],
+            max_agent_turns=8,
+        )
+        pipeline = LoadedPipeline(
+            name="test",
+            steps=[step],
+            context_dependencies={"deployment": []},
+            max_rollbacks=3,
+            skills={},
+        )
+        registry = ToolRegistry()
+        registry.register(DummyRosStack())
+
+        class Provider:
+            def __init__(self) -> None:
+                self.calls = 0
+
+            def get_model_name(self) -> str:
+                return "test-model"
+
+            async def stream(self, messages, system, tools=None):
+                self.calls += 1
+                if self.calls == 1:
+                    yield MessageStartEvent(message_id="m1")
+                    yield ToolUseStartEvent(tool_use_id="done_bad", name="complete_step")
+                    yield ToolUseEndEvent(
+                        tool_use_id="done_bad",
+                        name="complete_step",
+                        input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+                    )
+                    yield MessageEndEvent(stop_reason="tool_use", usage=Usage())
+                    return
+
+                if self.calls == 2:
+                    assert any(
+                        getattr(block, "type", None) == "tool_result"
+                        and getattr(block, "tool_use_id", None) == "done_bad"
+                        and getattr(block, "is_error", False)
+                        and "CreateStack" in getattr(block, "content", "")
+                        for message in messages
+                        for block in (message.content if isinstance(message.content, list) else [])
+                    )
+                    yield MessageStartEvent(message_id="m2")
+                    yield ToolUseStartEvent(tool_use_id="stack_1", name="ros_stack")
+                    yield ToolUseEndEvent(
+                        tool_use_id="stack_1",
+                        name="ros_stack",
+                        input={"action": "CreateStack", "params": {"StackName": "demo"}},
+                    )
+                    yield MessageEndEvent(stop_reason="tool_use", usage=Usage())
+                    return
+
+                if self.calls == 3:
+                    yield MessageStartEvent(message_id="m3")
+                    yield ToolUseStartEvent(tool_use_id="done_good", name="complete_step")
+                    yield ToolUseEndEvent(
+                        tool_use_id="done_good",
+                        name="complete_step",
+                        input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+                    )
+                    yield MessageEndEvent(stop_reason="tool_use", usage=Usage())
+                    return
+
+                yield MessageStartEvent(message_id="m4")
+                yield MessageEndEvent(stop_reason="end_turn", usage=Usage())
+
+        provider = Provider()
+        executor = StepExecutor(
+            provider_manager=provider,
+            base_tool_registry=registry,
+            pipeline=pipeline,
+            pipeline_dir=tmp_path,
+        )
+
+        collected = []
+        async for event in executor.execute(step, PipelineContext({"deployment": []}), "test"):
+            collected.append(event)
+
+        complete_results = [
+            event for event in collected if isinstance(event, ToolResultEvent) and event.tool_name == "complete_step"
+        ]
+        assert provider.calls == 3
+        assert complete_results[0].is_error
+        assert "CreateStack" in complete_results[0].result
+        assert complete_results[-1].is_error is False
+        step_results = [event for event in collected if isinstance(event, StepResult)]
+        assert step_results[-1].status == StepStatus.COMPLETED
+        assert step_results[-1].conclusion == {"status": "success", "stack_id": "stack-123"}
+
+    @pytest.mark.asyncio
+    async def test_fresh_complete_step_recovery_preserves_create_stack_guard_state(self, tmp_path):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "deploying.md").write_text("Deploy.", encoding="utf-8")
+
+        class DummyRosStack(Tool):
+            @property
+            def name(self) -> str:
+                return "ros_stack"
+
+            @property
+            def description(self) -> str:
+                return "ROS stack"
+
+            @property
+            def input_schema(self) -> dict:
+                return {
+                    "type": "object",
+                    "required": ["action"],
+                    "properties": {"action": {"type": "string"}, "params": {"type": "object"}},
+                }
+
+            def is_read_only(self, input: dict | None = None) -> bool:
+                return True
+
+            async def execute(self, *, tool_input: dict, context: ToolContext) -> ToolResult:
+                return ToolResult.success(
+                    json.dumps(
+                        {
+                            "stack_id": "stack-123",
+                            "stack_name": "demo",
+                            "status": "CREATE_COMPLETE",
+                            "is_success": True,
+                        }
+                    )
+                )
+
+        step = StepSpec(
+            step_id="deploying",
+            conclusion_field="deployment",
+            forward=None,
+            prompt_file="prompts/deploying.md",
+            conclusion_schema={
+                "type": "object",
+                "required": ["status"],
+                "additionalProperties": False,
+                "properties": {
+                    "stack_id": {"type": "string"},
+                    "status": {"type": "string", "enum": ["success", "failed", "cancelled"]},
+                    "error": {"type": "string"},
+                },
+            },
+            completion_guards=[
+                {
+                    "when_conclusion_field_equals": {"status": "success"},
+                    "required_conclusion_field": "stack_id",
+                    "require_tool_result": {
+                        "tool": "ros_stack",
+                        "action_in": ["CreateStack", "ContinueCreateStack"],
+                        "is_success": True,
+                        "status_in": ["CREATE_COMPLETE"],
+                        "match_conclusion_field": "stack_id",
+                    },
+                }
+            ],
+            max_agent_turns=8,
+        )
+        pipeline = LoadedPipeline(
+            name="test",
+            steps=[step],
+            context_dependencies={"deployment": []},
+            max_rollbacks=3,
+            skills={},
+        )
+        registry = ToolRegistry()
+        registry.register(DummyRosStack())
+
+        class Provider:
+            def __init__(self) -> None:
+                self.calls = 0
+
+            def get_model_name(self) -> str:
+                return "test-model"
+
+            async def stream(self, messages, system, tools=None):
+                self.calls += 1
+                if self.calls == 1:
+                    yield MessageStartEvent(message_id="m1")
+                    yield ToolUseStartEvent(tool_use_id="stack_1", name="ros_stack")
+                    yield ToolUseEndEvent(
+                        tool_use_id="stack_1",
+                        name="ros_stack",
+                        input={"action": "CreateStack", "params": {"StackName": "demo"}},
+                    )
+                    yield MessageEndEvent(stop_reason="tool_use", usage=Usage())
+                    return
+
+                if self.calls in {2, 3}:
+                    yield MessageStartEvent(message_id=f"m{self.calls}")
+                    yield ToolUseStartEvent(tool_use_id=f"done_bad_{self.calls}", name="complete_step")
+                    yield ToolUseEndEvent(
+                        tool_use_id=f"done_bad_{self.calls}",
+                        name="complete_step",
+                        input={},
+                    )
+                    yield MessageEndEvent(stop_reason="tool_use", usage=Usage())
+                    return
+
+                if self.calls == 4:
+                    yield MessageStartEvent(message_id="m4")
+                    yield ToolUseStartEvent(tool_use_id="done_good", name="complete_step")
+                    yield ToolUseEndEvent(
+                        tool_use_id="done_good",
+                        name="complete_step",
+                        input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+                    )
+                    yield MessageEndEvent(stop_reason="tool_use", usage=Usage())
+                    return
+
+                yield MessageStartEvent(message_id="m5")
+                yield MessageEndEvent(stop_reason="end_turn", usage=Usage())
+
+        provider = Provider()
+        executor = StepExecutor(
+            provider_manager=provider,
+            base_tool_registry=registry,
+            pipeline=pipeline,
+            pipeline_dir=tmp_path,
+        )
+
+        collected = []
+        async for event in executor.execute(step, PipelineContext({"deployment": []}), "test"):
+            collected.append(event)
+
+        assert provider.calls == 4
+        complete_results = [
+            event for event in collected if isinstance(event, ToolResultEvent) and event.tool_name == "complete_step"
+        ]
+        assert complete_results[-1].is_error is False
+        step_results = [event for event in collected if isinstance(event, StepResult)]
+        assert step_results[-1].status == StepStatus.COMPLETED
+        assert step_results[-1].conclusion == {"status": "success", "stack_id": "stack-123"}
+
+    @pytest.mark.asyncio
+    async def test_resumed_completed_step_revalidates_completion_guards(self, monkeypatch, tmp_path):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "deploying.md").write_text("Deploy.", encoding="utf-8")
+        calls: list[str] = []
+
+        class FakeAgentLoop:
+            def __init__(self, **kwargs):
+                self.resume_messages = kwargs.get("resume_messages")
+
+            async def continue_streaming(self):
+                calls.append("continue")
+                yield ToolUseStartEvent(tool_use_id="stack_1", name="ros_stack")
+                yield ToolUseEndEvent(
+                    tool_use_id="stack_1",
+                    name="ros_stack",
+                    input={"action": "CreateStack", "params": {"StackName": "demo"}},
+                )
+                yield ToolResultEvent(
+                    tool_use_id="stack_1",
+                    tool_name="ros_stack",
+                    result=json.dumps(
+                        {
+                            "stack_id": "stack-123",
+                            "stack_name": "demo",
+                            "status": "CREATE_COMPLETE",
+                            "is_success": True,
+                        }
+                    ),
+                )
+                yield ToolUseStartEvent(tool_use_id="done_good", name="complete_step")
+                yield ToolUseEndEvent(
+                    tool_use_id="done_good",
+                    name="complete_step",
+                    input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+                )
+                yield ToolResultEvent(tool_use_id="done_good", tool_name="complete_step", result="ok")
+
+            async def run_streaming(self, user_input):
+                raise AssertionError("resumed step should continue, not start a fresh prompt")
+
+        monkeypatch.setattr("iac_code.agent.agent_loop.AgentLoop", FakeAgentLoop)
+
+        step = StepSpec(
+            step_id="deploying",
+            conclusion_field="deployment",
+            forward=None,
+            prompt_file="prompts/deploying.md",
+            conclusion_schema={
+                "type": "object",
+                "required": ["status"],
+                "additionalProperties": False,
+                "properties": {
+                    "stack_id": {"type": "string"},
+                    "status": {"type": "string", "enum": ["success", "failed", "cancelled"]},
+                    "error": {"type": "string"},
+                },
+            },
+            completion_guards=[
+                {
+                    "when_conclusion_field_equals": {"status": "success"},
+                    "required_conclusion_field": "stack_id",
+                    "require_tool_result": {
+                        "tool": "ros_stack",
+                        "action_in": ["CreateStack", "ContinueCreateStack"],
+                        "is_success": True,
+                        "status_in": ["CREATE_COMPLETE"],
+                        "match_conclusion_field": "stack_id",
+                    },
+                }
+            ],
+        )
+        pipeline = LoadedPipeline(
+            name="test",
+            steps=[step],
+            context_dependencies={"deployment": []},
+            max_rollbacks=3,
+            skills={},
+        )
+        executor = StepExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=ToolRegistry(),
+            pipeline=pipeline,
+            pipeline_dir=tmp_path,
+        )
+        resume_messages = [
+            Message(
+                role="assistant",
+                content=[
+                    ToolUseBlock(
+                        id="done_old",
+                        name="complete_step",
+                        input={"conclusion": {"status": "success", "stack_id": "stack-123"}},
+                    )
+                ],
+            ),
+            Message(role="user", content=[ToolResultBlock(tool_use_id="done_old", content="ok", is_error=False)]),
+        ]
+
+        collected = []
+        async for event in executor.execute(
+            step,
+            PipelineContext({"deployment": []}),
+            "test",
+            resume_messages=resume_messages,
+        ):
+            collected.append(event)
+
+        assert calls == ["continue"]
+        step_results = [event for event in collected if isinstance(event, StepResult)]
+        assert step_results[-1].status == StepStatus.COMPLETED
+        assert step_results[-1].conclusion == {"status": "success", "stack_id": "stack-123"}
+
 
 class TestPipelineToolsDiscovery:
     def test_inject_tool_from_pipeline_tools_dir(self, tmp_path):
@@ -1575,7 +2063,6 @@ def test_passes_rollback_targets_to_tool(self, tmp_path):
             conclusion_field="intent",
             forward="arch",
             prompt_file="prompts/intent_parsing.md",
-            rollback_rules=[RollbackRule(target_step="prev_step", condition="bad")],
         )
         executor = StepExecutor(
             provider_manager=MagicMock(),
@@ -1584,18 +2071,40 @@ def test_passes_rollback_targets_to_tool(self, tmp_path):
             pipeline_dir=tmp_path,
         )
         ctx = PipelineContext(SIMPLE_DEPS)
-        tool_reg = executor._build_step_tools(step, ctx)
+        tool_reg = executor._build_step_tools(step, ctx, rollback_targets=["prev_step"])
         complete_tool = tool_reg.get("complete_step")
         schema = complete_tool.input_schema
         assert schema["properties"]["rollback_request"]["properties"]["target_step"]["enum"] == ["prev_step"]
 
+    def test_does_not_fallback_to_static_rollback_rules(self, tmp_path):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "intent_parsing.md").write_text("Parse.", encoding="utf-8")
+        step = StepSpec(
+            step_id="intent_parsing",
+            conclusion_field="intent",
+            forward="arch",
+            prompt_file="prompts/intent_parsing.md",
+        )
+        setattr(step, "rollback_rules", [SimpleNamespace(target_step="legacy_prev", condition="bad")])
+        executor = StepExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=ToolRegistry(),
+            pipeline=_make_pipeline(),
+            pipeline_dir=tmp_path,
+        )
+        ctx = PipelineContext(SIMPLE_DEPS)
+        tool_reg = executor._build_step_tools(step, ctx)
+        complete_tool = tool_reg.get("complete_step")
+
+        assert "rollback_request" not in complete_tool.input_schema["properties"]
+
 
 class TestSchemaIntegration:
     """Integration test: schema flows from StepSpec through StepExecutor to CompleteStepTool."""
 
     def test_conclusion_schema_and_rollback_targets_propagate(self, tmp_path):
         """Verify that conclusion_schema from StepSpec reaches the tool's input_schema,
-        and rollback_rules produce correct enum constraint on rollback_request.target_step."""
+        and explicit rollback targets produce correct enum constraint on rollback_request.target_step."""
         (tmp_path / "prompts").mkdir(exist_ok=True)
         (tmp_path / "prompts" / "intent_parsing.md").write_text("Do it.", encoding="utf-8")
         step = StepSpec(
@@ -1611,10 +2120,6 @@ def test_conclusion_schema_and_rollback_targets_propagate(self, tmp_path):
                     "confidence": {"type": "string", "enum": ["high", "medium", "low"]},
                 },
             },
-            rollback_rules=[
-                RollbackRule(target_step="prev_step", condition="bad_input"),
-                RollbackRule(target_step="other_step", condition="other_issue"),
-            ],
             max_conclusion_retries=3,
         )
         executor = StepExecutor(
@@ -1624,7 +2129,7 @@ def test_conclusion_schema_and_rollback_targets_propagate(self, tmp_path):
             pipeline_dir=tmp_path,
         )
         ctx = PipelineContext(SIMPLE_DEPS)
-        tool_reg = executor._build_step_tools(step, ctx)
+        tool_reg = executor._build_step_tools(step, ctx, rollback_targets=["prev_step", "other_step"])
         tool = tool_reg.get("complete_step")
         schema = tool.input_schema
 
@@ -1665,7 +2170,7 @@ def test_no_schema_falls_back_to_generic(self, tmp_path):
         assert conclusion["type"] == "object"
         assert "description" in conclusion
         assert "properties" not in conclusion
-        # No rollback when no rollback_rules
+        # No rollback unless the runner passes dynamic rollback targets.
         assert "rollback_request" not in schema["properties"]
 
 
diff --git a/tests/pipeline/engine/test_step_executor_integration.py b/tests/pipeline/engine/test_step_executor_integration.py
index cb971a7f..8150b1ab 100644
--- a/tests/pipeline/engine/test_step_executor_integration.py
+++ b/tests/pipeline/engine/test_step_executor_integration.py
@@ -108,3 +108,25 @@ def test_step_executor_defaults_keep_existing_signatures(tmp_path):
     assert executor._permission_context_getter is None
     assert executor._memory_content_getter is None
     assert executor._auto_trigger_skills == []
+
+
+def test_step_agent_loop_does_not_receive_memory_recall_service(monkeypatch, tmp_path):
+    captured_kwargs = {}
+
+    class FakeAgentLoop:
+        def __init__(self, **kwargs):
+            captured_kwargs.update(kwargs)
+
+    monkeypatch.setattr("iac_code.agent.agent_loop.AgentLoop", FakeAgentLoop)
+
+    executor = _make_executor(
+        tmp_path,
+        memory_content_getter=lambda: "this should not imply side recall",
+    )
+    step = _make_step()
+    ctx = PipelineContext({"x": []})
+
+    agent_context = executor.build_agent_loop_context(step, ctx, "session-1")
+
+    assert agent_context.agent_loop is not None
+    assert "memory_recall_service" not in captured_kwargs
diff --git a/tests/pipeline/engine/test_step_spec.py b/tests/pipeline/engine/test_step_spec.py
index fe02d8d3..a7ea4663 100644
--- a/tests/pipeline/engine/test_step_spec.py
+++ b/tests/pipeline/engine/test_step_spec.py
@@ -6,7 +6,6 @@
     SubPipelineSpec,
     render_prompt,
 )
-from iac_code.pipeline.engine.types import RollbackRule
 
 
 class TestIncludeExcludeConfig:
@@ -93,14 +92,13 @@ def test_create_full(self):
             forward="cost_estimating",
             prompt_file="prompts/reviewing.md",
             skill="iac-aliyun-review",
-            rollback_rules=[RollbackRule(target_step="template_generating", condition="template_issue")],
             context_fields=["template"],
             enabled_when="cost_estimation",
             hooks_file="hooks/deploying.py",
         )
         assert spec.skill == "iac-aliyun-review"
         assert spec.enabled_when == "cost_estimation"
-        assert len(spec.rollback_rules) == 1
+        assert spec.context_fields == ["template"]
 
     def test_parallel_sub_pipeline_step(self):
         spec = StepSpec(
diff --git a/tests/pipeline/engine/test_sub_pipeline_executor.py b/tests/pipeline/engine/test_sub_pipeline_executor.py
index 5d24a481..8f0eccf5 100644
--- a/tests/pipeline/engine/test_sub_pipeline_executor.py
+++ b/tests/pipeline/engine/test_sub_pipeline_executor.py
@@ -5,12 +5,13 @@
 
 import pytest
 
+from iac_code.agent.message import ImageBlock, Message, ToolResultBlock, ToolUseBlock
 from iac_code.pipeline.engine.context import PipelineContext
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
 from iac_code.pipeline.engine.state_machine import StateMachine
 from iac_code.pipeline.engine.step_spec import LoadedPipeline, StepSpec, SubPipelineSpec
 from iac_code.pipeline.engine.sub_pipeline_executor import SubPipelineExecutor, SubPipelineResult
-from iac_code.pipeline.engine.types import RollbackRule, StepResult, StepStatus
+from iac_code.pipeline.engine.types import StepResult, StepStatus
 from iac_code.tools.base import ToolRegistry
 from iac_code.types.stream_events import ToolResultEvent, ToolUseEndEvent, ToolUseStartEvent
 
@@ -188,6 +189,85 @@ async def execute(
             }
         ]
 
+    @pytest.mark.asyncio
+    async def test_execute_streaming_appends_explicit_resume_messages_to_repaired_transcript(
+        self, tmp_path, monkeypatch
+    ):
+        (tmp_path / "prompts").mkdir(exist_ok=True)
+        (tmp_path / "prompts" / "template.md").write_text("Generate template", encoding="utf-8")
+        sub_spec = SubPipelineSpec(
+            name="evaluate_candidate",
+            steps=[
+                StepSpec(
+                    step_id="template_generating",
+                    conclusion_field="template",
+                    forward=None,
+                    prompt_file="prompts/template.md",
+                    skill="iac_aliyun",
+                    context_fields=["candidate", "intent"],
+                )
+            ],
+            max_rollbacks=2,
+            iterate_over="architecture.candidates",
+            context_fields_from_parent=["intent"],
+        )
+        repaired = [
+            Message(
+                role="assistant",
+                content=[ToolUseBlock(id="toolu_1", name="ask_user_question", input={"question": "q"})],
+            )
+        ]
+        tool_result = Message(
+            role="user",
+            content=[ToolResultBlock(tool_use_id="toolu_1", content='{"free_text":"see image"}', is_error=False)],
+        )
+        image_message = [ImageBlock(media_type="image/png", data="aGVsbG8=")]
+        captured = {}
+
+        class FakeStepExecutor:
+            current_agent_loop = None
+
+            async def execute(self, step, context, session_id, user_message=None, **kwargs):
+                captured["resume_messages"] = kwargs["resume_messages"]
+                captured["user_message"] = user_message
+                yield StepResult(step_id=step.step_id, status=StepStatus.COMPLETED, conclusion={"body": "ok"})
+
+        executor = SubPipelineExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=ToolRegistry(),
+            pipeline=LoadedPipeline(
+                name="test",
+                steps=[],
+                context_dependencies={"intent": []},
+                max_rollbacks=3,
+                skills={"iac_aliyun": "# IaC Skill", "iac-aliyun-cost": "# Cost Skill"},
+            ),
+            pipeline_dir=tmp_path,
+        )
+        monkeypatch.setattr(executor, "_make_step_executor", lambda: FakeStepExecutor())
+        parent_ctx = PipelineContext({"intent": []})
+        parent_ctx.set_conclusion("intent", {"type": "test"})
+
+        async for _event in executor.execute_streaming(
+            sub_spec=sub_spec,
+            candidate={"name": "Plan A"},
+            candidate_index=0,
+            parent_context=parent_ctx,
+            session_id="test_session",
+            user_message=image_message,
+            resume_messages=[tool_result],
+            resume_state={
+                "current_sub_step": "template_generating",
+                "active_attempt_id": "att_1",
+                "transcript_id": "transcript_1",
+                "resume_messages": repaired,
+            },
+        ):
+            pass
+
+        assert captured["resume_messages"] == [*repaired, tool_result]
+        assert captured["user_message"] == image_message
+
     @pytest.mark.asyncio
     async def test_completed_sub_step_resume_state_starts_at_next_sub_step(self, tmp_path, monkeypatch):
         """A crash after persisting sub-step completion must resume at the next sub-step."""
@@ -370,7 +450,6 @@ async def test_rollback_persistence_drops_stale_target_and_downstream_conclusion
                     forward=None,
                     prompt_file="prompts/cost.md",
                     context_fields=["template"],
-                    rollback_rules=[RollbackRule(target_step="template_generating", condition="needs_template_rework")],
                 ),
             ],
             max_rollbacks=2,
diff --git a/tests/pipeline/engine/test_transcript_storage.py b/tests/pipeline/engine/test_transcript_storage.py
index 313612b4..23b0575e 100644
--- a/tests/pipeline/engine/test_transcript_storage.py
+++ b/tests/pipeline/engine/test_transcript_storage.py
@@ -4,7 +4,7 @@
 from pathlib import Path
 
 from iac_code import __version__
-from iac_code.agent.message import Message, TextBlock, ToolUseBlock
+from iac_code.agent.message import ImageBlock, Message, TextBlock, ToolUseBlock
 from iac_code.pipeline.engine.transcript_storage import PipelineTranscriptStorage
 
 
@@ -26,6 +26,21 @@ def test_append_and_load_roundtrip(tmp_path: Path):
     assert messages[1].get_text() == "hi"
 
 
+def test_pipeline_transcript_round_trips_image_blocks(tmp_path: Path):
+    storage = PipelineTranscriptStorage(tmp_path / "pipeline")
+    messages = [
+        Message(
+            role="user",
+            content=[TextBlock(text="diagram"), ImageBlock(media_type="image/png", data="aGVsbG8=")],
+        )
+    ]
+
+    storage.save("/repo", "transcript_att_0001", messages)
+    loaded = storage.load("/repo", "transcript_att_0001")
+
+    assert loaded == messages
+
+
 def test_transcript_lives_inside_sidecar(tmp_path: Path):
     storage = PipelineTranscriptStorage(tmp_path / "pipeline")
 
diff --git a/tests/pipeline/engine/test_types.py b/tests/pipeline/engine/test_types.py
index 516aa869..a9ff4fa9 100644
--- a/tests/pipeline/engine/test_types.py
+++ b/tests/pipeline/engine/test_types.py
@@ -1,4 +1,4 @@
-from iac_code.pipeline.engine.types import RollbackRule, StepConfig, StepResult, StepStatus
+from iac_code.pipeline.engine.types import StepConfig, StepResult, StepStatus
 
 
 class TestStepStatus:
@@ -13,22 +13,6 @@ def test_is_str_enum(self):
         assert isinstance(StepStatus.PENDING, str)
 
 
-class TestRollbackRule:
-    def test_basic_construction(self):
-        rule = RollbackRule(target_step="intent_parsing", condition="user_request")
-        assert rule.target_step == "intent_parsing"
-        assert rule.condition == "user_request"
-        assert rule.invalidates == []
-
-    def test_with_invalidates(self):
-        rule = RollbackRule(
-            target_step="architecture_planning",
-            condition="cost_too_high",
-            invalidates=["specs", "template"],
-        )
-        assert rule.invalidates == ["specs", "template"]
-
-
 class TestStepConfig:
     def test_defaults(self):
         config = StepConfig(
@@ -38,22 +22,21 @@ def test_defaults(self):
         )
         assert config.auto_advance is True
         assert config.max_agent_turns == 50
-        assert config.rollback_rules == []
+        assert config.rollback_targets == []
 
     def test_custom_values(self):
-        rules = [RollbackRule(target_step="prev", condition="wrong")]
         config = StepConfig(
             step_id="my_step",
             conclusion_field="my_field",
             forward=None,
-            rollback_rules=rules,
+            rollback_targets=["prev"],
             auto_advance=False,
             max_agent_turns=20,
         )
         assert config.forward is None
         assert config.auto_advance is False
         assert config.max_agent_turns == 20
-        assert len(config.rollback_rules) == 1
+        assert config.rollback_targets == ["prev"]
 
 
 class TestStepResult:
diff --git a/tests/pipeline/engine/test_ui_contract.py b/tests/pipeline/engine/test_ui_contract.py
index 2a8344c9..66547906 100644
--- a/tests/pipeline/engine/test_ui_contract.py
+++ b/tests/pipeline/engine/test_ui_contract.py
@@ -22,11 +22,46 @@ def test_encode_selected_candidate_returns_json_string():
     assert payload == {"selected_candidate_name": "Same", "selected_candidate_index": 1}
 
 
+def test_encode_selected_candidate_can_include_parameter_overrides():
+    payload = json.loads(encode_selected_candidate("Same", 1, {"InstanceType": "ecs.g7.large"}))
+    assert payload == {
+        "selected_candidate_name": "Same",
+        "selected_candidate_index": 1,
+        "parameter_overrides": {"InstanceType": "ecs.g7.large"},
+    }
+
+
 def test_parse_selected_candidate_accepts_structured_json_string():
     parsed = parse_selected_candidate('{"selected_candidate_name": "Same", "selected_candidate_index": 1}')
     assert parsed is not None
     assert parsed.selected_candidate_name == "Same"
     assert parsed.selected_candidate_index == 1
+    assert parsed.parameter_overrides == {}
+
+
+def test_parse_selected_candidate_accepts_parameter_overrides():
+    parsed = parse_selected_candidate(
+        '{"selected_candidate_name": "Same", "selected_candidate_index": 1, '
+        '"parameter_overrides": {"InstanceType": "ecs.g7.large", "Optional": null}}'
+    )
+    assert parsed is not None
+    assert parsed.selected_candidate_name == "Same"
+    assert parsed.selected_candidate_index == 1
+    assert parsed.parameter_overrides == {"InstanceType": "ecs.g7.large"}
+
+
+def test_parse_selected_candidate_accepts_parameters_alias_for_a2a_payloads():
+    parsed = parse_selected_candidate('{"selected_candidate_index": 1, "parameters": {"ZoneId": "cn-hangzhou-k"}}')
+    assert parsed is not None
+    assert parsed.selected_candidate_index == 1
+    assert parsed.parameter_overrides == {"ZoneId": "cn-hangzhou-k"}
+
+
+def test_parse_selected_candidate_rejects_invalid_parameter_overrides():
+    parsed = parse_selected_candidate(
+        '{"selected_candidate_name": "Same", "selected_candidate_index": 1, "parameter_overrides": "bad"}'
+    )
+    assert parsed is None
 
 
 def test_parse_selected_candidate_accepts_legacy_plain_name():
@@ -34,6 +69,7 @@ def test_parse_selected_candidate_accepts_legacy_plain_name():
     assert parsed is not None
     assert parsed.selected_candidate_name == "Same"
     assert parsed.selected_candidate_index is None
+    assert parsed.parameter_overrides == {}
 
 
 def test_parse_selected_candidate_extracts_zero_based_index_from_natural_language_choice():
diff --git a/tests/pipeline/engine/test_user_input.py b/tests/pipeline/engine/test_user_input.py
new file mode 100644
index 00000000..538b5d83
--- /dev/null
+++ b/tests/pipeline/engine/test_user_input.py
@@ -0,0 +1,55 @@
+from iac_code.agent.message import ImageBlock, TextBlock, ToolResultBlock
+from iac_code.pipeline.engine.user_input import (
+    PipelineUserInput,
+    content_display_text,
+    content_has_images,
+    normalize_pipeline_user_input,
+)
+
+
+def test_normalize_string_input() -> None:
+    value = normalize_pipeline_user_input("create an ecs")
+
+    assert value == PipelineUserInput(
+        content="create an ecs",
+        display_text="create an ecs",
+        has_images=False,
+    )
+    assert value.is_empty is False
+
+
+def test_normalize_image_only_input_is_not_empty() -> None:
+    image = ImageBlock(media_type="image/png", data="aGVsbG8=")
+
+    value = normalize_pipeline_user_input([image])
+
+    assert value.content == [image]
+    assert value.display_text == "[Image input]"
+    assert value.has_images is True
+    assert value.is_empty is False
+
+
+def test_content_display_text_extracts_text_and_tool_result_without_image_bytes() -> None:
+    blocks = [
+        TextBlock(text="text part"),
+        ImageBlock(media_type="image/png", data="aGVsbG8="),
+        ToolResultBlock(tool_use_id="toolu_1", content='{"answer":"ok"}'),
+    ]
+
+    assert content_has_images(blocks) is True
+    assert content_display_text(blocks) == 'text part\n{"answer":"ok"}'
+
+
+def test_with_prepended_text_preserves_original_image_block() -> None:
+    image = ImageBlock(media_type="image/png", data="aGVsbG8=")
+    value = normalize_pipeline_user_input([TextBlock(text="original"), image])
+
+    updated = value.with_prepended_text("rollback context")
+
+    assert updated.display_text == "rollback context\n\noriginal"
+    assert updated.has_images is True
+    assert updated.content == [
+        TextBlock(text="rollback context"),
+        TextBlock(text="original"),
+        image,
+    ]
diff --git a/tests/pipeline/selling/skills/test_iac_aliyun_architecture_skill.py b/tests/pipeline/selling/skills/test_iac_aliyun_architecture_skill.py
index 0a491802..c29f5980 100644
--- a/tests/pipeline/selling/skills/test_iac_aliyun_architecture_skill.py
+++ b/tests/pipeline/selling/skills/test_iac_aliyun_architecture_skill.py
@@ -24,3 +24,13 @@ def test_architecture_consumes_intent_resource_lifecycle_contract():
     assert "use_existing/reference 必须作为已有资源引用" in body
     assert "不得生成 VSwitch" in body
     assert "forbidden_resources" not in body
+
+
+def test_architecture_prompt_guides_optional_memory_lookup_for_planning_context():
+    body = PROMPT_FILE.read_text(encoding="utf-8")
+
+    assert "不要读取项目文件或记忆" not in body
+    assert "read_memory({})" in body
+    assert "架构偏好" in body
+    assert "已有 VPC" in body
+    assert "当前用户意图为准" in body
diff --git a/tests/pipeline/selling/skills/test_iac_aliyun_cost_skill.py b/tests/pipeline/selling/skills/test_iac_aliyun_cost_skill.py
index baf58fcc..51ba6007 100644
--- a/tests/pipeline/selling/skills/test_iac_aliyun_cost_skill.py
+++ b/tests/pipeline/selling/skills/test_iac_aliyun_cost_skill.py
@@ -9,6 +9,7 @@
 )
 SKILL_MD = SKILL_DIR / "SKILL.md"
 EVALS_JSON = SKILL_DIR / "evals.json"
+COST_PROMPT_MD = SKILL_DIR.parents[1] / "prompts" / "cost_estimating.md"
 
 
 def _direct_references_dir_or_skip() -> Path:
@@ -55,6 +56,20 @@ def test_description_mentions_cost(self):
         fm = _parse_frontmatter(content)
         assert "GetTemplateEstimateCost" in fm["description"] or "费用" in fm["description"]
 
+    def test_conclusion_schema_carries_deployment_parameters(self):
+        content = SKILL_MD.read_text(encoding="utf-8")
+        fm = _parse_frontmatter(content)
+        schema = fm["conclusion_schema"]
+        assert "deployment_parameters" in schema["required"]
+        assert schema["properties"]["deployment_parameters"]["type"] == "object"
+
+    def test_conclusion_schema_can_report_missing_deployment_parameters(self):
+        content = SKILL_MD.read_text(encoding="utf-8")
+        fm = _parse_frontmatter(content)
+        schema = fm["conclusion_schema"]
+        assert "missing_deployment_parameters" in schema["properties"]
+        assert schema["properties"]["missing_deployment_parameters"]["type"] == "array"
+
 
 class TestSkillContentRosOnly:
     @pytest.fixture()
@@ -91,8 +106,61 @@ def test_modified_template_retry_limit_is_seven(self, body):
     def test_validate_template_policy_is_not_repeated(self, body):
         assert body.count("只有在修复或改写模板后") == 1
 
-    def test_contains_parameter_flattening(self, body):
-        assert "Parameters.1.ParameterKey" in body or "ParameterKey" in body
+    def test_uses_parameters_dictionary_auto_expansion(self, body):
+        assert '"Parameters": {' in body
+        assert "直接传字典格式" in body
+        assert "工具会自动展开" in body
+        assert "Parameters.1.ParameterKey" not in body
+
+    def test_outputs_pricing_parameters_for_deployment(self, body):
+        assert "deployment_parameters" in body
+        assert "传递给 deploying" in body
+        assert "写入模板 Parameters 的 `Default`" not in body
+        assert "沉淀参数默认值" not in body
+
+    def test_contains_parameter_recommendation_flow(self, body):
+        assert "Pricing Parameter Set" in body
+        assert "Preview-Validated Pricing Parameter Set" in body
+        assert "references/template-parameter-recommendation.md" in body
+        assert "GetTemplateParameterConstraints" in body
+        assert "PreviewStack" in body
+        assert "AllowedValues" in body
+        assert "不得编造" in body
+        assert "外部输入" in body
+        assert "不执行 `PreviewStack`" not in body
+        assert "写回模板的 Default 保持一致" not in body
+
+    def test_existing_resource_parameters_can_use_api_candidates(self, body):
+        assert "VpcId、VSwitchId、SecurityGroupId、KeyPairName" in body
+        assert "API 返回候选不是编造" in body
+        assert "先查询约束或只读资源候选" in body
+        assert "不要仅因参数名是 VpcId" in body
+
+    def test_preview_stack_uses_aliyun_api_not_ros_stack(self, body):
+        assert 'aliyun_api(product="ros", action="PreviewStack")' in body
+        assert "不要使用 `ros_stack` 执行 `PreviewStack`" in body
+
+    def test_preview_stack_must_pass_stack_name_with_random_suffix(self, body):
+        assert "PreviewStack 必须传 StackName" in body
+        assert "随机串后缀" in body
+        assert "避免重名" in body
+
+    def test_parameter_recommendation_precedes_initial_pricing(self, body):
+        assert "先直接询价" not in body
+        assert "首次询价前" in body
+        assert "形成 Preview-Validated Pricing Parameter Set" in body
+
+    def test_preserves_preview_parameters_when_pricing_fails(self, body):
+        assert "PreviewStack 成功但询价失败" in body
+        assert "不要丢弃 Preview-Validated Pricing Parameter Set" in body
+        assert "询价失败或外部输入缺失时填 `{}`" not in body
+
+    def test_preview_stack_is_not_hard_gate_for_pricing(self, body):
+        assert "PreviewStack 不是硬门禁" in body
+        assert "完整部署参数" in body
+        assert "GetTemplateEstimateCost" in body
+        assert "missing_deployment_parameters" in body
+        assert "选择阶段" in body and "parameter_overrides" in body
 
     def test_contains_template_url(self, body):
         assert "TemplateURL" in body
@@ -111,12 +179,15 @@ def test_no_doc_search_recommendation(self, body):
             if "aliyun_doc_search" in line:
                 assert "不要" in line or "不" in line or "禁" in line
 
-    def test_contains_resource_types(self, body):
-        assert "ALIYUN::ECS::VPC" in body
-        assert "ALIYUN::ECS::InstanceGroup" in body
+    def test_does_not_inline_common_resource_catalog(self, body):
+        assert "### 常用资源类型" not in body
+        assert "ALIYUN::ECS::VPC — 专有网络" not in body
+        assert "ALIYUN::ECS::InstanceGroup — ECS 实例" not in body
 
-    def test_contains_parameterization_rules(self, body):
-        assert "参数化" in body
+    def test_parameterization_details_stay_in_references(self, body):
+        assert "### 参数化规则" not in body
+        assert "| ECS | ZoneId, InstanceType" not in body
+        assert "references/template-parameters.md" in body
 
     def test_contains_error_handling(self, body):
         assert "失败" in body
@@ -193,6 +264,26 @@ def test_skill_content_matches_file(self):
         assert loaded.skills["iac-aliyun-cost"] == expected
 
 
+class TestCostPrompt:
+    def test_prompt_is_not_duplicate_output_reference(self):
+        body = COST_PROMPT_MD.read_text(encoding="utf-8")
+        assert "Preview-Validated Pricing Parameter Set" in body
+        assert "deployment_parameters" not in body
+        assert "询价失败但 PreviewStack 已成功" not in body
+        assert "字段为字符串" not in body
+
+    def test_prompt_names_preview_stack_tool_contract(self):
+        body = COST_PROMPT_MD.read_text(encoding="utf-8")
+        assert 'aliyun_api(product="ros", action="PreviewStack")' in body
+        assert "不要使用 `ros_stack` 执行 `PreviewStack`" in body
+
+    def test_prompt_treats_preview_stack_as_soft_gate(self):
+        body = COST_PROMPT_MD.read_text(encoding="utf-8")
+        assert "优先通过" in body
+        assert "不是硬门禁" in body
+        assert "参数缺口" in body
+
+
 class TestEvalsJson:
     def test_evals_file_exists(self):
         assert EVALS_JSON.exists()
@@ -201,6 +292,42 @@ def test_valid_json(self):
         data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
         assert isinstance(data, dict)
 
+    def test_evals_follow_parameter_dictionary_contract(self):
+        text = EVALS_JSON.read_text(encoding="utf-8")
+        assert "Parameters.<N>.ParameterKey" not in text
+        assert "Parameters.1.ParameterKey" not in text
+        assert "deployment_parameters" in text
+
+    def test_evals_do_not_require_validation_before_initial_pricing(self):
+        text = EVALS_JSON.read_text(encoding="utf-8")
+        assert "先校验" not in text
+
+    def test_evals_keep_preview_parameters_on_pricing_failure(self):
+        text = EVALS_JSON.read_text(encoding="utf-8")
+        assert "PreviewStack 成功但询价失败" in text
+        assert "不丢弃" in text
+
+    def test_evals_assert_preview_stack_api_tool_contract(self):
+        data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
+        checks = "\n".join(assertion["check"] for ev in data["evals"] for assertion in ev["assertions"])
+        assert 'aliyun_api(product="ros", action="PreviewStack")' in checks
+        assert "不使用 ros_stack" in checks
+
+    def test_evals_cover_existing_vpc_parameter_recommendation(self):
+        data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
+        eval_text = json.dumps(data, ensure_ascii=False)
+        assert "existing-vpc-vswitch-cost" in eval_text
+        assert "ALIYUN::ECS::VPC::VPCId" in eval_text
+        assert "VpcId" in eval_text
+        assert "API 返回候选不是编造" in eval_text
+
+    def test_evals_cover_preview_stack_soft_gate(self):
+        data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
+        eval_text = json.dumps(data, ensure_ascii=False)
+        assert "preview-soft-gate-partial-pricing" in eval_text
+        assert "PreviewStack 不是硬门禁" in eval_text
+        assert "missing_deployment_parameters" in eval_text
+
     def test_has_required_fields(self):
         data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
         assert data["skill_name"] == "iac-aliyun-cost"
diff --git a/tests/pipeline/selling/skills/test_iac_aliyun_deploying_skill.py b/tests/pipeline/selling/skills/test_iac_aliyun_deploying_skill.py
index 79c6425c..5cb964df 100644
--- a/tests/pipeline/selling/skills/test_iac_aliyun_deploying_skill.py
+++ b/tests/pipeline/selling/skills/test_iac_aliyun_deploying_skill.py
@@ -1,6 +1,7 @@
 import json
 from pathlib import Path
 
+import jsonschema
 import pytest
 import yaml
 
@@ -55,6 +56,18 @@ def test_description_mentions_ros(self):
         fm = _parse_frontmatter(content)
         assert "ROS" in fm["description"]
 
+    def test_conclusion_schema_requires_stack_id_for_success_and_error_for_failed(self):
+        content = SKILL_MD.read_text(encoding="utf-8")
+        fm = _parse_frontmatter(content)
+        schema = fm["conclusion_schema"]
+
+        jsonschema.validate({"status": "success", "stack_id": "stack-123"}, schema)
+        jsonschema.validate({"status": "failed", "error": "CREATE_FAILED"}, schema)
+        with pytest.raises(jsonschema.ValidationError):
+            jsonschema.validate({"status": "success"}, schema)
+        with pytest.raises(jsonschema.ValidationError):
+            jsonschema.validate({"status": "failed"}, schema)
+
 
 class TestSkillContentRosOnly:
     @pytest.fixture()
@@ -75,6 +88,44 @@ def test_contains_ros_stack(self, body):
     def test_contains_availability_query(self, body):
         assert "可用性查询" in body
 
+    def test_deploying_uses_parameters_without_preview_recommendation(self, body):
+        assert "部署参数装配" in body
+        assert "selected_plan.effective_deployment_parameters" in body
+        assert "CreateStack" in body
+        assert "GetTemplateParameterConstraints" not in body
+        assert "PreviewStack" not in body
+        assert "Preview-Validated Parameter Set" not in body
+        assert "参数推荐" not in body
+
+    def test_create_stack_name_has_random_suffix(self, body):
+        assert "StackName" in body
+        assert "随机串后缀" in body
+        assert "避免重名" in body
+
+    def test_prefers_cost_deployment_parameters(self, body):
+        assert "selected_plan.selected_candidate_result.cost.deployment_parameters" in body
+        assert "按以下优先级" in body
+        assert "前序成本步骤沉淀的 Default" not in body
+
+    def test_prefers_effective_deployment_parameters(self, body):
+        assert "selected_plan.effective_deployment_parameters" in body
+        assert "最终部署参数集" in body
+        assert "GetTemplateEstimateCost" not in body
+
+    def test_availability_conflict_prefers_non_user_parameters_first(self, body):
+        assert "优先调整非用户指定参数" in body
+        assert "仍无法成功创建资源栈" in body
+        assert "才可调整用户指定参数" in body
+
+    def test_skill_omits_discussion_process_terms(self, body):
+        forbidden = ["A2A", "前端", "客户端", "方案 A", "方案 B", "策略 A", "策略 B", "讨论"]
+        for phrase in forbidden:
+            assert phrase not in body
+
+    def test_does_not_mention_stack_instances(self, body):
+        assert "CreateStackInstances" not in body
+        assert "UpdateStackInstances" not in body
+
     def test_contains_template_validation(self, body):
         assert "ValidateTemplate" in body
         assert "模板校验" in body
@@ -113,13 +164,50 @@ def test_pipeline_confirmed_deploy_does_not_ask_again(self, body):
         assert "不要再次请求用户确认" in body
         assert "不得用 status: cancelled 表示等待用户确认" in body
 
+    def test_delete_requires_explicit_delete_confirmation(self, body):
+        assert "删除请求本身不等于删除确认" in body
+        assert "`delete_confirmed: true`" in body
+        assert "确认删除" in body
+        assert "未收到明确删除确认前，不得调用 `ros_stack` 的 `DeleteStack`" in body
+
 
 class TestDeployingPrompt:
     def test_pipeline_confirmed_deploy_is_direct_execution(self):
         body = DEPLOYING_PROMPT_MD.read_text(encoding="utf-8")
         assert "不要再次询问是否确认部署" in body
-        assert "不得用 status: cancelled 表示等待用户确认" in body
-        assert "只有用户明确取消部署时" in body
+        assert "不得用 status: cancelled 表示等待用户确认" not in body
+        assert "只有用户明确取消部署时" not in body
+
+    def test_prompt_defers_parameter_priority_to_skill(self):
+        body = DEPLOYING_PROMPT_MD.read_text(encoding="utf-8")
+        assert "selected_plan.selected_candidate_result.cost.deployment_parameters" not in body
+        assert "部署参数按以下优先级装配" not in body
+        assert "部署参数装配规则见技能" in body
+
+    def test_prompt_keeps_no_repricing_without_parameter_priority_duplication(self):
+        body = DEPLOYING_PROMPT_MD.read_text(encoding="utf-8")
+        assert "部署步骤不计算费用" in body
+        assert "selected_plan.effective_deployment_parameters" not in body
+        assert "GetTemplateEstimateCost" not in body
+
+    def test_prompt_does_not_repeat_parameter_adjustment_rules(self):
+        body = DEPLOYING_PROMPT_MD.read_text(encoding="utf-8")
+        assert "优先调整非用户指定参数" not in body
+        assert "仍无法成功创建资源栈" not in body
+        assert "才可调整用户指定参数" not in body
+        assert "可用区不可用 → 自动更换可用区重试" not in body
+
+    def test_prompt_omits_discussion_process_terms(self):
+        body = DEPLOYING_PROMPT_MD.read_text(encoding="utf-8")
+        forbidden = ["A2A", "前端", "客户端", "方案 A", "方案 B", "策略 A", "策略 B", "讨论"]
+        for phrase in forbidden:
+            assert phrase not in body
+
+    def test_prompt_delete_requires_explicit_delete_confirmation(self):
+        body = DEPLOYING_PROMPT_MD.read_text(encoding="utf-8")
+        assert "删除请求本身不等于删除确认" in body
+        assert "`delete_confirmed: true`" in body
+        assert "未收到明确删除确认前，不得调用 `ros_stack` 的 `DeleteStack`" in body
 
 
 class TestSkillDiscovery:
@@ -195,3 +283,18 @@ def test_eval_names_are_unique(self):
         data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
         names = [ev["name"] for ev in data["evals"]]
         assert len(names) == len(set(names))
+
+    def test_delete_evals_split_confirmation_and_execution(self):
+        data = json.loads(EVALS_JSON.read_text(encoding="utf-8"))
+        evals_by_name = {ev["name"]: ev for ev in data["evals"]}
+
+        confirmation_eval = evals_by_name["delete-stack-confirmation"]
+        confirmation_assertions = {assertion["name"] for assertion in confirmation_eval["assertions"]}
+        assert "user_confirmation" in confirmation_assertions
+        assert "uses_delete_stack" not in confirmation_assertions
+        assert "no_delete_without_confirmation" in confirmation_assertions
+
+        confirmed_eval = evals_by_name["delete-stack-confirmed"]
+        confirmed_assertions = {assertion["name"] for assertion in confirmed_eval["assertions"]}
+        assert "确认" in confirmed_eval["prompt"]
+        assert "uses_delete_stack" in confirmed_assertions
diff --git a/tests/pipeline/selling/skills/test_iac_aliyun_intent_skill.py b/tests/pipeline/selling/skills/test_iac_aliyun_intent_skill.py
index bfda5ee4..f7b64857 100644
--- a/tests/pipeline/selling/skills/test_iac_aliyun_intent_skill.py
+++ b/tests/pipeline/selling/skills/test_iac_aliyun_intent_skill.py
@@ -49,6 +49,16 @@ def test_intent_prompt_requires_question_before_completion_for_ambiguous_guidabl
     assert "不要把 `is_infra_intent`" in body
 
 
+def test_intent_prompt_guides_optional_memory_lookup_without_overriding_current_input():
+    body = PROMPT_FILE.read_text(encoding="utf-8")
+
+    assert "不要读取项目文件或记忆" not in body
+    assert "read_memory({})" in body
+    assert "已有资源" in body
+    assert "当前用户输入为准" in body
+    assert "不要因为没有相关记忆而阻塞" in body
+
+
 def test_intent_prompt_pins_extremely_vague_launch_to_detail_request():
     body = PROMPT_FILE.read_text(encoding="utf-8")
 
@@ -118,6 +128,25 @@ def test_intent_schema_captures_resource_lifecycle_fields():
     assert "forbidden_resources" not in properties
 
 
+def test_intent_schema_captures_stack_name_and_network_constraints_without_e2e_controls():
+    body = (SKILL_DIR / "SKILL.md").read_text(encoding="utf-8")
+    prompt = PROMPT_FILE.read_text(encoding="utf-8")
+    schema = _parse_frontmatter(body)["conclusion_schema"]
+    non_functional = schema["properties"]["non_functional"]["properties"]
+
+    assert non_functional["stack_name"]["type"] == "string"
+    assert "资源栈名称" in non_functional["stack_name"]["description"]
+    assert non_functional["network_constraints"]["type"] == "object"
+    assert "deployment_hold" not in non_functional
+    assert "non_functional.stack_name" in prompt
+    assert "non_functional.network_constraints" in prompt
+    assert "deployment_hold" not in body
+    assert "部署后等待用户继续" not in body
+    assert "CreateStack 的 params.StackName" not in prompt
+    assert "first/second" not in body
+    assert "first/second" not in prompt
+
+
 def test_intent_guidance_preserves_existing_resource_lifecycle():
     body = (SKILL_DIR / "SKILL.md").read_text(encoding="utf-8")
 
diff --git a/tests/pipeline/selling/skills/test_template_generating_skill.py b/tests/pipeline/selling/skills/test_template_generating_skill.py
index ae94c6dd..a184ef1a 100644
--- a/tests/pipeline/selling/skills/test_template_generating_skill.py
+++ b/tests/pipeline/selling/skills/test_template_generating_skill.py
@@ -67,15 +67,29 @@ def test_no_terraform_references(self, body):
     def test_contains_ros_template_format(self, body):
         assert "ROSTemplateFormatVersion" in body or "ROS" in body
 
-    def test_contains_parameterization_rules(self, body):
-        assert "参数化规则" in body
+    def test_parameterization_guidance_points_to_references_without_inline_table(self, body):
+        assert "库存相关属性" in body
+        assert "references/cloud-products/" in body
+        assert "| ECS | ZoneId, InstanceType" not in body
 
     def test_contains_validation_step(self, body):
         assert "ValidateTemplate" in body
 
-    def test_contains_resource_types(self, body):
-        assert "ALIYUN::ECS::VPC" in body
-        assert "ALIYUN::ECS::InstanceGroup" in body
+    def test_must_read_ros_template_reference_before_generation(self, body):
+        assert "必须" in body
+        assert "references/ros-template.md" in body
+        assert "未阅读不得生成模板" in body
+
+    def test_does_not_inline_common_resource_catalog(self, body):
+        assert "## 常用资源类型" not in body
+        assert "ALIYUN::ECS::VPC: 创建专有网络" not in body
+        assert "ALIYUN::ECS::InstanceGroup: 创建 N 个 ECS 实例" not in body
+        assert "references/ros-template.md" in body
+
+    def test_run_command_details_stay_in_reference(self, body):
+        assert "## 在实例中执行命令" not in body
+        assert "ALIYUN::ECS::RunCommand + `CommandContent`" not in body
+        assert "references/ros-template.md" in body
 
     def test_no_deploy_flow(self, body):
         assert "CreateStack" not in body
@@ -139,6 +153,30 @@ def test_full_prompt_includes_skill_base_directory(self, tmp_path):
 
         assert f"Base directory for this skill: {SKILL_DIR}" in prompt
 
+    def test_agent_loop_trusts_skill_base_directory_for_tools(self, tmp_path):
+        from iac_code.pipeline.engine.context import PipelineContext
+        from iac_code.pipeline.engine.loader import load_pipeline_dir
+        from iac_code.pipeline.engine.step_executor import StepExecutor
+        from iac_code.tools.base import ToolRegistry
+
+        pipeline_dir = SKILL_DIR.parents[1]
+        loaded = load_pipeline_dir(pipeline_dir)
+        step = next(s for s in loaded.sub_pipelines["evaluate_candidate"].steps if s.step_id == "template_generating")
+        context = PipelineContext({"candidate": []})
+        context.set_conclusion("candidate", {"output_path": "templates/example.yml"})
+
+        agent_context = StepExecutor(
+            provider_manager=MagicMock(),
+            base_tool_registry=ToolRegistry(),
+            pipeline=loaded,
+            pipeline_dir=pipeline_dir,
+            cwd=str(tmp_path),
+        ).build_agent_loop_context(step, context, "session-1")
+
+        assert agent_context.agent_loop is not None
+        assert str(SKILL_DIR) in agent_context.agent_loop._tool_context_trusted_read_directories
+        assert str(SKILL_DIR) in agent_context.agent_loop._tool_context_relative_read_directories
+
 
 class TestEvalsJson:
     def test_evals_file_exists(self):
diff --git a/tests/pipeline/selling/test_deploying_cleanup_hook.py b/tests/pipeline/selling/test_deploying_cleanup_hook.py
new file mode 100644
index 00000000..86eacfa5
--- /dev/null
+++ b/tests/pipeline/selling/test_deploying_cleanup_hook.py
@@ -0,0 +1,226 @@
+from __future__ import annotations
+
+import logging
+
+from iac_code.pipeline.engine.cleanup import CleanupLedger
+from iac_code.pipeline.engine.context import PipelineContext
+from iac_code.pipeline.selling.hooks import deploying
+from iac_code.types.stream_events import ResourceObservedEvent
+
+
+def test_deploying_hook_returns_ros_create_stack_observation_without_persisting(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+    event = ResourceObservedEvent(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        resource_name="demo",
+        region_id="cn-hangzhou",
+        action="CreateStack",
+        tool_name="ros_stack",
+        tool_use_id="toolu-create",
+        metadata={"params": {"TemplateBody": "secret template", "Password": "secret"}},
+    )
+
+    observed = deploying.on_resource_observed(ctx, event, ledger=ledger, step_id="deploying", attempt_id="att_0001")
+
+    assert observed is not None
+    assert observed.provider == "ros"
+    assert observed.resource_type == "stack"
+    assert observed.resource_id == "stack-123"
+    assert observed.source_step_id == "deploying"
+    assert observed.source_attempt_id == "att_0001"
+    assert observed.metadata == {"tool_name": "ros_stack", "tool_use_id": "toolu-create"}
+    assert ledger.observed_resources() == []
+
+
+def test_deploying_hook_ignores_non_create_stack_observations(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+
+    observed = deploying.on_resource_observed(
+        ctx,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-123",
+            action="UpdateStack",
+        ),
+        ledger=ledger,
+        step_id="deploying",
+        attempt_id="att_0001",
+    )
+
+    assert observed is None
+    assert ledger.observed_resources() == []
+
+
+def test_deploying_hook_marks_only_deploying_rollback_resources(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+    observed = deploying.on_resource_observed(
+        ctx,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-123",
+            resource_name="demo",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+        ),
+        ledger=ledger,
+        step_id="deploying",
+        attempt_id="att_0001",
+    )
+    assert observed is not None
+    ledger.record_observed(observed)
+
+    cleanup = deploying.on_rollback_cleanup_required(
+        ctx,
+        ledger=ledger,
+        from_step="deploying",
+        from_attempt_id="att_0001",
+        to_step="confirm_and_select",
+        reason="invalid selection",
+    )
+
+    assert len(cleanup) == 1
+    assert cleanup[0].resource_id == "stack-123"
+    assert cleanup[0].cleanup_reason == "invalid selection"
+    assert ledger.pending_resources() == []
+
+
+def test_deploying_hook_ignores_other_step_rollbacks(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+    observed = deploying.on_resource_observed(
+        ctx,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-123",
+            action="CreateStack",
+        ),
+        ledger=ledger,
+        step_id="deploying",
+        attempt_id="att_0001",
+    )
+    assert observed is not None
+    ledger.record_observed(observed)
+
+    cleanup = deploying.on_rollback_cleanup_required(
+        ctx,
+        ledger=ledger,
+        from_step="confirm_and_select",
+        from_attempt_id="att_0001",
+        to_step="architecture_planning",
+        reason="retry",
+    )
+
+    assert cleanup == []
+    assert ledger.pending_resources() == []
+
+
+def test_deploying_hook_warns_when_attempt_id_missing(tmp_path, caplog) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+    caplog.set_level(logging.WARNING, logger="iac_code.pipeline.selling.hooks.deploying")
+
+    cleanup = deploying.on_rollback_cleanup_required(
+        ctx,
+        ledger=ledger,
+        from_step="deploying",
+        from_attempt_id=None,
+        to_step="confirm_and_select",
+        reason="retry",
+    )
+
+    assert cleanup == []
+    assert "Skipping deploying cleanup hook because from_attempt_id is missing" in caplog.text
+
+
+def test_deploying_hook_marks_only_current_attempt_resources(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+    first = deploying.on_resource_observed(
+        ctx,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-old",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+        ),
+        ledger=ledger,
+        step_id="deploying",
+        attempt_id="att_0001",
+    )
+    second = deploying.on_resource_observed(
+        ctx,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-current",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+        ),
+        ledger=ledger,
+        step_id="deploying",
+        attempt_id="att_0002",
+    )
+    assert first is not None
+    assert second is not None
+    ledger.record_observed(first)
+    ledger.record_observed(second)
+
+    cleanup = deploying.on_rollback_cleanup_required(
+        ctx,
+        ledger=ledger,
+        from_step="deploying",
+        from_attempt_id="att_0002",
+        to_step="confirm_and_select",
+        reason="retry current attempt",
+    )
+
+    assert [resource.resource_id for resource in cleanup] == ["stack-current"]
+
+
+def test_deploying_cleanup_ledger_does_not_persist_observed_secret_metadata(tmp_path) -> None:
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ctx = PipelineContext({})
+    observed = deploying.on_resource_observed(
+        ctx,
+        ResourceObservedEvent(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-secret",
+            resource_name="demo",
+            region_id="cn-hangzhou",
+            action="CreateStack",
+            tool_name="ros_stack",
+            tool_use_id="toolu-create",
+            metadata={"params": {"TemplateBody": "secret template body", "DbPassword": "super-secret"}},
+        ),
+        ledger=ledger,
+        step_id="deploying",
+        attempt_id="att_0001",
+    )
+    assert observed is not None
+
+    ledger.record_observed(observed)
+    cleanup = deploying.on_rollback_cleanup_required(
+        ctx,
+        ledger=ledger,
+        from_step="deploying",
+        from_attempt_id="att_0001",
+        to_step="confirm_and_select",
+        reason="rollback",
+    )
+    ledger.mark_cleanup_required(cleanup, source_step_id="deploying", reason="rollback")
+
+    text = ledger.path.read_text(encoding="utf-8")
+    assert "secret template body" not in text
+    assert "super-secret" not in text
+    assert "TemplateBody" not in text
+    assert "DbPassword" not in text
diff --git a/tests/pipeline/selling/test_deploying_hook.py b/tests/pipeline/selling/test_deploying_hook.py
index 1cff2dd9..fc716b49 100644
--- a/tests/pipeline/selling/test_deploying_hook.py
+++ b/tests/pipeline/selling/test_deploying_hook.py
@@ -35,6 +35,64 @@ def test_normalize_selected_plan_adds_resolution_metadata():
     assert normalized["selection"]["selected_candidate_index"] == 0
 
 
+def test_normalize_selected_plan_preserves_cost_deployment_parameters():
+    evaluated_candidates = [
+        {
+            "candidate": {"name": "WithParams", "output_path": "templates/a.yml"},
+            "failed": False,
+            "cost": {"deployment_parameters": {"ZoneId": "cn-hangzhou-k", "InstanceType": "ecs.g7.large"}},
+        }
+    ]
+    selected_plan = {"user_input": encode_selected_candidate("WithParams", 0), "options": []}
+
+    normalized = normalize_selected_plan(selected_plan, evaluated_candidates)
+
+    assert normalized["selection_valid"] is True
+    assert normalized["selected_candidate_result"]["cost"]["deployment_parameters"] == {
+        "ZoneId": "cn-hangzhou-k",
+        "InstanceType": "ecs.g7.large",
+    }
+
+
+def test_normalize_selected_plan_applies_user_parameter_overrides():
+    evaluated_candidates = [
+        {
+            "candidate": {"name": "WithParams", "output_path": "templates/a.yml"},
+            "failed": False,
+            "cost": {
+                "deployment_parameters": {
+                    "ZoneId": "cn-hangzhou-k",
+                    "InstanceType": "ecs.g7.large",
+                    "SystemDiskCategory": "cloud_essd",
+                }
+            },
+        }
+    ]
+    selected_plan = {
+        "user_input": encode_selected_candidate(
+            "WithParams",
+            0,
+            {"InstanceType": "ecs.c7.large", "ImageId": "centos_stream_9_x64_20G_alibase_20260414.vhd"},
+        ),
+        "options": [],
+    }
+
+    normalized = normalize_selected_plan(selected_plan, evaluated_candidates)
+
+    assert normalized["selection_valid"] is True
+    assert normalized["parameter_overrides"] == {
+        "InstanceType": "ecs.c7.large",
+        "ImageId": "centos_stream_9_x64_20G_alibase_20260414.vhd",
+    }
+    assert normalized["effective_deployment_parameters"] == {
+        "ZoneId": "cn-hangzhou-k",
+        "InstanceType": "ecs.c7.large",
+        "SystemDiskCategory": "cloud_essd",
+        "ImageId": "centos_stream_9_x64_20G_alibase_20260414.vhd",
+    }
+    assert normalized["cost_estimate_parameter_overridden"] is True
+
+
 def test_normalize_selected_plan_resolves_natural_language_zero_based_choice():
     selected_plan = {"user_input": "我选择方案0", "options": []}
     normalized = normalize_selected_plan(selected_plan, _evaluated_candidates())
diff --git a/tests/pipeline/selling/test_deploying_prompt.py b/tests/pipeline/selling/test_deploying_prompt.py
new file mode 100644
index 00000000..13c4b468
--- /dev/null
+++ b/tests/pipeline/selling/test_deploying_prompt.py
@@ -0,0 +1,49 @@
+from pathlib import Path
+
+from iac_code.pipeline.engine.context import PipelineContext
+from iac_code.pipeline.engine.loader import load_pipeline_dir
+from iac_code.pipeline.engine.step_spec import render_prompt
+
+
+def _selling_dir() -> Path:
+    return Path(__file__).resolve().parents[3] / "src" / "iac_code" / "pipeline" / "selling"
+
+
+def test_deploying_prompt_preserves_explicit_stack_name_without_e2e_controls() -> None:
+    selling_dir = _selling_dir()
+    loaded = load_pipeline_dir(selling_dir)
+    deploying_step = next(step for step in loaded.steps if step.step_id == "deploying")
+    stack_name = "iac-e2e-original-intent"
+
+    ctx = PipelineContext(loaded.context_dependencies)
+    ctx.set_conclusion(
+        "intent",
+        {
+            "requirement": f"创建 VSwitch，部署资源栈 StackName 必须精确等于 {stack_name}",
+            "non_functional": {"stack_name": stack_name},
+        },
+    )
+    ctx.set_conclusion(
+        "selected_plan",
+        {
+            "selection_valid": True,
+            "selected_candidate": {"name": "existing-vpc-vswitch", "output_path": "templates/vswitch.yml"},
+        },
+    )
+    ctx.set_conclusion("evaluated_candidates", [{"candidate": {"name": "existing-vpc-vswitch"}}])
+
+    prompt = render_prompt(
+        (selling_dir / deploying_step.prompt_file).read_text(encoding="utf-8"),
+        ctx,
+        deploying_step.context_fields,
+    )
+
+    assert "intent" in deploying_step.context_fields
+    assert stack_name in prompt
+    assert "params.StackName" in prompt
+    assert "必须精确等于该名称" in prompt
+    assert "用户未明确指定 StackName" in prompt
+    assert "禁止省略 `params.StackName`" not in prompt
+    assert "vswitch-in-existing-vpc" not in prompt
+    assert "部署后是否等待用户继续" not in prompt
+    assert "如果无法确定应使用的 StackName，不要调用 `CreateStack`" not in prompt
diff --git a/tests/pipeline/selling/test_memory_policy.py b/tests/pipeline/selling/test_memory_policy.py
new file mode 100644
index 00000000..e153c4c0
--- /dev/null
+++ b/tests/pipeline/selling/test_memory_policy.py
@@ -0,0 +1,42 @@
+from __future__ import annotations
+
+from pathlib import Path
+
+from iac_code.pipeline.engine.loader import load_pipeline_dir
+
+
+def _selling_dir() -> Path:
+    return Path(__file__).resolve().parents[3] / "src" / "iac_code" / "pipeline" / "selling"
+
+
+def _step_by_id(step_id: str):
+    loaded = load_pipeline_dir(_selling_dir())
+    return next(step for step in loaded.steps if step.step_id == step_id)
+
+
+def _sub_step_by_id(sub_pipeline_name: str, step_id: str):
+    loaded = load_pipeline_dir(_selling_dir())
+    return next(step for step in loaded.sub_pipelines[sub_pipeline_name].steps if step.step_id == step_id)
+
+
+def test_memory_read_is_available_to_steps_that_need_autonomous_context_choice() -> None:
+    intent = _step_by_id("intent_parsing")
+    architecture = _step_by_id("architecture_planning")
+
+    assert intent.tools is not None
+    assert "read_memory" in intent.tools.include
+    assert architecture.tools is not None
+    assert "read_memory" in architecture.tools.include
+
+
+def test_pipeline_steps_do_not_offer_write_memory_by_default() -> None:
+    template = _sub_step_by_id("evaluate_candidate", "template_generating")
+    cost = _sub_step_by_id("evaluate_candidate", "cost_estimating")
+    deploying = _step_by_id("deploying")
+
+    assert template.tools is not None
+    assert "write_memory" in template.tools.exclude
+    assert cost.tools is not None
+    assert "write_memory" in cost.tools.exclude
+    assert deploying.tools is not None
+    assert "write_memory" in deploying.tools.exclude
diff --git a/tests/pipeline/selling/test_terminal_ui_contract.py b/tests/pipeline/selling/test_terminal_ui_contract.py
index e6fad583..af0d60ac 100644
--- a/tests/pipeline/selling/test_terminal_ui_contract.py
+++ b/tests/pipeline/selling/test_terminal_ui_contract.py
@@ -18,18 +18,76 @@ def test_confirm_options_schema_requires_candidate_index():
     assert option_schema["properties"]["candidate_index"]["type"] == "integer"
 
 
+def test_confirm_schema_accepts_parameter_overrides():
+    loaded = load_pipeline_dir(_selling_pipeline_dir())
+    confirm = next(step for step in loaded.steps if step.step_id == "confirm_and_select")
+    schema = confirm.conclusion_schema
+    assert schema is not None
+
+    assert "parameter_overrides" in schema["properties"]
+    assert schema["properties"]["parameter_overrides"]["type"] == "object"
+
+
 def test_confirm_prompt_tells_model_to_output_candidate_index():
     prompt = (_selling_pipeline_dir() / "prompts" / "confirm_and_select.md").read_text(encoding="utf-8")
 
     assert "`options[].candidate_index`" in prompt
 
 
-def test_deploying_can_rollback_to_confirm_and_select_for_invalid_selection():
+def test_confirm_prompt_tells_model_to_preserve_parameter_overrides():
+    prompt = (_selling_pipeline_dir() / "prompts" / "confirm_and_select.md").read_text(encoding="utf-8")
+
+    assert "`parameter_overrides`" in prompt
+    assert "用户选择方案时传入" in prompt
+    assert "结构化 JSON" in prompt
+    forbidden = ["A2A", "前端", "客户端", "方案 A", "方案 B", "策略 A", "策略 B", "讨论"]
+    for phrase in forbidden:
+        assert phrase not in prompt
+
+
+def test_confirm_prompts_share_selection_contract_structure():
+    repl_prompt = (_selling_pipeline_dir() / "prompts" / "confirm_and_select.md").read_text(encoding="utf-8")
+    a2a_prompt = (_selling_pipeline_dir() / "prompts" / "confirm_and_select.a2a.md").read_text(encoding="utf-8")
+
+    shared_fragments = [
+        "## 首次执行",
+        "### 待选择结论",
+        "`complete_step.conclusion.options`",
+        "`complete_step.conclusion.user_prompt`",
+        "## 收到用户选择",
+        '"selected_candidate_index": 0',
+        "`parameter_overrides`",
+        "`parameters`",
+        "## 约束",
+        "不要在本步骤重新询价",
+        "不要修改模板 Default",
+    ]
+    for fragment in shared_fragments:
+        assert fragment in repl_prompt
+        assert fragment in a2a_prompt
+
+
+def test_confirm_a2a_surface_uses_thin_prompt_without_display_tools():
+    loaded = load_pipeline_dir(_selling_pipeline_dir())
+    confirm = next(step for step in loaded.steps if step.step_id == "confirm_and_select")
+    a2a = confirm.surface_overrides["a2a"]
+
+    assert a2a.prompt_file == "prompts/confirm_and_select.a2a.md"
+    assert a2a.inject_tools == []
+
+    prompt = (_selling_pipeline_dir() / "prompts" / "confirm_and_select.a2a.md").read_text(encoding="utf-8")
+    assert "`selected_candidate_index`" in prompt
+    assert "`parameter_overrides`" in prompt
+    assert "`complete_step.conclusion.user_prompt`" in prompt
+    assert "不要在本步骤重新询价" in prompt
+    assert "show_architecture_diagram" not in prompt
+    assert "show_candidate_detail" not in prompt
+
+
+def test_selling_steps_do_not_expose_static_rollback_rules():
     loaded = load_pipeline_dir(_selling_pipeline_dir())
-    deploying = next(step for step in loaded.steps if step.step_id == "deploying")
-    rollback_pairs = {(rule.target_step, rule.condition) for rule in deploying.rollback_rules}
 
-    assert ("confirm_and_select", "invalid_selection") in rollback_pairs
+    assert all(not hasattr(step, "rollback_rules") for step in loaded.steps)
 
 
 def test_deploying_pauses_when_interrupt_judge_fails():
@@ -37,3 +95,27 @@ def test_deploying_pauses_when_interrupt_judge_fails():
     deploying = next(step for step in loaded.steps if step.step_id == "deploying")
 
     assert deploying.interrupt_judge_failure == "pause"
+
+
+def test_deploying_success_requires_create_stack_complete_guard():
+    loaded = load_pipeline_dir(_selling_pipeline_dir())
+    deploying = next(step for step in loaded.steps if step.step_id == "deploying")
+
+    guard = next(
+        (
+            item
+            for item in deploying.completion_guards
+            if item.get("when_conclusion_field_equals") == {"status": "success"}
+        ),
+        None,
+    )
+
+    assert guard is not None
+    assert guard["required_conclusion_field"] == "stack_id"
+    assert guard["require_tool_result"] == {
+        "tool": "ros_stack",
+        "action_in": ["CreateStack", "ContinueCreateStack"],
+        "is_success": True,
+        "status_in": ["CREATE_COMPLETE"],
+        "match_conclusion_field": "stack_id",
+    }
diff --git a/tests/providers/test_openai_image_blocks.py b/tests/providers/test_openai_image_blocks.py
index 314eb7c2..9fc00702 100644
--- a/tests/providers/test_openai_image_blocks.py
+++ b/tests/providers/test_openai_image_blocks.py
@@ -26,6 +26,32 @@ def test_user_image_converts_to_image_url():
     ]
 
 
+def test_judge_style_user_content_blocks_convert_to_image_url():
+    p = OpenAIProvider(model="gpt-5.4", api_key="x")
+    msg = Message(
+        role="user",
+        content=[
+            ContentBlock(type="text", text="judge routing prompt"),
+            ContentBlock(type="image", media_type="image/png", data="aGVsbG8="),
+        ],
+    )
+
+    api = p._convert_messages([msg])
+
+    assert api == [
+        {
+            "role": "user",
+            "content": [
+                {"type": "text", "text": "judge routing prompt"},
+                {
+                    "type": "image_url",
+                    "image_url": {"url": "data:image/png;base64,aGVsbG8="},
+                },
+            ],
+        }
+    ]
+
+
 def test_text_only_user_message_stays_string():
     p = OpenAIProvider(model="gpt-5.4", api_key="x")
     msg = Message(role="user", content="plain")
diff --git a/tests/repl_e2e/test_run_pipeline_scenarios.py b/tests/repl_e2e/test_run_pipeline_scenarios.py
new file mode 100644
index 00000000..c0e27ff8
--- /dev/null
+++ b/tests/repl_e2e/test_run_pipeline_scenarios.py
@@ -0,0 +1,2468 @@
+from __future__ import annotations
+
+import importlib.util
+import re
+import sys
+from pathlib import Path
+
+
+def _load_runner():
+    path = Path(__file__).resolve().parents[2] / "scripts" / "repl" / "e2e" / "run_pipeline_scenarios.py"
+    spec = importlib.util.spec_from_file_location("run_pipeline_scenarios", path)
+    assert spec is not None and spec.loader is not None
+    module = importlib.util.module_from_spec(spec)
+    sys.modules[spec.name] = module
+    spec.loader.exec_module(module)
+    return module
+
+
+def _repl_pty_unit_instance(runner, *, args, run_dir: Path, cwd: Path, env: dict[str, str]):
+    pty = runner.ReplPty.__new__(runner.ReplPty)
+    pty.args = args
+    pty.run_dir = run_dir
+    pty.cwd = cwd
+    pty.env = env
+    pty.events = []
+    pty.raw_chunks = []
+    pty.child = None
+    pty._live_transcript = False
+    return pty
+
+
+def _install_flow_fake_pty(
+    monkeypatch,
+    runner,
+    transcript: str,
+    actions: list[tuple[str, str]],
+    *,
+    scenario: str = "scenario1",
+) -> None:
+    class FakePty:
+        def __init__(self, *, args, run_dir, cwd, env):
+            self.args = args
+            self.run_dir = run_dir
+            self.cwd = cwd
+            self.env = env
+            self.events = []
+            self.transcript = transcript
+            if "first-stack-id" in transcript:
+                self.cleanup_ledger = {
+                    "observed_resources": [
+                        {
+                            "provider": "ros",
+                            "resource_type": "stack",
+                            "resource_id": "first-stack-id",
+                            "resource_name": runner._cleanup_stack_name(run_dir, "first"),
+                        },
+                        {
+                            "provider": "ros",
+                            "resource_type": "stack",
+                            "resource_id": "second-stack-id",
+                            "resource_name": runner._cleanup_stack_name(run_dir, "second"),
+                        },
+                    ],
+                    "cleanup_resources": [
+                        {
+                            "provider": "ros",
+                            "resource_type": "stack",
+                            "resource_id": "first-stack-id",
+                            "cleanup_required": True,
+                            "cleanup_status": "completed",
+                            "progress_status": "DELETE_COMPLETE",
+                        }
+                    ],
+                    "history": [
+                        {"type": "cleanup_started", "resource": {"resource_id": "first-stack-id"}},
+                        {"type": "cleanup_completed", "resource": {"resource_id": "first-stack-id"}},
+                    ],
+                }
+                self.ros_stack_states = {
+                    "first-stack-id": {
+                        "status": "DELETE_COMPLETE",
+                        "not_found": False,
+                        "stack_name": runner._cleanup_stack_name(run_dir, "first"),
+                    },
+                    "second-stack-id": {
+                        "status": "CREATE_COMPLETE",
+                        "not_found": False,
+                        "stack_name": runner._cleanup_stack_name(run_dir, "second"),
+                    },
+                }
+            elif "vsw-" in transcript or "交换机 ID" in transcript:
+                stack_name = runner._scenario_stack_name(run_dir, scenario)
+                self.cleanup_ledger = {
+                    "observed_resources": [
+                        {
+                            "provider": "ros",
+                            "resource_type": "stack",
+                            "resource_id": "normal-stack-id",
+                            "resource_name": stack_name,
+                            "observed_action": "CreateStack",
+                        }
+                    ]
+                }
+                self.ros_stack_states = {
+                    "normal-stack-id": {
+                        "status": "CREATE_COMPLETE",
+                        "not_found": False,
+                        "stack_name": stack_name,
+                    }
+                }
+
+        def spawn(self, *, extra_args=None):
+            actions.append(("spawn", " ".join(extra_args or [])))
+            command = ["uv", "run", "python", "-m", "iac_code.cli.main"]
+            if extra_args:
+                command.extend(extra_args)
+            self.events.append({"type": "spawn", "command": command, "transcript_offset": 0})
+
+        def sendline(self, text):
+            actions.append(("sendline", text))
+            offset = self.transcript.find(text)
+            if offset < 0 and text == self.args.rollback_prompt:
+                offset = self.transcript.find("● Intent parsing (1/5)")
+            if offset < 0 and text == self.args.ask_answer:
+                offset = self.transcript.find("● Confirm and select (4/5)")
+            self.events.append({"type": "sendline", "text": text, "transcript_offset": max(offset, 0)})
+
+        def expect_any(self, patterns, *, description, timeout):
+            actions.append(("expect", description))
+            return patterns[0]
+
+        def expect_optional(self, patterns, *, description, timeout):
+            actions.append(("expect_optional", description))
+            if description == "second ask question after image answer":
+                return False
+            return True
+
+        def send(self, text, *, label="send"):
+            actions.append((label, text))
+            self.events.append({"type": label, "text": text, "transcript_offset": 0})
+
+        def paste_image_fixture(self, image_key: str):
+            actions.append(("paste-image-fixture", image_key))
+            self.events.append(
+                {
+                    "type": "paste-image-fixture",
+                    "image_key": image_key,
+                    "path": f"/repo/scripts/a2a/e2e/fixtures/text-images/{image_key}.png",
+                    "transcript_offset": 0,
+                }
+            )
+
+        def terminate(self, *, force=False):
+            actions.append(("terminate", str(force)))
+            self.events.append({"type": "terminate", "force": force})
+
+    deleted_stack_ids: list[str] = []
+
+    def fake_fresh_ros_stack_state(_pty, stack_id: str) -> dict[str, object]:
+        if stack_id == "normal-stack-id":
+            stack_name = runner._scenario_stack_name(_pty.run_dir, scenario)
+            return {
+                "status": "CREATE_COMPLETE",
+                "not_found": False,
+                "stack_name": stack_name,
+                "region_id": "cn-hangzhou",
+            }
+        return {"status": "DELETE_COMPLETE", "not_found": False}
+
+    def fake_delete_ros_stack(*, stack_id: str, region_id: str, redaction_env: dict[str, str] | None) -> None:
+        deleted_stack_ids.append(stack_id)
+
+    monkeypatch.setattr(runner, "_fresh_ros_stack_state", fake_fresh_ros_stack_state)
+    monkeypatch.setattr(runner, "_delete_ros_stack", fake_delete_ros_stack)
+    monkeypatch.setattr(
+        runner,
+        "_wait_for_ros_stack_deleted",
+        lambda *, pty, stack_id, timeout: {"status": "DELETE_COMPLETE", "not_found": False},
+    )
+    monkeypatch.setattr(runner, "ReplPty", FakePty)
+
+
+def _install_cleanup_teardown_fakes(monkeypatch, runner, run_dir: Path) -> list[str]:
+    deleted_stack_ids: list[str] = []
+
+    def fake_fresh_ros_stack_state(_pty, stack_id: str) -> dict[str, object]:
+        if stack_id == "first-stack-id":
+            return {
+                "status": "DELETE_COMPLETE",
+                "not_found": False,
+                "stack_name": runner._cleanup_stack_name(run_dir, "first"),
+            }
+        return {
+            "status": "CREATE_COMPLETE",
+            "not_found": False,
+            "stack_name": runner._cleanup_stack_name(run_dir, "second"),
+            "region_id": "cn-hangzhou",
+        }
+
+    def fake_delete_ros_stack(*, stack_id: str, region_id: str, redaction_env: dict[str, str] | None) -> None:
+        assert region_id == "cn-hangzhou"
+        assert redaction_env is not None
+        deleted_stack_ids.append(stack_id)
+
+    monkeypatch.setattr(runner, "_fresh_ros_stack_state", fake_fresh_ros_stack_state)
+    monkeypatch.setattr(runner, "_delete_ros_stack", fake_delete_ros_stack)
+    monkeypatch.setattr(
+        runner,
+        "_wait_for_ros_stack_deleted",
+        lambda *, pty, stack_id, timeout: {"status": "DELETE_COMPLETE", "not_found": False},
+    )
+    return deleted_stack_ids
+
+
+def _install_observed_stack_teardown_fakes(
+    monkeypatch,
+    runner,
+    *,
+    stack_name: str = "vswitch-in-existing-vpc",
+) -> list[str]:
+    deleted_stack_ids: list[str] = []
+
+    def fake_fresh_ros_stack_state(_pty, stack_id: str) -> dict[str, object]:
+        return {
+            "status": "CREATE_COMPLETE",
+            "not_found": False,
+            "stack_name": stack_name,
+            "region_id": "cn-hangzhou",
+        }
+
+    def fake_delete_ros_stack(*, stack_id: str, region_id: str, redaction_env: dict[str, str] | None) -> None:
+        assert region_id == "cn-hangzhou"
+        assert redaction_env is not None
+        deleted_stack_ids.append(stack_id)
+
+    monkeypatch.setattr(runner, "_fresh_ros_stack_state", fake_fresh_ros_stack_state)
+    monkeypatch.setattr(runner, "_delete_ros_stack", fake_delete_ros_stack)
+    monkeypatch.setattr(
+        runner,
+        "_wait_for_ros_stack_deleted",
+        lambda *, pty, stack_id, timeout: {"status": "DELETE_COMPLETE", "not_found": False},
+    )
+    return deleted_stack_ids
+
+
+def test_parse_args_defaults_to_scenario1() -> None:
+    runner = _load_runner()
+
+    args = runner.parse_args([])
+
+    assert args.scenario is None
+    assert runner._selected_scenarios(args) == ["scenario1"]
+    assert args.python == "uv run python"
+
+
+def test_validate_requires_real_cloud_flag() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--scenario", "scenario1"])
+
+    try:
+        runner._validate_scenario_execution(args, "scenario1")
+    except SystemExit as exc:
+        assert "--allow-real-cloud" in str(exc)
+    else:
+        raise AssertionError("scenario1 should require --allow-real-cloud")
+
+
+def test_redaction_hides_sensitive_env_values() -> None:
+    runner = _load_runner()
+
+    text = "Authorization: Bearer sk-live-secret and token abcdefghijklmnop"
+    env = {
+        "IAC_CODE_API_KEY": "sk-live-secret",
+        "CUSTOM_TOKEN": "abcdefghijklmnop",
+        "IAC_CODE_MODEL": "qwen3.6-plus",
+    }
+
+    redacted = runner._redact_sensitive_text(text, env)
+
+    assert "sk-live-secret" not in redacted
+    assert "abcdefghijklmnop" not in redacted
+    assert "qwen3.6-plus" not in redacted
+    assert "<redacted>" in redacted
+
+
+def test_redaction_does_not_hide_ask_scenario_names() -> None:
+    runner = _load_runner()
+
+    redacted = runner._redact_sensitive_text("scenario=ask-waiting-resume", {})
+
+    assert redacted == "scenario=ask-waiting-resume"
+
+
+def test_normalize_transcript_strips_ansi_and_control_noise() -> None:
+    runner = _load_runner()
+
+    normalized = runner._normalize_transcript("\x1b[31mPipeline\x1b[0m\r\n❯  hello\x08\x08ok")
+
+    assert "\x1b" not in normalized
+    assert "Pipeline" in normalized
+    assert "ok" in normalized
+
+
+def test_build_child_env_sets_pipeline_mode_without_overriding_home(monkeypatch) -> None:
+    runner = _load_runner()
+    monkeypatch.setenv("HOME", "/Users/example")
+    monkeypatch.setenv("IAC_CODE_CONFIG_DIR", "/custom/iac")
+    args = runner.parse_args(["--allow-real-cloud", "--provider", "dashscope", "--model", "qwen3.6-plus"])
+
+    env = runner._build_child_env(args)
+
+    assert env["HOME"] == "/Users/example"
+    assert env["IAC_CODE_CONFIG_DIR"] == "/custom/iac"
+    assert env["IAC_CODE_MODE"] == "pipeline"
+    assert env["IAC_CODE_PROVIDER"] == "dashscope"
+    assert env["IAC_CODE_MODEL"] == "qwen3.6-plus"
+    assert env["PYTHONUTF8"] == "1"
+
+
+def test_repeated_scenarios_are_preserved() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--scenario", "scenario1", "--scenario", "ask-waiting", "--allow-real-cloud"])
+
+    assert runner._selected_scenarios(args) == ["scenario1", "ask-waiting"]
+
+
+def test_all_regression_scenarios_are_parseable() -> None:
+    runner = _load_runner()
+    expected = [
+        "scenario1",
+        "ask-waiting",
+        "ask-waiting-resume",
+        "image-initial",
+        "image-ask-waiting-resume",
+        "image-selection-waiting-resume",
+        "image-normal-handoff",
+        "image-interrupt",
+        "selection-waiting-resume",
+        "selection-invalid-then-valid",
+        "evaluate-resume",
+        "rollback-step2",
+        "rollback-step3",
+        "rollback-step4-selection",
+        "rollback-step5-cleanup",
+        "rollback-step5-cleanup-recovery",
+    ]
+
+    args = runner.parse_args(
+        ["--allow-real-cloud", *[item for scenario in expected for item in ("--scenario", scenario)]]
+    )
+
+    assert runner._selected_scenarios(args) == expected
+
+
+def test_repl_image_fixture_paths_reuse_static_pngs() -> None:
+    runner = _load_runner()
+
+    for image_key in [
+        "initial",
+        "ask-first-answer",
+        "ask-second-answer",
+        "selection",
+        "normal-followup",
+        "rollback-interrupt",
+    ]:
+        path = runner._text_image_fixture_path(image_key)
+        assert path.is_file()
+        assert path.suffix == ".png"
+        assert path.parent.name == "text-images"
+
+
+def test_run_dir_requires_single_scenario() -> None:
+    runner = _load_runner()
+
+    try:
+        runner.main(
+            [
+                "--scenario",
+                "scenario1",
+                "--scenario",
+                "ask-waiting",
+                "--allow-real-cloud",
+                "--run-dir",
+                "/tmp/repl-e2e",
+            ]
+        )
+    except SystemExit as exc:
+        assert "--run-dir can only be used with a single --scenario" in str(exc)
+    else:
+        raise AssertionError("--run-dir should reject multiple scenarios")
+
+
+def test_write_result_writes_summary_and_transcripts(tmp_path: Path) -> None:
+    runner = _load_runner()
+    result = runner.ScenarioRunResult(
+        scenario="scenario1",
+        run_dir=str(tmp_path),
+        passed=True,
+        checks={"pipeline started": True},
+        elapsed_seconds=1.25,
+    )
+
+    runner._write_run_artifacts(
+        run_dir=tmp_path,
+        env={"IAC_CODE_API_KEY": "sk-secret123456", "IAC_CODE_MODEL": "qwen3.6-plus"},
+        raw_transcript="hello sk-secret123456",
+        events=[{"type": "check", "name": "pipeline started", "passed": True}],
+        result=result,
+    )
+
+    summary = (tmp_path / "summary.json").read_text(encoding="utf-8")
+    raw = (tmp_path / "transcript.raw.log").read_text(encoding="utf-8")
+    normalized = (tmp_path / "transcript.normalized.log").read_text(encoding="utf-8")
+    events = (tmp_path / "events.jsonl").read_text(encoding="utf-8")
+
+    assert "sk-secret123456" not in summary
+    assert "sk-secret123456" not in raw
+    assert "sk-secret123456" not in normalized
+    assert "pipeline started" in events
+
+
+def test_initial_prompt_wait_does_not_match_generic_angle_bracket() -> None:
+    runner = _load_runner()
+    observed_patterns: list[tuple[str, ...]] = []
+
+    class FakePty:
+        def expect_any(self, patterns, *, description, timeout):
+            observed_patterns.append(patterns)
+            return patterns[0]
+
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    runner._expect_initial_prompt(FakePty(), args)
+
+    assert r"❯" in observed_patterns[0]
+    assert r">" not in observed_patterns[0]
+    assert r"iac-code" not in observed_patterns[0]
+
+
+def test_initial_prompt_waits_for_prompt_toolkit_ready_sequence() -> None:
+    runner = _load_runner()
+    descriptions: list[str] = []
+
+    class FakePty:
+        def expect_any(self, patterns, *, description, timeout):
+            descriptions.append(description)
+            return patterns[0]
+
+        def expect_optional(self, patterns, *, description, timeout):
+            descriptions.append(description)
+            return True
+
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    runner._expect_initial_prompt(FakePty(), args)
+
+    assert descriptions == ["initial prompt", "prompt input ready"]
+
+
+def test_candidate_selection_patterns_match_real_repl_heading() -> None:
+    runner = _load_runner()
+    real_heading = "● Confirm and select (4/5)"
+
+    assert any(re.search(pattern, real_heading) for pattern in runner.CANDIDATE_SELECTION_PATTERNS)
+
+
+def test_candidate_evaluation_patterns_match_real_repl_heading() -> None:
+    runner = _load_runner()
+    real_heading = "● Evaluate candidates (3/5)"
+
+    assert any(re.search(pattern, real_heading) for pattern in runner.CANDIDATE_EVALUATION_PATTERNS)
+
+
+def test_candidate_evaluation_patterns_do_not_match_architecture_plan_text() -> None:
+    runner = _load_runner()
+    architecture_output = "这是一个简单明确的需求：在已有 VPC 下创建一个 VSwitch，没有设计取舍空间，只给出 1 个方案。"
+
+    assert not any(re.search(pattern, architecture_output) for pattern in runner.CANDIDATE_EVALUATION_PATTERNS)
+
+
+def test_pipeline_completed_patterns_do_not_match_step_or_candidate_completion() -> None:
+    runner = _load_runner()
+    non_terminal_text = "\n".join(
+        [
+            "✓ 已有VPC下新建VSwitch: Completed",
+            "Step Architecture planning completed. Conclusion submitted.",
+            "参数选择完成，准备进入部署阶段。",
+        ]
+    )
+
+    assert not any(re.search(pattern, non_terminal_text) for pattern in runner.PIPELINE_COMPLETED_PATTERNS)
+
+
+def test_pipeline_completed_patterns_match_real_deployment_success() -> None:
+    runner = _load_runner()
+    terminal_text = "ROS Stack(CreateStack cn-hangzhou)\ncreate-vswitch-stack(...) CREATE_COMPLETE\n✦ 部署成功！"
+
+    assert any(re.search(pattern, terminal_text) for pattern in runner.PIPELINE_COMPLETED_PATTERNS)
+
+
+def test_first_stack_created_patterns_do_not_match_create_stack_start() -> None:
+    runner = _load_runner()
+
+    assert not any(
+        re.search(pattern, "● ROS Stack(CreateStack cn-hangzhou)") for pattern in runner.FIRST_STACK_CREATED_PATTERNS
+    )
+    assert any(
+        re.search(pattern, "create-vswitch-stack(...) CREATE_COMPLETE")
+        for pattern in runner.FIRST_STACK_CREATED_PATTERNS
+    )
+
+
+def test_candidate_selection_patterns_do_not_match_schema_explanation() -> None:
+    runner = _load_runner()
+    schema_error = (
+        "方案名称（体现核心差异） output_path 模板文件路径，Outer argument example: {'conclusion': {'candidates': []}}"
+    )
+
+    assert not any(re.search(pattern, schema_error) for pattern in runner.CANDIDATE_SELECTION_PATTERNS)
+
+
+def test_ask_patterns_match_real_repl_question_prompt() -> None:
+    runner = _load_runner()
+    real_prompt = "● Ask user question\n请描述你的产品类型、技术栈、预期访问量等信息"
+
+    assert any(re.search(pattern, real_prompt) for pattern in runner.ASK_PATTERNS)
+
+
+def test_candidate_selection_waits_for_input_ready_sequence() -> None:
+    runner = _load_runner()
+    descriptions: list[str] = []
+
+    class FakePty:
+        def expect_any(self, patterns, *, description, timeout):
+            descriptions.append(description)
+            return patterns[0]
+
+        def expect_optional(self, patterns, *, description, timeout):
+            descriptions.append(description)
+            return False
+
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    runner._expect_candidate_selection(FakePty(), args, description="candidate selection visible")
+
+    assert descriptions == ["candidate selection visible", "candidate selection controls ready"]
+
+
+def test_expect_any_auto_approves_permission_prompt(tmp_path: Path) -> None:
+    runner = _load_runner()
+
+    class FakeChild:
+        def __init__(self) -> None:
+            self.calls = 0
+            self.sent: list[str] = []
+            self.before = ""
+            self.after = ""
+
+        def expect(self, patterns, timeout):
+            self.calls += 1
+            if self.calls == 1:
+                self.after = "Yes, allow once"
+                return patterns.index(r"Yes, allow once")
+            self.after = "Pipeline completed"
+            return 0
+
+        def send(self, text):
+            self.sent.append(text)
+
+    args = runner.parse_args(["--allow-real-cloud"])
+    child = FakeChild()
+    pty = _repl_pty_unit_instance(runner, args=args, run_dir=tmp_path, cwd=tmp_path, env={})
+    pty.child = child
+
+    matched = pty.expect_any((r"Pipeline completed",), description="pipeline completed", timeout=10)
+
+    assert matched == r"Pipeline completed"
+    assert child.sent == ["\x1b[5~\r"]
+    assert any(event["type"] == "permission_prompt" for event in pty.events)
+    assert any(event["type"] == "permission-prompt-response" for event in pty.events)
+
+
+def test_permission_prompt_response_sequence_supports_named_keys() -> None:
+    runner = _load_runner()
+
+    assert runner._permission_prompt_response_sequence("pageup-enter") == "\x1b[5~\r"
+    assert runner._permission_prompt_response_sequence("up-enter") == "\x1b[A\r"
+    assert runner._permission_prompt_response_sequence("enter") == "\r"
+    assert runner._permission_prompt_response_sequence("1") == "1\r"
+
+
+def test_repl_pty_sendline_chunks_long_input(tmp_path: Path, monkeypatch) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    sent: list[tuple[str, str]] = []
+    reads = ["echoed chunk"]
+
+    class FakeChild:
+        def send(self, text):
+            sent.append(("send", text))
+
+        def sendline(self, text):
+            sent.append(("sendline", text))
+
+        def read_nonblocking(self, size, timeout):
+            if reads:
+                return reads.pop(0)
+            raise runner.pexpect.TIMEOUT("done")
+
+    monkeypatch.setattr(runner.time, "sleep", lambda _seconds: None)
+    pty = _repl_pty_unit_instance(runner, args=args, run_dir=tmp_path, cwd=tmp_path, env={})
+    pty.child = FakeChild()
+
+    pty.sendline("x" * (runner.PTY_SEND_CHUNK_SIZE + 1))
+
+    assert [kind for kind, _ in sent] == ["send", "send", "sendline"]
+    assert sent[-1] == ("sendline", "")
+    assert "echoed chunk" in pty.transcript
+
+
+def test_cleanup_pipeline_prompt_stays_pty_sized(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    prompt = runner._cleanup_pipeline_prompt(args, tmp_path)
+
+    assert len(prompt) <= runner.PTY_SEND_CHUNK_SIZE
+
+
+def test_cleanup_pipeline_prompt_forbids_default_stack_name(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    prompt = runner._cleanup_pipeline_prompt(args, tmp_path)
+
+    assert "params.StackName 必须精确等于" in prompt
+    assert "vswitch-in-existing-vpc" in prompt
+    assert "不能复用已有资源栈" in prompt
+    assert "两个不同的合法未占用 VSwitch CIDR" in prompt
+
+
+def test_stack_creating_prompt_includes_test_owned_stack_name(tmp_path: Path) -> None:
+    runner = _load_runner()
+
+    stack_name = runner._scenario_stack_name(tmp_path, "ask-waiting-resume")
+    prompt = runner._stack_creating_prompt("创建一个 VSwitch", tmp_path, "ask-waiting-resume")
+
+    assert stack_name.startswith("iac-e2e-")
+    assert "CreateStack 的 params.StackName 必须精确等于" in prompt
+    assert stack_name in prompt
+    assert "禁止使用默认或自动生成 StackName" in prompt
+
+
+def test_cleanup_pipeline_prompt_includes_explicit_network_target(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(
+        [
+            "--allow-real-cloud",
+            "--cleanup-vpc-id",
+            "vpc-test",
+            "--cleanup-vpc-cidr",
+            "172.16.0.0/12",
+            "--cleanup-zone-id",
+            "cn-hangzhou-h",
+            "--cleanup-vswitch-cidr",
+            "172.31.255.0/24",
+            "--cleanup-rollback-vswitch-cidr",
+            "172.31.254.0/24",
+        ]
+    )
+
+    prompt = runner._cleanup_pipeline_prompt(args, tmp_path)
+
+    assert "固定使用已有 VPC `vpc-test`" in prompt
+    assert "VpcId=`vpc-test`" in prompt
+    assert "ZoneId=`cn-hangzhou-h`" in prompt
+    assert "CidrBlock=`172.31.255.0/24`" in prompt
+    assert "172.31.254.0/24" not in prompt
+    assert "禁止使用模板默认 CidrBlock" in prompt
+
+
+def test_cleanup_pipeline_prompt_does_not_ask_llm_to_control_steps(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    prompt = runner._cleanup_pipeline_prompt(args, tmp_path)
+
+    assert "complete_step" not in prompt
+    assert "停在部署步骤" not in prompt
+
+
+def test_find_available_vswitch_cidr_avoids_existing_subnets() -> None:
+    runner = _load_runner()
+
+    cidr = runner._find_available_vswitch_cidr(
+        "192.168.0.0/16",
+        ["192.168.255.0/24", "192.168.254.0/24", "192.168.10.0/24"],
+    )
+
+    assert cidr == "192.168.253.0/24"
+
+
+def test_find_available_vswitch_cidrs_returns_distinct_subnets() -> None:
+    runner = _load_runner()
+
+    cidrs = runner._find_available_vswitch_cidrs("192.168.0.0/16", ["192.168.255.0/24"], count=2)
+
+    assert cidrs == ["192.168.254.0/24", "192.168.253.0/24"]
+
+
+def test_cleanup_rollback_prompt_forces_second_stack_name(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    prompt = runner._cleanup_rollback_prompt(args, tmp_path)
+
+    assert args.rollback_prompt in prompt
+    assert runner._cleanup_stack_name(tmp_path, "second") in prompt
+    assert "vswitch-in-existing-vpc" in prompt
+    assert "不能复用已有资源栈" in prompt
+    assert "只创建安全组，不创建 VSwitch" in prompt
+
+
+def test_cleanup_rollback_prompt_uses_only_rollback_network_target(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(
+        [
+            "--allow-real-cloud",
+            "--cleanup-vpc-id",
+            "vpc-test",
+            "--cleanup-vpc-cidr",
+            "172.16.0.0/12",
+            "--cleanup-zone-id",
+            "cn-hangzhou-h",
+            "--cleanup-vswitch-cidr",
+            "172.31.255.0/24",
+            "--cleanup-rollback-vswitch-cidr",
+            "172.31.254.0/24",
+        ]
+    )
+
+    prompt = runner._cleanup_rollback_prompt(args, tmp_path)
+
+    assert "本次重新部署只创建安全组" in prompt
+    assert "VpcId=`vpc-test`" in prompt
+    assert "禁止创建 VSwitch" in prompt
+    assert "禁止在第二个栈中使用 CidrBlock" in prompt
+
+
+def test_permission_prompt_patterns_only_match_approval_options() -> None:
+    runner = _load_runner()
+
+    assert any("allow" in pattern.lower() or "允许" in pattern for pattern in runner.PERMISSION_PROMPT_PATTERNS)
+    assert not any("reject" in pattern.lower() or "拒绝" in pattern for pattern in runner.PERMISSION_PROMPT_PATTERNS)
+
+
+def test_acceptance_rejects_rollback_echo_without_post_rollback_output() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    rollback_offset = len("● Evaluate candidates (3/5)\n✎ ")
+
+    class FakePty:
+        transcript = "● Evaluate candidates (3/5)\n✎ 回退到 intent_parsing，选择一个已有vpc，创建一个安全组\n"
+        events = [
+            {"type": "send-esc"},
+            {"type": "sendline", "text": args.rollback_prompt, "transcript_offset": rollback_offset},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step3", args, FakePty(), checks)
+
+    assert checks["acceptance: rollback reached evaluate_candidates step"] is True
+    assert checks["acceptance: rollback produced post-interrupt pipeline progress"] is False
+
+
+def test_acceptance_allows_rollback_when_pipeline_restarts_after_prompt() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    before_rollback = (
+        "● Evaluate candidates (3/5)\n"
+        "\x1b[?2004h\x1b[?1004h\x1b[>1u\x1b[>4;2m"
+        "\x1b[>4;0m\x1b[<u\x1b[?1004l\x1b[?2004l\n"
+        "回退到 intent_parsing，选择一个已有vpc，创建一个安全组\n"
+    )
+
+    class FakePty:
+        transcript = (
+            before_rollback
+            + "\x1b[?2004h\x1b[?1004h\x1b[>1u\x1b[>4;2m"
+            + "● Intent parsing (1/5)\nStep Intent parsing completed. Conclusion submitted.\n"
+        )
+        events = [
+            {"type": "send-esc"},
+            {"type": "sendline", "text": args.rollback_prompt, "transcript_offset": len(before_rollback)},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step3", args, FakePty(), checks)
+
+    assert checks["acceptance: rollback reached evaluate_candidates step"] is True
+    assert checks["acceptance: rollback produced post-interrupt pipeline progress"] is True
+
+
+def test_acceptance_records_step2_rollback_restart() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    before_rollback = "● Architecture planning (2/5)\n✎ " + args.rollback_prompt + "\n"
+
+    class FakePty:
+        transcript = before_rollback + "● Intent parsing (1/5)\n"
+        events = [
+            {"type": "send-esc"},
+            {"type": "sendline", "text": args.rollback_prompt, "transcript_offset": len(before_rollback)},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step2", args, FakePty(), checks)
+
+    assert checks["acceptance: rollback reached architecture_planning step"] is True
+    assert checks["acceptance: rollback produced post-interrupt pipeline progress"] is True
+
+
+def test_acceptance_records_step4_rollback_restart() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    before_rollback = "● Confirm and select (4/5)\n✎ " + args.rollback_prompt + "\n"
+
+    class FakePty:
+        transcript = before_rollback + "● Intent parsing (1/5)\n"
+        events = [
+            {"type": "send-esc"},
+            {"type": "sendline", "text": args.rollback_prompt, "transcript_offset": len(before_rollback)},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step4-selection", args, FakePty(), checks)
+
+    assert checks["acceptance: rollback reached candidate selection step"] is True
+    assert checks["acceptance: rollback produced post-interrupt pipeline progress"] is True
+
+
+def test_acceptance_records_evaluate_resume() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    fake_transcript = (
+        "● Evaluate candidates (3/5)\n"
+        "● Evaluate candidates (3/5)\n" + args.evaluate_resume_continue_prompt + "\n"
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n"
+    )
+
+    class FakePty:
+        transcript = fake_transcript
+        events = [
+            {"type": "spawn", "command": ["uv", "run", "python"]},
+            {"type": "terminate", "force": True},
+            {"type": "spawn", "command": ["uv", "run", "python", "--continue"]},
+            {
+                "type": "sendline",
+                "text": args.evaluate_resume_continue_prompt,
+                "transcript_offset": fake_transcript.find(args.evaluate_resume_continue_prompt),
+            },
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("evaluate-resume", args, FakePty(), checks)
+
+    assert checks["acceptance: evaluate_candidates was shown before resume"] is True
+    assert checks["acceptance: evaluate_candidates was replayed after resume"] is True
+    assert checks["acceptance: resume used --continue"] is True
+    assert checks["acceptance: resume continue input was sent"] is True
+    assert checks["acceptance: pipeline advanced after resume continue"] is True
+
+
+def test_acceptance_records_ask_waiting_resume() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    fake_transcript = "● Ask user question\n● Ask user question\n" + args.ask_answer + "\n● Confirm and select (4/5)\n"
+
+    class FakePty:
+        transcript = fake_transcript
+        events = [
+            {"type": "spawn", "command": ["uv", "run", "python"]},
+            {"type": "terminate", "force": True},
+            {"type": "spawn", "command": ["uv", "run", "python", "--continue"]},
+            {"type": "sendline", "text": args.ask_answer, "transcript_offset": fake_transcript.find(args.ask_answer)},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("ask-waiting-resume", args, FakePty(), checks)
+
+    assert checks["acceptance: ask user question was replayed after resume"] is True
+    assert checks["acceptance: resume used --continue"] is True
+    assert checks["acceptance: ask answer advanced pipeline after resume"] is True
+
+
+def test_acceptance_records_invalid_selection_then_valid_completion() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    class FakePty:
+        transcript = "● Confirm and select (4/5)\n✔ Pipeline completed\n交换机 ID   vsw-bp1234567890\n"
+        events = [
+            {"type": "select-invalid-candidate", "text": "9"},
+            {"type": "select-default-candidate", "text": "1\r"},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("selection-invalid-then-valid", args, FakePty(), checks)
+
+    assert checks["acceptance: invalid selection input was sent"] is True
+    assert checks["acceptance: valid selection input was sent after invalid input"] is True
+    assert checks["acceptance: pipeline completed"] is True
+
+
+def test_acceptance_records_rollback_step5_cleanup_completion() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    run_path = Path("/tmp/20260101T000000Z-1-abc12345")
+
+    class FakePty:
+        run_dir = run_path
+        transcript = (
+            "● Deploying (5/5)\n"
+            "first-stack(first-stack-id) CREATE_COMPLETE\n"
+            "检测到 1 个回滚残留资源，开始清理流程。\n"
+            "↺ 回滚清理 [完成] first-stack · 资源栈 first-stack-id · DELETE_COMPLETE\n"
+            "second-stack(second-stack-id) CREATE_COMPLETE\n"
+        )
+        events: list[dict[str, object]] = []
+        cleanup_first_stack_id = "first-stack-id"
+        cleanup_second_stack_id = "second-stack-id"
+        cleanup_ledger = {
+            "observed_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "first-stack-id",
+                    "resource_name": runner._cleanup_stack_name(run_path, "first"),
+                },
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "second-stack-id",
+                    "resource_name": runner._cleanup_stack_name(run_path, "second"),
+                },
+            ],
+            "cleanup_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "first-stack-id",
+                    "cleanup_required": True,
+                    "cleanup_status": "completed",
+                    "progress_status": "DELETE_COMPLETE",
+                }
+            ],
+        }
+        ros_stack_states = {
+            "first-stack-id": {"status": "DELETE_COMPLETE", "not_found": False},
+            "second-stack-id": {"status": "CREATE_COMPLETE", "not_found": False},
+        }
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step5-cleanup", args, FakePty(), checks)
+
+    assert checks["acceptance: first rollback stack observed"] is True
+    assert checks["acceptance: rollback cleanup ledger includes first stack"] is True
+    assert checks["acceptance: second stack created after rollback"] is True
+    assert checks["acceptance: first rollback stack name matches test stack"] is True
+    assert checks["acceptance: second stack name matches test stack"] is True
+    assert checks["acceptance: cleanup snapshot does not target second stack"] is True
+    assert checks["acceptance: rollback cleanup completed"] is True
+    assert checks["acceptance: no ROS create failure in cleanup transcript"] is True
+    assert checks["acceptance: ROS first rollback stack deleted"] is True
+    assert checks["acceptance: ROS second stack retained"] is True
+
+
+def test_acceptance_rejects_rollback_step5_create_failed_transcript() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    run_path = Path("/tmp/20260101T000000Z-1-abc12345")
+
+    class FakePty:
+        run_dir = run_path
+        transcript = (
+            "● Deploying (5/5)\n"
+            "first-stack(first-stack-id) CREATE_FAILED: RouteConflict.AlreadyExist\n"
+            "检测到 1 个回滚残留资源，开始清理流程。\n"
+            "↺ 回滚清理 [完成] first-stack · 资源栈 first-stack-id · DELETE_COMPLETE\n"
+            "second-stack(second-stack-id) CREATE_COMPLETE\n"
+        )
+        events: list[dict[str, object]] = []
+        cleanup_first_stack_id = "first-stack-id"
+        cleanup_second_stack_id = "second-stack-id"
+        cleanup_ledger = {
+            "observed_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "first-stack-id",
+                    "resource_name": runner._cleanup_stack_name(run_path, "first"),
+                },
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "second-stack-id",
+                    "resource_name": runner._cleanup_stack_name(run_path, "second"),
+                },
+            ],
+            "cleanup_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "first-stack-id",
+                    "cleanup_required": True,
+                    "cleanup_status": "completed",
+                    "progress_status": "DELETE_COMPLETE",
+                }
+            ],
+        }
+        ros_stack_states = {
+            "first-stack-id": {"status": "DELETE_COMPLETE", "not_found": False},
+            "second-stack-id": {"status": "CREATE_COMPLETE", "not_found": False},
+        }
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step5-cleanup", args, FakePty(), checks)
+
+    assert checks["acceptance: no ROS create failure in cleanup transcript"] is False
+
+
+def test_acceptance_records_rollback_step5_cleanup_recovery() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    run_path = Path("/tmp/20260101T000000Z-1-abc12345")
+
+    class FakePty:
+        run_dir = run_path
+        transcript = (
+            "● Deploying (5/5)\n"
+            "first-stack(first-stack-id) CREATE_COMPLETE\n"
+            "检测到 1 个回滚残留资源，开始清理流程。\n"
+            "↺ 回滚清理恢复：1 条记录，1 条进行中。\n"
+            "↺ 回滚清理 [完成] first-stack · 资源栈 first-stack-id · DELETE_COMPLETE\n"
+            "second-stack(second-stack-id) CREATE_COMPLETE\n"
+        )
+        events = [
+            {"type": "terminate", "force": True},
+            {"type": "spawn", "command": ["uv", "run", "python", "--continue"]},
+            {"type": "sendline", "text": args.cleanup_continue_prompt},
+        ]
+        cleanup_first_stack_id = "first-stack-id"
+        cleanup_second_stack_id = "second-stack-id"
+        cleanup_ledger = {
+            "observed_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "first-stack-id",
+                    "resource_name": runner._cleanup_stack_name(run_path, "first"),
+                },
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "second-stack-id",
+                    "resource_name": runner._cleanup_stack_name(run_path, "second"),
+                },
+            ],
+            "cleanup_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "first-stack-id",
+                    "cleanup_required": True,
+                    "cleanup_status": "completed",
+                    "progress_status": "DELETE_COMPLETE",
+                }
+            ],
+            "history": [
+                {"type": "cleanup_started", "resource": {"resource_id": "first-stack-id"}},
+                {"type": "cleanup_completed", "resource": {"resource_id": "first-stack-id"}},
+            ],
+        }
+        ros_stack_states = {
+            "first-stack-id": {"status": "DELETE_COMPLETE", "not_found": False},
+            "second-stack-id": {"status": "CREATE_COMPLETE", "not_found": False},
+        }
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step5-cleanup-recovery", args, FakePty(), checks)
+
+    assert checks["acceptance: cleanup process was killed"] is True
+    assert checks["acceptance: cleanup resume used --continue"] is True
+    assert checks["acceptance: cleanup retriggered after restart"] is True
+    assert checks["acceptance: rollback cleanup completed"] is True
+    assert checks["acceptance: ROS first rollback stack deleted"] is True
+    assert checks["acceptance: ROS second stack retained"] is True
+
+
+def test_cleanup_final_teardown_deletes_owned_second_stack(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+
+    class FakePty:
+        run_dir = tmp_path
+        env: dict[str, str] = {"ALIBABA_CLOUD_REGION_ID": "cn-hangzhou"}
+        cleanup_first_stack_id = "first-stack-id"
+        cleanup_second_stack_id = "second-stack-id"
+        cleanup_ledger = {
+            "observed_resources": [
+                {"provider": "ros", "resource_type": "stack", "resource_id": "first-stack-id"},
+                {"provider": "ros", "resource_type": "stack", "resource_id": "second-stack-id"},
+            ]
+        }
+
+    deleted_stack_ids = _install_cleanup_teardown_fakes(monkeypatch, runner, tmp_path)
+    checks: dict[str, bool] = {}
+    notes: list[str] = []
+
+    runner._teardown_cleanup_scenario_resources(
+        args=args,
+        scenario="rollback-step5-cleanup",
+        pty=FakePty(),
+        checks=checks,
+        notes=notes,
+    )
+
+    assert deleted_stack_ids == ["second-stack-id"]
+    assert checks["teardown: cleanup scenario owned ROS stacks deleted"] is True
+
+
+def test_cleanup_final_teardown_refuses_unowned_stack_name(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+
+    class FakePty:
+        run_dir = tmp_path
+        env: dict[str, str] = {"ALIBABA_CLOUD_REGION_ID": "cn-hangzhou"}
+        cleanup_first_stack_id = "first-stack-id"
+        cleanup_second_stack_id = "second-stack-id"
+        cleanup_ledger = {
+            "observed_resources": [
+                {"provider": "ros", "resource_type": "stack", "resource_id": "first-stack-id"},
+                {"provider": "ros", "resource_type": "stack", "resource_id": "second-stack-id"},
+            ]
+        }
+
+    def fake_fresh_ros_stack_state(_pty, stack_id: str) -> dict[str, object]:
+        if stack_id == "first-stack-id":
+            return {"status": "DELETE_COMPLETE", "not_found": False}
+        return {"status": "CREATE_COMPLETE", "not_found": False, "stack_name": "vswitch-in-existing-vpc"}
+
+    monkeypatch.setattr(runner, "_fresh_ros_stack_state", fake_fresh_ros_stack_state)
+    monkeypatch.setattr(runner, "_delete_ros_stack", lambda **_kwargs: (_ for _ in ()).throw(AssertionError))
+
+    checks: dict[str, bool] = {}
+    notes: list[str] = []
+
+    runner._teardown_cleanup_scenario_resources(
+        args=args,
+        scenario="rollback-step5-cleanup",
+        pty=FakePty(),
+        checks=checks,
+        notes=notes,
+    )
+
+    assert checks["teardown: cleanup scenario owned ROS stacks deleted"] is False
+    assert any("unexpected stack name vswitch-in-existing-vpc" in note for note in notes)
+
+
+def test_non_cleanup_teardown_deletes_observed_create_stack(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    stack_name = runner._scenario_stack_name(tmp_path, "scenario1")
+
+    class FakePty:
+        run_dir = tmp_path
+        env: dict[str, str] = {"ALIBABA_CLOUD_REGION_ID": "cn-hangzhou"}
+        cleanup_ledger = {
+            "observed_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "stack-created-by-scenario1",
+                    "resource_name": stack_name,
+                    "observed_action": "CreateStack",
+                }
+            ]
+        }
+
+    deleted_stack_ids = _install_observed_stack_teardown_fakes(monkeypatch, runner, stack_name=stack_name)
+    checks: dict[str, bool] = {}
+    notes: list[str] = []
+
+    runner._teardown_real_cloud_scenario_resources(
+        args=args,
+        scenario="scenario1",
+        pty=FakePty(),
+        checks=checks,
+        notes=notes,
+    )
+
+    assert deleted_stack_ids == ["stack-created-by-scenario1"]
+    assert checks["teardown: observed ROS stacks deleted"] is True
+
+
+def test_non_cleanup_teardown_refuses_observed_stack_name_mismatch(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    stack_name = runner._scenario_stack_name(tmp_path, "scenario1")
+
+    class FakePty:
+        run_dir = tmp_path
+        env: dict[str, str] = {"ALIBABA_CLOUD_REGION_ID": "cn-hangzhou"}
+        cleanup_ledger = {
+            "observed_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "stack-created-by-scenario1",
+                    "resource_name": stack_name,
+                    "observed_action": "CreateStack",
+                }
+            ]
+        }
+
+    deleted_stack_ids = _install_observed_stack_teardown_fakes(monkeypatch, runner, stack_name="different-stack-name")
+    checks: dict[str, bool] = {}
+    notes: list[str] = []
+
+    runner._teardown_real_cloud_scenario_resources(
+        args=args,
+        scenario="scenario1",
+        pty=FakePty(),
+        checks=checks,
+        notes=notes,
+    )
+
+    assert deleted_stack_ids == []
+    assert checks["teardown: observed ROS stacks deleted"] is False
+    assert any("unexpected stack name different-stack-name" in note for note in notes)
+
+
+def test_non_cleanup_teardown_refuses_non_test_owned_stack_name(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+
+    class FakePty:
+        run_dir = tmp_path
+        env: dict[str, str] = {"ALIBABA_CLOUD_REGION_ID": "cn-hangzhou"}
+        cleanup_ledger = {
+            "observed_resources": [
+                {
+                    "provider": "ros",
+                    "resource_type": "stack",
+                    "resource_id": "stack-created-by-scenario1",
+                    "resource_name": "vswitch-in-existing-vpc",
+                    "observed_action": "CreateStack",
+                }
+            ]
+        }
+
+    deleted_stack_ids = _install_observed_stack_teardown_fakes(
+        monkeypatch,
+        runner,
+        stack_name="vswitch-in-existing-vpc",
+    )
+    checks: dict[str, bool] = {}
+    notes: list[str] = []
+
+    runner._teardown_real_cloud_scenario_resources(
+        args=args,
+        scenario="scenario1",
+        pty=FakePty(),
+        checks=checks,
+        notes=notes,
+    )
+
+    assert deleted_stack_ids == []
+    assert checks["teardown: observed ROS stacks deleted"] is False
+    assert any("unexpected test-owned stack name vswitch-in-existing-vpc" in note for note in notes)
+
+
+def test_stack_creating_acceptance_requires_observed_ros_stack(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n" + args.normal_followup_prompt + "\n刚才创建了一个 VSwitch 交换机。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.run_dir = tmp_path
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.normal_followup_prompt,
+            "transcript_offset": transcript.find(args.normal_followup_prompt),
+        }
+    ]
+    FakePty.cleanup_ledger = {"observed_resources": []}
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: ROS stack observed in cleanup ledger"] is False
+    assert checks["acceptance: ROS stack name is test-owned"] is False
+
+
+def test_stack_creating_acceptance_records_observed_ros_stack(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    stack_name = runner._scenario_stack_name(tmp_path, "scenario1")
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n" + args.normal_followup_prompt + "\n刚才创建了一个 VSwitch 交换机。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.run_dir = tmp_path
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.normal_followup_prompt,
+            "transcript_offset": transcript.find(args.normal_followup_prompt),
+        }
+    ]
+    FakePty.cleanup_ledger = {
+        "observed_resources": [
+            {
+                "provider": "ros",
+                "resource_type": "stack",
+                "resource_id": "stack-created-by-scenario1",
+                "resource_name": stack_name,
+                "observed_action": "CreateStack",
+            }
+        ]
+    }
+    FakePty.ros_stack_states = {
+        "stack-created-by-scenario1": {
+            "status": "CREATE_COMPLETE",
+            "not_found": False,
+            "stack_name": stack_name,
+        }
+    }
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: ROS stack observed in cleanup ledger"] is True
+    assert checks["acceptance: ROS stack name is test-owned"] is True
+    assert checks["acceptance: ROS created stack retained before teardown"] is True
+
+
+def test_stack_creating_acceptance_rejects_non_test_owned_stack_name(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    class FakePty:
+        pass
+
+    FakePty.run_dir = tmp_path
+    FakePty.transcript = "● Confirm and select (4/5)\n✔ Pipeline completed\n交换机 ID   vsw-bp1234567890\n"
+    FakePty.events = []
+    FakePty.cleanup_ledger = {
+        "observed_resources": [
+            {
+                "provider": "ros",
+                "resource_type": "stack",
+                "resource_id": "stack-created-by-scenario1",
+                "resource_name": "vswitch-in-existing-vpc",
+                "observed_action": "CreateStack",
+            }
+        ]
+    }
+    FakePty.ros_stack_states = {
+        "stack-created-by-scenario1": {
+            "status": "CREATE_COMPLETE",
+            "not_found": False,
+            "stack_name": "vswitch-in-existing-vpc",
+        }
+    }
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: ROS stack observed in cleanup ledger"] is True
+    assert checks["acceptance: ROS stack name is test-owned"] is False
+
+
+def test_stack_creating_acceptance_allows_deleted_failed_stack_before_retained_retry(tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    stack_name = runner._scenario_stack_name(tmp_path, "scenario1")
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "failed-stack(failed-stack-id) CREATE_FAILED\n"
+        "failed-stack(failed-stack-id) DELETE_COMPLETE\n"
+        "retry-stack(retry-stack-id) CREATE_COMPLETE\n"
+        "交换机 ID   vsw-bp1234567890\n" + args.normal_followup_prompt + "\n刚才创建了一个 VSwitch 交换机。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.run_dir = tmp_path
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.normal_followup_prompt,
+            "transcript_offset": transcript.find(args.normal_followup_prompt),
+        }
+    ]
+    FakePty.cleanup_ledger = {
+        "observed_resources": [
+            {
+                "provider": "ros",
+                "resource_type": "stack",
+                "resource_id": "failed-stack-id",
+                "resource_name": stack_name,
+                "observed_action": "CreateStack",
+            },
+            {
+                "provider": "ros",
+                "resource_type": "stack",
+                "resource_id": "retry-stack-id",
+                "resource_name": stack_name,
+                "observed_action": "CreateStack",
+            },
+        ]
+    }
+    FakePty.ros_stack_states = {
+        "failed-stack-id": {"status": "DELETE_COMPLETE", "not_found": False, "stack_name": stack_name},
+        "retry-stack-id": {"status": "CREATE_COMPLETE", "not_found": False, "stack_name": stack_name},
+    }
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: ROS stack observed in cleanup ledger"] is True
+    assert checks["acceptance: ROS stack name is test-owned"] is True
+    assert checks["acceptance: ROS created stack retained before teardown"] is True
+
+
+def test_acceptance_records_scenario1_business_evidence() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n" + args.normal_followup_prompt + "\n刚才创建了一个 VSwitch 交换机。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.normal_followup_prompt,
+            "transcript_offset": transcript.find(args.normal_followup_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: candidate selection was shown"] is True
+    assert checks["acceptance: pipeline completed"] is True
+    assert checks["acceptance: VSwitch evidence found in PTY transcript"] is True
+    assert checks["acceptance: normal follow-up answered created VSwitch"] is True
+
+
+def test_acceptance_rejects_scenario1_normal_followup_without_resource_answer() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n" + args.normal_followup_prompt + "\n好的，我可以继续帮助你。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.normal_followup_prompt,
+            "transcript_offset": transcript.find(args.normal_followup_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: VSwitch evidence found in PTY transcript"] is True
+    assert checks["acceptance: normal follow-up answered created VSwitch"] is False
+
+
+def test_cleanup_pipeline_completion_requires_normal_chat_active() -> None:
+    runner = _load_runner()
+
+    assert not runner._has_any_pattern(
+        "iac-e2e-demo(second-id) CREATE_COMPLETE", runner.PIPELINE_FULLY_COMPLETED_PATTERNS
+    )
+    assert runner._has_any_pattern(
+        "Pipeline completed. Normal chat is now active.",
+        runner.PIPELINE_FULLY_COMPLETED_PATTERNS,
+    )
+
+
+def test_acceptance_records_vswitch_stack_business_evidence_without_vswitch_id() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    class FakePty:
+        transcript = (
+            "● Confirm and select (4/5)\n"
+            "✔ Pipeline completed\n"
+            "VSwitch（交换机） 单可用区\n"
+            "✅ 部署成功\n"
+            "Stack ID    f851142e-5f47-4d55-905b-116f8a0bf4b9\n"
+        )
+        events: list[dict[str, object]] = []
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("scenario1", args, FakePty(), checks)
+
+    assert checks["acceptance: VSwitch evidence found in PTY transcript"] is True
+
+
+def test_acceptance_rejects_completed_vswitch_scenario_without_resource_evidence() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+
+    class FakePty:
+        transcript = "● Confirm and select (4/5)\n✔ Pipeline completed\n"
+        events = [
+            {"type": "select-invalid-candidate", "text": "9"},
+            {"type": "select-default-candidate", "text": "1\r"},
+        ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("selection-invalid-then-valid", args, FakePty(), checks)
+
+    assert checks["acceptance: pipeline completed"] is True
+    assert checks["acceptance: VSwitch evidence found in PTY transcript"] is False
+
+
+def test_acceptance_rejects_rollback_security_group_target_from_echo_only() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = "● Evaluate candidates (3/5)\n" + args.rollback_prompt + "\n● Intent parsing (1/5)\n"
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.rollback_prompt,
+            "transcript_offset": transcript.find(args.rollback_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step3", args, FakePty(), checks)
+
+    assert checks["acceptance: rollback produced post-interrupt pipeline progress"] is True
+    assert checks["acceptance: post-rollback target is security group"] is False
+
+
+def test_acceptance_records_rollback_security_group_target_after_prompt() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Evaluate candidates (3/5)\n"
+        + args.rollback_prompt
+        + "\n● Intent parsing (1/5)\n"
+        + "Step Intent parsing completed. Conclusion submitted.\n"
+        + "本轮目标资源为 ALIYUN::ECS::SecurityGroup 安全组。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.rollback_prompt,
+            "transcript_offset": transcript.find(args.rollback_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step3", args, FakePty(), checks)
+
+    assert checks["acceptance: post-rollback target is security group"] is True
+    assert checks["acceptance: post-rollback target is not VSwitch"] is True
+
+
+def test_post_rollback_security_group_target_waits_for_slow_candidate_evaluation() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--stream-timeout", "600"])
+    observed_timeouts: list[float] = []
+
+    class FakePty:
+        def expect_any(self, patterns, *, description, timeout):
+            observed_timeouts.append(timeout)
+            return patterns[0]
+
+    checks: dict[str, bool] = {}
+
+    runner._expect_post_rollback_security_group_target(FakePty(), args, checks)
+
+    assert observed_timeouts == [300.0]
+    assert checks["post-rollback security group target visible"] is True
+
+
+def test_acceptance_allows_post_rollback_forbidden_vswitch_context() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Architecture planning (2/5)\n"
+        + args.rollback_prompt
+        + "\n● Intent parsing (1/5)\n"
+        + "Step Intent parsing completed. Conclusion submitted.\n"
+        + "resource_intents: SecurityGroup=create, VSwitch=forbid。\n"
+        + "在用户指定的已有VPC中创建一个安全组，安全组挂载在该VPC下，不创建新的VSwitch。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.rollback_prompt,
+            "transcript_offset": transcript.find(args.rollback_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step2", args, FakePty(), checks)
+
+    assert checks["acceptance: post-rollback target is security group"] is True
+    assert checks["acceptance: post-rollback target is not VSwitch"] is True
+
+
+def test_acceptance_allows_post_rollback_change_reason_mentions_old_vswitch_target() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        + args.rollback_prompt
+        + "\n╭─ Interrupt handling ─╮\n"
+        + "用户明确要求回退到intent_parsing并将需求从创建 VSwitch\n"
+        + "改为创建安全组，意图发生根本改变。\n"
+        + "● Intent parsing (1/5)\n"
+        + "Step Intent parsing completed. Conclusion submitted.\n"
+        + "● Evaluate candidates (3/5)\n"
+        + "✓ 已有VPC创建安全组: Completed\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.rollback_prompt,
+            "transcript_offset": transcript.find(args.rollback_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step4-selection", args, FakePty(), checks)
+
+    assert checks["acceptance: post-rollback target is security group"] is True
+    assert checks["acceptance: post-rollback target is not VSwitch"] is True
+
+
+def test_acceptance_allows_post_rollback_english_no_vswitch_context() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        + args.rollback_prompt
+        + "\n● Intent parsing (1/5)\n"
+        + "Step Intent parsing completed. Conclusion submitted.\n"
+        + "● Architecture planning (2/5)\n"
+        + "create a security group in an existing VPC, with no VSwitch. Only one candidate is needed.\n"
+        + "● Evaluate candidates (3/5)\n"
+        + "✓ 已有VPC新建安全组: Completed\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.rollback_prompt,
+            "transcript_offset": transcript.find(args.rollback_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step4-selection", args, FakePty(), checks)
+
+    assert checks["acceptance: post-rollback target is security group"] is True
+    assert checks["acceptance: post-rollback target is not VSwitch"] is True
+
+
+def test_acceptance_rejects_post_rollback_positive_vswitch_target() -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud"])
+    transcript = (
+        "● Architecture planning (2/5)\n"
+        + args.rollback_prompt
+        + "\n● Intent parsing (1/5)\n"
+        + "Step Intent parsing completed. Conclusion submitted.\n"
+        + "本轮目标资源为 ALIYUN::ECS::VSwitch 交换机。\n"
+    )
+
+    class FakePty:
+        pass
+
+    FakePty.transcript = transcript
+    FakePty.events = [
+        {
+            "type": "sendline",
+            "text": args.rollback_prompt,
+            "transcript_offset": transcript.find(args.rollback_prompt),
+        }
+    ]
+
+    checks: dict[str, bool] = {}
+
+    runner._apply_acceptance_checks("rollback-step2", args, FakePty(), checks)
+
+    assert checks["acceptance: post-rollback target is not VSwitch"] is False
+
+
+def test_run_with_pty_writes_acceptance_checks_after_callback_failure(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+
+    class FakePty:
+        def __init__(self, *, args, run_dir, cwd, env):
+            self.events = []
+            self.transcript = "captured transcript"
+
+        def spawn(self, *, extra_args=None):
+            return None
+
+        def terminate(self, *, force=False):
+            return None
+
+    def callback(_pty, _checks):
+        raise RuntimeError("boom")
+
+    monkeypatch.setattr(runner, "ReplPty", FakePty)
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+
+    assert runner._run_with_pty(args, "scenario1", callback) == 1
+    summary = (tmp_path / "summary.json").read_text(encoding="utf-8")
+
+    assert "acceptance: PTY transcript captured" in summary
+
+
+def test_scenario1_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    actions: list[tuple[str, str]] = []
+
+    class FakePty:
+        def __init__(self, *, args, run_dir, cwd, env):
+            stack_name = runner._scenario_stack_name(run_dir, "scenario1")
+            self.run_dir = run_dir
+            self.env = env
+            self.events = []
+            self.transcript = (
+                "● Confirm and select (4/5)\n"
+                "✔ Pipeline completed\n"
+                "交换机 ID   vsw-bp1234567890\n" + args.normal_followup_prompt + "\n刚才创建了一个 VSwitch 交换机。\n"
+            )
+            self.cleanup_ledger = {
+                "observed_resources": [
+                    {
+                        "provider": "ros",
+                        "resource_type": "stack",
+                        "resource_id": "normal-stack-id",
+                        "resource_name": stack_name,
+                        "observed_action": "CreateStack",
+                    }
+                ]
+            }
+            self.ros_stack_states = {
+                "normal-stack-id": {
+                    "status": "CREATE_COMPLETE",
+                    "not_found": False,
+                    "stack_name": stack_name,
+                }
+            }
+
+        def spawn(self, *, extra_args=None):
+            actions.append(("spawn", ""))
+
+        def sendline(self, text):
+            actions.append(("sendline", text))
+            self.events.append({"type": "sendline", "text": text, "transcript_offset": self.transcript.find(text)})
+
+        def expect_any(self, patterns, *, description, timeout):
+            actions.append(("expect", description))
+            return patterns[0]
+
+        def expect_optional(self, patterns, *, description, timeout):
+            actions.append(("expect_optional", description))
+            return True
+
+        def send(self, text, *, label="send"):
+            actions.append((label, text))
+
+        def terminate(self, *, force=False):
+            actions.append(("terminate", str(force)))
+
+    monkeypatch.setattr(runner, "ReplPty", FakePty)
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    stack_owned_initial = runner._stack_creating_prompt(args.initial_prompt, tmp_path, "scenario1")
+    _install_observed_stack_teardown_fakes(
+        monkeypatch,
+        runner,
+        stack_name=runner._scenario_stack_name(tmp_path, "scenario1"),
+    )
+
+    assert runner.run_scenario1(args, "scenario1") == 0
+    assert ("sendline", stack_owned_initial) in actions
+    assert ("select-default-candidate", f"{runner.DEFAULT_SELECTION_PROMPT}\r") in actions
+    assert ("sendline", runner.DEFAULT_NORMAL_FOLLOWUP_PROMPT) in actions
+    assert ("sendline", "/exit") in actions
+
+
+def test_image_initial_pastes_static_prompt_image(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = "● Confirm and select (4/5)\n✔ Pipeline completed\n交换机 ID   vsw-bp1234567890\n"
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="image-initial")
+
+    assert runner.run_image_initial(args, "image-initial") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "sendline", "paste-image-fixture", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("paste-image-fixture", "initial"),
+        ("sendline", runner._stack_name_constraint(tmp_path, "image-initial")),
+        ("expect", "pipeline started"),
+        ("expect", "candidate selection visible"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after image initial"),
+        ("sendline", "/exit"),
+    ]
+    assert ("sendline", args.initial_prompt) not in actions
+
+
+def test_image_ask_waiting_resume_pastes_static_answer_image(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Ask user question\n"
+        "● Ask user question\n"
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="image-ask-waiting-resume")
+
+    assert runner.run_image_ask_waiting_resume(args, "image-ask-waiting-resume") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "spawn", "terminate", "sendline", "paste-image-fixture", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("spawn", ""),
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", args.ask_prompt),
+        ("expect", "ask question visible before kill"),
+        ("terminate", "True"),
+        ("spawn", "--continue"),
+        ("expect", "ask question replayed"),
+        ("expect", "ask image answer input ready after resume"),
+        ("paste-image-fixture", "ask-first-answer"),
+        ("sendline", runner._stack_name_constraint(tmp_path, "image-ask-waiting-resume")),
+        ("expect", "pipeline continued after ask image resume"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after ask image resume"),
+        ("sendline", "/exit"),
+        ("terminate", "False"),
+    ]
+    assert ("sendline", args.ask_answer) not in actions
+
+
+def test_image_selection_waiting_resume_starts_with_image_and_recovers_selection(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Confirm and select (4/5)\n● Confirm and select (4/5)\n✔ Pipeline completed\n交换机 ID   vsw-bp1234567890\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="image-selection-waiting-resume")
+
+    assert runner.run_image_selection_waiting_resume(args, "image-selection-waiting-resume") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "spawn", "terminate", "sendline", "paste-image-fixture", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("spawn", ""),
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("paste-image-fixture", "initial"),
+        ("sendline", runner._stack_name_constraint(tmp_path, "image-selection-waiting-resume")),
+        ("expect", "candidate selection visible before image resume kill"),
+        ("terminate", "True"),
+        ("spawn", "--continue"),
+        ("expect", "candidate selection replayed after image resume"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after image selection resume"),
+        ("sendline", "/exit"),
+        ("terminate", "False"),
+    ]
+
+
+def test_image_normal_handoff_pastes_static_followup_image(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "Pipeline completed. Normal chat is now active.\n"
+        "[Image #1]\n"
+        "刚才创建了一个 VSwitch 交换机。\n"
+        "交换机 ID   vsw-bp1234567890\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="image-normal-handoff")
+    stack_owned_initial = runner._stack_creating_prompt(args.initial_prompt, tmp_path, "image-normal-handoff")
+
+    assert runner.run_image_normal_handoff(args, "image-normal-handoff") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "sendline", "paste-image-fixture", "submit-image", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", stack_owned_initial),
+        ("expect", "pipeline started"),
+        ("expect", "candidate selection visible"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline fully completed"),
+        ("expect", "normal prompt input ready"),
+        ("paste-image-fixture", "normal-followup"),
+        ("submit-image", "\r"),
+        ("expect", "normal image follow-up answered created VSwitch"),
+        ("sendline", "/exit"),
+    ]
+    assert ("sendline", args.normal_followup_prompt) not in actions
+
+
+def test_image_interrupt_pastes_static_rollback_image(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Evaluate candidates (3/5)\n"
+        "[Image #1]\n"
+        "● Intent parsing (1/5)\n"
+        "目标资源为 ALIYUN::ECS::SecurityGroup 安全组。\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="image-interrupt")
+
+    assert runner.run_image_interrupt(args, "image-interrupt") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "send-esc", "sendline", "paste-image-fixture", "submit-image"}
+    ]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", args.initial_prompt),
+        ("expect", "candidate evaluation visible"),
+        ("expect", "parallel interrupt input ready"),
+        ("send-esc", "\x1b"),
+        ("expect", "parallel interrupt text input ready"),
+        ("paste-image-fixture", "rollback-interrupt"),
+        ("submit-image", "\r"),
+        ("expect", "post-rollback pipeline progress visible"),
+        ("expect", "post-rollback security group target visible"),
+        ("sendline", "/exit"),
+    ]
+    assert ("sendline", args.rollback_prompt) not in actions
+
+
+def test_rollback_step3_sends_rollback_prompt_without_waiting_for_visible_interrupt(
+    monkeypatch, tmp_path: Path
+) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+
+    class FakePty:
+        def __init__(self, *, args, run_dir, cwd, env):
+            self.events = []
+            self.transcript = (
+                "● Evaluate candidates (3/5)\n"
+                "回退到 intent_parsing，选择一个已有vpc，创建一个安全组\n"
+                "● Intent parsing (1/5)\n"
+                "目标资源为 ALIYUN::ECS::SecurityGroup 安全组。\n"
+            )
+
+        def spawn(self, *, extra_args=None):
+            actions.append(("spawn", ""))
+
+        def sendline(self, text):
+            actions.append(("sendline", text))
+            offset = self.transcript.find("● Intent parsing (1/5)") if text == args.rollback_prompt else 0
+            self.events.append({"type": "sendline", "text": text, "transcript_offset": offset})
+
+        def expect_any(self, patterns, *, description, timeout):
+            if description in {"candidate evaluation activity visible", "interrupt input visible"}:
+                raise AssertionError(description)
+            actions.append(("expect", description))
+            return patterns[0]
+
+        def expect_optional(self, patterns, *, description, timeout):
+            actions.append(("expect_optional", description))
+            return True
+
+        def send(self, text, *, label="send"):
+            actions.append((label, text))
+            self.events.append({"type": label, "transcript_offset": self.transcript.find("回退到")})
+
+        def terminate(self, *, force=False):
+            actions.append(("terminate", str(force)))
+
+    monkeypatch.setattr(runner, "ReplPty", FakePty)
+
+    assert runner.run_rollback_step3(args, "rollback-step3") == 0
+
+    ordered_actions = [(kind, value) for kind, value in actions if kind in {"expect", "send-esc"}]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("expect", "candidate evaluation visible"),
+        ("expect", "parallel interrupt input ready"),
+        ("send-esc", "\x1b"),
+        ("expect", "parallel interrupt text input ready"),
+        ("expect", "post-rollback pipeline progress visible"),
+        ("expect", "post-rollback security group target visible"),
+    ]
+    assert ("sendline", args.rollback_prompt) in actions
+
+
+def test_rollback_step3_waits_for_interrupt_text_input_ready_after_escape(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+
+    class FakePty:
+        def __init__(self, *, args, run_dir, cwd, env):
+            self.events = []
+            self.transcript = (
+                "● Evaluate candidates (3/5)\n"
+                "回退到 intent_parsing，选择一个已有vpc，创建一个安全组\n"
+                "● Intent parsing (1/5)\n"
+                "目标资源为 ALIYUN::ECS::SecurityGroup 安全组。\n"
+            )
+
+        def spawn(self, *, extra_args=None):
+            actions.append(("spawn", ""))
+
+        def sendline(self, text):
+            actions.append(("sendline", text))
+            offset = self.transcript.find("● Intent parsing (1/5)") if text == args.rollback_prompt else 0
+            self.events.append({"type": "sendline", "text": text, "transcript_offset": offset})
+
+        def expect_any(self, patterns, *, description, timeout):
+            actions.append(("expect", description))
+            return patterns[0]
+
+        def expect_optional(self, patterns, *, description, timeout):
+            actions.append(("expect_optional", description))
+            return True
+
+        def send(self, text, *, label="send"):
+            actions.append((label, text))
+            self.events.append({"type": label, "transcript_offset": self.transcript.find("回退到")})
+
+        def terminate(self, *, force=False):
+            actions.append(("terminate", str(force)))
+
+    monkeypatch.setattr(runner, "ReplPty", FakePty)
+
+    assert runner.run_rollback_step3(args, "rollback-step3") == 0
+
+    assert actions.index(("send-esc", "\x1b")) < actions.index(("expect", "parallel interrupt text input ready"))
+    assert actions.index(("expect", "parallel interrupt text input ready")) < actions.index(
+        ("sendline", args.rollback_prompt)
+    )
+
+
+def test_rollback_step2_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Architecture planning (2/5)\n✎ "
+        + args.rollback_prompt
+        + "\n● Intent parsing (1/5)\n目标资源为 ALIYUN::ECS::SecurityGroup 安全组。\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions)
+
+    assert runner.run_rollback_step2(args, "rollback-step2") == 0
+
+    ordered_actions = [(kind, value) for kind, value in actions if kind in {"expect", "send-esc", "sendline"}]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", args.initial_prompt),
+        ("expect", "architecture planning visible"),
+        ("send-esc", "\x1b"),
+        ("expect", "interrupt input visible"),
+        ("expect", "interrupt prompt input ready"),
+        ("sendline", args.rollback_prompt),
+        ("expect", "post-rollback pipeline progress visible"),
+        ("expect", "post-rollback security group target visible"),
+        ("sendline", "/exit"),
+    ]
+
+
+def test_rollback_step4_selection_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        + args.rollback_prompt
+        + "\n● Intent parsing (1/5)\n目标资源为 ALIYUN::ECS::SecurityGroup 安全组。\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions)
+
+    assert runner.run_rollback_step4_selection(args, "rollback-step4-selection") == 0
+
+    ordered_actions = [(kind, value) for kind, value in actions if kind in {"expect", "send-esc", "sendline"}]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", args.initial_prompt),
+        ("expect", "candidate selection visible"),
+        ("expect", "candidate selection input ready"),
+        ("send-esc", "\x1b"),
+        ("expect", "candidate selection interrupt text input ready"),
+        ("sendline", args.rollback_prompt),
+        ("expect", "post-rollback pipeline progress visible"),
+        ("expect", "post-rollback security group target visible"),
+        ("sendline", "/exit"),
+    ]
+
+
+def test_evaluate_resume_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Evaluate candidates (3/5)\n"
+        "● Evaluate candidates (3/5)\n" + args.evaluate_resume_continue_prompt + "\n"
+        "● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="evaluate-resume")
+    stack_owned_initial = runner._stack_creating_prompt(args.initial_prompt, tmp_path, "evaluate-resume")
+
+    assert runner.run_evaluate_resume(args, "evaluate-resume") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "spawn", "terminate", "sendline", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("spawn", ""),
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", stack_owned_initial),
+        ("expect", "candidate evaluation visible"),
+        ("expect", "parallel interrupt input ready"),
+        ("terminate", "True"),
+        ("spawn", "--continue"),
+        ("expect", "candidate evaluation replayed after resume"),
+        ("expect", "evaluate resume prompt input ready"),
+        ("sendline", args.evaluate_resume_continue_prompt),
+        ("expect", "candidate selection visible after resume continue"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after evaluate resume"),
+        ("sendline", "/exit"),
+        ("terminate", "False"),
+    ]
+
+
+def test_ask_waiting_resume_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    stack_owned_answer = runner._stack_creating_prompt(args.ask_answer, tmp_path, "ask-waiting-resume")
+    transcript = (
+        "● Ask user question\n"
+        "● Ask user question\n" + stack_owned_answer + "\n● Confirm and select (4/5)\n"
+        "✔ Pipeline completed\n"
+        "交换机 ID   vsw-bp1234567890\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="ask-waiting-resume")
+
+    assert runner.run_ask_waiting_resume(args, "ask-waiting-resume") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "spawn", "terminate", "sendline", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("spawn", ""),
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", args.ask_prompt),
+        ("expect", "ask question visible before kill"),
+        ("terminate", "True"),
+        ("spawn", "--continue"),
+        ("expect", "ask question replayed"),
+        ("expect", "ask answer input ready after resume"),
+        ("sendline", stack_owned_answer),
+        ("expect", "pipeline continued after ask resume"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after ask resume"),
+        ("sendline", "/exit"),
+        ("terminate", "False"),
+    ]
+
+
+def test_selection_invalid_then_valid_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = "● Confirm and select (4/5)\n✔ Pipeline completed\n交换机 ID   vsw-bp1234567890\n"
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions, scenario="selection-invalid-then-valid")
+    stack_owned_initial = runner._stack_creating_prompt(
+        args.initial_prompt,
+        tmp_path,
+        "selection-invalid-then-valid",
+    )
+
+    assert runner.run_selection_invalid_then_valid(args, "selection-invalid-then-valid") == 0
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "sendline", "select-invalid-candidate", "select-default-candidate"}
+    ]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", stack_owned_initial),
+        ("expect", "candidate selection visible"),
+        ("select-invalid-candidate", "9"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed"),
+        ("sendline", "/exit"),
+    ]
+
+
+def test_rollback_step5_cleanup_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "first-stack(first-stack-id) CREATE_COMPLETE\n"
+        "● Confirm and select (4/5)\n"
+        "second-stack(second-stack-id) CREATE_COMPLETE\n"
+        "检测到 1 个回滚残留资源，开始清理流程。\n"
+        "↺ 回滚清理 [完成] first-stack · 资源栈 first-stack-id · DELETE_COMPLETE\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions)
+    monkeypatch.setattr(
+        runner,
+        "_ensure_cleanup_network_target",
+        lambda _args, _run_dir: runner.CleanupNetworkTarget(
+            vpc_id="vpc-test",
+            vpc_cidr="172.16.0.0/12",
+            zone_id="cn-hangzhou-h",
+            vswitch_cidr="172.31.255.0/24",
+            rollback_vswitch_cidr="172.31.254.0/24",
+        ),
+    )
+    monkeypatch.setattr(runner, "_wait_for_latest_observed_stack_id", lambda *_, **__: "first-stack-id")
+    monkeypatch.setattr(runner, "_cleanup_target_stack_ids", lambda *_, **__: ["first-stack-id"])
+    monkeypatch.setattr(runner, "_wait_for_cleanup_resource_status", lambda *_, **__: None)
+    monkeypatch.setattr(
+        runner,
+        "_latest_observed_stack_id",
+        lambda _pty, *, exclude: "second-stack-id" if "first-stack-id" in exclude else "first-stack-id",
+    )
+    deleted_stack_ids = _install_cleanup_teardown_fakes(monkeypatch, runner, tmp_path)
+
+    assert runner.run_rollback_step5_cleanup(args, "rollback-step5-cleanup") == 0
+    assert deleted_stack_ids == ["second-stack-id"]
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "send-esc", "sendline", "select-default-candidate"}
+        or (kind == "expect_optional" and value == "cleanup completed")
+    ]
+    assert ordered_actions == [
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", runner._cleanup_pipeline_prompt(args, tmp_path)),
+        ("expect", "initial candidate selection visible"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "first stack create started"),
+        ("send-esc", "\x1b"),
+        ("expect", "deploying interrupt input ready"),
+        ("sendline", runner._cleanup_rollback_prompt(args, tmp_path)),
+        ("expect", "post-rollback candidate selection visible"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after second deployment"),
+        ("sendline", args.normal_followup_prompt),
+        ("expect", "cleanup started"),
+        ("expect_optional", "cleanup completed"),
+        ("expect", "post-cleanup prompt input ready"),
+        ("sendline", "/exit"),
+    ]
+
+
+def test_rollback_step5_cleanup_recovery_runs_expected_terminal_flow(monkeypatch, tmp_path: Path) -> None:
+    runner = _load_runner()
+    args = runner.parse_args(["--allow-real-cloud", "--run-dir", str(tmp_path)])
+    actions: list[tuple[str, str]] = []
+    transcript = (
+        "● Confirm and select (4/5)\n"
+        "first-stack(first-stack-id) CREATE_COMPLETE\n"
+        "● Confirm and select (4/5)\n"
+        "second-stack(second-stack-id) CREATE_COMPLETE\n"
+        "检测到 1 个回滚残留资源，开始清理流程。\n"
+        "↺ 回滚清理恢复：1 条记录，1 条进行中。\n"
+        "↺ 回滚清理 [完成] first-stack · 资源栈 first-stack-id · DELETE_COMPLETE\n"
+    )
+    _install_flow_fake_pty(monkeypatch, runner, transcript, actions)
+    monkeypatch.setattr(
+        runner,
+        "_ensure_cleanup_network_target",
+        lambda _args, _run_dir: runner.CleanupNetworkTarget(
+            vpc_id="vpc-test",
+            vpc_cidr="172.16.0.0/12",
+            zone_id="cn-hangzhou-h",
+            vswitch_cidr="172.31.255.0/24",
+            rollback_vswitch_cidr="172.31.254.0/24",
+        ),
+    )
+    monkeypatch.setattr(runner, "_wait_for_latest_observed_stack_id", lambda *_, **__: "first-stack-id")
+    monkeypatch.setattr(runner, "_cleanup_target_stack_ids", lambda *_, **__: ["first-stack-id"])
+    monkeypatch.setattr(
+        runner,
+        "_latest_observed_stack_id",
+        lambda _pty, *, exclude: "second-stack-id" if "first-stack-id" in exclude else "first-stack-id",
+    )
+    deleted_stack_ids = _install_cleanup_teardown_fakes(monkeypatch, runner, tmp_path)
+
+    assert runner.run_rollback_step5_cleanup_recovery(args, "rollback-step5-cleanup-recovery") == 0
+    assert deleted_stack_ids == ["second-stack-id"]
+
+    ordered_actions = [
+        (kind, value)
+        for kind, value in actions
+        if kind in {"expect", "spawn", "terminate", "send-esc", "sendline", "select-default-candidate"}
+        or (kind == "expect_optional" and value == "cleanup completed")
+    ]
+    assert ordered_actions == [
+        ("spawn", ""),
+        ("expect", "initial prompt"),
+        ("expect", "prompt input ready"),
+        ("sendline", runner._cleanup_pipeline_prompt(args, tmp_path)),
+        ("expect", "initial candidate selection visible"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "first stack create started"),
+        ("send-esc", "\x1b"),
+        ("expect", "deploying interrupt input ready"),
+        ("sendline", runner._cleanup_rollback_prompt(args, tmp_path)),
+        ("expect", "post-rollback candidate selection visible"),
+        ("select-default-candidate", f"{args.selection_prompt}\r"),
+        ("expect", "pipeline completed after second deployment"),
+        ("sendline", args.normal_followup_prompt),
+        ("expect", "cleanup started before kill"),
+        ("terminate", "True"),
+        ("spawn", "--continue"),
+        ("expect", "cleanup resume summary"),
+        ("expect_optional", "cleanup completed"),
+        ("expect", "post-cleanup prompt input ready"),
+        ("sendline", "/exit"),
+        ("terminate", "False"),
+    ]
diff --git a/tests/services/test_context_manager.py b/tests/services/test_context_manager.py
index 83bf6ff8..5489bb89 100644
--- a/tests/services/test_context_manager.py
+++ b/tests/services/test_context_manager.py
@@ -1,6 +1,11 @@
 from types import SimpleNamespace
 
 from iac_code.agent.message import TextBlock, ToolResultBlock, ToolUseBlock
+from iac_code.pipeline.engine.cleanup import (
+    CLEANUP_PROMPT_METADATA_TYPE,
+    create_cleanup_prompt_message,
+    is_cleanup_prompt_message,
+)
 from iac_code.services.context_manager import ContextManager, get_context_window_config
 
 
@@ -133,6 +138,50 @@ def test_build_compaction_prompt_excludes_recalled_memory_messages(self):
         assert "hidden memory body" not in prompt
         assert "hidden-topic.md" not in prompt
 
+    def test_build_compaction_prompt_excludes_cleanup_prompt_messages(self):
+        cm = ContextManager(system_prompt="sys", model="qwen")
+        cm.add_raw_message(
+            {
+                "role": "user",
+                "content": "cleanup hidden prompt",
+                "metadata": {"type": CLEANUP_PROMPT_METADATA_TYPE, "source": "pipeline_cleanup"},
+            }
+        )
+        for i in range(6):
+            cm.add_user_message(f"User message {i}")
+            cm.add_assistant_message([TextBlock(text=f"Assistant response {i}")])
+
+        prompt = cm.build_compaction_prompt()
+
+        assert "User message 0" in prompt
+        assert "cleanup hidden prompt" not in prompt
+
+    def test_apply_compaction_preserves_cleanup_prompt_messages(self):
+        cm = ContextManager(system_prompt="sys", model="qwen")
+        cleanup_message = create_cleanup_prompt_message("cleanup hidden prompt")
+        cm.add_raw_message(cleanup_message.to_dict())
+        for i in range(6):
+            cm.add_user_message(f"User message {i}")
+            cm.add_assistant_message([TextBlock(text=f"Assistant response {i}")])
+
+        cm.apply_compaction("summary")
+
+        messages = cm.get_messages()
+        assert any(
+            is_cleanup_prompt_message(message) and message.content == "cleanup hidden prompt" for message in messages
+        )
+        assert messages[0].content == "[Conversation Summary]\nsummary"
+
+    def test_remove_cleanup_prompt_messages_removes_hidden_prompts(self):
+        cm = ContextManager(system_prompt="sys", model="qwen")
+        cm.add_user_message("real prompt")
+        cm.add_raw_message(create_cleanup_prompt_message("cleanup hidden prompt").to_dict())
+
+        removed = cm.remove_cleanup_prompt_messages()
+
+        assert removed == 1
+        assert [message.content for message in cm.get_messages()] == ["real prompt"]
+
     def test_apply_compaction_preserves_recent(self):
         cm = ContextManager(system_prompt="sys", model="qwen")
         for i in range(6):
@@ -298,3 +347,18 @@ def test_compaction_surfaced_files_come_from_retained_metadata_only():
     cm.apply_compaction("Summary mentions old.md and recent.md")
 
     assert cm.get_surfaced_memory_files() == {"recent.md"}
+
+
+def test_add_raw_message_preserves_metadata():
+    cm = ContextManager(system_prompt="sys", model="qwen")
+
+    msg = cm.add_raw_message(
+        {
+            "role": "user",
+            "content": "hidden cleanup prompt",
+            "metadata": {"type": CLEANUP_PROMPT_METADATA_TYPE, "source": "pipeline_cleanup"},
+        }
+    )
+
+    assert msg.metadata == {"type": CLEANUP_PROMPT_METADATA_TYPE, "source": "pipeline_cleanup"}
+    assert cm.get_messages()[0].metadata["type"] == CLEANUP_PROMPT_METADATA_TYPE
diff --git a/tests/services/test_session_index.py b/tests/services/test_session_index.py
index 503b1046..1d395e3d 100644
--- a/tests/services/test_session_index.py
+++ b/tests/services/test_session_index.py
@@ -2,12 +2,16 @@
 
 from __future__ import annotations
 
+import json
 import os
+import subprocess
+import sys
 import time
 
 import pytest
 
 from iac_code.agent.message import Message, TextBlock, ToolResultBlock, create_recalled_memory_message
+from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
 from iac_code.services.session_index import (
     SessionIndex,
     extract_first_json_string_field,
@@ -131,6 +135,37 @@ def test_skips_recalled_memory_user_messages(self, storage):
 
         assert meta.first_prompt == "real prompt"
 
+    def test_cleanup_prompt_last_prompt_meta_is_ignored(self, storage):
+        cwd = "/proj/cp-last"
+        storage.append(cwd, "scp-last", Message(role="user", content="real prompt"), git_branch=None)
+        storage.append_meta(
+            cwd,
+            "scp-last",
+            {
+                "type": "last-prompt",
+                "last_prompt": "检测到 pipeline rollback 后仍需要清理的云资源。只有确认 DELETE_COMPLETE 才算完成。",
+            },
+        )
+
+        meta = read_lite_metadata(storage.session_path(cwd, "scp-last"))
+
+        assert meta.last_prompt is None
+        assert meta.first_prompt == "real prompt"
+
+    def test_skips_cleanup_prompt_user_messages(self, storage):
+        cwd = "/proj/cp-first"
+        storage.append(
+            cwd,
+            "scp-first",
+            create_cleanup_prompt_message("cleanup hidden prompt"),
+            git_branch=None,
+        )
+        storage.append(cwd, "scp-first", Message(role="user", content="real prompt"), git_branch=None)
+
+        meta = read_lite_metadata(storage.session_path(cwd, "scp-first"))
+
+        assert meta.first_prompt == "real prompt"
+
 
 # ---------------------------------------------------------------------------
 # SessionIndex
@@ -138,6 +173,20 @@ def test_skips_recalled_memory_user_messages(self, storage):
 
 
 class TestSessionIndex:
+    def test_session_services_do_not_import_pipeline_engine_modules(self):
+        script = """
+import json
+import sys
+
+import iac_code.services.session_index
+import iac_code.services.session_storage
+
+print(json.dumps(sorted(name for name in sys.modules if name.startswith("iac_code.pipeline.engine"))))
+"""
+        result = subprocess.run([sys.executable, "-c", script], check=True, capture_output=True, text=True)
+
+        assert json.loads(result.stdout) == []
+
     def test_list_for_cwd_filters_by_project(self, tmp_path):
         storage = SessionStorage(projects_dir=tmp_path)
         storage.append("/a", "id-a", Message(role="user", content="one"), git_branch=None)
@@ -179,6 +228,79 @@ def test_directory_session_metadata_name_takes_precedence(self, tmp_path):
         assert entry.auto_title == "first prompt"
         assert entry.is_legacy is False
 
+    def test_user_prompt_mentioning_cleanup_terms_is_not_hidden(self, tmp_path):
+        storage = SessionStorage(projects_dir=tmp_path)
+        prompt = "How do I verify DELETE_COMPLETE for deleted stacks?"
+        storage.append("/p", "cleanup-terms", Message(role="user", content=prompt), git_branch=None)
+
+        entry = SessionIndex(projects_dir=tmp_path).list_for_cwd("/p")[0]
+
+        assert entry.title == prompt
+        assert entry.auto_title == prompt
+
+    def test_user_prompt_mentioning_cleanup_required_is_not_hidden(self, tmp_path):
+        storage = SessionStorage(projects_dir=tmp_path)
+        prompt = "What does cleanup required mean in Terraform?"
+        storage.append("/p", "cleanup-required", Message(role="user", content=prompt), git_branch=None)
+
+        entry = SessionIndex(projects_dir=tmp_path).list_for_cwd("/p")[0]
+
+        assert entry.title == prompt
+        assert entry.auto_title == prompt
+
+    def test_user_prompt_mentioning_strict_whitelist_is_not_hidden(self, tmp_path):
+        storage = SessionStorage(projects_dir=tmp_path)
+        prompt = "严格白名单策略怎么配置？"
+        storage.append("/p", "strict-whitelist", Message(role="user", content=prompt), git_branch=None)
+
+        entry = SessionIndex(projects_dir=tmp_path).list_for_cwd("/p")[0]
+
+        assert entry.title == prompt
+        assert entry.auto_title == prompt
+
+    def test_user_prompt_mentioning_resources_to_clean_is_not_hidden(self, tmp_path):
+        storage = SessionStorage(projects_dir=tmp_path)
+        prompt = "待清理资源怎么配置提醒？"
+        storage.append("/p", "resources-to-clean", Message(role="user", content=prompt), git_branch=None)
+
+        entry = SessionIndex(projects_dir=tmp_path).list_for_cwd("/p")[0]
+
+        assert entry.title == prompt
+        assert entry.auto_title == prompt
+
+    def test_legacy_cleanup_prompt_last_prompt_meta_is_ignored(self, tmp_path):
+        storage = SessionStorage(projects_dir=tmp_path)
+        cwd = "/proj/cp-last-legacy"
+        storage.append(cwd, "scp-last-legacy", Message(role="user", content="real prompt"), git_branch=None)
+        storage.append_meta(
+            cwd,
+            "scp-last-legacy",
+            {
+                "type": "last-prompt",
+                "last_prompt": "Pipeline rollback cleanup required for leftover resources.",
+            },
+        )
+
+        meta = read_lite_metadata(storage.session_path(cwd, "scp-last-legacy"))
+
+        assert meta.last_prompt is None
+        assert meta.first_prompt == "real prompt"
+
+    def test_skips_legacy_cleanup_prompt_user_messages(self, tmp_path):
+        storage = SessionStorage(projects_dir=tmp_path)
+        cwd = "/proj/cp-first-legacy"
+        storage.append(
+            cwd,
+            "scp-first-legacy",
+            Message(role="user", content="Rollback cleanup required for stack-123."),
+            git_branch=None,
+        )
+        storage.append(cwd, "scp-first-legacy", Message(role="user", content="real prompt"), git_branch=None)
+
+        meta = read_lite_metadata(storage.session_path(cwd, "scp-first-legacy"))
+
+        assert meta.first_prompt == "real prompt"
+
     def test_legacy_session_still_indexed(self, tmp_path):
         storage = SessionStorage(projects_dir=tmp_path)
         legacy_path = storage.legacy_session_path("/legacy", "legacy")
diff --git a/tests/services/test_session_storage.py b/tests/services/test_session_storage.py
index 00489581..12cbf943 100644
--- a/tests/services/test_session_storage.py
+++ b/tests/services/test_session_storage.py
@@ -11,6 +11,7 @@
     create_recalled_memory_message,
     get_recalled_memory_files,
 )
+from iac_code.pipeline.engine.cleanup import CLEANUP_PROMPT_METADATA_TYPE, create_cleanup_prompt_message
 from iac_code.services.session_metadata import SESSION_JSONL_FILENAME, SESSION_METADATA_FILENAME
 from iac_code.services.session_storage import SessionStorage
 from iac_code.services.session_usage import SessionUsageStore
@@ -106,6 +107,68 @@ def test_tool_use_preserved(self, storage, sample_messages):
         assert len(tool_uses) == 1
         assert tool_uses[0].name == "read_file"
 
+    def test_save_preserves_existing_cleanup_prompt_message(self, storage):
+        cleanup = create_cleanup_prompt_message("cleanup hidden prompt")
+        storage.append(CWD, "cleanup-save", cleanup, git_branch="main")
+
+        storage.save(
+            CWD,
+            "cleanup-save",
+            [Message(role="user", content="later"), Message(role="assistant", content="done")],
+            git_branch="main",
+            preserve_cleanup_prompts=True,
+        )
+
+        loaded = storage.load(CWD, "cleanup-save")
+        assert [message.content for message in loaded] == ["later", "done", "cleanup hidden prompt"]
+        assert loaded[-1].metadata["type"] == CLEANUP_PROMPT_METADATA_TYPE
+
+    def test_save_does_not_duplicate_existing_cleanup_prompt_message(self, storage):
+        cleanup = create_cleanup_prompt_message("cleanup hidden prompt")
+        storage.append(CWD, "cleanup-save-once", cleanup, git_branch="main")
+
+        storage.save(
+            CWD,
+            "cleanup-save-once",
+            [cleanup, Message(role="assistant", content="done")],
+            git_branch="main",
+            preserve_cleanup_prompts=True,
+        )
+
+        loaded = storage.load(CWD, "cleanup-save-once")
+        cleanup_messages = [
+            message for message in loaded if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE
+        ]
+        assert len(cleanup_messages) == 1
+
+    def test_save_updates_cleanup_prompt_status_without_represerving_pending_prompt(self, storage, tmp_path):
+        cleanup = create_cleanup_prompt_message(
+            "cleanup hidden prompt",
+            cleanup_ledger_path=tmp_path / "cleanup.yaml",
+            cleanup_status="pending",
+        )
+        storage.append(CWD, "cleanup-status", cleanup, git_branch="main")
+
+        completed = create_cleanup_prompt_message(
+            "cleanup hidden prompt",
+            cleanup_ledger_path=tmp_path / "cleanup.yaml",
+            cleanup_status="completed",
+        )
+        storage.save(
+            CWD,
+            "cleanup-status",
+            [completed, Message(role="assistant", content="done")],
+            git_branch="main",
+            preserve_cleanup_prompts=True,
+        )
+
+        loaded = storage.load(CWD, "cleanup-status")
+        cleanup_messages = [
+            message for message in loaded if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE
+        ]
+        assert len(cleanup_messages) == 1
+        assert cleanup_messages[0].metadata["cleanupStatus"] == "completed"
+
     def test_find_session_anywhere(self, storage):
         storage.append("/tmp/a", "id-aa", Message(role="user", content="from a"), git_branch=None)
         storage.append("/tmp/b", "id-bb", Message(role="user", content="from b"), git_branch=None)
@@ -239,3 +302,64 @@ def test_rename_to_existing_name_is_noop(storage):
     storage.rename_session(CWD, "same", "deploy-prod", git_branch=None)
 
     assert storage.rename_session(CWD, "same", "deploy-prod", git_branch=None) == "unchanged"
+
+
+def test_save_does_not_scan_old_file_unless_preserving_cleanup_prompts(tmp_path, monkeypatch):
+    storage = SessionStorage(projects_dir=tmp_path)
+    storage.append("/tmp/project", "sid", Message(role="user", content="old"))
+
+    def fail_load(cwd, session_id):
+        raise AssertionError("save should not load existing messages")
+
+    monkeypatch.setattr(storage, "load", fail_load)
+
+    storage.save("/tmp/project", "sid", [Message(role="user", content="new")])
+
+    assert [message.content for message in SessionStorage(projects_dir=tmp_path).load("/tmp/project", "sid")] == ["new"]
+
+
+def test_save_can_preserve_cleanup_prompts_when_requested(tmp_path):
+    storage = SessionStorage(projects_dir=tmp_path)
+    cleanup = create_cleanup_prompt_message("cleanup stack-123", cleanup_ledger_path=tmp_path / "cleanup.yaml")
+    storage.append("/tmp/project", "sid", cleanup)
+
+    storage.save(
+        "/tmp/project",
+        "sid",
+        [Message(role="user", content="new")],
+        preserve_cleanup_prompts=True,
+    )
+
+    loaded = SessionStorage(projects_dir=tmp_path).load("/tmp/project", "sid")
+    assert [message.content for message in loaded] == ["new", "cleanup stack-123"]
+
+
+def test_append_uses_locked_jsonl_helper(tmp_path, monkeypatch):
+    storage = SessionStorage(projects_dir=tmp_path)
+    calls = []
+
+    def fake_append(path, records, *, durable=False):
+        calls.append((path.name, list(records), durable))
+
+    monkeypatch.setattr("iac_code.services.session_storage.append_jsonl_locked", fake_append)
+
+    storage.append("/tmp/project", "sid", Message(role="user", content="hello"), git_branch="main")
+
+    assert calls[0][0] == "session.jsonl"
+    assert calls[0][1][0]["content"] == "hello"
+    assert calls[0][1][0]["git_branch"] == "main"
+
+
+def test_legacy_migration_keeps_directory_session_when_present(tmp_path):
+    storage = SessionStorage(projects_dir=tmp_path)
+    directory = storage.session_dir("/tmp/project", "sid")
+    directory.mkdir(parents=True)
+    directory_path = directory / "session.jsonl"
+    directory_path.write_text('{"role":"user","content":"directory"}\n', encoding="utf-8")
+    legacy_path = storage.legacy_session_path("/tmp/project", "sid")
+    legacy_path.parent.mkdir(parents=True, exist_ok=True)
+    legacy_path.write_text('{"role":"user","content":"legacy"}\n', encoding="utf-8")
+
+    assert storage._ensure_directory_format("/tmp/project", "sid") == directory
+
+    assert directory_path.read_text(encoding="utf-8") == '{"role":"user","content":"directory"}\n'
diff --git a/tests/test_agent/test_image_block.py b/tests/test_agent/test_image_block.py
index cd2b5c82..43bb33b5 100644
--- a/tests/test_agent/test_image_block.py
+++ b/tests/test_agent/test_image_block.py
@@ -10,7 +10,20 @@ def test_image_block_serializes_round_trip():
     block = ImageBlock(media_type="image/png", data="aGVsbG8=")
     assert block.type == "image"
     payload = block.model_dump()
-    assert payload == {"type": "image", "media_type": "image/png", "data": "aGVsbG8="}
+    assert payload == {"type": "image", "media_type": "image/png", "data": "aGVsbG8=", "ref_id": None}
+
+
+def test_message_with_image_blocks_deserializes_round_trip():
+    msg = Message(
+        role="user",
+        content=[TextBlock(text="see"), ImageBlock(media_type="image/png", data="aGVsbG8=")],
+    )
+
+    loaded = Message.from_dict(msg.to_dict())
+
+    assert loaded == msg
+    assert isinstance(loaded.content, list)
+    assert isinstance(loaded.content[1], ImageBlock)
 
 
 def test_message_with_blocks_to_api_format_keeps_image():
@@ -24,6 +37,7 @@ def test_message_with_blocks_to_api_format_keeps_image():
     api = msg.to_api_format()
     assert api["content"][1]["type"] == "image"
     assert api["content"][1]["data"] == "x"
+    assert "ref_id" not in api["content"][1]
 
 
 def test_conversation_add_user_message_accepts_blocks():
diff --git a/tests/tools/cloud/aliyun/test_aliyun_api.py b/tests/tools/cloud/aliyun/test_aliyun_api.py
index af4cd38b..f130ec4f 100644
--- a/tests/tools/cloud/aliyun/test_aliyun_api.py
+++ b/tests/tools/cloud/aliyun/test_aliyun_api.py
@@ -2,6 +2,7 @@
 
 from __future__ import annotations
 
+import asyncio
 import json
 from unittest.mock import MagicMock, patch
 
@@ -12,6 +13,7 @@
 from iac_code.tools.base import ToolContext
 from iac_code.tools.cloud.aliyun import aliyun_api as aliyun_api_module
 from iac_code.tools.cloud.aliyun.aliyun_api import AliyunApi
+from iac_code.types.stream_events import ResourceObservedEvent
 
 
 @pytest.fixture
@@ -363,6 +365,50 @@ async def test_successful_call(self, api: AliyunApi, context: ToolContext, mock_
         assert data == {"Instances": []}
         mock_client.call_api.assert_called_once()
 
+    @pytest.mark.asyncio
+    async def test_ros_create_stack_emits_resource_observed_event(self, api: AliyunApi, mock_credentials) -> None:
+        queue: asyncio.Queue = asyncio.Queue()
+        context = ToolContext(event_queue=queue, tool_use_id="toolu-create")
+        mock_client = MagicMock()
+        mock_client.call_api.return_value = {
+            "body": {
+                "RequestId": "req-1",
+                "StackId": "stack-id-123",
+            }
+        }
+
+        with patch("iac_code.tools.cloud.aliyun.aliyun_api.OpenApiClient", return_value=mock_client):
+            result = await api.execute(
+                tool_input={
+                    "product": "ros",
+                    "action": "CreateStack",
+                    "params": {
+                        "StackName": "iac-e2e-stack",
+                        "TemplateBody": "ROSTemplateFormatVersion: '2015-09-01'\nResources: {}\n",
+                    },
+                    "region_id": "cn-hangzhou",
+                },
+                context=context,
+            )
+
+        assert result.is_error is False
+        events = []
+        while not queue.empty():
+            events.append(await queue.get())
+
+        assert len(events) == 1
+        event = events[0]
+        assert isinstance(event, ResourceObservedEvent)
+        assert event.provider == "ros"
+        assert event.resource_type == "stack"
+        assert event.resource_id == "stack-id-123"
+        assert event.resource_name == "iac-e2e-stack"
+        assert event.region_id == "cn-hangzhou"
+        assert event.action == "CreateStack"
+        assert event.tool_name == "aliyun_api"
+        assert event.tool_use_id == "toolu-create"
+        assert event.metadata == {}
+
     @pytest.mark.asyncio
     async def test_explicit_version(self, api: AliyunApi, context: ToolContext, mock_credentials) -> None:
         mock_client = MagicMock()
@@ -558,8 +604,57 @@ async def test_uppercase_product_works(self, api: AliyunApi, context: ToolContex
 
 class TestAliyunApiHooks:
     @pytest.mark.asyncio
-    async def test_hook_blocks_validate_with_wrong_resource_types(
+    async def test_ros_template_body_is_rejected_before_cloud_call(
+        self, api: AliyunApi, context: ToolContext, mock_credentials
+    ) -> None:
+        with patch("iac_code.tools.cloud.aliyun.aliyun_api.OpenApiClient") as mock_open_api_client:
+            result = await api.execute(
+                tool_input={
+                    "product": "ros",
+                    "action": "ValidateTemplate",
+                    "params": {"TemplateBody": "{}"},
+                    "region_id": "cn-hangzhou",
+                },
+                context=ToolContext(pipeline_mode=True),
+            )
+
+        assert result.is_error is True
+        assert "TemplateBody" in result.content
+        assert "TemplateURL" in result.content
+        mock_open_api_client.assert_not_called()
+
+    @pytest.mark.asyncio
+    async def test_ros_template_body_is_allowed_outside_pipeline(
         self, api: AliyunApi, context: ToolContext, mock_credentials
+    ) -> None:
+        template = json.dumps(
+            {
+                "ROSTemplateFormatVersion": "2015-09-01",
+                "Resources": {
+                    "Vpc": {"Type": "ALIYUN::ECS::VPC", "Properties": {}},
+                },
+            }
+        )
+        mock_client = MagicMock()
+        mock_client.call_api.return_value = {"body": {"Description": "Valid"}}
+
+        with patch("iac_code.tools.cloud.aliyun.aliyun_api.OpenApiClient", return_value=mock_client):
+            result = await api.execute(
+                tool_input={
+                    "product": "ros",
+                    "action": "ValidateTemplate",
+                    "params": {"TemplateBody": template},
+                    "region_id": "cn-hangzhou",
+                },
+                context=context,
+            )
+
+        assert result.is_error is False
+        mock_client.call_api.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_hook_blocks_validate_with_wrong_resource_types(
+        self, api: AliyunApi, context: ToolContext, mock_credentials, tmp_path
     ) -> None:
         template = json.dumps(
             {
@@ -570,11 +665,13 @@ async def test_hook_blocks_validate_with_wrong_resource_types(
                 },
             }
         )
+        template_file = tmp_path / "wrong-resource-types.json"
+        template_file.write_text(template, encoding="utf-8")
         result = await api.execute(
             tool_input={
                 "product": "ros",
                 "action": "ValidateTemplate",
-                "params": {"TemplateBody": template},
+                "params": {"TemplateURL": str(template_file)},
                 "region_id": "cn-hangzhou",
             },
             context=context,
@@ -585,7 +682,7 @@ async def test_hook_blocks_validate_with_wrong_resource_types(
 
     @pytest.mark.asyncio
     async def test_hook_passes_correct_resource_types(
-        self, api: AliyunApi, context: ToolContext, mock_credentials
+        self, api: AliyunApi, context: ToolContext, mock_credentials, tmp_path
     ) -> None:
         template = json.dumps(
             {
@@ -595,6 +692,8 @@ async def test_hook_passes_correct_resource_types(
                 },
             }
         )
+        template_file = tmp_path / "correct-resource-types.json"
+        template_file.write_text(template, encoding="utf-8")
         mock_client = MagicMock()
         mock_client.call_api.return_value = {"body": {"Description": "Valid"}}
 
@@ -603,7 +702,7 @@ async def test_hook_passes_correct_resource_types(
                 tool_input={
                     "product": "ros",
                     "action": "ValidateTemplate",
-                    "params": {"TemplateBody": template},
+                    "params": {"TemplateURL": str(template_file)},
                     "region_id": "cn-hangzhou",
                 },
                 context=context,
diff --git a/tests/tools/cloud/aliyun/test_ros_stack.py b/tests/tools/cloud/aliyun/test_ros_stack.py
index f765dd60..8f9d2269 100644
--- a/tests/tools/cloud/aliyun/test_ros_stack.py
+++ b/tests/tools/cloud/aliyun/test_ros_stack.py
@@ -13,10 +13,7 @@
 from iac_code.tools.cloud.aliyun.ros_stack import RosStack
 from iac_code.types.stream_events import StackProgressEvent
 
-_MINIMAL_TEMPLATE_BODY = (
-    '{"ROSTemplateFormatVersion": "2015-09-01", '
-    '"Resources": {"Vpc": {"Type": "ALIYUN::ECS::VPC", "Properties": {"CidrBlock": "192.168.0.0/16"}}}}'
-)
+_REMOTE_TEMPLATE_URL = "oss://iac-code-test/template.json"
 
 
 @pytest.fixture
@@ -118,7 +115,7 @@ async def test_execute_create_stack(self, tool: RosStack, mock_credentials) -> N
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ctx,
@@ -144,6 +141,64 @@ async def test_execute_create_stack(self, tool: RosStack, mock_credentials) -> N
         assert first.resources[0]["name"] == "Vpc"
         assert first.resources[0]["resource_type"] == "ALIYUN::ECS::VPC"
 
+    @pytest.mark.asyncio
+    async def test_template_body_is_rejected_before_create_stack(self, tool: RosStack, mock_credentials) -> None:
+        mock_client = MagicMock()
+
+        with patch("iac_code.tools.cloud.aliyun.ros_stack.RosClientFactory") as mock_factory:
+            mock_factory.create.return_value = mock_client
+            result = await tool.execute(
+                tool_input={
+                    "action": "CreateStack",
+                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "region_id": "cn-hangzhou",
+                },
+                context=ToolContext(pipeline_mode=True),
+            )
+
+        assert result.is_error is True
+        assert "TemplateBody" in result.content
+        assert "TemplateURL" in result.content
+        mock_client.create_stack.assert_not_called()
+
+    @pytest.mark.asyncio
+    async def test_template_body_is_allowed_outside_pipeline(self, tool: RosStack, mock_credentials) -> None:
+        mock_client = MagicMock()
+
+        create_response = MagicMock()
+        create_response.body.stack_id = "stack-123"
+        mock_client.create_stack.return_value = create_response
+
+        get_stack_response = MagicMock()
+        get_stack_response.body.to_map.return_value = {
+            "StackId": "stack-123",
+            "StackName": "test",
+            "Status": "CREATE_COMPLETE",
+            "StatusReason": "",
+        }
+        mock_client.get_stack.return_value = get_stack_response
+
+        list_resources_response = MagicMock()
+        list_resources_response.body.to_map.return_value = {"Resources": []}
+        mock_client.list_stack_resources.return_value = list_resources_response
+
+        with (
+            patch("iac_code.tools.cloud.aliyun.ros_stack.RosClientFactory") as mock_factory,
+            patch("iac_code.tools.cloud.aliyun.api_hooks.run_hooks", return_value=None),
+        ):
+            mock_factory.create.return_value = mock_client
+            result = await tool.execute(
+                tool_input={
+                    "action": "CreateStack",
+                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "region_id": "cn-hangzhou",
+                },
+                context=ToolContext(),
+            )
+
+        assert result.is_error is False
+        mock_client.create_stack.assert_called_once()
+
     @pytest.mark.asyncio
     async def test_create_stack_emits_success_telemetry_only_after_terminal_success(
         self, tool: RosStack, mock_credentials
@@ -188,7 +243,7 @@ def record_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -240,7 +295,7 @@ def flaky_log_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -281,7 +336,7 @@ async def test_create_stack_polling_cancellation_cleans_context_and_emits_cancel
                 await tool.execute(
                     tool_input={
                         "action": "CreateStack",
-                        "params": {"StackName": "test", "TemplateBody": "{}"},
+                        "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                         "region_id": "cn-hangzhou",
                     },
                     context=ToolContext(),
@@ -337,7 +392,7 @@ def flaky_log_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -382,7 +437,7 @@ def flaky_add_metric(name: str, value: int, attrs: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -393,7 +448,7 @@ def flaky_add_metric(name: str, value: int, attrs: dict | None = None) -> None:
 
     @pytest.mark.asyncio
     async def test_create_stack_non_string_resource_type_does_not_prevent_api_call(
-        self, tool: RosStack, mock_credentials
+        self, tool: RosStack, mock_credentials, tmp_path
     ) -> None:
         mock_client = MagicMock()
 
@@ -415,6 +470,8 @@ async def test_create_stack_non_string_resource_type_does_not_prevent_api_call(
         mock_client.list_stack_resources.return_value = list_resources_response
 
         template_body = json.dumps({"Resources": {"R": {"Type": 123}}})
+        template_file = tmp_path / "non-string-resource-type.json"
+        template_file.write_text(template_body, encoding="utf-8")
 
         with (
             patch("iac_code.tools.cloud.aliyun.ros_stack.RosClientFactory") as mock_factory,
@@ -424,7 +481,7 @@ async def test_create_stack_non_string_resource_type_does_not_prevent_api_call(
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": template_body},
+                    "params": {"StackName": "test", "TemplateURL": str(template_file)},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -436,7 +493,7 @@ async def test_create_stack_non_string_resource_type_does_not_prevent_api_call(
         assert data["status"] == "CREATE_COMPLETE"
 
     @pytest.mark.asyncio
-    async def test_create_stack_none_template_body_does_not_prevent_api_call(
+    async def test_create_stack_template_url_does_not_require_template_body(
         self, tool: RosStack, mock_credentials
     ) -> None:
         mock_client = MagicMock()
@@ -466,7 +523,7 @@ async def test_create_stack_none_template_body_does_not_prevent_api_call(
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": None},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -475,7 +532,7 @@ async def test_create_stack_none_template_body_does_not_prevent_api_call(
         assert result.is_error is False
         mock_client.create_stack.assert_called_once()
         request = mock_client.create_stack.call_args.args[0]
-        assert request.template_body is None
+        assert request.to_map()["TemplateURL"] == _REMOTE_TEMPLATE_URL
         data = json.loads(result.content)
         assert data["status"] == "CREATE_COMPLETE"
 
@@ -514,7 +571,7 @@ async def test_create_stack_rollback_emits_failure_telemetry(self, tool: RosStac
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -557,7 +614,7 @@ async def test_create_stack_import_create_complete_is_terminal_success(
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -600,7 +657,7 @@ async def test_create_stack_import_create_rollback_complete_is_terminal_error(
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -651,7 +708,7 @@ def record_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": "{}"},
+                    "params": {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -707,7 +764,7 @@ async def test_update_stack_ignores_create_complete_from_previous_operation(
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": "{}"},
+                    "params": {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -747,7 +804,7 @@ async def test_update_stack_resource_error_with_stale_create_complete_is_not_ter
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": "{}"},
+                    "params": {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -793,7 +850,7 @@ def flaky_log_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": "{}"},
+                    "params": {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -804,7 +861,7 @@ def flaky_log_event(event_name: str, metadata: dict | None = None) -> None:
 
     @pytest.mark.asyncio
     async def test_update_stack_non_string_resource_type_does_not_prevent_api_call(
-        self, tool: RosStack, mock_credentials
+        self, tool: RosStack, mock_credentials, tmp_path
     ) -> None:
         mock_client = MagicMock()
 
@@ -826,6 +883,8 @@ async def test_update_stack_non_string_resource_type_does_not_prevent_api_call(
         mock_client.list_stack_resources.return_value = list_resources_response
 
         template_body = json.dumps({"Resources": {"R": {"Type": 123}}})
+        template_file = tmp_path / "update-non-string-resource-type.json"
+        template_file.write_text(template_body, encoding="utf-8")
 
         with (
             patch("iac_code.tools.cloud.aliyun.ros_stack.RosClientFactory") as mock_factory,
@@ -835,7 +894,7 @@ async def test_update_stack_non_string_resource_type_does_not_prevent_api_call(
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": template_body},
+                    "params": {"StackId": "stack-123", "TemplateURL": str(template_file)},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -847,7 +906,7 @@ async def test_update_stack_non_string_resource_type_does_not_prevent_api_call(
         assert data["status"] == "UPDATE_COMPLETE"
 
     @pytest.mark.asyncio
-    async def test_update_stack_none_template_body_does_not_prevent_api_call(
+    async def test_update_stack_template_url_does_not_require_template_body(
         self, tool: RosStack, mock_credentials
     ) -> None:
         mock_client = MagicMock()
@@ -877,7 +936,7 @@ async def test_update_stack_none_template_body_does_not_prevent_api_call(
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": None},
+                    "params": {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -886,7 +945,7 @@ async def test_update_stack_none_template_body_does_not_prevent_api_call(
         assert result.is_error is False
         mock_client.update_stack.assert_called_once()
         request = mock_client.update_stack.call_args.args[0]
-        assert request.template_body is None
+        assert request.to_map()["TemplateURL"] == _REMOTE_TEMPLATE_URL
         data = json.loads(result.content)
         assert data["status"] == "UPDATE_COMPLETE"
 
@@ -925,7 +984,7 @@ async def test_update_stack_rollback_emits_failure_telemetry(self, tool: RosStac
             result = await tool.execute(
                 tool_input={
                     "action": "UpdateStack",
-                    "params": {"StackId": "stack-123", "TemplateBody": "{}"},
+                    "params": {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -1145,10 +1204,10 @@ async def test_stale_create_or_update_context_is_not_consumed_by_delete_stack_te
         action_response.body.stack_id = "stack-123"
         if stale_action == "CreateStack":
             mock_client.create_stack.return_value = action_response
-            stale_params = {"StackName": "test", "TemplateBody": "{}"}
+            stale_params = {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL}
         else:
             mock_client.update_stack.return_value = action_response
-            stale_params = {"StackId": "stack-123", "TemplateBody": "{}"}
+            stale_params = {"StackId": "stack-123", "TemplateURL": _REMOTE_TEMPLATE_URL}
 
         delete_get_stack_response = MagicMock()
         delete_get_stack_response.body.to_map.return_value = {
@@ -1278,7 +1337,7 @@ async def test_terminal_status_emits_deployment_telemetry_when_resource_polling_
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -1325,7 +1384,7 @@ def flaky_log_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -1375,7 +1434,7 @@ def flaky_log_event(event_name: str, metadata: dict | None = None) -> None:
             result = await tool.execute(
                 tool_input={
                     "action": "CreateStack",
-                    "params": {"StackName": "test", "TemplateBody": "{}"},
+                    "params": {"StackName": "test", "TemplateURL": _REMOTE_TEMPLATE_URL},
                     "region_id": "cn-hangzhou",
                 },
                 context=ToolContext(),
@@ -1412,8 +1471,8 @@ async def test_continue_create_stack(self, stack):
     @pytest.mark.parametrize(
         ("action", "params", "sdk_method"),
         [
-            ("CreateStack", {"StackName": "n", "TemplateBody": "{}"}, "create_stack"),
-            ("UpdateStack", {"StackId": "sx", "TemplateBody": "{}"}, "update_stack"),
+            ("CreateStack", {"StackName": "n", "TemplateURL": _REMOTE_TEMPLATE_URL}, "create_stack"),
+            ("UpdateStack", {"StackId": "sx", "TemplateURL": _REMOTE_TEMPLATE_URL}, "update_stack"),
             ("ContinueCreateStack", {"StackId": "sx"}, "continue_create_stack"),
             ("DeleteStack", {"StackId": "sx"}, "delete_stack"),
         ],
@@ -1452,7 +1511,17 @@ async def test_template_url_local_file_read(self, stack, tmp_path):
         assert result == "stack-fake"
 
     @pytest.mark.asyncio
-    async def test_template_body_dict_to_json(self, stack):
+    async def test_template_body_dict_is_rejected_in_pipeline(self, stack):
+        with pytest.raises(ValueError, match="TemplateURL"):
+            await stack.call_action(
+                "CreateStack",
+                {"StackName": "n", "TemplateBody": {"ROSTemplateFormatVersion": "2015-09-01"}},
+                "cn-hangzhou",
+                pipeline_mode=True,
+            )
+
+    @pytest.mark.asyncio
+    async def test_template_body_dict_to_json_outside_pipeline(self, stack):
         result = await stack.call_action(
             "CreateStack",
             {"StackName": "n", "TemplateBody": {"ROSTemplateFormatVersion": "2015-09-01"}},
@@ -1534,7 +1603,7 @@ async def test_create_stack_parameters_survive_hooks_for_typed_sdk(self, monkeyp
             "CreateStack",
             {
                 "StackName": "n",
-                "TemplateBody": _MINIMAL_TEMPLATE_BODY,
+                "TemplateURL": _REMOTE_TEMPLATE_URL,
                 "Parameters": [
                     {"ParameterKey": "VpcId", "ParameterValue": "vpc-123"},
                     {"ParameterKey": "ZoneId", "ParameterValue": "cn-hangzhou-h"},
@@ -1562,7 +1631,7 @@ async def test_create_stack_flat_parameters_are_restored_for_typed_sdk(self, mon
             "CreateStack",
             {
                 "StackName": "n",
-                "TemplateBody": _MINIMAL_TEMPLATE_BODY,
+                "TemplateURL": _REMOTE_TEMPLATE_URL,
                 "Parameters.1.ParameterKey": "VpcId",
                 "Parameters.1.ParameterValue": "vpc-123",
             },
@@ -1587,7 +1656,7 @@ async def test_update_stack_flat_parameters_are_restored_for_typed_sdk(self, mon
             "UpdateStack",
             {
                 "StackId": "stack-123",
-                "TemplateBody": _MINIMAL_TEMPLATE_BODY,
+                "TemplateURL": _REMOTE_TEMPLATE_URL,
                 "Parameters.1.ParameterKey": "VpcId",
                 "Parameters.1.ParameterValue": "vpc-123",
             },
diff --git a/tests/tools/cloud/test_base_stack.py b/tests/tools/cloud/test_base_stack.py
index 04a0356a..206fae2f 100644
--- a/tests/tools/cloud/test_base_stack.py
+++ b/tests/tools/cloud/test_base_stack.py
@@ -10,7 +10,7 @@
 from iac_code.tools.base import ToolContext
 from iac_code.tools.cloud.base_stack import BaseCloudStack
 from iac_code.tools.cloud.types import ResourceStatus, StackStatus
-from iac_code.types.stream_events import StackProgressEvent
+from iac_code.types.stream_events import ResourceObservedEvent, StackProgressEvent
 
 
 class MockCloudStack(BaseCloudStack):
@@ -82,6 +82,11 @@ def is_action_success(self, action: str, status: StackStatus) -> bool:
         return action == "DeleteStack" and status.status == "DELETE_COMPLETE"
 
 
+class EmptyStackIdCloudStack(MockCloudStack):
+    async def call_action(self, action: str, params: dict, region: str) -> str:
+        return ""
+
+
 class HookCapturingCloudStack(MockCloudStack):
     def __init__(self) -> None:
         super().__init__()
@@ -215,6 +220,53 @@ async def test_execute_emits_progress_events_to_queue(self, stack: MockCloudStac
         assert first.stack_id == "stack-id-123"
         assert first.stack_name == "test-stack"
 
+    @pytest.mark.asyncio
+    async def test_execute_emits_resource_observed_before_progress(self, stack: MockCloudStack) -> None:
+        queue: asyncio.Queue = asyncio.Queue()
+        context = ToolContext(event_queue=queue, tool_use_id="toolu-create")
+
+        await stack.execute(
+            tool_input={
+                "action": "CreateStack",
+                "params": {"StackName": "test", "TemplateBody": "secret template", "DbPassword": "super-secret"},
+                "region_id": "cn-hangzhou",
+            },
+            context=context,
+        )
+
+        events = []
+        while not queue.empty():
+            events.append(await queue.get())
+
+        assert isinstance(events[0], ResourceObservedEvent)
+        assert events[0].provider == "mock"
+        assert events[0].resource_type == "stack"
+        assert events[0].resource_id == "stack-id-123"
+        assert events[0].resource_name == "test"
+        assert events[0].region_id == "cn-hangzhou"
+        assert events[0].action == "CreateStack"
+        assert events[0].tool_name == "mock_stack"
+        assert events[0].tool_use_id == "toolu-create"
+        assert events[0].metadata == {}
+        assert any(isinstance(event, StackProgressEvent) for event in events[1:])
+
+    @pytest.mark.asyncio
+    async def test_execute_does_not_emit_resource_observed_for_empty_stack_id(self) -> None:
+        stack = EmptyStackIdCloudStack()
+        queue: asyncio.Queue = asyncio.Queue()
+        context = ToolContext(cwd="/tmp", event_queue=queue, tool_use_id="toolu-1")
+
+        await stack.execute(
+            tool_input={"action": "CreateStack", "params": {}},
+            context=context,
+        )
+
+        events = []
+        while not queue.empty():
+            events.append(await queue.get())
+
+        assert not any(isinstance(event, ResourceObservedEvent) for event in events)
+
     @pytest.mark.asyncio
     async def test_execute_invalid_action_returns_error(self, stack: MockCloudStack, context: ToolContext) -> None:
         result = await stack.execute(
diff --git a/tests/tools/test_base.py b/tests/tools/test_base.py
index 8f8f6c2c..3018336a 100644
--- a/tests/tools/test_base.py
+++ b/tests/tools/test_base.py
@@ -19,6 +19,13 @@ def test_custom_cwd(self):
         ctx = ToolContext(cwd="/tmp")
         assert ctx.cwd == "/tmp"
 
+    def test_tool_use_id_positional_compatibility(self):
+        """Adding fields must not shift the existing tool_use_id positional slot."""
+        ctx = ToolContext("/tmp", None, [], [], "toolu-1")
+
+        assert ctx.tool_use_id == "toolu-1"
+        assert ctx.relative_read_directories == []
+
 
 class TestToolResult:
     """Tests for ToolResult."""
diff --git a/tests/tools/test_path_safety.py b/tests/tools/test_path_safety.py
index 3f4f90fc..a9051e54 100644
--- a/tests/tools/test_path_safety.py
+++ b/tests/tools/test_path_safety.py
@@ -147,3 +147,23 @@ def test_windows_root_containment_is_case_insensitive(monkeypatch, tmp_path):
     child = root / "src" / "app.py"
 
     assert _path_is_under(str(child).upper(), str(root).lower())
+
+
+def test_macos_case_insensitive_root_containment_allows_differently_cased_project_path(monkeypatch, tmp_path):
+    import iac_code.tools.path_safety as path_safety
+
+    monkeypatch.setattr(path_safety.sys, "platform", "darwin")
+    monkeypatch.setattr(path_safety, "_path_case_sensitive", lambda _root: False, raising=False)
+    cwd = tmp_path / "Project"
+    child = cwd / "src" / "app.py"
+    child.parent.mkdir(parents=True)
+    child.write_text("print('ok')", encoding="utf-8")
+
+    result = check_read_path(
+        str(child).upper(),
+        cwd=str(cwd).lower(),
+        additional_directories=[],
+        trusted_read_directories=[],
+    )
+
+    assert result.behavior == "allow"
diff --git a/tests/tools/test_read_file.py b/tests/tools/test_read_file.py
index 1f0ffa08..b4871c6d 100644
--- a/tests/tools/test_read_file.py
+++ b/tests/tools/test_read_file.py
@@ -1,5 +1,7 @@
 """Tests for the ReadFile tool."""
 
+import ntpath
+
 import pytest
 
 from iac_code.tools.base import ToolContext
@@ -25,6 +27,30 @@ def test_tool_properties(self, read_file_tool):
     def test_supports_blanket_allow_is_false(self, read_file_tool):
         assert read_file_tool.supports_blanket_allow is False
 
+    def test_path_is_under_windows_case_insensitive(self, monkeypatch):
+        monkeypatch.setattr("iac_code.tools.path_safety.sys.platform", "win32")
+        from iac_code.tools.read_file import _path_is_under
+
+        assert _path_is_under("C:\\Users\\Alice\\project\\file.txt", "c:/users/alice/project")
+
+    def test_path_is_under_windows_ntpath_separator_normalization(self, monkeypatch):
+        import iac_code.tools.path_safety as path_safety
+        import iac_code.tools.read_file as read_file
+
+        monkeypatch.setattr(path_safety.sys, "platform", "win32")
+        monkeypatch.setattr(path_safety.os, "path", ntpath)
+
+        assert read_file._path_is_under("C:\\Users\\Alice\\project\\file.txt", "c:/users/alice/project")
+
+    def test_path_is_under_darwin_case_insensitive_volume(self, monkeypatch):
+        import iac_code.tools.path_safety as path_safety
+        import iac_code.tools.read_file as read_file
+
+        monkeypatch.setattr(path_safety.sys, "platform", "darwin")
+        monkeypatch.setattr(path_safety, "_path_case_sensitive", lambda _root: False, raising=False)
+
+        assert read_file._path_is_under("/Users/Alice/project/file.txt", "/users/alice/project")
+
     @pytest.mark.asyncio
     async def test_read_normal_file(self, tmp_path, read_file_tool):
         """Test reading a normal file."""
@@ -122,6 +148,64 @@ async def test_read_file_in_subdirectory(self, tmp_path, read_file_tool):
         assert result.is_error is False
         assert "Nested content" in result.content
 
+    @pytest.mark.asyncio
+    async def test_relative_path_falls_back_to_relative_read_directory(self, tmp_path, read_file_tool):
+        """Skill reference links should resolve from explicit relative read roots when absent from cwd."""
+        workspace = tmp_path / "workspace"
+        workspace.mkdir()
+        skill_root = tmp_path / "skill"
+        reference = skill_root / "references" / "template-parameters.md"
+        reference.parent.mkdir(parents=True)
+        reference.write_text("Parameter reference content", encoding="utf-8")
+
+        context = ToolContext(cwd=str(workspace), relative_read_directories=[str(skill_root)])
+        result = await read_file_tool.execute(
+            tool_input={"path": "references/template-parameters.md"},
+            context=context,
+        )
+
+        assert result.is_error is False
+        assert "Parameter reference content" in result.content
+        assert f"File: {reference}" in result.content
+
+    @pytest.mark.asyncio
+    async def test_relative_path_does_not_fall_back_to_trusted_read_directory(self, tmp_path, read_file_tool):
+        """Trusted read roots should allow explicit reads without changing relative lookup semantics."""
+        workspace = tmp_path / "workspace"
+        workspace.mkdir()
+        trusted_root = tmp_path / "trusted"
+        reference = trusted_root / "references" / "template-parameters.md"
+        reference.parent.mkdir(parents=True)
+        reference.write_text("Trusted reference content", encoding="utf-8")
+
+        context = ToolContext(cwd=str(workspace), trusted_read_directories=[str(trusted_root)])
+        result = await read_file_tool.execute(
+            tool_input={"path": "references/template-parameters.md"},
+            context=context,
+        )
+
+        assert result.is_error is True
+        assert f"File not found: {workspace / 'references' / 'template-parameters.md'}" in result.content
+
+    @pytest.mark.asyncio
+    async def test_relative_path_does_not_fall_back_to_additional_directory(self, tmp_path, read_file_tool):
+        """Additional directories should not change relative path lookup semantics."""
+        workspace = tmp_path / "workspace"
+        workspace.mkdir()
+        shared_root = tmp_path / "shared"
+        reference = shared_root / "references" / "template-parameters.md"
+        reference.parent.mkdir(parents=True)
+        reference.write_text("Shared reference content", encoding="utf-8")
+
+        context = ToolContext(cwd=str(workspace), additional_directories=[str(shared_root)])
+        result = await read_file_tool.execute(
+            tool_input={"path": "references/template-parameters.md"},
+            context=context,
+        )
+
+        assert result.is_error is True
+        assert f"File not found: {workspace / 'references' / 'template-parameters.md'}" in result.content
+
     @pytest.mark.asyncio
     async def test_read_file_start_line_only(self, tmp_path, read_file_tool):
         """Test reading with only start_line specified."""
diff --git a/tests/tools/test_tool_context.py b/tests/tools/test_tool_context.py
new file mode 100644
index 00000000..5728edfe
--- /dev/null
+++ b/tests/tools/test_tool_context.py
@@ -0,0 +1,9 @@
+from iac_code.tools.base import ToolContext
+
+
+def test_tool_context_positional_tool_use_id_compatibility() -> None:
+    context = ToolContext("/tmp/project", None, "toolu-1")
+
+    assert context.cwd == "/tmp/project"
+    assert context.event_queue is None
+    assert context.tool_use_id == "toolu-1"
diff --git a/tests/tools/test_tool_executor.py b/tests/tools/test_tool_executor.py
index c78e12bc..4cfe73c3 100644
--- a/tests/tools/test_tool_executor.py
+++ b/tests/tools/test_tool_executor.py
@@ -113,6 +113,42 @@ async def execute(self, *, tool_input, context):
         assert len(results) == 5
         assert all(r.content == "read result" for r in results)
 
+    async def test_preserves_tool_context_read_roots(self):
+        class CapturingReadTool(FakeReadTool):
+            async def execute(self, *, tool_input, context):
+                roots = ",".join(context.trusted_read_directories)
+                return ToolResult.success(roots)
+
+        read_tool = CapturingReadTool()
+        registry = MagicMock()
+        registry.get = lambda name: read_tool
+        executor = ToolExecutor(registry=registry)
+
+        results = await executor.execute_batch(
+            [ToolCallRequest(id="read-1", name="read", input={})],
+            ToolContext(trusted_read_directories=["/tmp/skill-root"]),
+        )
+
+        assert results[0].content == "/tmp/skill-root"
+
+    async def test_preserves_tool_context_relative_read_roots(self):
+        class CapturingReadTool(FakeReadTool):
+            async def execute(self, *, tool_input, context):
+                roots = ",".join(context.relative_read_directories)
+                return ToolResult.success(roots)
+
+        read_tool = CapturingReadTool()
+        registry = MagicMock()
+        registry.get = lambda name: read_tool
+        executor = ToolExecutor(registry=registry)
+
+        results = await executor.execute_batch(
+            [ToolCallRequest(id="read-1", name="read", input={})],
+            ToolContext(relative_read_directories=["/tmp/skill-root"]),
+        )
+
+        assert results[0].content == "/tmp/skill-root"
+
     async def test_serial_order(self):
         order = []
 
@@ -190,6 +226,21 @@ async def execute(self, *, tool_input, context):
         assert tool.seen_context_queues == {"first": first_queue, "second": second_queue}
         assert tool._event_queue is None
 
+    async def test_pipeline_mode_is_preserved_in_derived_tool_context(self):
+        class ContextAwareTool(FakeReadTool):
+            async def execute(self, *, tool_input, context):
+                return ToolResult.success(str(context.pipeline_mode))
+
+        tool = ContextAwareTool()
+        registry = MagicMock()
+        registry.get = lambda name: tool
+        executor = ToolExecutor(registry=registry)
+        calls = [ToolCallRequest(id="a", name="read", input={})]
+
+        results = await executor.execute_batch(calls, ToolContext(pipeline_mode=True))
+
+        assert results[0].content == "True"
+
 
 class FakeStrictTool(Tool):
     @property
diff --git a/tests/ui/core/test_prompt_input.py b/tests/ui/core/test_prompt_input.py
index 7a6e1afb..54f003c5 100644
--- a/tests/ui/core/test_prompt_input.py
+++ b/tests/ui/core/test_prompt_input.py
@@ -520,6 +520,39 @@ def read_key(self):
         assert aggregator.updated == [("h", 1), ("hi", 2)]
         assert out.getvalue().endswith("\n")
 
+    def test_input_loop_initializes_next_image_id_from_store(self, monkeypatch):
+        import iac_code.ui.core.prompt_input as prompt_mod
+
+        events = iter([_key("enter")])
+
+        class FakeCapture:
+            def __enter__(self):
+                return self
+
+            def __exit__(self, *args):
+                return False
+
+            def read_key(self):
+                return next(events, None)
+
+        class FakeImageStore:
+            def next_image_id(self):
+                return 8
+
+        out = StringIO()
+        monkeypatch.setattr(prompt_mod, "sys", SimpleNamespace(stdout=out))
+        monkeypatch.setattr(
+            prompt_mod.shutil,
+            "get_terminal_size",
+            lambda *args, **kwargs: os.terminal_size((40, 24)),
+        )
+        monkeypatch.setattr("iac_code.ui.core.raw_input.RawInputCapture", FakeCapture)
+
+        inp = make_input(image_store=FakeImageStore())
+
+        assert inp._input_loop("❯ ") == ""
+        assert inp.next_paste_id() == 8
+
     def test_input_loop_returns_none_on_ctrl_c_with_empty_buffer(self, monkeypatch):
         import iac_code.ui.core.prompt_input as prompt_mod
 
diff --git a/tests/ui/dialogs/test_resume_picker.py b/tests/ui/dialogs/test_resume_picker.py
index 301f6ead..ccf3ab29 100644
--- a/tests/ui/dialogs/test_resume_picker.py
+++ b/tests/ui/dialogs/test_resume_picker.py
@@ -10,6 +10,7 @@
 from rich.console import Console as RichConsole
 
 from iac_code.agent.message import Message, create_recalled_memory_message
+from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
 from iac_code.services.session_index import SessionEntry, SessionIndex
 from iac_code.services.session_storage import SessionStorage
 from iac_code.ui.core.key_event import KeyEvent
@@ -116,6 +117,7 @@ def test_fallback_preview_hides_recalled_memory_messages(self):
             [
                 Message(role="user", content="visible question"),
                 create_recalled_memory_message("# Recalled Memory\nPrefer ROS YAML.", ["ros-yaml.md"]),
+                create_cleanup_prompt_message("cleanup hidden prompt"),
                 Message(role="assistant", content="visible answer"),
             ],
         )
@@ -125,6 +127,7 @@ def test_fallback_preview_hides_recalled_memory_messages(self):
         assert "visible answer" in output
         assert "Prefer ROS YAML" not in output
         assert "Relevant persistent memories" not in output
+        assert "cleanup hidden prompt" not in output
 
     def test_supplied_entries_are_not_reloaded_when_toggling_all_projects(self):
         index = MagicMock()
diff --git a/tests/ui/test_pipeline_interrupt_ui.py b/tests/ui/test_pipeline_interrupt_ui.py
index 2b376ff8..dec9ac2a 100644
--- a/tests/ui/test_pipeline_interrupt_ui.py
+++ b/tests/ui/test_pipeline_interrupt_ui.py
@@ -704,6 +704,33 @@ def test_render_pipeline_event_does_not_mutate_pipeline_step_names(self, mock_re
 
 
 class TestPipelineEventStyles:
+    def test_render_pipeline_warning_prints_non_terminal_warning(self, mock_repl):
+        from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+
+        printed = []
+
+        class CaptureConsole:
+            def print(self, *args, **kwargs):
+                if args:
+                    printed.extend(str(arg) for arg in args)
+                else:
+                    printed.append("")
+
+        mock_repl.renderer = SimpleNamespace(console=CaptureConsole())
+
+        mock_repl._render_pipeline_event(
+            PipelineEvent(
+                type=PipelineEventType.PIPELINE_WARNING,
+                step_id="deploying",
+                timestamp=0,
+                data={"reason": "cleanup_tracking_unavailable"},
+            )
+        )
+
+        rendered = "\n".join(printed)
+        assert "cleanup_tracking_unavailable" in rendered
+        assert "yellow" in rendered
+
     def test_render_pipeline_event_uses_slate_sky_label_styles(self, mock_repl):
         from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
         from iac_code.ui.pipeline_styles import PIPELINE_STEP_HEADER_STYLE, PIPELINE_TITLE_STYLE
diff --git a/tests/ui/test_renderer_helpers.py b/tests/ui/test_renderer_helpers.py
index 5359834e..f172cca8 100644
--- a/tests/ui/test_renderer_helpers.py
+++ b/tests/ui/test_renderer_helpers.py
@@ -6,7 +6,8 @@
 import pytest
 from rich.console import Console
 
-from iac_code.agent.message import Message, create_recalled_memory_message
+from iac_code.agent.message import ImageBlock, Message, TextBlock, create_recalled_memory_message
+from iac_code.pipeline.engine.cleanup import CLEANUP_PROMPT_METADATA_TYPE
 from iac_code.tools.base import Tool, ToolContext, ToolRegistry, ToolResult
 from iac_code.tools.read_file import ReadFileTool
 from iac_code.types.stream_events import StackInstancesProgressEvent, StackProgressEvent
@@ -35,6 +36,18 @@ def make_console(width: int = 80, height: int = 12) -> Console:
     )
 
 
+def make_link_console(width: int = 80, height: int = 12) -> Console:
+    return Console(
+        file=StringIO(),
+        width=width,
+        height=height,
+        force_terminal=True,
+        color_system="standard",
+        legacy_windows=False,
+        _environ={},
+    )
+
+
 class DemoTool(Tool):
     @property
     def name(self) -> str:
@@ -181,6 +194,70 @@ def test_replay_history_hides_recalled_memory_messages(self):
         assert "Prefer ROS YAML" not in output
         assert "Relevant persistent memories" not in output
 
+    def test_replay_history_hides_pipeline_cleanup_prompt(self):
+        renderer = make_renderer()
+
+        renderer.replay_history(
+            [
+                Message(role="user", content="visible question"),
+                Message(
+                    role="user",
+                    content="hidden cleanup prompt",
+                    metadata={"type": CLEANUP_PROMPT_METADATA_TYPE},
+                ),
+                Message(role="assistant", content="visible answer"),
+            ]
+        )
+
+        output = renderer.console.file.getvalue()
+        assert "visible question" in output
+        assert "visible answer" in output
+        assert "hidden cleanup prompt" not in output
+
+    def test_replay_history_does_not_link_plain_image_refs_without_image_blocks(self):
+        console = make_link_console()
+        registry = ToolRegistry()
+        renderer = Renderer(
+            console,
+            registry,
+            status_callback=lambda: "ready",
+            image_path_resolver=lambda image_id: f"/tmp/session-image-{image_id}.png",
+        )
+
+        renderer.replay_history([Message(role="user", content="see [Image #1]")])
+
+        output = console.file.getvalue()
+        assert "[Image #1]" in output
+        assert "\x1b]8;" not in output
+        assert "file:///tmp/session-image-1.png" not in output
+
+    def test_replay_history_renders_structured_image_blocks_as_image_refs(self):
+        console = make_link_console()
+        registry = ToolRegistry()
+        renderer = Renderer(
+            console,
+            registry,
+            status_callback=lambda: "ready",
+            image_block_path_resolver=lambda block: f"/tmp/session-image-{block.ref_id}.png",
+        )
+
+        renderer.replay_history(
+            [
+                Message(
+                    role="user",
+                    content=[
+                        TextBlock(text="see "),
+                        ImageBlock(media_type="image/png", data="aGVsbG8=", ref_id=8),
+                    ],
+                )
+            ]
+        )
+
+        output = console.file.getvalue()
+        assert "see " in output
+        assert "[Image #8]" in output
+        assert renderer._file_url("/tmp/session-image-8.png") in output
+
     def test_any_segment_has_verbose_content(self):
         renderer = make_renderer()
         segments = [
diff --git a/tests/ui/test_repl_integration.py b/tests/ui/test_repl_integration.py
index 441f498a..01b9de84 100644
--- a/tests/ui/test_repl_integration.py
+++ b/tests/ui/test_repl_integration.py
@@ -449,6 +449,375 @@ def test_swap_session_refreshes_session_name_and_renders_banner():
     repl.console.print.assert_called_once_with("banner")
 
 
+def test_swap_session_marks_completed_cleanup_prompt(tmp_path: Path):
+    from iac_code.agent.message import Message
+    from iac_code.pipeline.engine.cleanup import (
+        CleanupLedger,
+        CleanupResource,
+        create_cleanup_prompt_message,
+    )
+    from iac_code.services.session_storage import SessionStorage
+    from iac_code.ui.repl import InlineREPL
+
+    cwd = str(tmp_path / "repo")
+    Path(cwd).mkdir()
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    new_session_id = "new-session"
+    ledger = CleanupLedger(storage.session_dir(cwd, new_session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-deleted",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(
+        cwd,
+        new_session_id,
+        create_cleanup_prompt_message(cleanup_prompt.prompt, cleanup_ledger_path=ledger.path, cleanup_status="pending"),
+    )
+    storage.append(cwd, new_session_id, Message(role="assistant", content="cleanup finished"))
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-deleted",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._original_cwd = cwd
+    repl._session_id = "old-session"
+    repl._session_storage = storage
+    repl._agent_loop = SimpleNamespace(replace_session=Mock())
+    repl._load_current_session_name = Mock(return_value=None)
+    repl._load_pipeline_display_replay_model = Mock(return_value=None)
+    repl.current_git_branch = Mock(return_value="main")
+    repl.store = SimpleNamespace(get_state=Mock(return_value=SimpleNamespace(model="test-model", cwd=cwd)))
+    repl.console = SimpleNamespace(file=SimpleNamespace(write=Mock(), flush=Mock()), print=Mock())
+    repl.renderer = SimpleNamespace(replay_history=Mock())
+
+    repl.swap_session(new_session_id)
+
+    messages = storage.load(cwd, new_session_id)
+    cleanup_messages = [message for message in messages if message.metadata.get("type") == "pipeline_cleanup_prompt"]
+    assert cleanup_messages[0].metadata["cleanupStatus"] == "completed"
+
+
+def test_swap_session_prints_cleanup_resume_summary(tmp_path: Path):
+    from iac_code.agent.message import Message
+    from iac_code.pipeline.engine.cleanup import (
+        CleanupLedger,
+        CleanupResource,
+        create_cleanup_prompt_message,
+    )
+    from iac_code.services.session_storage import SessionStorage
+    from iac_code.ui.repl import InlineREPL
+
+    cwd = str(tmp_path / "repo")
+    Path(cwd).mkdir()
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    new_session_id = "new-session"
+    ledger = CleanupLedger(storage.session_dir(cwd, new_session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-deleted",
+                resource_name="demo-stack",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(
+        cwd,
+        new_session_id,
+        create_cleanup_prompt_message(cleanup_prompt.prompt, cleanup_ledger_path=ledger.path, cleanup_status="pending"),
+    )
+    storage.append(cwd, new_session_id, Message(role="assistant", content="cleanup finished"))
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-deleted",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._original_cwd = cwd
+    repl._session_id = "old-session"
+    repl._session_storage = storage
+    repl._agent_loop = SimpleNamespace(replace_session=Mock())
+    repl._load_current_session_name = Mock(return_value=None)
+    repl._load_pipeline_display_replay_model = Mock(return_value=None)
+    repl.current_git_branch = Mock(return_value="main")
+    repl.store = SimpleNamespace(get_state=Mock(return_value=SimpleNamespace(model="test-model", cwd=cwd)))
+    repl.console = SimpleNamespace(file=SimpleNamespace(write=Mock(), flush=Mock()), print=Mock())
+    repl.renderer = SimpleNamespace(replay_history=Mock(), print_system_message=Mock())
+
+    repl.swap_session(new_session_id)
+
+    rendered = "\n".join(call.args[0] for call in repl.renderer.print_system_message.call_args_list)
+    assert "↺ Rollback cleanup resume: all 1 records are completed." in rendered
+    assert "Rollback cleanup [Completed] demo-stack" not in rendered
+    assert "stack-deleted" not in rendered
+    assert "status=" not in rendered
+    assert "progress=" not in rendered
+    replayed = repl.renderer.replay_history.call_args.args[0]
+    assert all(message.metadata.get("type") != "pipeline_cleanup_prompt" for message in replayed)
+
+
+def test_swap_session_prints_cleanup_resume_summary_for_completed_prompt(tmp_path: Path):
+    from iac_code.agent.message import Message
+    from iac_code.pipeline.engine.cleanup import (
+        CleanupLedger,
+        CleanupResource,
+        create_cleanup_prompt_message,
+    )
+    from iac_code.services.session_storage import SessionStorage
+    from iac_code.ui.repl import InlineREPL
+
+    cwd = str(tmp_path / "repo")
+    Path(cwd).mkdir()
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    new_session_id = "new-session"
+    ledger = CleanupLedger(storage.session_dir(cwd, new_session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-deleted",
+                resource_name="demo-stack",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(
+        cwd,
+        new_session_id,
+        create_cleanup_prompt_message(
+            cleanup_prompt.prompt,
+            cleanup_ledger_path=ledger.path,
+            cleanup_status="completed",
+        ),
+    )
+    storage.append(cwd, new_session_id, Message(role="assistant", content="cleanup finished"))
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-deleted",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._original_cwd = cwd
+    repl._session_id = "old-session"
+    repl._session_storage = storage
+    repl._agent_loop = SimpleNamespace(replace_session=Mock())
+    repl._load_current_session_name = Mock(return_value=None)
+    repl._load_pipeline_display_replay_model = Mock(return_value=None)
+    repl.current_git_branch = Mock(return_value="main")
+    repl.store = SimpleNamespace(get_state=Mock(return_value=SimpleNamespace(model="test-model", cwd=cwd)))
+    repl.console = SimpleNamespace(file=SimpleNamespace(write=Mock(), flush=Mock()), print=Mock())
+    repl.renderer = SimpleNamespace(replay_history=Mock(), print_system_message=Mock())
+
+    repl.swap_session(new_session_id)
+
+    rendered = "\n".join(call.args[0] for call in repl.renderer.print_system_message.call_args_list)
+    assert "↺ Rollback cleanup resume: all 1 records are completed." in rendered
+    assert "Rollback cleanup [Completed] demo-stack" not in rendered
+    assert "DELETE_COMPLETE" not in rendered
+
+
+def test_swap_session_prints_failed_cleanup_resume_summary(tmp_path: Path):
+    from iac_code.agent.message import Message
+    from iac_code.pipeline.engine.cleanup import (
+        CleanupLedger,
+        CleanupResource,
+        create_cleanup_prompt_message,
+    )
+    from iac_code.services.session_storage import SessionStorage
+    from iac_code.ui.repl import InlineREPL
+
+    cwd = str(tmp_path / "repo")
+    Path(cwd).mkdir()
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    new_session_id = "new-session"
+    ledger = CleanupLedger(storage.session_dir(cwd, new_session_id) / "pipeline" / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-failed",
+                resource_name="failed-stack",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(
+        cwd,
+        new_session_id,
+        create_cleanup_prompt_message(cleanup_prompt.prompt, cleanup_ledger_path=ledger.path, cleanup_status="pending"),
+    )
+    storage.append(cwd, new_session_id, Message(role="assistant", content="cleanup failed"))
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-failed",
+        region_id="cn-hangzhou",
+        cleanup_status="failed",
+        progress_status="DELETE_FAILED",
+        last_error="DELETE_FAILED: stack still has dependency",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._original_cwd = cwd
+    repl._session_id = "old-session"
+    repl._session_storage = storage
+    repl._agent_loop = SimpleNamespace(replace_session=Mock())
+    repl._load_current_session_name = Mock(return_value=None)
+    repl._load_pipeline_display_replay_model = Mock(return_value=None)
+    repl.current_git_branch = Mock(return_value="main")
+    repl.store = SimpleNamespace(get_state=Mock(return_value=SimpleNamespace(model="test-model", cwd=cwd)))
+    repl.console = SimpleNamespace(file=SimpleNamespace(write=Mock(), flush=Mock()), print=Mock())
+    repl.renderer = SimpleNamespace(replay_history=Mock(), print_system_message=Mock())
+
+    repl.swap_session(new_session_id)
+
+    rendered = "\n".join(call.args[0] for call in repl.renderer.print_system_message.call_args_list)
+    assert "↺ Rollback cleanup resume: 1 records, 1 failed." in rendered
+    assert "  [Failed] failed-stack" in rendered
+    assert "↺ Rollback cleanup [Failed] failed-stack" not in rendered
+    assert "stack stack-failed · cn-hangzhou" in rendered
+    assert "DELETE_FAILED" in rendered
+    assert "dependency" in rendered
+    assert "status=" not in rendered
+    assert "progress=" not in rendered
+    replayed = repl.renderer.replay_history.call_args.args[0]
+    assert all(message.metadata.get("type") != "pipeline_cleanup_prompt" for message in replayed)
+
+
+def test_pipeline_visible_resume_messages_hides_pending_cleanup_prompt():
+    from iac_code.agent.message import Message
+    from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
+    from iac_code.ui.repl import InlineREPL
+
+    cleanup = create_cleanup_prompt_message("hidden cleanup prompt", cleanup_status="pending")
+    messages = [Message(role="user", content="visible"), cleanup, Message(role="assistant", content="answer")]
+
+    visible = InlineREPL._pipeline_visible_resume_messages(messages)
+
+    assert [message.content for message in visible] == ["visible", "answer"]
+
+
+def test_swap_session_clears_stale_cleanup_ledger_path_before_pruning(tmp_path: Path):
+    from iac_code.agent.message import Message
+    from iac_code.pipeline.engine.cleanup import (
+        CleanupLedger,
+        CleanupResource,
+        ObservedResource,
+        create_cleanup_prompt_message,
+    )
+    from iac_code.services.session_storage import SessionStorage
+    from iac_code.ui.repl import InlineREPL
+
+    cwd = str(tmp_path / "repo")
+    Path(cwd).mkdir()
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+
+    old_ledger = CleanupLedger(tmp_path / "old-cleanup.yaml")
+    old_ledger.record_observed(
+        ObservedResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="old-stack",
+            region_id="cn-hangzhou",
+            observed_action="CreateStack",
+        )
+    )
+
+    new_session_id = "new-session"
+    new_ledger = CleanupLedger(storage.session_dir(cwd, new_session_id) / "pipeline" / "cleanup.yaml")
+    new_ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-deleted",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = new_ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    storage.append(
+        cwd,
+        new_session_id,
+        create_cleanup_prompt_message(
+            cleanup_prompt.prompt,
+            cleanup_ledger_path=new_ledger.path,
+            cleanup_status="pending",
+        ),
+    )
+    storage.append(cwd, new_session_id, Message(role="assistant", content="cleanup finished"))
+    new_ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-deleted",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._original_cwd = cwd
+    repl._session_id = "old-session"
+    repl._pipeline_cleanup_ledger_path = old_ledger.path
+    repl._session_storage = storage
+    repl._agent_loop = SimpleNamespace(replace_session=Mock())
+    repl._load_current_session_name = Mock(return_value=None)
+    repl._load_pipeline_display_replay_model = Mock(return_value=None)
+    repl.current_git_branch = Mock(return_value="main")
+    repl.store = SimpleNamespace(get_state=Mock(return_value=SimpleNamespace(model="test-model", cwd=cwd)))
+    repl.console = SimpleNamespace(file=SimpleNamespace(write=Mock(), flush=Mock()), print=Mock())
+    repl.renderer = SimpleNamespace(replay_history=Mock())
+
+    repl.swap_session(new_session_id)
+
+    messages = storage.load(cwd, new_session_id)
+    cleanup_messages = [message for message in messages if message.metadata.get("type") == "pipeline_cleanup_prompt"]
+    assert cleanup_messages[0].metadata["cleanupStatus"] == "completed"
+    assert not hasattr(repl, "_pipeline_cleanup_ledger_path")
+
+
 def test_swap_session_refreshes_session_trusted_read_directories(monkeypatch, tmp_path):
     from iac_code.state.app_state import AppState
     from iac_code.types.permissions import ToolPermissionContext
@@ -494,6 +863,7 @@ def test_swap_session_refreshes_session_trusted_read_directories(monkeypatch, tm
 
 def test_extract_last_user_text_skips_recalled_memory_message():
     from iac_code.agent.message import Message, create_recalled_memory_message
+    from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
     from iac_code.ui.repl import InlineREPL
 
     text = InlineREPL._extract_last_user_text(
@@ -501,6 +871,7 @@ def test_extract_last_user_text_skips_recalled_memory_message():
             Message(role="user", content="real prompt"),
             Message(role="assistant", content="answer"),
             create_recalled_memory_message("# Recalled Memory\nhidden prompt", ["topic.md"]),
+            create_cleanup_prompt_message("cleanup hidden prompt"),
         ]
     )
 
@@ -509,6 +880,7 @@ def test_extract_last_user_text_skips_recalled_memory_message():
 
 def test_history_search_messages_skips_recalled_memory_messages_and_leaked_entries():
     from iac_code.agent.message import RECALLED_MEMORY_MARKER, Message, create_recalled_memory_message
+    from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
     from iac_code.ui.repl import InlineREPL
 
     repl = InlineREPL.__new__(InlineREPL)
@@ -525,6 +897,7 @@ def test_history_search_messages_skips_recalled_memory_messages_and_leaked_entri
             get_messages=Mock(
                 return_value=[
                     create_recalled_memory_message("# Recalled Memory\nhidden context", ["topic.md"]),
+                    create_cleanup_prompt_message("cleanup hidden prompt"),
                     Message(role="user", content="context prompt"),
                 ]
             )
diff --git a/tests/ui/test_repl_parallel_auto_approve.py b/tests/ui/test_repl_parallel_auto_approve.py
index 98e4c43f..2ec2829c 100644
--- a/tests/ui/test_repl_parallel_auto_approve.py
+++ b/tests/ui/test_repl_parallel_auto_approve.py
@@ -292,6 +292,79 @@ async def stream():
         await asyncio.wait_for(repl._render_parallel_tabs(stream()), timeout=5.0)
 
 
+@pytest.mark.asyncio
+async def test_parallel_tabs_escape_interrupt_forwards_pipeline_user_input(monkeypatch, fake_live):
+    from iac_code.agent.message import ImageBlock, TextBlock
+    from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+    from iac_code.pipeline.engine.user_input import PipelineUserInput
+    from iac_code.ui.core.key_event import KeyEvent
+
+    image_input = PipelineUserInput(
+        content=[
+            TextBlock(text="change"),
+            ImageBlock(media_type="image/png", data="aGVsbG8="),
+        ],
+        display_text="change [Image #1]",
+        has_images=True,
+    )
+
+    repl = _make_repl(prompt_result=True)
+    repl._pipeline_waiting_input = False
+    repl._read_pipeline_interrupt_input = AsyncMock(return_value=image_input)
+    repl._handle_mid_pipeline_message = AsyncMock(return_value=(False, "feedback"))
+
+    pause_called = asyncio.Event()
+    repl._pipeline.pause_agent_loops = MagicMock(side_effect=pause_called.set)
+    repl._pipeline.resume_agent_loops = MagicMock()
+
+    class FakeCapture:
+        def __init__(self, *args, **kwargs):
+            self._sent = False
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, *args):
+            return False
+
+        def read_key(self, timeout):
+            if self._sent:
+                if timeout:
+                    time.sleep(min(timeout, 0.05))
+                return None
+            self._sent = True
+            return KeyEvent(key="escape", char="\x1b")
+
+    monkeypatch.setattr("iac_code.ui.core.raw_input.RawInputCapture", FakeCapture)
+
+    async def stream():
+        yield PipelineEvent(
+            type=PipelineEventType.SUB_PIPELINE_STARTED,
+            step_id=None,
+            timestamp=time.time(),
+            data={
+                "sub_pipeline_id": "sub_test_escape",
+                "candidate_index": 0,
+                "candidate_name": "方案1",
+                "total_steps": 1,
+                "sub_pipeline_name": "test",
+            },
+        )
+        await asyncio.wait_for(pause_called.wait(), timeout=1.0)
+        yield PipelineEvent(
+            type=PipelineEventType.STEP_COMPLETED,
+            step_id=None,
+            timestamp=time.time(),
+            data={},
+        )
+
+    interrupted = await asyncio.wait_for(repl._render_parallel_tabs(stream()), timeout=5.0)
+
+    assert interrupted is False
+    repl._read_pipeline_interrupt_input.assert_awaited_once()
+    repl._handle_mid_pipeline_message.assert_awaited_once_with(image_input, suppress_render=True)
+
+
 @pytest.mark.asyncio
 async def test_parallel_permission_prompt_exception_denies_and_resumes_ui(fake_live, key_reader_tasks):
     repl = _make_repl(prompt_result=True)
diff --git a/tests/ui/test_repl_parallel_tabs_lifecycle.py b/tests/ui/test_repl_parallel_tabs_lifecycle.py
index eb985608..9f3e69b9 100644
--- a/tests/ui/test_repl_parallel_tabs_lifecycle.py
+++ b/tests/ui/test_repl_parallel_tabs_lifecycle.py
@@ -152,6 +152,97 @@ async def aclose(self):
     assert outer_idx < recur_idx, f"outer_aclose must come BEFORE recursive call, got order: {aclose_order!r}"
 
 
+@pytest.mark.asyncio
+async def test_candidate_selection_clears_waiting_flag_before_recursive_render(monkeypatch):
+    from io import StringIO
+
+    from rich.console import Console
+
+    from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+    from iac_code.types.stream_events import DiagramEvent
+    from iac_code.ui.core.key_event import KeyEvent
+    from iac_code.ui.repl import InlineREPL
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
+    repl.store = MagicMock()
+    repl._pipeline_waiting_input = False
+    repl._render_interrupt_feedback_inline = MagicMock()
+    repl._render_pipeline_event = MagicMock()
+
+    recursive_waiting_flags: list[bool] = []
+
+    async def fake_render_pipeline_stream(_stream):
+        recursive_waiting_flags.append(repl._pipeline_waiting_input)
+
+    repl._render_pipeline_stream = fake_render_pipeline_stream
+
+    pipeline = MagicMock()
+    pipeline.resume = MagicMock(return_value=MagicMock(name="new_stream_after_resume"))
+    pipeline.state_machine = MagicMock(is_complete=False)
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.resume_agent_loops = MagicMock()
+    repl._pipeline = pipeline
+
+    class FakeLive:
+        def __init__(self, *args, **kwargs):
+            pass
+
+        def start(self):
+            pass
+
+        def stop(self):
+            pass
+
+        def update(self, *args, **kwargs):
+            pass
+
+    monkeypatch.setattr("iac_code.ui.repl.Live", FakeLive)
+
+    class FakeCapture:
+        def __init__(self, *args, **kwargs):
+            self._fired = False
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, *args):
+            return False
+
+        def read_key(self, timeout):
+            if self._fired:
+                if timeout:
+                    time.sleep(min(timeout, 0.05))
+                return None
+            deadline = time.time() + (timeout if timeout else 1.0)
+            while time.time() < deadline:
+                if repl._pipeline_waiting_input:
+                    self._fired = True
+                    return KeyEvent(key="enter", char="")
+                time.sleep(0.01)
+            return None
+
+    monkeypatch.setattr("iac_code.ui.core.raw_input.RawInputCapture", FakeCapture)
+
+    async def stream():
+        yield DiagramEvent(
+            candidate_name="c1",
+            template_content="ROSTemplateFormatVersion: '2015-09-01'",
+            mermaid_source="graph TD; A-->B",
+        )
+        yield PipelineEvent(
+            type=PipelineEventType.USER_INPUT_REQUIRED,
+            step_id="confirm_and_select",
+            timestamp=time.time(),
+            data={"options": [{"name": "c1"}]},
+        )
+
+    await asyncio.wait_for(repl._render_candidate_selection_tabs(stream()), timeout=5.0)
+
+    assert recursive_waiting_flags == [False]
+
+
 @pytest.mark.asyncio
 async def test_user_input_required_escape_empty_input_returns_to_candidate_selection(monkeypatch):
     """ESC in candidate selection opens supplement input; empty ESC cancels back to selection."""
@@ -160,6 +251,7 @@ async def test_user_input_required_escape_empty_input_returns_to_candidate_selec
     from rich.console import Console
 
     from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+    from iac_code.pipeline.engine.user_input import PipelineUserInput
     from iac_code.types.stream_events import DiagramEvent
     from iac_code.ui.core.key_event import KeyEvent
     from iac_code.ui.repl import InlineREPL
@@ -169,6 +261,9 @@ async def test_user_input_required_escape_empty_input_returns_to_candidate_selec
     repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
     repl.store = MagicMock()
     repl._pipeline_waiting_input = False
+    repl._read_pipeline_interrupt_input = AsyncMock(
+        return_value=PipelineUserInput(content="", display_text="", has_images=False)
+    )
     repl._handle_mid_pipeline_message = AsyncMock(return_value=(False, ""))
     repl._render_pipeline_stream = AsyncMock()
 
@@ -207,7 +302,6 @@ def update(self, *args, **kwargs):
     key_events = deque(
         [
             ("key:escape:selection", KeyEvent(key="escape", char="\x1b")),
-            ("key:escape:input_cancel", KeyEvent(key="escape", char="\x1b")),
             ("key:enter:selection", KeyEvent(key="enter", char="")),
         ]
     )
@@ -253,14 +347,14 @@ async def stream():
     )
 
     repl._handle_mid_pipeline_message.assert_not_awaited()
+    repl._read_pipeline_interrupt_input.assert_awaited_once()
     pipeline.pause_agent_loops.assert_called()
     pipeline.resume_agent_loops.assert_called()
     pipeline.resume.assert_called_once()
     assert resumed_payloads == [{"selected_candidate_name": "c1", "selected_candidate_index": None}]
 
     assert events.index("key:escape:selection") < events.index("pause")
-    assert events.index("pause") < events.index("key:escape:input_cancel")
-    assert events.index("key:escape:input_cancel") < events.index("resume")
+    assert events.index("pause") < events.index("resume")
     assert events.index("resume") < events.index("key:enter:selection")
     assert events.index("key:enter:selection") < events.index("pipeline_resume")
 
@@ -272,6 +366,7 @@ async def test_user_input_required_hard_interrupt_clears_waiting_flag(monkeypatc
     from rich.console import Console
 
     from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+    from iac_code.pipeline.engine.user_input import PipelineUserInput
     from iac_code.types.stream_events import DiagramEvent
     from iac_code.ui.core.key_event import KeyEvent
     from iac_code.ui.repl import InlineREPL
@@ -281,6 +376,8 @@ async def test_user_input_required_hard_interrupt_clears_waiting_flag(monkeypatc
     repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
     repl.store = MagicMock()
     repl._pipeline_waiting_input = False
+    interrupt_input = PipelineUserInput(content="换", display_text="换", has_images=False)
+    repl._read_pipeline_interrupt_input = AsyncMock(return_value=interrupt_input)
     repl._handle_mid_pipeline_message = AsyncMock(return_value=(True, "已切换方案"))
     repl._render_interrupt_feedback_inline = MagicMock()
 
@@ -308,8 +405,6 @@ def update(self, *args, **kwargs):
     key_events = deque(
         [
             KeyEvent(key="escape", char="\x1b"),
-            KeyEvent(key="x", char="换"),
-            KeyEvent(key="enter", char=""),
         ]
     )
 
@@ -350,11 +445,110 @@ async def stream():
 
     assert result is True
     assert repl._pipeline_waiting_input is False
+    repl._handle_mid_pipeline_message.assert_awaited_once_with(interrupt_input, suppress_render=True)
     pipeline.resume.assert_not_called()
     pipeline.pause_agent_loops.assert_called()
     pipeline.resume_agent_loops.assert_called()
 
 
+@pytest.mark.asyncio
+async def test_user_input_required_escape_interrupt_forwards_pipeline_user_input(monkeypatch):
+    from io import StringIO
+
+    from rich.console import Console
+
+    from iac_code.agent.message import ImageBlock, TextBlock
+    from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+    from iac_code.pipeline.engine.user_input import PipelineUserInput
+    from iac_code.types.stream_events import DiagramEvent
+    from iac_code.ui.core.key_event import KeyEvent
+    from iac_code.ui.repl import InlineREPL
+
+    image_input = PipelineUserInput(
+        content=[
+            TextBlock(text="change"),
+            ImageBlock(media_type="image/png", data="aGVsbG8="),
+        ],
+        display_text="change [Image #1]",
+        has_images=True,
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
+    repl.store = MagicMock()
+    repl._pipeline_waiting_input = False
+    repl._read_pipeline_interrupt_input = AsyncMock(return_value=image_input)
+    repl._handle_mid_pipeline_message = AsyncMock(return_value=(False, "feedback"))
+    repl._render_pipeline_stream = AsyncMock()
+
+    pipeline = MagicMock()
+    pipeline.resume = MagicMock(return_value=MagicMock(name="resumed_stream_after_selection"))
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.resume_agent_loops = MagicMock()
+    repl._pipeline = pipeline
+
+    class FakeLive:
+        def __init__(self, *args, **kwargs):
+            pass
+
+        def start(self):
+            pass
+
+        def stop(self):
+            pass
+
+        def update(self, *args, **kwargs):
+            pass
+
+    monkeypatch.setattr("iac_code.ui.repl.Live", FakeLive)
+
+    key_events = deque(
+        [
+            KeyEvent(key="escape", char="\x1b"),
+            KeyEvent(key="enter", char=""),
+        ]
+    )
+
+    class FakeCapture:
+        def __init__(self, *args, **kwargs):
+            pass
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, *args):
+            return False
+
+        def read_key(self, timeout):
+            deadline = time.time() + (timeout if timeout else 1.0)
+            while time.time() < deadline:
+                if repl._pipeline_waiting_input and key_events:
+                    return key_events.popleft()
+                time.sleep(0.01)
+            return None
+
+    monkeypatch.setattr("iac_code.ui.core.raw_input.RawInputCapture", FakeCapture)
+
+    async def stream():
+        yield DiagramEvent(
+            candidate_name="c1",
+            template_content="ROSTemplateFormatVersion: '2015-09-01'",
+            mermaid_source="graph TD; A-->B",
+        )
+        yield PipelineEvent(
+            type=PipelineEventType.USER_INPUT_REQUIRED,
+            step_id=None,
+            timestamp=time.time(),
+            data={"candidates": [{"name": "c1"}]},
+        )
+
+    await asyncio.wait_for(repl._render_candidate_selection_tabs(stream()), timeout=5.0)
+
+    repl._read_pipeline_interrupt_input.assert_awaited_once()
+    repl._handle_mid_pipeline_message.assert_awaited_once_with(image_input, suppress_render=True)
+
+
 @pytest.mark.asyncio
 async def test_user_input_required_ctrl_c_cancels_candidate_selection(monkeypatch):
     """Ctrl+C inside the candidate-selection UI should abort the pipeline,
diff --git a/tests/ui/test_repl_pipeline_handoff.py b/tests/ui/test_repl_pipeline_handoff.py
index e2cc4684..a8513d82 100644
--- a/tests/ui/test_repl_pipeline_handoff.py
+++ b/tests/ui/test_repl_pipeline_handoff.py
@@ -6,7 +6,7 @@
 import time
 from io import StringIO
 from pathlib import Path
-from unittest.mock import AsyncMock, MagicMock
+from unittest.mock import AsyncMock, MagicMock, call
 
 import pytest
 import yaml
@@ -14,7 +14,16 @@
 
 from iac_code.agent.message import Message
 from iac_code.pipeline.config import RunMode
+from iac_code.pipeline.engine.cleanup import (
+    CLEANUP_PROMPT_METADATA_TYPE,
+    CleanupLedger,
+    CleanupResource,
+    ObservedResource,
+    create_cleanup_prompt_message,
+)
 from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+from iac_code.pipeline.engine.user_input import PipelineUserInput
+from iac_code.types.stream_events import StackProgressEvent, ToolResultEvent, ToolUseEndEvent
 
 
 async def _empty_stream():
@@ -31,6 +40,18 @@ def _pipeline_completed_event(**data) -> PipelineEvent:
     )
 
 
+def _pipeline_persistence_failure_event(step_id: str) -> PipelineEvent:
+    return PipelineEvent(
+        type=PipelineEventType.STEP_FAILED,
+        step_id=step_id,
+        timestamp=time.time(),
+        data={
+            "error": "Pipeline state persistence failed.",
+            "error_details": {"type": "PipelineStatePersistenceError"},
+        },
+    )
+
+
 def _make_repl_for_handoff(
     terminal_event: PipelineEvent,
     *,
@@ -280,7 +301,12 @@ async def test_completed_pipeline_handoff_switches_to_normal_and_clears_state():
         injected,
         git_branch="main",
     )
-    pipeline.mark_normal_handoff.assert_called_once_with(status="succeeded", failed_reason=None)
+    pipeline.mark_normal_handoff.assert_has_calls(
+        [
+            call(status="pending", failed_reason=None),
+            call(status="succeeded", failed_reason=None),
+        ]
+    )
     pipeline.clear_sidecar.assert_not_called()
     pipeline.mark_user_aborted.assert_not_called()
     assert repl._pipeline is None
@@ -288,176 +314,1635 @@ async def test_completed_pipeline_handoff_switches_to_normal_and_clears_state():
 
 
 @pytest.mark.asyncio
-async def test_early_exit_handoff_clears_incomplete_state_without_user_abort():
-    terminal_event = _pipeline_completed_event(early_exit=True)
-    repl, pipeline, _injected = _make_repl_for_handoff(
-        terminal_event,
-        should_switch_to_normal=True,
-        is_complete=False,
+async def test_completed_pipeline_handoff_starts_hidden_cleanup_prompt(tmp_path: Path):
+    terminal_event = _pipeline_completed_event()
+    repl, pipeline, _injected = _make_repl_for_handoff(terminal_event, should_switch_to_normal=True)
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    observed = ObservedResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        resource_name="demo",
+        region_id="cn-hangzhou",
+        source_step_id="deploying",
+        source_attempt_id="att_0001",
+        observed_action="CreateStack",
+    )
+    ledger.mark_cleanup_required(
+        [CleanupResource.from_observed(observed, reason="rollback")],
+        source_step_id="deploying",
+        reason="rollback",
     )
+    pipeline.cleanup_ledger = MagicMock(return_value=ledger)
 
-    await repl._handle_pipeline_chat("start")
+    def add_raw_message(raw):
+        return Message(role=raw["role"], content=raw["content"], metadata=raw.get("metadata", {}))
 
-    assert repl._runtime_mode == RunMode.NORMAL
-    pipeline.mark_normal_handoff.assert_called_once_with(status="succeeded", failed_reason=None)
-    pipeline.clear_sidecar.assert_not_called()
-    pipeline.mark_user_aborted.assert_not_called()
-    assert repl._pipeline is None
-    assert repl._pipeline_waiting_input is False
+    repl._agent_loop.context_manager.add_raw_message.side_effect = add_raw_message
 
+    async def cleanup_stream():
+        yield ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="ros_stack",
+            input={"action": "DeleteStack", "region_id": "cn-hangzhou", "params": {"StackId": "stack-123"}},
+        )
+        yield ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="ros_stack",
+            result='{"stack_id":"stack-123","status":"DELETE_COMPLETE","is_success":true}',
+            is_error=False,
+        )
 
-@pytest.mark.asyncio
-async def test_failed_terminal_event_does_not_handoff_and_failed_cleanup_remains():
-    terminal_event = _pipeline_completed_event(failed=True)
-    repl, pipeline, _injected = _make_repl_for_handoff(
-        terminal_event,
-        should_switch_to_normal=False,
-        is_complete=False,
-        sidecar_status="failed",
-    )
+    repl._agent_loop.continue_streaming = MagicMock(return_value=cleanup_stream())
+
+    async def consume_cleanup_events(events, **_kwargs):
+        async for _event in events:
+            pass
+        return (0.0, [], "")
+
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_cleanup_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
 
     await repl._handle_pipeline_chat("start")
 
-    assert repl._runtime_mode == RunMode.PIPELINE
-    repl._agent_loop.context_manager.add_raw_message.assert_not_called()
-    repl._session_storage.append.assert_not_called()
-    pipeline.clear_sidecar.assert_not_called()
-    pipeline.mark_normal_handoff.assert_not_called()
-    pipeline.mark_user_aborted.assert_not_called()
-    assert repl._pipeline is None
-    assert repl._pipeline_waiting_input is False
+    repl.renderer.print_system_message.assert_any_call(
+        "\nDetected 1 rollback cleanup resources; starting cleanup.",
+        style="yellow",
+    )
+    raw_cleanup_call = repl._agent_loop.context_manager.add_raw_message.call_args_list[-1].args[0]
+    assert raw_cleanup_call["role"] == "user"
+    assert raw_cleanup_call["metadata"]["type"] == CLEANUP_PROMPT_METADATA_TYPE
+    assert "stack-123" in raw_cleanup_call["content"]
+    repl.renderer.record_user_turn.assert_called_once_with("start")
+    repl.renderer.run_streaming_output.assert_awaited_once()
+    assert ledger.cleanup_resources()[0].cleanup_status == "completed"
 
 
-@pytest.mark.asyncio
-async def test_handoff_injection_failure_still_switches_to_normal_and_preserves_sidecar():
-    terminal_event = _pipeline_completed_event()
-    repl, pipeline, _injected = _make_repl_for_handoff(terminal_event, should_switch_to_normal=True)
-    repl._agent_loop.context_manager.add_raw_message.side_effect = RuntimeError("context unavailable")
+def test_cleanup_resource_status_message_is_single_line_badge_style() -> None:
+    from iac_code.ui.repl import InlineREPL
 
-    await repl._handle_pipeline_chat("start")
+    resource = CleanupResource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="9b124deb-1ef2-46b1-8375-de8b76df2660",
+        resource_name="basic-vpc-network",
+        region_id="cn-hangzhou",
+        cleanup_status="in_progress",
+        progress_status="CREATE_COMPLETE",
+    )
 
-    assert repl._runtime_mode == RunMode.NORMAL
-    repl._session_storage.append.assert_not_called()
-    repl.renderer.print_system_message.assert_called()
-    pipeline.mark_normal_handoff.assert_called_once_with(
-        status="failed",
-        failed_reason="context unavailable",
+    message = InlineREPL._cleanup_resource_status_message(resource)
+
+    assert message == (
+        "↺ Rollback cleanup [Checking] basic-vpc-network · stack 9b124deb…2660 · "
+        "cn-hangzhou · CREATE_COMPLETE; deletion required"
     )
-    pipeline.clear_sidecar.assert_not_called()
-    pipeline.mark_user_aborted.assert_not_called()
-    pipeline.resume.assert_called_once_with("start")
-    pipeline.run.assert_not_called()
-    assert repl._pipeline is None
-    assert repl._pipeline_waiting_input is False
+    assert "\n" not in message
+    assert "status=" not in message
+    assert "progress=" not in message
 
 
 @pytest.mark.asyncio
-async def test_handoff_persistence_failure_still_switches_to_normal_and_preserves_sidecar():
-    terminal_event = _pipeline_completed_event()
-    repl, pipeline, _injected = _make_repl_for_handoff(terminal_event, should_switch_to_normal=True)
-    repl._session_storage.append.side_effect = RuntimeError("disk unavailable")
+async def test_normal_resume_continues_existing_cleanup_prompt_without_duplicate(tmp_path: Path):
+    from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
+    from iac_code.ui.repl import InlineREPL
 
-    await repl._handle_pipeline_chat("start")
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="in_progress",
+                progress_status="DELETE_REQUESTED",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
 
-    assert repl._runtime_mode == RunMode.NORMAL
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl.renderer._last_streaming_errors = []
+    repl.store = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._streaming_error_log = []
+
+    existing_prompt_message = create_cleanup_prompt_message(cleanup_prompt.prompt)
+    repl._session_storage.load.return_value = [existing_prompt_message]
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[existing_prompt_message])
+    repl._agent_loop.context_manager.add_raw_message = MagicMock()
+
+    async def cleanup_stream():
+        yield ToolUseEndEvent(
+            tool_use_id="toolu-get",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "GetStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+        yield ToolResultEvent(
+            tool_use_id="toolu-get",
+            tool_name="aliyun_api",
+            result='{"Stack":{"StackId":"stack-123","StackStatus":"DELETE_COMPLETE"}}',
+            is_error=False,
+        )
+
+    repl._agent_loop.continue_streaming = MagicMock(return_value=cleanup_stream())
+
+    async def consume_cleanup_events(events, **_kwargs):
+        async for _event in events:
+            pass
+        return (0.0, [], "")
+
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_cleanup_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
+
+    assert await repl._maybe_start_normal_chat_cleanup_on_startup() is True
+
+    repl.renderer.print_system_message.assert_any_call(
+        "\nDetected 1 rollback cleanup resources; starting cleanup.",
+        style="yellow",
+    )
+    assert any(
+        "DELETE_COMPLETE" in call.args[0] and call.kwargs.get("style") == "green"
+        for call in repl.renderer.print_system_message.call_args_list
+    )
     repl._agent_loop.context_manager.add_raw_message.assert_called_once()
-    repl.renderer.print_system_message.assert_called()
-    pipeline.mark_normal_handoff.assert_called_once_with(
-        status="failed",
-        failed_reason="disk unavailable",
+    repl._session_storage.append.assert_not_called()
+    assert ledger.cleanup_resources()[0].cleanup_status == "completed"
+
+
+def test_normal_chat_finds_cleanup_ledger_from_prompt_metadata(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    cleanup_message = create_cleanup_prompt_message(
+        cleanup_prompt.prompt,
+        cleanup_ledger_path=ledger.path,
+        cleanup_status="pending",
     )
-    pipeline.clear_sidecar.assert_not_called()
-    pipeline.mark_user_aborted.assert_not_called()
-    assert repl._pipeline is None
-    assert repl._pipeline_waiting_input is False
 
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = [cleanup_message]
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[])
 
-@pytest.mark.asyncio
-async def test_outer_stream_returns_candidate_selection_terminal_event():
+    restored = repl._cleanup_ledger_for_normal_chat()
+
+    assert restored is not None
+    assert restored.path == ledger.path
+
+
+def test_normal_chat_ignores_observed_only_cleanup_ledger(tmp_path: Path):
     from iac_code.ui.repl import InlineREPL
 
-    terminal_event = _pipeline_completed_event()
+    session_dir = tmp_path / "session"
+    ledger = CleanupLedger(session_dir / "pipeline" / "cleanup.yaml")
+    ledger.record_observed(
+        ObservedResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-success",
+            region_id="cn-hangzhou",
+            observed_action="CreateStack",
+            source_step_id="deploying",
+        )
+    )
+
     repl = InlineREPL.__new__(InlineREPL)
-    repl._pipeline = MagicMock()
-    repl._pipeline_step_names = []
-    repl._pipeline_completed_indices = set()
-    repl._update_pipeline_state_from_event = MagicMock()
-    repl._render_pipeline_event = MagicMock()
-    repl._render_candidate_selection_tabs = AsyncMock(return_value=terminal_event)
-    repl._restart_pipeline_stream_after_interrupt = AsyncMock(return_value=_empty_stream())
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = []
+    repl._session_storage.session_dir.return_value = session_dir
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[])
 
-    async def stream():
-        yield PipelineEvent(
-            type=PipelineEventType.STEP_STARTED,
-            step_id="select",
-            timestamp=time.time(),
-            data={"index": 1, "total": 1, "ui_mode": "candidate_selection"},
+    assert repl._cleanup_ledger_for_normal_chat() is None
+
+
+def test_normal_chat_ignores_observed_only_explicit_cleanup_ledger(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.record_observed(
+        ObservedResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-success",
+            region_id="cn-hangzhou",
+            observed_action="CreateStack",
+            source_step_id="deploying",
         )
+    )
 
-    result = await repl._render_pipeline_stream(stream())
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = []
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[])
 
-    assert result is terminal_event
-    repl._restart_pipeline_stream_after_interrupt.assert_not_awaited()
+    assert repl._cleanup_ledger_for_normal_chat() is None
+    assert not hasattr(repl, "_pipeline_cleanup_ledger_path")
 
 
-@pytest.mark.asyncio
-async def test_outer_stream_returns_parallel_tabs_terminal_event():
+def test_normal_chat_fallback_continues_past_observed_only_cleanup_ledger(monkeypatch, tmp_path: Path):
     from iac_code.ui.repl import InlineREPL
 
-    terminal_event = _pipeline_completed_event()
+    pipeline_cwd = "/pipeline-workspace"
+    original_cwd = "/workspace"
+    session_id = "session-1"
+    pipeline_dir = tmp_path / "pipeline-session"
+    original_dir = tmp_path / "original-session"
+    observed_ledger = CleanupLedger(pipeline_dir / "pipeline" / "cleanup.yaml")
+    observed_ledger.record_observed(
+        ObservedResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-success",
+            region_id="cn-hangzhou",
+            observed_action="CreateStack",
+            source_step_id="deploying",
+        )
+    )
+    pending_ledger = CleanupLedger(original_dir / "pipeline" / "cleanup.yaml")
+    pending_ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-leftover",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    monkeypatch.setattr("iac_code.pipeline.config.get_working_directory", lambda: pipeline_cwd)
+
     repl = InlineREPL.__new__(InlineREPL)
-    repl._pipeline = MagicMock()
-    repl._pipeline_step_names = []
-    repl._pipeline_completed_indices = set()
-    repl._update_pipeline_state_from_event = MagicMock()
-    repl._render_pipeline_event = MagicMock()
-    repl._render_parallel_tabs = AsyncMock(return_value=terminal_event)
-    repl._restart_pipeline_stream_after_interrupt = AsyncMock(return_value=_empty_stream())
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = []
+    repl._session_storage.session_dir.side_effect = lambda cwd, _session_id: (
+        pipeline_dir if cwd == pipeline_cwd else original_dir
+    )
+    repl._original_cwd = original_cwd
+    repl._session_id = session_id
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[])
 
-    async def stream():
-        yield PipelineEvent(
-            type=PipelineEventType.STEP_STARTED,
-            step_id="parallel",
-            timestamp=time.time(),
-            data={
-                "index": 1,
-                "total": 1,
-                "ui_mode": "default",
-                "step_type": "parallel_sub_pipeline",
-            },
+    restored = repl._cleanup_ledger_for_normal_chat()
+
+    assert restored is not None
+    assert restored.path == pending_ledger.path
+
+
+def test_normal_chat_legacy_prompt_prefers_pending_ledger_across_cwds(monkeypatch, tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    pipeline_cwd = "/pipeline-workspace"
+    original_cwd = "/workspace"
+    session_id = "session-1"
+    pipeline_dir = tmp_path / "pipeline-session"
+    original_dir = tmp_path / "original-session"
+    observed_ledger = CleanupLedger(pipeline_dir / "pipeline" / "cleanup.yaml")
+    observed_ledger.record_observed(
+        ObservedResource(
+            provider="ros",
+            resource_type="stack",
+            resource_id="stack-success",
+            region_id="cn-hangzhou",
+            observed_action="CreateStack",
+            source_step_id="deploying",
         )
+    )
+    pending_ledger = CleanupLedger(original_dir / "pipeline" / "cleanup.yaml")
+    pending_ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-leftover",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    legacy_prompt = create_cleanup_prompt_message("legacy cleanup prompt without ledger path")
+    monkeypatch.setattr("iac_code.pipeline.config.get_working_directory", lambda: pipeline_cwd)
 
-    result = await repl._render_pipeline_stream(stream())
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = [legacy_prompt]
+    repl._session_storage.session_dir.side_effect = lambda cwd, _session_id: (
+        pipeline_dir if cwd == pipeline_cwd else original_dir
+    )
+    repl._original_cwd = original_cwd
+    repl._session_id = session_id
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[])
 
-    assert result is terminal_event
-    repl._restart_pipeline_stream_after_interrupt.assert_not_awaited()
+    restored = repl._cleanup_ledger_for_normal_chat()
+
+    assert restored is not None
+    assert restored.path == pending_ledger.path
 
 
 @pytest.mark.asyncio
-async def test_render_parallel_tabs_returns_consumed_pipeline_completed_event(monkeypatch):
+async def test_cleanup_start_persists_prompt_when_runtime_has_prompt_but_session_does_not(tmp_path: Path):
     from iac_code.ui.repl import InlineREPL
 
-    terminal_event = _pipeline_completed_event()
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="in_progress",
+                progress_status="DELETE_REQUESTED",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = ledger.build_pending_prompt()
+    assert cleanup_prompt is not None
+    existing_prompt_message = create_cleanup_prompt_message(cleanup_prompt.prompt)
+
     repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
     repl.renderer = MagicMock()
-    repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
-    repl._pipeline = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl.renderer._last_streaming_errors = []
+    repl.store = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = []
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._streaming_error_log = []
 
-    class FakeLive:
-        def start(self):
-            pass
+    injected = create_cleanup_prompt_message(cleanup_prompt.prompt)
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[existing_prompt_message])
+    repl._agent_loop.context_manager.add_raw_message = MagicMock(return_value=injected)
+    repl._agent_loop.continue_streaming = MagicMock(return_value=_empty_stream())
 
-        def stop(self):
+    async def consume_cleanup_events(events, **_kwargs):
+        async for _event in events:
             pass
+        return (0.0, [], "")
 
-        def update(self, *args, **kwargs):
-            pass
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_cleanup_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
 
-    monkeypatch.setattr(InlineREPL, "_create_parallel_live", lambda self: FakeLive(), raising=False)
+    assert await repl._start_pipeline_cleanup_from_ledger(ledger) is True
 
-    async def stream():
-        yield terminal_event
+    repl._session_storage.append.assert_called_once_with(
+        "/workspace",
+        "session-1",
+        injected,
+        git_branch="main",
+    )
 
-    result = await repl._render_parallel_tabs(stream())
 
-    assert result is terminal_event
+@pytest.mark.asyncio
+async def test_normal_startup_prunes_completed_cleanup_prompt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="completed",
+                progress_status="DELETE_COMPLETE",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(return_value=1)
+
+    assert await repl._maybe_start_normal_chat_cleanup_on_startup() is False
+
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages.assert_called_once_with()
+
+
+@pytest.mark.asyncio
+async def test_normal_startup_replays_completed_cleanup_history_before_pruning(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                resource_name="demo",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-123",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(return_value=1)
+
+    assert await repl._maybe_start_normal_chat_cleanup_on_startup() is False
+
+    rendered = "\n".join(call.args[0] for call in repl.renderer.print_system_message.call_args_list)
+    assert "↺ Rollback cleanup resume: all 1 records are completed." in rendered
+    assert "Rollback cleanup [Completed] demo" not in rendered
+    assert "stack stack-123 · cn-hangzhou" not in rendered
+    assert "status=" not in rendered
+    assert "progress=" not in rendered
+
+
+def test_cleanup_resume_summary_collapses_history_to_latest_resource_state(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-1234567890",
+                resource_name="demo-stack",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-1234567890",
+        region_id="cn-hangzhou",
+        cleanup_status="started",
+        progress_status="DELETE_STARTED",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-1234567890",
+        region_id="cn-hangzhou",
+        cleanup_status="in_progress",
+        progress_status="DELETE_IN_PROGRESS",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-1234567890",
+        region_id="cn-hangzhou",
+        cleanup_status="failed",
+        progress_status="DELETE_FAILED",
+        last_error="DELETE_FAILED",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+
+    repl._print_cleanup_resume_summary()
+
+    rendered = "\n".join(call.args[0] for call in repl.renderer.print_system_message.call_args_list)
+    assert "↺ Rollback cleanup resume: 1 records, 1 failed." in rendered
+    assert rendered.count("  [Failed] demo-stack") == 1
+    assert "↺ Rollback cleanup [Failed] demo-stack" not in rendered
+    assert "  [Deleting] demo-stack" not in rendered
+    assert "DELETE_FAILED" in rendered
+
+
+def test_cleanup_resume_summary_collapses_completed_resources_and_indents_actionable_details(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-completed",
+                resource_name="completed-stack",
+                region_id="cn-hangzhou",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-failed",
+                resource_name="failed-stack",
+                region_id="cn-hangzhou",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-running",
+                resource_name="running-stack",
+                region_id="cn-hangzhou",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-completed",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-failed",
+        region_id="cn-hangzhou",
+        cleanup_status="failed",
+        progress_status="DELETE_FAILED",
+        last_error="DELETE_FAILED",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-running",
+        region_id="cn-hangzhou",
+        cleanup_status="in_progress",
+        progress_status="DELETE_IN_PROGRESS",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+
+    repl._print_cleanup_resume_summary()
+
+    calls = repl.renderer.print_system_message.call_args_list
+    assert calls[0].args[0] == "↺ Rollback cleanup resume: 3 records, 1 failed, 1 in progress, 1 completed."
+    assert calls[0].kwargs["style"] == "yellow"
+    assert not any("completed-stack" in call.args[0] for call in calls[1:])
+    assert any("  [Failed] failed-stack" in call.args[0] and call.kwargs["style"] == "red" for call in calls)
+    assert any("  [Deleting] running-stack" in call.args[0] and call.kwargs["style"] == "yellow" for call in calls)
+
+
+def test_cleanup_resume_summary_shows_only_pending_detail_when_completed_resources_exist(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-completed-1",
+                resource_name="completed-one",
+                region_id="cn-hangzhou",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-completed-2",
+                resource_name="completed-two",
+                region_id="cn-hangzhou",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-pending",
+                resource_name="pending-stack",
+                region_id="cn-hangzhou",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-completed-1",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-completed-2",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+
+    repl._print_cleanup_resume_summary()
+
+    calls = repl.renderer.print_system_message.call_args_list
+    rendered = "\n".join(call.args[0] for call in calls)
+    assert calls[0].args[0] == "↺ Rollback cleanup resume: 3 records, 1 pending, 2 completed."
+    assert rendered.count("  [Pending] pending-stack") == 1
+    assert "completed-one" not in rendered
+    assert "completed-two" not in rendered
+
+
+@pytest.mark.asyncio
+async def test_completed_cleanup_marks_session_prompt_completed(tmp_path: Path):
+    from iac_code.services.session_storage import SessionStorage
+    from iac_code.ui.repl import InlineREPL
+
+    cwd = str(tmp_path / "workspace")
+    session_id = "session-1"
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="completed",
+                progress_status="DELETE_COMPLETE",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    cleanup_prompt = create_cleanup_prompt_message(
+        "cleanup prompt for stack-123",
+        cleanup_ledger_path=ledger.path,
+        cleanup_status="pending",
+    )
+    storage = SessionStorage(projects_dir=tmp_path / "projects")
+    storage.append(cwd, session_id, cleanup_prompt, git_branch="main")
+    runtime_prompt = create_cleanup_prompt_message(
+        "cleanup prompt for stack-123",
+        cleanup_ledger_path=ledger.path,
+        cleanup_status="pending",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl._session_storage = storage
+    repl._original_cwd = cwd
+    repl._session_id = session_id
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[runtime_prompt])
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(return_value=1)
+
+    assert await repl._maybe_start_normal_chat_cleanup_on_startup() is False
+
+    loaded = storage.load(cwd, session_id)
+    assert loaded[0].metadata["cleanupStatus"] == "completed"
+    assert runtime_prompt.metadata["cleanupStatus"] == "completed"
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages.assert_called_once_with()
+
+
+@pytest.mark.asyncio
+async def test_normal_startup_keeps_cleanup_prompt_when_cleanup_ledger_is_corrupt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(return_value=1)
+
+    assert await repl._maybe_start_normal_chat_cleanup_on_startup() is False
+
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages.assert_not_called()
+    repl.renderer.print_system_message.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_cleanup_observer_does_not_mutate_corrupt_ledger_or_prune_prompt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    ledger = CleanupLedger(path)
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(return_value=1)
+
+    async def events():
+        yield ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "DeleteStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+
+    async for _event in repl._wrap_cleanup_observer(events(), ledger=ledger):
+        pass
+    repl._prune_cleanup_prompts_if_no_pending_cleanup(ledger)
+
+    assert path.exists()
+    assert not list(tmp_path.glob("cleanup.yaml.corrupt*"))
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages.assert_not_called()
+
+
+@pytest.mark.asyncio
+async def test_normal_chat_blocks_agent_execution_when_cleanup_ledger_is_corrupt_with_prompt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    path = tmp_path / "cleanup.yaml"
+    path.write_text("[broken", encoding="utf-8")
+    cleanup_message = create_cleanup_prompt_message("cleanup prompt for stack-123")
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[cleanup_message])
+    repl._agent_loop.run_streaming = MagicMock()
+
+    assert await repl._handle_chat("hello") == []
+
+    repl._agent_loop.run_streaming.assert_not_called()
+    repl.renderer.print_system_message.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_normal_chat_blocks_agent_execution_when_cleanup_ledger_is_missing_with_prompt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    cleanup_message = create_cleanup_prompt_message("cleanup prompt for stack-123")
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = tmp_path / "missing-cleanup.yaml"
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = [cleanup_message]
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl._streaming_draft_input = ""
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(return_value=[cleanup_message])
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock()
+    repl._agent_loop.run_streaming = MagicMock()
+
+    assert await repl._handle_chat("hello") == []
+
+    repl._agent_loop.run_streaming.assert_not_called()
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages.assert_not_called()
+    repl.renderer.print_system_message.assert_called_once()
+    assert repl._streaming_draft_input == "hello"
+
+
+@pytest.mark.asyncio
+async def test_normal_chat_runs_pending_cleanup_before_user_prompt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="in_progress",
+                progress_status="DELETE_REQUESTED",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    calls: list[object] = []
+    messages: list[Message] = []
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl.renderer.record_user_turn = MagicMock()
+    repl.renderer._last_streaming_errors = []
+    repl.store = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = []
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._streaming_error_log = []
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(side_effect=lambda: messages)
+
+    def add_raw_message(raw):
+        message = Message(role=raw["role"], content=raw["content"], metadata=raw.get("metadata", {}))
+        messages.append(message)
+        return message
+
+    repl._agent_loop.context_manager.add_raw_message = MagicMock(side_effect=add_raw_message)
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(
+        side_effect=lambda: messages.clear() or 0
+    )
+
+    async def cleanup_stream():
+        yield StackProgressEvent(
+            stack_id="stack-123",
+            stack_name="demo",
+            status="DELETE_COMPLETE",
+            progress_percentage=100,
+            elapsed_seconds=1.0,
+            resources=[],
+        )
+
+    async def user_stream():
+        if False:
+            yield None
+
+    def continue_streaming():
+        calls.append("cleanup")
+        return cleanup_stream()
+
+    def run_streaming(prompt, **_kwargs):
+        calls.append(("user", prompt))
+        return user_stream()
+
+    repl._agent_loop.continue_streaming = MagicMock(side_effect=continue_streaming)
+    repl._agent_loop.run_streaming = MagicMock(side_effect=run_streaming)
+
+    async def consume_events(events, **_kwargs):
+        async for _event in events:
+            pass
+        return (0.0, [], "")
+
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
+
+    assert await repl._handle_chat("please continue") == []
+
+    assert calls == ["cleanup", ("user", "please continue")]
+    repl.renderer.record_user_turn.assert_called_once_with("please continue")
+    assert ledger.pending_resources() == []
+
+
+@pytest.mark.asyncio
+async def test_cleanup_observer_prints_status_transitions_and_persists_history(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                resource_name="demo",
+                region_id="cn-hangzhou",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+
+    async def cleanup_events():
+        yield ToolUseEndEvent(
+            tool_use_id="toolu-delete",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "DeleteStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+        yield ToolResultEvent(
+            tool_use_id="toolu-delete",
+            tool_name="aliyun_api",
+            result='{"RequestId":"req-1"}',
+            is_error=False,
+        )
+        yield ToolUseEndEvent(
+            tool_use_id="toolu-get",
+            name="aliyun_api",
+            input={
+                "product": "ros",
+                "action": "GetStack",
+                "region_id": "cn-hangzhou",
+                "params": {"StackId": "stack-123"},
+            },
+        )
+        yield ToolResultEvent(
+            tool_use_id="toolu-get",
+            tool_name="aliyun_api",
+            result='{"StackId":"stack-123","Status":"DELETE_COMPLETE"}',
+            is_error=False,
+        )
+
+    async for _event in repl._wrap_cleanup_observer(cleanup_events(), ledger=ledger):
+        pass
+
+    rendered = "\n".join(call.args[0] for call in repl.renderer.print_system_message.call_args_list)
+    assert "stack-123" in rendered
+    assert "DELETE_STARTED" in rendered
+    assert "DELETE_REQUESTED" in rendered
+    assert "DELETE_COMPLETE" in rendered
+
+    history_types = [entry["type"] for entry in ledger._load()["history"]]
+    assert history_types == [
+        "cleanup_required",
+        "cleanup_started",
+        "cleanup_progress",
+        "cleanup_completed",
+    ]
+
+
+@pytest.mark.asyncio
+async def test_normal_chat_preserves_user_prompt_when_cleanup_remains_pending(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-123",
+                region_id="cn-hangzhou",
+                cleanup_status="in_progress",
+                progress_status="DELETE_REQUESTED",
+            )
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    messages: list[Message] = []
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl.renderer.record_user_turn = MagicMock()
+    repl.renderer._last_streaming_errors = []
+    repl.store = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._session_storage.load.return_value = []
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._streaming_error_log = []
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(side_effect=lambda: messages)
+
+    def add_raw_message(raw):
+        message = Message(role=raw["role"], content=raw["content"], metadata=raw.get("metadata", {}))
+        messages.append(message)
+        return message
+
+    repl._agent_loop.context_manager.add_raw_message = MagicMock(side_effect=add_raw_message)
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(
+        side_effect=lambda: messages.clear() or 0
+    )
+    repl._agent_loop.continue_streaming = MagicMock(return_value=_empty_stream())
+    repl._agent_loop.run_streaming = MagicMock()
+
+    async def consume_events(events, **_kwargs):
+        async for _event in events:
+            pass
+        return (0.0, [], "")
+
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
+
+    assert await repl._handle_chat("please continue") == []
+
+    repl._agent_loop.continue_streaming.assert_called_once()
+    repl._agent_loop.run_streaming.assert_not_called()
+    repl.renderer.record_user_turn.assert_not_called()
+    assert repl._streaming_draft_input == "please continue"
+    assert ledger.pending_resources()
+
+
+@pytest.mark.asyncio
+async def test_pipeline_cleanup_start_replaces_stale_runtime_cleanup_prompt(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-done",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-pending",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    stale_prompt = ledger.build_pending_prompt()
+    assert stale_prompt is not None
+    messages = [create_cleanup_prompt_message(stale_prompt.prompt)]
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-done",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl.renderer._last_streaming_errors = []
+    repl.store = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._streaming_error_log = []
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(side_effect=lambda: messages)
+
+    def add_raw_message(raw):
+        message = Message(role=raw["role"], content=raw["content"], metadata=raw.get("metadata", {}))
+        messages.append(message)
+        return message
+
+    def remove_cleanup_prompt_messages():
+        removed = len(messages)
+        messages.clear()
+        return removed
+
+    repl._agent_loop.context_manager.add_raw_message = MagicMock(side_effect=add_raw_message)
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(
+        side_effect=remove_cleanup_prompt_messages
+    )
+
+    async def empty_stream():
+        if False:
+            yield None
+
+    repl._agent_loop.continue_streaming = MagicMock(return_value=empty_stream())
+
+    async def consume_cleanup_events(events, **_kwargs):
+        async for _event in events:
+            pass
+        return (0.0, [], "")
+
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_cleanup_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
+
+    assert await repl._start_pipeline_cleanup_from_ledger(ledger) is True
+
+    cleanup_messages = [message for message in messages if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE]
+    assert len(cleanup_messages) == 1
+    assert "stack-pending" in cleanup_messages[0].content
+    assert "stack-done" not in cleanup_messages[0].content
+
+
+@pytest.mark.asyncio
+async def test_pipeline_cleanup_start_removes_stale_prompt_even_when_latest_prompt_exists(tmp_path: Path):
+    from iac_code.ui.repl import InlineREPL
+
+    ledger = CleanupLedger(tmp_path / "cleanup.yaml")
+    ledger.mark_cleanup_required(
+        [
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-done",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            ),
+            CleanupResource(
+                provider="ros",
+                resource_type="stack",
+                resource_id="stack-pending",
+                region_id="cn-hangzhou",
+                source_step_id="deploying",
+            ),
+        ],
+        source_step_id="deploying",
+        reason="rollback",
+    )
+    stale_prompt = ledger.build_pending_prompt()
+    assert stale_prompt is not None
+    stale_message = create_cleanup_prompt_message(stale_prompt.prompt)
+    ledger.update_resource(
+        provider="ros",
+        resource_type="stack",
+        resource_id="stack-done",
+        region_id="cn-hangzhou",
+        cleanup_status="completed",
+        progress_status="DELETE_COMPLETE",
+    )
+    latest_prompt = ledger.build_pending_prompt()
+    assert latest_prompt is not None
+    latest_message = create_cleanup_prompt_message(latest_prompt.prompt)
+    messages = [stale_message, latest_message]
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._runtime_mode = RunMode.NORMAL
+    repl._pipeline_cleanup_ledger_path = ledger.path
+    repl.renderer = MagicMock()
+    repl.renderer.print_system_message = MagicMock()
+    repl.renderer._last_streaming_errors = []
+    repl.store = MagicMock()
+    repl._session_storage = MagicMock()
+    repl._original_cwd = "/workspace"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="main")
+    repl._streaming_error_log = []
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager = MagicMock()
+    repl._agent_loop.context_manager.get_messages = MagicMock(side_effect=lambda: messages)
+
+    def add_raw_message(raw):
+        message = Message(role=raw["role"], content=raw["content"], metadata=raw.get("metadata", {}))
+        messages.append(message)
+        return message
+
+    def remove_cleanup_prompt_messages():
+        removed = len(messages)
+        messages.clear()
+        return removed
+
+    repl._agent_loop.context_manager.add_raw_message = MagicMock(side_effect=add_raw_message)
+    repl._agent_loop.context_manager.remove_cleanup_prompt_messages = MagicMock(
+        side_effect=remove_cleanup_prompt_messages
+    )
+
+    async def empty_stream():
+        if False:
+            yield None
+
+    repl._agent_loop.continue_streaming = MagicMock(return_value=empty_stream())
+
+    async def consume_cleanup_events(events, **_kwargs):
+        async for _event in events:
+            pass
+        return (0.0, [], "")
+
+    repl.renderer.run_streaming_output = AsyncMock(side_effect=consume_cleanup_events)
+    repl._normalize_streaming_output_result = MagicMock(return_value=(0.0, [], ""))
+
+    assert await repl._start_pipeline_cleanup_from_ledger(ledger) is True
+
+    cleanup_messages = [message for message in messages if message.metadata.get("type") == CLEANUP_PROMPT_METADATA_TYPE]
+    assert len(cleanup_messages) == 1
+    assert cleanup_messages[0].content == latest_prompt.prompt
+
+
+@pytest.mark.asyncio
+async def test_early_exit_handoff_clears_incomplete_state_without_user_abort():
+    terminal_event = _pipeline_completed_event(early_exit=True)
+    repl, pipeline, _injected = _make_repl_for_handoff(
+        terminal_event,
+        should_switch_to_normal=True,
+        is_complete=False,
+    )
+
+    await repl._handle_pipeline_chat("start")
+
+    assert repl._runtime_mode == RunMode.NORMAL
+    pipeline.mark_normal_handoff.assert_has_calls(
+        [
+            call(status="pending", failed_reason=None),
+            call(status="succeeded", failed_reason=None),
+        ]
+    )
+    pipeline.clear_sidecar.assert_not_called()
+    pipeline.mark_user_aborted.assert_not_called()
+    assert repl._pipeline is None
+    assert repl._pipeline_waiting_input is False
+
+
+@pytest.mark.asyncio
+async def test_failed_terminal_event_does_not_handoff_and_failed_cleanup_remains():
+    terminal_event = _pipeline_completed_event(failed=True)
+    repl, pipeline, _injected = _make_repl_for_handoff(
+        terminal_event,
+        should_switch_to_normal=False,
+        is_complete=False,
+        sidecar_status="failed",
+    )
+
+    await repl._handle_pipeline_chat("start")
+
+    assert repl._runtime_mode == RunMode.PIPELINE
+    repl._agent_loop.context_manager.add_raw_message.assert_not_called()
+    repl._session_storage.append.assert_not_called()
+    pipeline.clear_sidecar.assert_not_called()
+    pipeline.mark_normal_handoff.assert_not_called()
+    pipeline.mark_user_aborted.assert_not_called()
+    assert repl._pipeline is None
+    assert repl._pipeline_waiting_input is False
+
+
+@pytest.mark.asyncio
+async def test_handoff_injection_failure_still_switches_to_normal_and_preserves_sidecar():
+    terminal_event = _pipeline_completed_event()
+    repl, pipeline, _injected = _make_repl_for_handoff(terminal_event, should_switch_to_normal=True)
+    repl._agent_loop.context_manager.add_raw_message.side_effect = RuntimeError("context unavailable")
+
+    await repl._handle_pipeline_chat("start")
+
+    assert repl._runtime_mode == RunMode.NORMAL
+    repl._session_storage.append.assert_not_called()
+    repl.renderer.print_system_message.assert_called()
+    pipeline.mark_normal_handoff.assert_has_calls(
+        [
+            call(status="pending", failed_reason=None),
+            call(status="failed", failed_reason="context unavailable"),
+        ]
+    )
+    pipeline.clear_sidecar.assert_not_called()
+    pipeline.mark_user_aborted.assert_not_called()
+    pipeline.resume.assert_called_once_with(PipelineUserInput(content="start", display_text="start", has_images=False))
+    pipeline.run.assert_not_called()
+    assert repl._pipeline is None
+    assert repl._pipeline_waiting_input is False
+
+
+@pytest.mark.asyncio
+async def test_handoff_summary_append_failure_still_switches_to_normal_and_preserves_sidecar():
+    terminal_event = _pipeline_completed_event()
+    repl, pipeline, _injected = _make_repl_for_handoff(terminal_event, should_switch_to_normal=True)
+    repl._session_storage.append.side_effect = RuntimeError("disk unavailable")
+
+    await repl._handle_pipeline_chat("start")
+
+    assert repl._runtime_mode == RunMode.NORMAL
+    repl._agent_loop.context_manager.add_raw_message.assert_called_once()
+    repl.renderer.print_system_message.assert_called()
+    pipeline.mark_normal_handoff.assert_has_calls(
+        [
+            call(status="pending", failed_reason=None),
+            call(status="failed", failed_reason="disk unavailable"),
+        ]
+    )
+    pipeline.clear_sidecar.assert_not_called()
+    pipeline.mark_user_aborted.assert_not_called()
+    assert repl._pipeline is None
+    assert repl._pipeline_waiting_input is False
+
+
+@pytest.mark.asyncio
+async def test_outer_stream_returns_candidate_selection_terminal_event():
+    from iac_code.ui.repl import InlineREPL
+
+    terminal_event = _pipeline_completed_event()
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline = MagicMock()
+    repl._pipeline_step_names = []
+    repl._pipeline_completed_indices = set()
+    repl._update_pipeline_state_from_event = MagicMock()
+    repl._render_pipeline_event = MagicMock()
+    repl._render_candidate_selection_tabs = AsyncMock(return_value=terminal_event)
+    repl._restart_pipeline_stream_after_interrupt = AsyncMock(return_value=_empty_stream())
+
+    async def stream():
+        yield PipelineEvent(
+            type=PipelineEventType.STEP_STARTED,
+            step_id="select",
+            timestamp=time.time(),
+            data={"index": 1, "total": 1, "ui_mode": "candidate_selection"},
+        )
+
+    result = await repl._render_pipeline_stream(stream())
+
+    assert result is terminal_event
+    repl._restart_pipeline_stream_after_interrupt.assert_not_awaited()
+
+
+@pytest.mark.asyncio
+async def test_outer_stream_returns_parallel_tabs_terminal_event():
+    from iac_code.ui.repl import InlineREPL
+
+    terminal_event = _pipeline_completed_event()
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline = MagicMock()
+    repl._pipeline_step_names = []
+    repl._pipeline_completed_indices = set()
+    repl._update_pipeline_state_from_event = MagicMock()
+    repl._render_pipeline_event = MagicMock()
+    repl._render_parallel_tabs = AsyncMock(return_value=terminal_event)
+    repl._restart_pipeline_stream_after_interrupt = AsyncMock(return_value=_empty_stream())
+
+    async def stream():
+        yield PipelineEvent(
+            type=PipelineEventType.STEP_STARTED,
+            step_id="parallel",
+            timestamp=time.time(),
+            data={
+                "index": 1,
+                "total": 1,
+                "ui_mode": "default",
+                "step_type": "parallel_sub_pipeline",
+            },
+        )
+
+    result = await repl._render_pipeline_stream(stream())
+
+    assert result is terminal_event
+    repl._restart_pipeline_stream_after_interrupt.assert_not_awaited()
+
+
+@pytest.mark.asyncio
+async def test_outer_stream_returns_candidate_selection_persistence_failure_without_marking_completed():
+    from iac_code.ui.repl import InlineREPL
+
+    failure_event = _pipeline_persistence_failure_event("select")
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline = MagicMock()
+    repl._pipeline_step_names = []
+    repl._pipeline_completed_indices = set()
+    repl._update_pipeline_state_from_event = InlineREPL._update_pipeline_state_from_event.__get__(repl)
+    repl._render_pipeline_event = MagicMock()
+    repl._render_candidate_selection_tabs = AsyncMock(return_value=failure_event)
+    repl._restart_pipeline_stream_after_interrupt = AsyncMock(return_value=_empty_stream())
+
+    async def stream():
+        yield PipelineEvent(
+            type=PipelineEventType.PIPELINE_STARTED,
+            step_id=None,
+            timestamp=time.time(),
+            data={"step_names": ["select"]},
+        )
+        yield PipelineEvent(
+            type=PipelineEventType.STEP_STARTED,
+            step_id="select",
+            timestamp=time.time(),
+            data={"index": 1, "total": 1, "ui_mode": "candidate_selection"},
+        )
+
+    result = await repl._render_pipeline_stream(stream())
+
+    assert result is failure_event
+    assert repl._pipeline_completed_indices == set()
+
+
+@pytest.mark.asyncio
+async def test_outer_stream_returns_parallel_tabs_persistence_failure_without_marking_completed():
+    from iac_code.ui.repl import InlineREPL
+
+    failure_event = _pipeline_persistence_failure_event("parallel")
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._pipeline = MagicMock()
+    repl._pipeline_step_names = []
+    repl._pipeline_completed_indices = set()
+    repl._update_pipeline_state_from_event = InlineREPL._update_pipeline_state_from_event.__get__(repl)
+    repl._render_pipeline_event = MagicMock()
+    repl._render_parallel_tabs = AsyncMock(return_value=failure_event)
+    repl._restart_pipeline_stream_after_interrupt = AsyncMock(return_value=_empty_stream())
+
+    async def stream():
+        yield PipelineEvent(
+            type=PipelineEventType.PIPELINE_STARTED,
+            step_id=None,
+            timestamp=time.time(),
+            data={"step_names": ["parallel"]},
+        )
+        yield PipelineEvent(
+            type=PipelineEventType.STEP_STARTED,
+            step_id="parallel",
+            timestamp=time.time(),
+            data={
+                "index": 1,
+                "total": 1,
+                "ui_mode": "default",
+                "step_type": "parallel_sub_pipeline",
+            },
+        )
+
+    result = await repl._render_pipeline_stream(stream())
+
+    assert result is failure_event
+    assert repl._pipeline_completed_indices == set()
+
+
+@pytest.mark.asyncio
+async def test_render_parallel_tabs_returns_consumed_pipeline_completed_event(monkeypatch):
+    from iac_code.ui.repl import InlineREPL
+
+    terminal_event = _pipeline_completed_event()
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
+    repl._pipeline = MagicMock()
+
+    class FakeLive:
+        def start(self):
+            pass
+
+        def stop(self):
+            pass
+
+        def update(self, *args, **kwargs):
+            pass
+
+    monkeypatch.setattr(InlineREPL, "_create_parallel_live", lambda self: FakeLive(), raising=False)
+
+    async def stream():
+        yield terminal_event
+
+    result = await repl._render_parallel_tabs(stream())
+
+    assert result is terminal_event
+
+
+@pytest.mark.asyncio
+async def test_render_candidate_selection_tabs_returns_consumed_persistence_failure_event(monkeypatch):
+    from iac_code.ui.repl import InlineREPL
+
+    failure_event = _pipeline_persistence_failure_event("select")
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
+    repl._pipeline = MagicMock()
+    repl._pipeline_waiting_input = False
+    repl._pipeline_display_recorder = None
+    repl._pipeline_state_persistence_failed = False
+
+    class FakeLive:
+        def __init__(self, *args, **kwargs):
+            pass
+
+        def start(self):
+            pass
+
+        def stop(self):
+            pass
+
+        def update(self, *args, **kwargs):
+            pass
+
+    class FakeCapture:
+        def __init__(self, *args, **kwargs):
+            pass
+
+        def __enter__(self):
+            return self
+
+        def __exit__(self, *args):
+            return False
+
+        def read_key(self, timeout):
+            return None
+
+    monkeypatch.setattr("iac_code.ui.repl.Live", FakeLive)
+    monkeypatch.setattr("iac_code.ui.core.raw_input.RawInputCapture", FakeCapture)
+
+    async def stream():
+        yield failure_event
+
+    result = await repl._render_candidate_selection_tabs(stream())
+
+    assert result is failure_event
+    assert repl._pipeline_state_persistence_failed is True
+
+
+@pytest.mark.asyncio
+async def test_render_parallel_tabs_returns_consumed_persistence_failure_event(monkeypatch):
+    from iac_code.ui.repl import InlineREPL
+
+    failure_event = _pipeline_persistence_failure_event("parallel")
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.renderer = MagicMock()
+    repl.renderer.console = Console(file=StringIO(), width=120, force_terminal=True)
+    repl._pipeline = MagicMock()
+    repl._pipeline_display_recorder = None
+    repl._pipeline_state_persistence_failed = False
+
+    class FakeLive:
+        def start(self):
+            pass
+
+        def stop(self):
+            pass
+
+        def update(self, *args, **kwargs):
+            pass
+
+    monkeypatch.setattr(InlineREPL, "_create_parallel_live", lambda self: FakeLive(), raising=False)
+
+    async def stream():
+        yield failure_event
+
+    result = await repl._render_parallel_tabs(stream())
+
+    assert result is failure_event
+    assert repl._pipeline_state_persistence_failed is True
diff --git a/tests/ui/test_repl_pipeline_image_warning.py b/tests/ui/test_repl_pipeline_image_warning.py
index 6e14fff1..45c28653 100644
--- a/tests/ui/test_repl_pipeline_image_warning.py
+++ b/tests/ui/test_repl_pipeline_image_warning.py
@@ -1,64 +1,141 @@
-"""U-I4: pipeline mode must warn before dropping pasted images."""
+"""Pipeline REPL input should preserve image blocks while keeping text-only feedback."""
 
 from __future__ import annotations
 
+from io import StringIO
 from unittest.mock import AsyncMock, MagicMock
 
 import pytest
+from rich.console import Console
 
+from iac_code.agent.message import ImageBlock, TextBlock
 from iac_code.pipeline.config import RunMode
+from iac_code.pipeline.engine.interrupt import InterruptVerdict
+from iac_code.pipeline.engine.user_input import PipelineUserInput
 from iac_code.ui.core.prompt_input import PromptInputResult
 from iac_code.utils.image.pasted_content import PastedContent
 
 
-@pytest.mark.asyncio
-async def test_pipeline_mode_warns_when_pasted_image_present(monkeypatch):
-    """Image in pasted_contents should trigger a yellow print_system_message before drop."""
-    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
-
+def _image_prompt(text: str = "describe [Image #1]") -> PromptInputResult:
     pc = PastedContent(id=1, type="image", content="iVBORw0KGgo=", media_type="image/png")
-    user_input = PromptInputResult(text="describe this image", pasted_contents={1: pc})
+    return PromptInputResult(text=text, pasted_contents={1: pc})
 
+
+@pytest.mark.asyncio
+async def test_pipeline_prompt_input_forwards_image_blocks() -> None:
     from iac_code.ui.repl import InlineREPL
 
     repl = InlineREPL.__new__(InlineREPL)
     repl._runtime_mode = RunMode.PIPELINE
-    repl.renderer = MagicMock()
     repl._handle_pipeline_chat = AsyncMock()
 
-    await repl._handle_chat(user_input)
+    await repl._handle_chat(_image_prompt())
 
-    # Verify the warning went to renderer.print_system_message (consistent with
-    # other image warnings at repl.py:2250, 2258, 2275).
-    repl.renderer.print_system_message.assert_called_once()
-    call = repl.renderer.print_system_message.call_args
-    # First positional arg is the message (or `msg` kwarg).
-    msg_arg = call.args[0] if call.args else call.kwargs.get("msg") or call.kwargs.get("message")
-    assert msg_arg is not None, f"could not extract message from call: {call!r}"
-    assert "image" in msg_arg.lower(), f"image warning text missing: {msg_arg!r}"
-    # Style must be yellow.
-    assert call.kwargs.get("style") == "yellow", f"expected style='yellow', got {call.kwargs!r}"
-
-    # Pipeline handler still invoked (warning is non-blocking).
     repl._handle_pipeline_chat.assert_awaited_once()
+    pipeline_input = repl._handle_pipeline_chat.await_args.args[0]
+    assert isinstance(pipeline_input, PipelineUserInput)
+    assert pipeline_input.display_text == "describe [Image #1]"
+    assert pipeline_input.has_images is True
+    assert isinstance(pipeline_input.content, list)
+    assert any(isinstance(block, ImageBlock) for block in pipeline_input.content)
+    assert any(isinstance(block, TextBlock) for block in pipeline_input.content)
 
 
 @pytest.mark.asyncio
-async def test_pipeline_mode_no_warning_when_no_images(monkeypatch):
-    """Text-only pipeline input should NOT trigger the image warning."""
-    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
-
-    pc = PastedContent(id=1, type="text", content="some pasted text")
-    user_input = PromptInputResult(text="hi", pasted_contents={1: pc})
-
+async def test_pipeline_prompt_input_uses_plain_text_when_no_images() -> None:
     from iac_code.ui.repl import InlineREPL
 
     repl = InlineREPL.__new__(InlineREPL)
     repl._runtime_mode = RunMode.PIPELINE
-    repl.renderer = MagicMock()
     repl._handle_pipeline_chat = AsyncMock()
 
+    user_input = PromptInputResult(
+        text="hi",
+        pasted_contents={1: PastedContent(id=1, type="text", content="some pasted text")},
+    )
     await repl._handle_chat(user_input)
 
-    repl.renderer.print_system_message.assert_not_called()
-    repl._handle_pipeline_chat.assert_awaited_once()
+    pipeline_input = repl._handle_pipeline_chat.await_args.args[0]
+    assert isinstance(pipeline_input, PipelineUserInput)
+    assert pipeline_input.content == "hi"
+    assert pipeline_input.display_text == "hi"
+    assert pipeline_input.has_images is False
+
+
+def test_pipeline_visible_user_turn_persists_image_blocks_for_resume() -> None:
+    from iac_code.ui.repl import InlineREPL
+
+    repl = InlineREPL.__new__(InlineREPL)
+    injected = {"role": "user", "content": "visible"}
+    repl._agent_loop = MagicMock()
+    repl._agent_loop.context_manager.add_raw_message = MagicMock(return_value=injected)
+    repl._session_storage = MagicMock()
+    repl._original_cwd = "/tmp/project"
+    repl._session_id = "session-1"
+    repl.current_git_branch = MagicMock(return_value="branch")
+    pipeline_input = PipelineUserInput(
+        content=[
+            TextBlock(text="describe "),
+            ImageBlock(media_type="image/png", data="base64-bytes"),
+        ],
+        display_text="describe [Image #1]",
+        has_images=True,
+    )
+
+    repl._persist_pipeline_visible_user_turn(pipeline_input)
+
+    raw_message = repl._agent_loop.context_manager.add_raw_message.call_args.args[0]
+    assert raw_message["role"] == "user"
+    assert isinstance(raw_message["content"], list)
+    assert any(isinstance(block, TextBlock) for block in raw_message["content"])
+    assert any(isinstance(block, ImageBlock) for block in raw_message["content"])
+    repl._session_storage.append.assert_called_once_with(
+        "/tmp/project",
+        "session-1",
+        injected,
+        git_branch="branch",
+    )
+
+
+@pytest.mark.asyncio
+async def test_pipeline_mid_interrupt_forwards_image_blocks() -> None:
+    from iac_code.ui.repl import InlineREPL
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl.console = Console(file=StringIO(), width=120, force_terminal=True)
+    verdict = InterruptVerdict(action="continue", reason="")
+    repl._pipeline = MagicMock()
+    repl._pipeline.handle_user_interrupt = AsyncMock(return_value=verdict)
+
+    _needs_restart, feedback = await repl._handle_mid_pipeline_message(_image_prompt(), suppress_render=True)
+
+    pipeline_input = repl._pipeline.handle_user_interrupt.await_args.args[0]
+    assert isinstance(pipeline_input, PipelineUserInput)
+    assert pipeline_input.display_text == "describe [Image #1]"
+    assert pipeline_input.has_images is True
+    assert isinstance(pipeline_input.content, list)
+    assert any(isinstance(block, ImageBlock) for block in pipeline_input.content)
+    assert "describe [Image #1]" in feedback
+    assert "iVBORw0KGgo=" not in feedback
+
+
+@pytest.mark.asyncio
+async def test_pipeline_interrupt_reader_preserves_pasted_images() -> None:
+    from iac_code.ui.repl import InlineREPL
+
+    class Prompt:
+        async def get_input(self, *, prompt: str, transient: bool):
+            return "describe [Image #1]"
+
+        def make_result(self):
+            return _image_prompt()
+
+    repl = InlineREPL.__new__(InlineREPL)
+    repl._prompt_input = Prompt()
+
+    pipeline_input = await repl._read_pipeline_interrupt_input()
+
+    assert pipeline_input.display_text == "describe [Image #1]"
+    assert pipeline_input.has_images is True
+    assert isinstance(pipeline_input.content, list)
+    assert any(isinstance(block, ImageBlock) for block in pipeline_input.content)
diff --git a/tests/ui/test_repl_pipeline_memory.py b/tests/ui/test_repl_pipeline_memory.py
new file mode 100644
index 00000000..8f6d12a7
--- /dev/null
+++ b/tests/ui/test_repl_pipeline_memory.py
@@ -0,0 +1,20 @@
+from __future__ import annotations
+
+from pathlib import Path
+
+REPL_SOURCE = Path("src/iac_code/ui/repl.py")
+
+
+def test_repl_pipeline_creation_does_not_pass_full_memory_prompt_content() -> None:
+    source = REPL_SOURCE.read_text(encoding="utf-8")
+
+    assert "get_prompt_content()" not in source
+    assert "memory_content_getter=(lambda: self._memory_manager.get_prompt_content()" not in source
+    assert 'lambda: self._memory_manager.get_prompt_content() if self._memory_manager else ""' not in source
+
+
+def test_repl_pipeline_creation_uses_explicit_pipeline_memory_policy_helper() -> None:
+    source = REPL_SOURCE.read_text(encoding="utf-8")
+
+    assert "def _pipeline_memory_content_getter(" in source
+    assert source.count("memory_content_getter=self._pipeline_memory_content_getter(),") == 3
diff --git a/tests/ui/test_repl_pipeline_sidecar_restore.py b/tests/ui/test_repl_pipeline_sidecar_restore.py
index 5756afe7..f37899d8 100644
--- a/tests/ui/test_repl_pipeline_sidecar_restore.py
+++ b/tests/ui/test_repl_pipeline_sidecar_restore.py
@@ -1,8 +1,11 @@
-from unittest.mock import AsyncMock, MagicMock, patch
+from unittest.mock import AsyncMock, MagicMock, call, patch
 
 import pytest
 
 from iac_code.agent.message import Message
+from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+from iac_code.pipeline.engine.pipeline_runner import PipelineStatePersistenceError
+from iac_code.pipeline.engine.user_input import PipelineUserInput
 
 
 @pytest.fixture
@@ -12,6 +15,8 @@ def repl_for_sidecar_restore(tmp_path):
     repl = InlineREPL.__new__(InlineREPL)
     repl._pipeline = None
     repl._pipeline_waiting_input = False
+    repl._pipeline_state_persistence_failed = False
+    repl._pipeline_state_persistence_warning_rendered = False
     repl._session_id = "sid"
     repl._original_cwd = str(tmp_path)
     repl._provider_manager = MagicMock()
@@ -24,6 +29,7 @@ def repl_for_sidecar_restore(tmp_path):
     repl.renderer = MagicMock()
     repl.renderer.record_user_turn = MagicMock()
     repl.renderer.print_system_message = MagicMock()
+    repl.console = MagicMock()
     repl.store = MagicMock()
     repl.store.get_state.return_value.permission_context = None
     repl.store.set_state = MagicMock()
@@ -33,6 +39,231 @@ def repl_for_sidecar_restore(tmp_path):
     return repl
 
 
+def test_normal_handoff_save_failure_does_not_switch_or_append(repl_for_sidecar_restore):
+    from iac_code.pipeline.config import RunMode
+
+    repl_for_sidecar_restore._runtime_mode = RunMode.PIPELINE
+    repl_for_sidecar_restore._agent_loop = MagicMock()
+    repl_for_sidecar_restore._agent_loop.context_manager = MagicMock()
+    repl_for_sidecar_restore._agent_loop.context_manager.add_raw_message = MagicMock()
+    repl_for_sidecar_restore.current_git_branch = MagicMock(return_value="main")
+    terminal_event = PipelineEvent(
+        type=PipelineEventType.PIPELINE_COMPLETED,
+        step_id=None,
+        timestamp=1.0,
+        data={"total_steps": 1},
+    )
+    pipeline = MagicMock()
+    pipeline.should_switch_to_normal.return_value = True
+    pipeline.build_normal_handoff_summary.return_value = "handoff summary"
+    pipeline.mark_normal_handoff.side_effect = PipelineStatePersistenceError(
+        "pipeline state persistence failed during save_normal_handoff"
+    )
+    repl_for_sidecar_restore._pipeline = pipeline
+
+    result = repl_for_sidecar_restore._handoff_pipeline_to_normal(terminal_event)
+
+    assert result == "persistence_failed"
+    assert repl_for_sidecar_restore._pipeline_state_persistence_failed is True
+    assert repl_for_sidecar_restore._runtime_mode == RunMode.PIPELINE
+    pipeline.mark_normal_handoff.assert_called_once_with(status="pending", failed_reason=None)
+    pipeline.build_normal_handoff_summary.assert_not_called()
+    repl_for_sidecar_restore._agent_loop.context_manager.add_raw_message.assert_not_called()
+    repl_for_sidecar_restore._session_storage.append.assert_not_called()
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called_once_with(
+        "Pipeline state persistence failed. Normal chat handoff was not marked durable.",
+        style="yellow",
+    )
+
+
+def test_finalize_handoff_persistence_failure_keeps_pipeline_paused(repl_for_sidecar_restore):
+    from iac_code.pipeline.config import RunMode
+
+    terminal_event = PipelineEvent(
+        type=PipelineEventType.PIPELINE_COMPLETED,
+        step_id=None,
+        timestamp=1.0,
+        data={"total_steps": 1},
+    )
+    pipeline = MagicMock()
+    pipeline.should_switch_to_normal.return_value = True
+    pipeline.mark_normal_handoff.side_effect = PipelineStatePersistenceError(
+        "pipeline state persistence failed during save_normal_handoff"
+    )
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.mark_user_aborted = MagicMock()
+    repl_for_sidecar_restore._runtime_mode = RunMode.PIPELINE
+    repl_for_sidecar_restore._pipeline = pipeline
+
+    repl_for_sidecar_restore._finalize_pipeline_after_render(terminal_event)
+
+    assert repl_for_sidecar_restore._runtime_mode == RunMode.PIPELINE
+    assert repl_for_sidecar_restore._pipeline is pipeline
+    assert repl_for_sidecar_restore._pipeline_state_persistence_failed is True
+    pipeline.pause_agent_loops.assert_called_once_with()
+    pipeline.mark_user_aborted.assert_not_called()
+
+
+def test_handoff_append_failure_and_failed_metadata_failure_does_not_record_success(repl_for_sidecar_restore):
+    from iac_code.pipeline.config import RunMode
+
+    repl_for_sidecar_restore._runtime_mode = RunMode.PIPELINE
+    repl_for_sidecar_restore._agent_loop = MagicMock()
+    repl_for_sidecar_restore._agent_loop.context_manager = MagicMock()
+    repl_for_sidecar_restore._agent_loop.context_manager.add_raw_message.return_value = Message(
+        role="user",
+        content="handoff summary",
+    )
+    repl_for_sidecar_restore.current_git_branch = MagicMock(return_value="main")
+    repl_for_sidecar_restore._session_storage.append.side_effect = RuntimeError("disk unavailable")
+    terminal_event = PipelineEvent(
+        type=PipelineEventType.PIPELINE_COMPLETED,
+        step_id=None,
+        timestamp=1.0,
+        data={"total_steps": 1},
+    )
+    pipeline = MagicMock()
+    pipeline.should_switch_to_normal.return_value = True
+    pipeline.build_normal_handoff_summary.return_value = "handoff summary"
+    pipeline.mark_normal_handoff.side_effect = [
+        None,
+        PipelineStatePersistenceError("pipeline state persistence failed during save_normal_handoff"),
+    ]
+    repl_for_sidecar_restore._pipeline = pipeline
+
+    result = repl_for_sidecar_restore._handoff_pipeline_to_normal(terminal_event)
+
+    assert result == "persistence_failed"
+    assert repl_for_sidecar_restore._pipeline_state_persistence_failed is True
+    assert repl_for_sidecar_restore._runtime_mode == RunMode.PIPELINE
+    pipeline.mark_normal_handoff.assert_has_calls(
+        [
+            call(status="pending", failed_reason=None),
+            call(status="failed", failed_reason="disk unavailable"),
+        ]
+    )
+    assert pipeline.mark_normal_handoff.call_count == 2
+
+
+def test_finalize_persistence_failure_event_does_not_mark_user_aborted(repl_for_sidecar_restore):
+    event = PipelineEvent(
+        type=PipelineEventType.STEP_FAILED,
+        step_id="collect",
+        timestamp=1.0,
+        data={
+            "error": "Pipeline state persistence failed.",
+            "error_details": {"type": "PipelineStatePersistenceError"},
+        },
+    )
+    pipeline = MagicMock()
+    pipeline.sidecar_status = None
+    pipeline.state_machine.is_complete = False
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.mark_user_aborted = MagicMock()
+    repl_for_sidecar_restore._pipeline = pipeline
+    repl_for_sidecar_restore._pipeline_waiting_input = False
+
+    repl_for_sidecar_restore._record_pipeline_display_event(event)
+    repl_for_sidecar_restore._finalize_pipeline_after_render(None)
+
+    assert repl_for_sidecar_restore._pipeline_state_persistence_failed is True
+    assert repl_for_sidecar_restore._pipeline is pipeline
+    pipeline.pause_agent_loops.assert_called_once_with()
+    pipeline.mark_user_aborted.assert_not_called()
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called_once_with(
+        "Pipeline state persistence failed. The pipeline is paused; do not continue until state is durable.",
+        style="yellow",
+    )
+
+
+def test_finalize_user_abort_persistence_failure_keeps_pipeline_paused(repl_for_sidecar_restore):
+    pipeline = MagicMock()
+    pipeline.sidecar_status = None
+    pipeline.state_machine.is_complete = False
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.mark_user_aborted.side_effect = PipelineStatePersistenceError(
+        "pipeline state persistence failed during save_user_aborted_sync"
+    )
+    repl_for_sidecar_restore._pipeline = pipeline
+    repl_for_sidecar_restore._pipeline_waiting_input = False
+    repl_for_sidecar_restore._last_interrupt_paused = False
+
+    repl_for_sidecar_restore._finalize_pipeline_after_render(None)
+
+    assert repl_for_sidecar_restore._pipeline_state_persistence_failed is True
+    assert repl_for_sidecar_restore._pipeline is pipeline
+    pipeline.mark_user_aborted.assert_called_once_with("pipeline interrupted by user or renderer cancellation")
+    pipeline.pause_agent_loops.assert_called_once_with()
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called_once_with(
+        "Pipeline state persistence failed. The pipeline is paused; do not continue until state is durable.",
+        style="yellow",
+    )
+
+
+@pytest.mark.asyncio
+async def test_mid_pipeline_pause_save_failure_warns_and_stays_paused(repl_for_sidecar_restore):
+    from iac_code.pipeline.engine.interrupt import InterruptVerdict
+
+    verdict = InterruptVerdict(action="continue", reason="judge failed", paused=True)
+    pipeline = MagicMock()
+    pipeline.handle_user_interrupt = AsyncMock(return_value=verdict)
+    pipeline.save_interrupt_pause = AsyncMock(
+        side_effect=PipelineStatePersistenceError("pipeline state persistence failed during save_waiting_input")
+    )
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.resume_agent_loops = MagicMock()
+    repl_for_sidecar_restore._pipeline = pipeline
+    repl_for_sidecar_restore._last_interrupt_paused = False
+    repl_for_sidecar_restore._pipeline_waiting_input = False
+
+    needs_restart, feedback = await repl_for_sidecar_restore._handle_mid_pipeline_message(
+        "等等",
+        suppress_render=True,
+    )
+
+    assert needs_restart is False
+    assert feedback == ""
+    assert repl_for_sidecar_restore._pipeline_waiting_input is False
+    assert repl_for_sidecar_restore._last_interrupt_paused is True
+    pipeline.save_interrupt_pause.assert_awaited_once_with(verdict)
+    pipeline.resume_agent_loops.assert_not_called()
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called_once_with(
+        "Pipeline state persistence failed. The pipeline is paused; do not continue until state is durable.",
+        style="yellow",
+    )
+
+
+@pytest.mark.asyncio
+async def test_mid_pipeline_hard_interrupt_save_failure_warns_and_stays_paused(repl_for_sidecar_restore):
+    from iac_code.pipeline.engine.interrupt import InterruptVerdict
+
+    verdict = InterruptVerdict(action="hard_interrupt", reason="changed mind", rollback_target="intent")
+    pipeline = MagicMock()
+    pipeline.handle_user_interrupt = AsyncMock(return_value=verdict)
+    pipeline.apply_hard_interrupt = MagicMock(
+        side_effect=PipelineStatePersistenceError("pipeline state persistence failed during save_rollback_sync")
+    )
+    pipeline.pause_agent_loops = MagicMock()
+    pipeline.resume_agent_loops = MagicMock()
+    repl_for_sidecar_restore._pipeline = pipeline
+    repl_for_sidecar_restore._last_interrupt_paused = False
+
+    needs_restart, feedback = await repl_for_sidecar_restore._handle_mid_pipeline_message(
+        "换方案",
+        suppress_render=True,
+    )
+
+    assert needs_restart is False
+    assert feedback == ""
+    assert repl_for_sidecar_restore._last_interrupt_paused is True
+    pipeline.apply_hard_interrupt.assert_called_once_with(verdict)
+    pipeline.resume_agent_loops.assert_not_called()
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called_once_with(
+        "Pipeline state persistence failed. The pipeline is paused; do not continue until state is durable.",
+        style="yellow",
+    )
+
+
 @pytest.mark.asyncio
 async def test_fresh_pipeline_persists_visible_user_turn_to_root_session(monkeypatch, repl_for_sidecar_restore):
     monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
@@ -141,7 +372,9 @@ async def test_restored_waiting_input_routes_current_message_to_resume(monkeypat
     with patch("iac_code.pipeline.create_pipeline", return_value=pipeline):
         await repl_for_sidecar_restore._handle_pipeline_chat("方案一")
 
-    pipeline.resume.assert_called_once_with("方案一")
+    pipeline.resume.assert_called_once_with(
+        PipelineUserInput(content="方案一", display_text="方案一", has_images=False)
+    )
     pipeline.run.assert_not_called()
     pipeline.continue_from_sidecar.assert_not_called()
 
@@ -244,6 +477,56 @@ async def fake_resume_selection():
     assert repl_for_sidecar_restore._pipeline_waiting_input is True
 
 
+@pytest.mark.asyncio
+async def test_startup_waiting_candidate_selection_starts_cleanup_after_terminal_handoff(
+    monkeypatch,
+    repl_for_sidecar_restore,
+):
+    monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
+    from iac_code.pipeline.config import RunMode
+    from iac_code.pipeline.engine.events import PipelineEvent, PipelineEventType
+    from iac_code.ui.repl import InlineREPL
+
+    repl_for_sidecar_restore._runtime_mode = RunMode.PIPELINE
+    terminal_event = PipelineEvent(
+        type=PipelineEventType.PIPELINE_COMPLETED,
+        step_id=None,
+        timestamp=1.0,
+        data={"total_steps": 1},
+    )
+    pipeline = MagicMock()
+    pipeline.sidecar_restore_result = MagicMock(ok=True, status="waiting_input", reason=None)
+    pipeline.restore_from_sidecar = AsyncMock()
+    pipeline.resume = MagicMock(return_value=_empty_stream())
+    pipeline.run = MagicMock(return_value=_empty_stream())
+    pipeline.continue_from_sidecar = MagicMock(return_value=_empty_stream())
+    pipeline.state_machine.current_step.step_id = "confirm_and_select"
+    pipeline.state_machine.current_step.ui_mode = "candidate_selection"
+    pipeline.state_machine.is_complete = True
+    pipeline.sidecar_status = "completed"
+    pipeline.should_switch_to_normal = MagicMock(return_value=True)
+    pipeline.build_normal_handoff_summary = MagicMock(return_value="handoff summary")
+    pipeline.mark_normal_handoff = MagicMock()
+    pipeline.mark_user_aborted = MagicMock()
+    pipeline.display_transcript_path = None
+    repl_for_sidecar_restore.current_git_branch = MagicMock(return_value="main")
+    repl_for_sidecar_restore._agent_loop = MagicMock()
+    repl_for_sidecar_restore._agent_loop.context_manager = MagicMock()
+    repl_for_sidecar_restore._agent_loop.context_manager.add_raw_message = MagicMock(
+        return_value=Message(role="user", content="handoff summary")
+    )
+    repl_for_sidecar_restore._render_pipeline_display_replay_on_startup = MagicMock()
+    repl_for_sidecar_restore._resume_waiting_candidate_selection_from_sidecar = AsyncMock(return_value=terminal_event)
+    repl_for_sidecar_restore._maybe_start_pipeline_cleanup = AsyncMock(return_value=True)
+    _seed_sidecar(repl_for_sidecar_restore, "waiting_input")
+
+    with patch("iac_code.pipeline.create_pipeline", return_value=pipeline):
+        handled = await InlineREPL._resume_pipeline_sidecar_on_startup(repl_for_sidecar_restore)
+
+    assert handled is True
+    repl_for_sidecar_restore._maybe_start_pipeline_cleanup.assert_awaited_once_with(pipeline)
+
+
 @pytest.mark.asyncio
 async def test_startup_running_pipeline_replays_history_without_continuing(monkeypatch, repl_for_sidecar_restore):
     monkeypatch.setenv("IAC_CODE_MODE", "pipeline")
@@ -296,7 +579,9 @@ async def test_restored_running_routes_to_continue_without_user_prompt(monkeypat
     with patch("iac_code.pipeline.create_pipeline", return_value=pipeline):
         await repl_for_sidecar_restore._handle_pipeline_chat("hello after crash")
 
-    pipeline.continue_from_sidecar.assert_called_once_with(user_input="hello after crash")
+    pipeline.continue_from_sidecar.assert_called_once_with(
+        user_input=PipelineUserInput(content="hello after crash", display_text="hello after crash", has_images=False)
+    )
     pipeline.run.assert_not_called()
     pipeline.resume.assert_not_called()
 
@@ -325,7 +610,9 @@ async def test_restored_running_uses_pipeline_working_directory(monkeypatch, tmp
         await repl_for_sidecar_restore._handle_pipeline_chat("hello after crash")
 
     pipeline.restore_from_sidecar.assert_awaited_once()
-    pipeline.continue_from_sidecar.assert_called_once_with(user_input="hello after crash")
+    pipeline.continue_from_sidecar.assert_called_once_with(
+        user_input=PipelineUserInput(content="hello after crash", display_text="hello after crash", has_images=False)
+    )
     pipeline.run.assert_not_called()
     pipeline.resume.assert_not_called()
 
@@ -344,7 +631,29 @@ async def test_corrupt_sidecar_starts_fresh(monkeypatch, repl_for_sidecar_restor
     with patch("iac_code.pipeline.create_pipeline", return_value=pipeline):
         await repl_for_sidecar_restore._handle_pipeline_chat("fresh")
 
-    pipeline.run.assert_called_once_with("fresh")
+    pipeline.run.assert_called_once_with(PipelineUserInput(content="fresh", display_text="fresh", has_images=False))
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called()
+
+
+@pytest.mark.asyncio
+async def test_confirm_pipeline_resume_handles_corrupt_meta(tmp_path, repl_for_sidecar_restore):
+    meta_path = tmp_path / "meta.yaml"
+    meta_path.write_text("[broken", encoding="utf-8")
+
+    choice = await repl_for_sidecar_restore._confirm_pipeline_resume(meta_path)
+
+    assert choice == "discard"
+    repl_for_sidecar_restore.renderer.print_system_message.assert_called()
+
+
+@pytest.mark.asyncio
+async def test_confirm_pipeline_resume_discards_non_mapping_meta(tmp_path, repl_for_sidecar_restore):
+    meta_path = tmp_path / "meta.yaml"
+    meta_path.write_text("- not\n- metadata\n", encoding="utf-8")
+
+    choice = await repl_for_sidecar_restore._confirm_pipeline_resume(meta_path)
+
+    assert choice == "discard"
     repl_for_sidecar_restore.renderer.print_system_message.assert_called()
 
 
@@ -363,7 +672,7 @@ async def test_discarded_sidecar_starts_fresh_without_restore(monkeypatch, repl_
         await repl_for_sidecar_restore._handle_pipeline_chat("fresh")
 
     pipeline.restore_from_sidecar.assert_not_called()
-    pipeline.run.assert_called_once_with("fresh")
+    pipeline.run.assert_called_once_with(PipelineUserInput(content="fresh", display_text="fresh", has_images=False))
 
 
 def _seed_sidecar(repl, status: str) -> None:
diff --git a/tests/ui/test_repl_runtime_mode.py b/tests/ui/test_repl_runtime_mode.py
index f428476a..cbaab96e 100644
--- a/tests/ui/test_repl_runtime_mode.py
+++ b/tests/ui/test_repl_runtime_mode.py
@@ -7,6 +7,7 @@
 import pytest
 
 from iac_code.pipeline.config import RunMode
+from iac_code.pipeline.engine.user_input import PipelineUserInput
 
 
 def _make_repl_for_normal_chat():
@@ -35,7 +36,9 @@ async def test_handle_chat_uses_instance_runtime_mode_when_environment_is_normal
 
     await repl._handle_chat("hello")
 
-    repl._handle_pipeline_chat.assert_awaited_once_with("hello")
+    repl._handle_pipeline_chat.assert_awaited_once_with(
+        PipelineUserInput(content="hello", display_text="hello", has_images=False)
+    )
     repl._agent_loop.run_streaming.assert_not_called()
 
 
diff --git a/tests/ui/test_repl_status.py b/tests/ui/test_repl_status.py
index 9240c2fc..7c9df131 100644
--- a/tests/ui/test_repl_status.py
+++ b/tests/ui/test_repl_status.py
@@ -2,6 +2,7 @@
 from unittest.mock import MagicMock
 
 from iac_code.agent.message import Message, ToolResultBlock, create_recalled_memory_message
+from iac_code.pipeline.engine.cleanup import create_cleanup_prompt_message
 from iac_code.state.app_state import AppState, AppStateStore
 from iac_code.ui.repl import InlineREPL
 
@@ -25,6 +26,7 @@ def test_count_user_turns_ignores_recalled_memory_messages() -> None:
     messages = [
         Message(role="user", content="first"),
         create_recalled_memory_message("# Recalled Memory\nPrefer ROS YAML.", ["ros-yaml.md"]),
+        create_cleanup_prompt_message("cleanup hidden prompt"),
         Message(role="assistant", content="answer"),
         Message(role="user", content="second"),
     ]
@@ -68,6 +70,7 @@ def test_status_snapshot_uses_agent_loop_and_original_cwd(monkeypatch) -> None:
     }
     repl._agent_loop.context_manager.get_messages.return_value = [
         Message(role="user", content="first"),
+        create_cleanup_prompt_message("cleanup hidden prompt"),
         Message(role="assistant", content="answer"),
     ]
 
diff --git a/tests/ui/test_repl_swap_session_pipeline.py b/tests/ui/test_repl_swap_session_pipeline.py
index 3db133d4..e731328b 100644
--- a/tests/ui/test_repl_swap_session_pipeline.py
+++ b/tests/ui/test_repl_swap_session_pipeline.py
@@ -6,6 +6,7 @@
 import pytest
 
 from iac_code.pipeline.config import RunMode
+from iac_code.pipeline.engine.user_input import PipelineUserInput
 
 
 def _make_repl_with_pipeline(tmp_path: Path, session_id_old: str, session_id_new: str):
@@ -297,7 +298,9 @@ async def test_swap_session_running_resume_routes_next_message_to_interrupt_judg
 
     await repl._handle_pipeline_chat("change the plan")
 
-    fake_pipeline.continue_from_sidecar.assert_called_once_with(user_input="change the plan")
+    fake_pipeline.continue_from_sidecar.assert_called_once_with(
+        user_input=PipelineUserInput(content="change the plan", display_text="change the plan", has_images=False)
+    )
     fake_pipeline.resume.assert_not_called()
 
 
@@ -337,7 +340,9 @@ async def test_swap_session_waiting_input_resume_routes_next_message_to_resume(t
 
     await repl._handle_pipeline_chat("option A")
 
-    fake_pipeline.resume.assert_called_once_with("option A")
+    fake_pipeline.resume.assert_called_once_with(
+        PipelineUserInput(content="option A", display_text="option A", has_images=False)
+    )
     fake_pipeline.continue_from_sidecar.assert_not_called()
 
 
diff --git a/tests/utils/image/test_processor.py b/tests/utils/image/test_processor.py
index d247696e..9adc5dca 100644
--- a/tests/utils/image/test_processor.py
+++ b/tests/utils/image/test_processor.py
@@ -26,6 +26,7 @@ def test_image_at_arbitrary_position_produces_interleaved_blocks():
     assert len(blocks) == 3
     assert isinstance(blocks[0], TextBlock) and blocks[0].text == "look at "
     assert isinstance(blocks[1], ImageBlock)
+    assert blocks[1].ref_id == 1
     assert isinstance(blocks[2], TextBlock) and blocks[2].text == " please"
 
 
diff --git a/tests/utils/image/test_store.py b/tests/utils/image/test_store.py
index 277989e2..9de65473 100644
--- a/tests/utils/image/test_store.py
+++ b/tests/utils/image/test_store.py
@@ -24,6 +24,28 @@ def test_store_writes_per_session_file_with_0o600(tmp_path, monkeypatch):
         assert stat.S_IMODE(p.stat().st_mode) == 0o600
 
 
+def test_get_path_discovers_cached_file_after_store_recreated(tmp_path, monkeypatch):
+    monkeypatch.setattr("iac_code.utils.image.store._get_base_dir", lambda: tmp_path / "image-cache")
+    first = ImageStore(session_id="sess-a")
+    pc = PastedContent(id=7, type="image", content="aGVsbG8=", media_type="image/png")
+    path = first.store(pc)
+    assert path is not None
+
+    restored = ImageStore(session_id="sess-a")
+
+    assert restored.get_path(7) == path
+
+
+def test_next_image_id_skips_existing_cached_files_after_store_recreated(tmp_path, monkeypatch):
+    monkeypatch.setattr("iac_code.utils.image.store._get_base_dir", lambda: tmp_path / "image-cache")
+    first = ImageStore(session_id="sess-a")
+    assert first.store(PastedContent(id=1, type="image", content="MQ==", media_type="image/png")) is not None
+
+    restored = ImageStore(session_id="sess-a")
+
+    assert restored.next_image_id() == 2
+
+
 @pytest.mark.skipif(sys.platform == "win32", reason="POSIX modes are not meaningful on Windows")
 def test_store_directories_are_owner_only(tmp_path, monkeypatch):
     monkeypatch.setattr("iac_code.utils.image.store._get_base_dir", lambda: tmp_path / "image-cache")
diff --git a/tests/utils/test_state_io.py b/tests/utils/test_state_io.py
new file mode 100644
index 00000000..af5511bf
--- /dev/null
+++ b/tests/utils/test_state_io.py
@@ -0,0 +1,238 @@
+from __future__ import annotations
+
+import errno
+import gc
+import json
+import os
+import sys
+import types
+import weakref
+from pathlib import Path
+
+import pytest
+
+from iac_code.utils.state_io import append_jsonl_locked, atomic_write_json, atomic_write_text, safe_replace
+
+
+def test_atomic_write_text_replaces_file_and_removes_temp(tmp_path: Path) -> None:
+    path = tmp_path / "state.txt"
+    path.write_text("old", encoding="utf-8")
+
+    atomic_write_text(path, "new", durable=True)
+
+    assert path.read_text(encoding="utf-8") == "new"
+    assert not list(tmp_path.glob(".state.txt.*.tmp"))
+
+
+def test_atomic_write_json_fails_without_overwriting_target(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
+    path = tmp_path / "state.json"
+    path.write_text('{"ok": true}\n', encoding="utf-8")
+
+    def fail_replace(src: str, dst: str) -> None:
+        raise PermissionError("locked")
+
+    monkeypatch.setattr("iac_code.utils.state_io.os.replace", fail_replace)
+
+    with pytest.raises(PermissionError, match="locked"):
+        atomic_write_json(path, {"ok": False}, durable=True, replace_attempts=1)
+
+    assert path.read_text(encoding="utf-8") == '{"ok": true}\n'
+    assert not list(tmp_path.glob(".state.json.*.tmp"))
+
+
+def test_atomic_write_json_rejects_invalid_replace_attempts_without_overwriting_target(tmp_path: Path) -> None:
+    path = tmp_path / "state.json"
+    path.write_text('{"ok": true}\n', encoding="utf-8")
+
+    with pytest.raises(ValueError, match="attempts must be >= 1"):
+        atomic_write_json(path, {"ok": False}, durable=True, replace_attempts=0)
+
+    assert path.read_text(encoding="utf-8") == '{"ok": true}\n'
+    assert not list(tmp_path.glob(".state.json.*.tmp"))
+
+
+def test_append_jsonl_locked_writes_one_complete_line_per_record(tmp_path: Path) -> None:
+    path = tmp_path / "session.jsonl"
+
+    append_jsonl_locked(path, [{"a": 1}, {"b": 2}], durable=False)
+
+    lines = path.read_text(encoding="utf-8").splitlines()
+    assert [json.loads(line) for line in lines] == [{"a": 1}, {"b": 2}]
+
+
+def test_path_lock_registry_reuses_held_lock_for_same_path(tmp_path: Path) -> None:
+    from iac_code.utils.path_locks import PathLockRegistry
+
+    registry = PathLockRegistry()
+    path = tmp_path / "state.jsonl"
+
+    with registry.lock_for(path) as first:
+        with registry.lock_for(path) as second:
+            assert second is first
+
+
+def test_path_lock_registry_releases_stale_locks_after_callers_drop_references(tmp_path: Path) -> None:
+    from iac_code.utils.path_locks import PathLockRegistry
+
+    registry = PathLockRegistry()
+    path = tmp_path / "state.jsonl"
+
+    with registry.lock_for(path) as first:
+        ref = weakref.ref(first)
+
+    del first
+    gc.collect()
+    registry.prune()
+
+    assert ref() is None
+
+
+def test_safe_replace_cross_device_fallback_copies_then_unlinks_source(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    from iac_code.utils import state_io
+
+    src = tmp_path / "legacy.jsonl"
+    dst = tmp_path / "session" / "session.jsonl"
+    dst.parent.mkdir()
+    src.write_text("legacy", encoding="utf-8")
+
+    real_replace = os.replace
+
+    def raise_exdev_for_legacy_src(_src: str | Path, _dst: str | Path) -> None:
+        if Path(_src) == src:
+            raise OSError(errno.EXDEV, "Invalid cross-device link")
+        real_replace(_src, _dst)
+
+    monkeypatch.setattr(state_io.os, "replace", raise_exdev_for_legacy_src)
+
+    safe_replace(src, dst)
+
+    assert dst.read_text(encoding="utf-8") == "legacy"
+    assert not src.exists()
+
+
+def test_safe_replace_cross_device_fallback_retries_transient_final_replace_lock(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    from iac_code.utils import state_io
+
+    src = tmp_path / "legacy.jsonl"
+    dst = tmp_path / "session" / "session.jsonl"
+    dst.parent.mkdir()
+    src.write_text("legacy", encoding="utf-8")
+    real_replace = os.replace
+    final_replace_attempts = 0
+
+    def fail_exdev_then_transient_final_lock(_src: str | Path, _dst: str | Path) -> None:
+        nonlocal final_replace_attempts
+        src_path = Path(_src)
+        if src_path == src:
+            raise OSError(errno.EXDEV, "Invalid cross-device link")
+        if src_path.parent == dst.parent and src_path.name.startswith(f".{dst.name}."):
+            final_replace_attempts += 1
+            if final_replace_attempts == 1:
+                raise PermissionError("target locked")
+        real_replace(_src, _dst)
+
+    monkeypatch.setattr(state_io.os, "replace", fail_exdev_then_transient_final_lock)
+
+    safe_replace(src, dst, attempts=2, delay=0)
+
+    assert final_replace_attempts == 2
+    assert dst.read_text(encoding="utf-8") == "legacy"
+    assert not src.exists()
+
+
+def test_durable_append_jsonl_fsyncs_parent_directory_for_new_file(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    path = tmp_path / "session.jsonl"
+    calls: list[Path] = []
+
+    monkeypatch.setattr("iac_code.utils.state_io.fsync_parent_dir", calls.append)
+
+    append_jsonl_locked(path, [{"created": True}], durable=True)
+
+    assert calls == [path]
+
+
+def test_append_jsonl_locked_fails_loudly_when_posix_lock_acquisition_fails(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    if sys.platform == "win32":
+        pytest.skip("POSIX fcntl lock path is not available on Windows")
+
+    import fcntl
+
+    path = tmp_path / "session.jsonl"
+
+    def fail_flock(fd: int, operation: int) -> None:
+        if operation == fcntl.LOCK_EX:
+            raise OSError("lock unavailable")
+
+    monkeypatch.setattr(fcntl, "flock", fail_flock)
+
+    with pytest.raises(RuntimeError, match="could not acquire append lock"):
+        append_jsonl_locked(path, [{"a": 1}])
+
+    assert not path.exists()
+
+
+def test_windows_append_lock_seeks_before_lock_and_unlock(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
+    from iac_code.utils import state_io
+
+    events: list[tuple[str, int] | tuple[str, int, int]] = []
+
+    class FakeLockFile:
+        def __enter__(self) -> FakeLockFile:
+            return self
+
+        def __exit__(self, exc_type: object, exc: object, traceback: object) -> None:
+            return None
+
+        def fileno(self) -> int:
+            return 42
+
+        def seek(self, offset: int) -> None:
+            events.append(("seek", offset))
+
+    def fake_open(self: Path, mode: str = "r", *args: object, **kwargs: object) -> FakeLockFile:
+        return FakeLockFile()
+
+    def fake_locking(fd: int, mode: int, nbytes: int) -> None:
+        events.append(("locking", mode, nbytes))
+
+    fake_msvcrt = types.SimpleNamespace(LK_LOCK=1, LK_UNLCK=2, locking=fake_locking)
+    monkeypatch.setattr("iac_code.utils.state_io.sys.platform", "win32")
+    monkeypatch.setitem(sys.modules, "msvcrt", fake_msvcrt)
+    monkeypatch.setattr(Path, "open", fake_open)
+
+    with state_io._cross_process_append_lock(tmp_path / "session.jsonl"):
+        events.append(("yield", 0))
+
+    assert events == [
+        ("seek", 0),
+        ("locking", 1, 1),
+        ("yield", 0),
+        ("seek", 0),
+        ("locking", 2, 1),
+    ]
+
+
+def test_parent_directory_fsync_is_best_effort(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
+    path = tmp_path / "state.txt"
+    calls: list[int] = []
+    original_fsync = os.fsync
+
+    def flaky_fsync(fd: int) -> None:
+        calls.append(fd)
+        if len(calls) > 1:
+            raise OSError("directory fsync unsupported")
+        original_fsync(fd)
+
+    monkeypatch.setattr("iac_code.utils.state_io.os.fsync", flaky_fsync)
+
+    atomic_write_text(path, "ok", durable=True)
+
+    assert path.read_text(encoding="utf-8") == "ok"
diff --git a/uv.lock b/uv.lock
index 9ab6d240..155cbd66 100644
--- a/uv.lock
+++ b/uv.lock
@@ -1310,6 +1310,7 @@ http = [
 [package.dev-dependencies]
 dev = [
     { name = "babel" },
+    { name = "pexpect" },
     { name = "pre-commit" },
     { name = "pytest" },
     { name = "pytest-asyncio" },
@@ -1364,6 +1365,7 @@ provides-extras = ["http", "a2a", "a2a-signing", "a2a-grpc", "a2a-redis", "diagr
 [package.metadata.requires-dev]
 dev = [
     { name = "babel", specifier = ">=2.14.0" },
+    { name = "pexpect", specifier = ">=4.9.0" },
     { name = "pre-commit", specifier = ">=4.0" },
     { name = "pytest", specifier = ">=8.0" },
     { name = "pytest-asyncio", specifier = ">=0.23.0" },
@@ -1978,6 +1980,18 @@ wheels = [
     { url = "https://mirrors.aliyun.com/pypi/packages/7a/c2/920ef838e2f0028c8262f16101ec09ebd5969864e5a64c4c05fad0617c56/packaging-26.1-py3-none-any.whl", hash = "sha256:5d9c0669c6285e491e0ced2eee587eaf67b670d94a19e94e3984a481aba6802f" },
 ]
 
+[[package]]
+name = "pexpect"
+version = "4.9.0"
+source = { registry = "https://mirrors.aliyun.com/pypi/simple/" }
+dependencies = [
+    { name = "ptyprocess" },
+]
+sdist = { url = "https://mirrors.aliyun.com/pypi/packages/42/92/cc564bf6381ff43ce1f4d06852fc19a2f11d180f23dc32d9588bee2f149d/pexpect-4.9.0.tar.gz", hash = "sha256:ee7d41123f3c9911050ea2c2dac107568dc43b2d3b0c7557a33212c398ead30f" }
+wheels = [
+    { url = "https://mirrors.aliyun.com/pypi/packages/9e/c3/059298687310d527a58bb01f3b1965787ee3b40dce76752eda8b44e9a2c5/pexpect-4.9.0-py2.py3-none-any.whl", hash = "sha256:7236d1e080e4936be2dc3e326cec0af72acf9212a7e1d060210e70a47e253523" },
+]
+
 [[package]]
 name = "pillow"
 version = "12.2.0"
@@ -2251,6 +2265,15 @@ wheels = [
     { url = "https://mirrors.aliyun.com/pypi/packages/c4/72/02445137af02769918a93807b2b7890047c32bfb9f90371cbc12688819eb/protobuf-6.33.6-py3-none-any.whl", hash = "sha256:77179e006c476e69bf8e8ce866640091ec42e1beb80b213c3900006ecfba6901" },
 ]
 
+[[package]]
+name = "ptyprocess"
+version = "0.7.0"
+source = { registry = "https://mirrors.aliyun.com/pypi/simple/" }
+sdist = { url = "https://mirrors.aliyun.com/pypi/packages/20/e5/16ff212c1e452235a90aeb09066144d0c5a6a8c0834397e03f5224495c4e/ptyprocess-0.7.0.tar.gz", hash = "sha256:5c5d0a3b48ceee0b48485e0c26037c0acd7d29765ca3fbb5cb3831d347423220" }
+wheels = [
+    { url = "https://mirrors.aliyun.com/pypi/packages/22/a6/858897256d0deac81a172289110f31629fc4cee19b6f01283303e18c8db3/ptyprocess-0.7.0-py2.py3-none-any.whl", hash = "sha256:4b41f3967fce3af57cc7e94b888626c18bf37a083e3651ca8feeb66d492fef35" },
+]
+
 [[package]]
 name = "pyasn1"
 version = "0.6.3"
diff --git a/website/docusaurus.config.ts b/website/docusaurus.config.ts
index 37f298b4..7e90b0d1 100644
--- a/website/docusaurus.config.ts
+++ b/website/docusaurus.config.ts
@@ -110,6 +110,11 @@ const config: Config = {
           label: 'CLI',
           position: 'left',
         },
+        {
+          to: '/docs/automation/pipeline-mode',
+          label: 'Pipeline',
+          position: 'left',
+        },
         {
           href: 'https://github.com/aliyun/iac-code',
           label: 'GitHub',
@@ -135,6 +140,10 @@ const config: Config = {
               label: 'CLI Overview',
               to: '/docs/cli/usage',
             },
+            {
+              label: 'Pipeline Mode',
+              to: '/docs/automation/pipeline-mode',
+            },
             {
               label: 'Slash Commands',
               to: '/docs/cli/commands',
diff --git a/website/i18n/de/docusaurus-theme-classic/footer.json b/website/i18n/de/docusaurus-theme-classic/footer.json
index 05a8961b..d3581b02 100644
--- a/website/i18n/de/docusaurus-theme-classic/footer.json
+++ b/website/i18n/de/docusaurus-theme-classic/footer.json
@@ -11,6 +11,10 @@
     "message": "CLI-Uebersicht",
     "description": "The label of footer link with label=CLI Overview linking to /docs/cli/usage"
   },
+  "link.item.label.Pipeline Mode": {
+    "message": "Pipeline-Modus",
+    "description": "The label of footer link with label=Pipeline Mode linking to /docs/automation/pipeline-mode"
+  },
   "link.item.label.Slash Commands": {
     "message": "Slash-Befehle",
     "description": "The label of footer link with label=Slash Commands linking to /docs/cli/commands"
diff --git a/website/i18n/de/docusaurus-theme-classic/navbar.json b/website/i18n/de/docusaurus-theme-classic/navbar.json
index 88d7385e..2616618e 100644
--- a/website/i18n/de/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/de/docusaurus-theme-classic/navbar.json
@@ -15,6 +15,10 @@
     "message": "CLI",
     "description": "Navbar item with label CLI"
   },
+  "item.label.Pipeline": {
+    "message": "Pipeline",
+    "description": "Navbar item with label Pipeline"
+  },
   "item.label.GitHub": {
     "message": "GitHub",
     "description": "Navbar item with label GitHub"
diff --git a/website/i18n/es/docusaurus-theme-classic/footer.json b/website/i18n/es/docusaurus-theme-classic/footer.json
index 8d7e93f5..bf53da1e 100644
--- a/website/i18n/es/docusaurus-theme-classic/footer.json
+++ b/website/i18n/es/docusaurus-theme-classic/footer.json
@@ -11,6 +11,10 @@
     "message": "Vision general del CLI",
     "description": "The label of footer link with label=CLI Overview linking to /docs/cli/usage"
   },
+  "link.item.label.Pipeline Mode": {
+    "message": "Modo Pipeline",
+    "description": "The label of footer link with label=Pipeline Mode linking to /docs/automation/pipeline-mode"
+  },
   "link.item.label.Slash Commands": {
     "message": "Comandos slash",
     "description": "The label of footer link with label=Slash Commands linking to /docs/cli/commands"
diff --git a/website/i18n/es/docusaurus-theme-classic/navbar.json b/website/i18n/es/docusaurus-theme-classic/navbar.json
index b86da3d4..5c9d595b 100644
--- a/website/i18n/es/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/es/docusaurus-theme-classic/navbar.json
@@ -15,6 +15,10 @@
     "message": "CLI",
     "description": "Navbar item with label CLI"
   },
+  "item.label.Pipeline": {
+    "message": "Pipeline",
+    "description": "Navbar item with label Pipeline"
+  },
   "item.label.GitHub": {
     "message": "GitHub",
     "description": "Navbar item with label GitHub"
diff --git a/website/i18n/fr/docusaurus-theme-classic/footer.json b/website/i18n/fr/docusaurus-theme-classic/footer.json
index 1ec6c8a4..5782c8d2 100644
--- a/website/i18n/fr/docusaurus-theme-classic/footer.json
+++ b/website/i18n/fr/docusaurus-theme-classic/footer.json
@@ -11,6 +11,10 @@
     "message": "Aperçu CLI",
     "description": "The label of footer link with label=CLI Overview linking to /docs/cli/usage"
   },
+  "link.item.label.Pipeline Mode": {
+    "message": "Mode Pipeline",
+    "description": "The label of footer link with label=Pipeline Mode linking to /docs/automation/pipeline-mode"
+  },
   "link.item.label.Slash Commands": {
     "message": "Commandes slash",
     "description": "The label of footer link with label=Slash Commands linking to /docs/cli/commands"
diff --git a/website/i18n/fr/docusaurus-theme-classic/navbar.json b/website/i18n/fr/docusaurus-theme-classic/navbar.json
index fc29c746..ba44e3ed 100644
--- a/website/i18n/fr/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/fr/docusaurus-theme-classic/navbar.json
@@ -15,6 +15,10 @@
     "message": "CLI",
     "description": "Navbar item with label CLI"
   },
+  "item.label.Pipeline": {
+    "message": "Pipeline",
+    "description": "Navbar item with label Pipeline"
+  },
   "item.label.GitHub": {
     "message": "GitHub",
     "description": "Navbar item with label GitHub"
diff --git a/website/i18n/ja/docusaurus-theme-classic/footer.json b/website/i18n/ja/docusaurus-theme-classic/footer.json
index c4d1d35f..b5b37bbb 100644
--- a/website/i18n/ja/docusaurus-theme-classic/footer.json
+++ b/website/i18n/ja/docusaurus-theme-classic/footer.json
@@ -11,6 +11,10 @@
     "message": "CLI 概要",
     "description": "The label of footer link with label=CLI Overview linking to /docs/cli/usage"
   },
+  "link.item.label.Pipeline Mode": {
+    "message": "Pipeline モード",
+    "description": "The label of footer link with label=Pipeline Mode linking to /docs/automation/pipeline-mode"
+  },
   "link.item.label.Slash Commands": {
     "message": "スラッシュコマンド",
     "description": "The label of footer link with label=Slash Commands linking to /docs/cli/commands"
diff --git a/website/i18n/ja/docusaurus-theme-classic/navbar.json b/website/i18n/ja/docusaurus-theme-classic/navbar.json
index b5c3ea04..2fc393e8 100644
--- a/website/i18n/ja/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/ja/docusaurus-theme-classic/navbar.json
@@ -15,6 +15,10 @@
     "message": "CLI",
     "description": "Navbar item with label CLI"
   },
+  "item.label.Pipeline": {
+    "message": "Pipeline",
+    "description": "Navbar item with label Pipeline"
+  },
   "item.label.GitHub": {
     "message": "GitHub",
     "description": "Navbar item with label GitHub"
diff --git a/website/i18n/pt/docusaurus-theme-classic/footer.json b/website/i18n/pt/docusaurus-theme-classic/footer.json
index 4f39ec05..e2af9390 100644
--- a/website/i18n/pt/docusaurus-theme-classic/footer.json
+++ b/website/i18n/pt/docusaurus-theme-classic/footer.json
@@ -11,6 +11,10 @@
     "message": "Visao geral do CLI",
     "description": "The label of footer link with label=CLI Overview linking to /docs/cli/usage"
   },
+  "link.item.label.Pipeline Mode": {
+    "message": "Modo pipeline",
+    "description": "The label of footer link with label=Pipeline Mode linking to /docs/automation/pipeline-mode"
+  },
   "link.item.label.Slash Commands": {
     "message": "Comandos slash",
     "description": "The label of footer link with label=Slash Commands linking to /docs/cli/commands"
diff --git a/website/i18n/pt/docusaurus-theme-classic/navbar.json b/website/i18n/pt/docusaurus-theme-classic/navbar.json
index 098fb5cc..b9a4b5ed 100644
--- a/website/i18n/pt/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/pt/docusaurus-theme-classic/navbar.json
@@ -15,6 +15,10 @@
     "message": "CLI",
     "description": "Navbar item with label CLI"
   },
+  "item.label.Pipeline": {
+    "message": "Pipeline",
+    "description": "Navbar item with label Pipeline"
+  },
   "item.label.GitHub": {
     "message": "GitHub",
     "description": "Navbar item with label GitHub"
diff --git a/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json b/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json
index 900ef5ea..828afa27 100644
--- a/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json
+++ b/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json
@@ -11,6 +11,10 @@
     "message": "CLI 概览",
     "description": "The label of footer link with label=CLI Overview linking to /docs/cli/usage"
   },
+  "link.item.label.Pipeline Mode": {
+    "message": "Pipeline 模式",
+    "description": "The label of footer link with label=Pipeline Mode linking to /docs/automation/pipeline-mode"
+  },
   "link.item.label.Slash Commands": {
     "message": "Slash 命令",
     "description": "The label of footer link with label=Slash Commands linking to /docs/cli/commands"
diff --git a/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json b/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json
index 6713df9b..1d24647c 100644
--- a/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json
@@ -15,6 +15,10 @@
     "message": "CLI",
     "description": "Navbar item with label CLI"
   },
+  "item.label.Pipeline": {
+    "message": "Pipeline",
+    "description": "Navbar item with label Pipeline"
+  },
   "item.label.GitHub": {
     "message": "GitHub",
     "description": "Navbar item with label GitHub"
diff --git a/website/src/clientModules/docsNavigation.test.cjs b/website/src/clientModules/docsNavigation.test.cjs
new file mode 100644
index 00000000..792c342f
--- /dev/null
+++ b/website/src/clientModules/docsNavigation.test.cjs
@@ -0,0 +1,42 @@
+const assert = require('node:assert/strict');
+const fs = require('node:fs');
+const path = require('node:path');
+const test = require('node:test');
+
+const websiteRoot = path.resolve(__dirname, '../..');
+const pipelineDocPath = '/docs/automation/pipeline-mode';
+
+function readWebsiteFile(...segments) {
+  return fs.readFileSync(path.join(websiteRoot, ...segments), 'utf8');
+}
+
+function readLocaleJson(locale, fileName) {
+  return JSON.parse(readWebsiteFile('i18n', locale, 'docusaurus-theme-classic', fileName));
+}
+
+test('global navigation exposes Pipeline documentation directly', () => {
+  const config = readWebsiteFile('docusaurus.config.ts');
+
+  assert.match(config, /label:\s*'Pipeline'/);
+  assert.match(config, /label:\s*'Pipeline Mode'/);
+  assert.equal((config.match(new RegExp(`to:\\s*'${pipelineDocPath}'`, 'g')) ?? []).length, 2);
+});
+
+test('localized navbar and footer include Pipeline documentation labels', () => {
+  const expected = {
+    'zh-Hans': {navbar: 'Pipeline', footer: 'Pipeline 模式'},
+    ja: {navbar: 'Pipeline', footer: 'Pipeline モード'},
+    fr: {navbar: 'Pipeline', footer: 'Mode Pipeline'},
+    de: {navbar: 'Pipeline', footer: 'Pipeline-Modus'},
+    es: {navbar: 'Pipeline', footer: 'Modo Pipeline'},
+    pt: {navbar: 'Pipeline', footer: 'Modo pipeline'},
+  };
+
+  for (const [locale, labels] of Object.entries(expected)) {
+    const navbar = readLocaleJson(locale, 'navbar.json');
+    const footer = readLocaleJson(locale, 'footer.json');
+
+    assert.equal(navbar['item.label.Pipeline']?.message, labels.navbar);
+    assert.equal(footer['link.item.label.Pipeline Mode']?.message, labels.footer);
+  }
+});